{"train/loss": 4.3897, "train/learning_rate": 0.00026639999999999997, "train/epoch": 1.0, "train/global_step": 446, "_runtime": 6612, "_timestamp": 1646235748, "_step": 447, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 7.0, 20.0, 25.0, 40.0, 85.0, 103.0, 116.0, 150.0, 136.0, 129.0, 87.0, 53.0, 29.0, 11.0, 12.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.08663558959961, -22.38998794555664, -21.69333839416504, -20.99669075012207, -20.30004119873047, -19.6033935546875, -18.90674591064453, -18.21009635925293, -17.513446807861328, -16.81679916381836, -16.120149612426758, -15.423501968383789, -14.726852416992188, -14.030204772949219, -13.333556175231934, -12.636907577514648, -11.94025993347168, -11.243611335754395, -10.54696273803711, -9.85031509399414, -9.153665542602539, -8.45701789855957, -7.760369300842285, -7.063720703125, -6.367072105407715, -5.67042350769043, -4.9737749099731445, -4.277126789093018, -3.5804781913757324, -2.8838295936584473, -2.1871814727783203, -1.4905328750610352, -0.79388427734375, -0.0972357988357544, 0.5994126796722412, 1.2960610389709473, 1.9927096366882324, 2.6893582344055176, 3.3860063552856445, 4.08265495300293, 4.779303550720215, 5.4759521484375, 6.172600746154785, 6.869248867034912, 7.565897464752197, 8.26254653930664, 8.95919418334961, 9.655842781066895, 10.35249137878418, 11.049139976501465, 11.74578857421875, 12.442436218261719, 13.13908576965332, 13.835733413696289, 14.532382011413574, 15.22903060913086, 15.925679206848145, 16.62232780456543, 17.3189754486084, 18.015625, 18.71227264404297, 19.40892219543457, 20.10556983947754, 20.80221939086914, 21.49886703491211]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 6.0, 7.0, 7.0, 8.0, 8.0, 15.0, 8.0, 13.0, 23.0, 20.0, 24.0, 30.0, 17.0, 32.0, 25.0, 39.0, 40.0, 29.0, 37.0, 45.0, 49.0, 52.0, 40.0, 40.0, 42.0, 29.0, 37.0, 29.0, 36.0, 26.0, 26.0, 23.0, 21.0, 18.0, 17.0, 11.0, 15.0, 11.0, 8.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-31.706920623779297, -30.750709533691406, -29.794498443603516, -28.838287353515625, -27.882076263427734, -26.925865173339844, -25.969655990600586, -25.013444900512695, -24.057233810424805, -23.101022720336914, -22.144811630249023, -21.188600540161133, -20.232391357421875, -19.276180267333984, -18.319969177246094, -17.363758087158203, -16.407546997070312, -15.451335906982422, -14.495124816894531, -13.538914680480957, -12.582703590393066, -11.626492500305176, -10.670282363891602, -9.714071273803711, -8.75786018371582, -7.80164909362793, -6.845438480377197, -5.889227867126465, -4.933016777038574, -3.9768056869506836, -3.020595073699951, -2.0643844604492188, -1.1081714630126953, -0.1519606113433838, 0.8042502403259277, 1.7604610919952393, 2.716671943664551, 3.6728830337524414, 4.629093647003174, 5.585304260253906, 6.541515350341797, 7.4977264404296875, 8.453937530517578, 9.410147666931152, 10.366358757019043, 11.322569847106934, 12.278779983520508, 13.234991073608398, 14.191202163696289, 15.14741325378418, 16.10362434387207, 17.05983543395996, 18.01604461669922, 18.97225570678711, 19.928466796875, 20.88467788696289, 21.84088897705078, 22.797100067138672, 23.753311157226562, 24.709522247314453, 25.665733337402344, 26.621944427490234, 27.578153610229492, 28.534364700317383, 29.490575790405273]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 8.0, 7.0, 5.0, 12.0, 11.0, 14.0, 21.0, 13.0, 19.0, 19.0, 26.0, 22.0, 23.0, 36.0, 45.0, 32.0, 33.0, 39.0, 43.0, 28.0, 47.0, 49.0, 52.0, 48.0, 34.0, 36.0, 35.0, 34.0, 26.0, 25.0, 21.0, 18.0, 18.0, 19.0, 17.0, 7.0, 12.0, 9.0, 9.0, 4.0, 3.0, 2.0, 5.0, 4.0, 3.0, 0.0, 1.0, 2.0, 2.0], "bins": [-0.98779296875, -0.9596405029296875, -0.931488037109375, -0.9033355712890625, -0.87518310546875, -0.8470306396484375, -0.818878173828125, -0.7907257080078125, -0.7625732421875, -0.7344207763671875, -0.706268310546875, -0.6781158447265625, -0.64996337890625, -0.6218109130859375, -0.593658447265625, -0.5655059814453125, -0.537353515625, -0.5092010498046875, -0.481048583984375, -0.4528961181640625, -0.42474365234375, -0.3965911865234375, -0.368438720703125, -0.3402862548828125, -0.3121337890625, -0.2839813232421875, -0.255828857421875, -0.2276763916015625, -0.19952392578125, -0.1713714599609375, -0.143218994140625, -0.1150665283203125, -0.0869140625, -0.0587615966796875, -0.030609130859375, -0.0024566650390625, 0.02569580078125, 0.0538482666015625, 0.082000732421875, 0.1101531982421875, 0.1383056640625, 0.1664581298828125, 0.194610595703125, 0.2227630615234375, 0.25091552734375, 0.2790679931640625, 0.307220458984375, 0.3353729248046875, 0.363525390625, 0.3916778564453125, 0.419830322265625, 0.4479827880859375, 0.47613525390625, 0.5042877197265625, 0.532440185546875, 0.5605926513671875, 0.5887451171875, 0.6168975830078125, 0.645050048828125, 0.6732025146484375, 0.70135498046875, 0.7295074462890625, 0.757659912109375, 0.7858123779296875, 0.81396484375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 5.0, 7.0, 3.0, 7.0, 10.0, 7.0, 15.0, 23.0, 30.0, 21.0, 33.0, 51.0, 65.0, 93.0, 112.0, 173.0, 210.0, 272.0, 401.0, 612.0, 947.0, 1674.0, 3295.0, 9658.0, 48150.0, 904712.0, 3084689.0, 112324.0, 16356.0, 4712.0, 1965.0, 1166.0, 782.0, 482.0, 359.0, 247.0, 156.0, 126.0, 73.0, 61.0, 57.0, 40.0, 25.0, 20.0, 14.0, 15.0, 9.0, 9.0, 6.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0], "bins": [-6.80078125, -6.60186767578125, -6.4029541015625, -6.20404052734375, -6.005126953125, -5.80621337890625, -5.6072998046875, -5.40838623046875, -5.20947265625, -5.01055908203125, -4.8116455078125, -4.61273193359375, -4.413818359375, -4.21490478515625, -4.0159912109375, -3.81707763671875, -3.6181640625, -3.41925048828125, -3.2203369140625, -3.02142333984375, -2.822509765625, -2.62359619140625, -2.4246826171875, -2.22576904296875, -2.02685546875, -1.82794189453125, -1.6290283203125, -1.43011474609375, -1.231201171875, -1.03228759765625, -0.8333740234375, -0.63446044921875, -0.435546875, -0.23663330078125, -0.0377197265625, 0.16119384765625, 0.360107421875, 0.55902099609375, 0.7579345703125, 0.95684814453125, 1.15576171875, 1.35467529296875, 1.5535888671875, 1.75250244140625, 1.951416015625, 2.15032958984375, 2.3492431640625, 2.54815673828125, 2.7470703125, 2.94598388671875, 3.1448974609375, 3.34381103515625, 3.542724609375, 3.74163818359375, 3.9405517578125, 4.13946533203125, 4.33837890625, 4.53729248046875, 4.7362060546875, 4.93511962890625, 5.134033203125, 5.33294677734375, 5.5318603515625, 5.73077392578125, 5.9296875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 8.0, 16.0, 19.0, 71.0, 133.0, 482.0, 1370.0, 1223.0, 434.0, 176.0, 75.0, 30.0, 23.0, 9.0, 11.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.75, -11.39306640625, -11.0361328125, -10.67919921875, -10.322265625, -9.96533203125, -9.6083984375, -9.25146484375, -8.89453125, -8.53759765625, -8.1806640625, -7.82373046875, -7.466796875, -7.10986328125, -6.7529296875, -6.39599609375, -6.0390625, -5.68212890625, -5.3251953125, -4.96826171875, -4.611328125, -4.25439453125, -3.8974609375, -3.54052734375, -3.18359375, -2.82666015625, -2.4697265625, -2.11279296875, -1.755859375, -1.39892578125, -1.0419921875, -0.68505859375, -0.328125, 0.02880859375, 0.3857421875, 0.74267578125, 1.099609375, 1.45654296875, 1.8134765625, 2.17041015625, 2.52734375, 2.88427734375, 3.2412109375, 3.59814453125, 3.955078125, 4.31201171875, 4.6689453125, 5.02587890625, 5.3828125, 5.73974609375, 6.0966796875, 6.45361328125, 6.810546875, 7.16748046875, 7.5244140625, 7.88134765625, 8.23828125, 8.59521484375, 8.9521484375, 9.30908203125, 9.666015625, 10.02294921875, 10.3798828125, 10.73681640625, 11.09375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 4.0, 8.0, 9.0, 26.0, 49.0, 85.0, 238.0, 697.0, 3302.0, 1963006.0, 2222055.0, 3558.0, 775.0, 262.0, 90.0, 61.0, 29.0, 21.0, 12.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-33.09375, -32.091064453125, -31.08837890625, -30.085693359375, -29.0830078125, -28.080322265625, -27.07763671875, -26.074951171875, -25.072265625, -24.069580078125, -23.06689453125, -22.064208984375, -21.0615234375, -20.058837890625, -19.05615234375, -18.053466796875, -17.05078125, -16.048095703125, -15.04541015625, -14.042724609375, -13.0400390625, -12.037353515625, -11.03466796875, -10.031982421875, -9.029296875, -8.026611328125, -7.02392578125, -6.021240234375, -5.0185546875, -4.015869140625, -3.01318359375, -2.010498046875, -1.0078125, -0.005126953125, 0.99755859375, 2.000244140625, 3.0029296875, 4.005615234375, 5.00830078125, 6.010986328125, 7.013671875, 8.016357421875, 9.01904296875, 10.021728515625, 11.0244140625, 12.027099609375, 13.02978515625, 14.032470703125, 15.03515625, 16.037841796875, 17.04052734375, 18.043212890625, 19.0458984375, 20.048583984375, 21.05126953125, 22.053955078125, 23.056640625, 24.059326171875, 25.06201171875, 26.064697265625, 27.0673828125, 28.070068359375, 29.07275390625, 30.075439453125, 31.078125]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 6.0, 234.0, 684.0, 86.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.84878540039062, -140.8623046875, -137.87582397460938, -134.8893585205078, -131.9028778076172, -128.91639709472656, -125.92992401123047, -122.94345092773438, -119.95697021484375, -116.97048950195312, -113.98401641845703, -110.99754333496094, -108.01106262207031, -105.02458190917969, -102.0381088256836, -99.0516357421875, -96.06515502929688, -93.07867431640625, -90.09220123291016, -87.10572814941406, -84.11924743652344, -81.13276672363281, -78.14629364013672, -75.15982055664062, -72.17333984375, -69.18685913085938, -66.20038604736328, -63.21390914916992, -60.22743225097656, -57.2409553527832, -54.254478454589844, -51.268001556396484, -48.281517028808594, -45.295040130615234, -42.308563232421875, -39.322086334228516, -36.335609436035156, -33.3491325378418, -30.362655639648438, -27.376178741455078, -24.38970184326172, -21.40322494506836, -18.416748046875, -15.43027114868164, -12.443794250488281, -9.457317352294922, -6.4708404541015625, -3.484363555908203, -0.49788665771484375, 2.4885902404785156, 5.475067138671875, 8.461544036865234, 11.448020935058594, 14.434497833251953, 17.420974731445312, 20.407451629638672, 23.39392852783203, 26.38040542602539, 29.36688232421875, 32.35335922241211, 35.33983612060547, 38.32631301879883, 41.31278991699219, 44.29926681518555, 47.285743713378906]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 4.0, 4.0, 12.0, 5.0, 13.0, 19.0, 29.0, 25.0, 30.0, 21.0, 33.0, 32.0, 32.0, 38.0, 58.0, 41.0, 53.0, 58.0, 66.0, 54.0, 46.0, 49.0, 43.0, 33.0, 35.0, 29.0, 39.0, 17.0, 28.0, 11.0, 12.0, 14.0, 8.0, 5.0, 6.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-30.013214111328125, -29.287200927734375, -28.561187744140625, -27.835174560546875, -27.109161376953125, -26.383148193359375, -25.657135009765625, -24.931123733520508, -24.205110549926758, -23.479097366333008, -22.753084182739258, -22.027070999145508, -21.301057815551758, -20.57504653930664, -19.84903335571289, -19.12302017211914, -18.39700698852539, -17.67099380493164, -16.94498062133789, -16.21896743774414, -15.492955207824707, -14.766942024230957, -14.040928840637207, -13.314916610717773, -12.58890151977539, -11.86288833618164, -11.13687515258789, -10.41086196899414, -9.684849739074707, -8.958836555480957, -8.232823371887207, -7.506810665130615, -6.780797958374023, -6.054784774780273, -5.328772068023682, -4.602758884429932, -3.8767459392547607, -3.15073299407959, -2.42471981048584, -1.698707103729248, -0.972693920135498, -0.24668091535568237, 0.4793320894241333, 1.2053451538085938, 1.9313580989837646, 2.6573710441589355, 3.3833842277526855, 4.109396934509277, 4.835410118103027, 5.561423301696777, 6.287436008453369, 7.013449192047119, 7.739461898803711, 8.465475082397461, 9.191488265991211, 9.917501449584961, 10.643514633178711, 11.369527816772461, 12.095541000366211, 12.821554183959961, 13.547566413879395, 14.273579597473145, 14.999592781066895, 15.725605010986328, 16.451618194580078]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 6.0, 5.0, 5.0, 3.0, 7.0, 8.0, 8.0, 17.0, 12.0, 18.0, 20.0, 21.0, 19.0, 21.0, 22.0, 42.0, 20.0, 26.0, 29.0, 28.0, 34.0, 28.0, 36.0, 46.0, 43.0, 56.0, 41.0, 51.0, 32.0, 31.0, 26.0, 31.0, 32.0, 26.0, 19.0, 15.0, 15.0, 17.0, 10.0, 12.0, 11.0, 9.0, 14.0, 6.0, 10.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.96337890625, -0.9356231689453125, -0.907867431640625, -0.8801116943359375, -0.85235595703125, -0.8246002197265625, -0.796844482421875, -0.7690887451171875, -0.7413330078125, -0.7135772705078125, -0.685821533203125, -0.6580657958984375, -0.63031005859375, -0.6025543212890625, -0.574798583984375, -0.5470428466796875, -0.519287109375, -0.4915313720703125, -0.463775634765625, -0.4360198974609375, -0.40826416015625, -0.3805084228515625, -0.352752685546875, -0.3249969482421875, -0.2972412109375, -0.2694854736328125, -0.241729736328125, -0.2139739990234375, -0.18621826171875, -0.1584625244140625, -0.130706787109375, -0.1029510498046875, -0.0751953125, -0.0474395751953125, -0.019683837890625, 0.0080718994140625, 0.03582763671875, 0.0635833740234375, 0.091339111328125, 0.1190948486328125, 0.1468505859375, 0.1746063232421875, 0.202362060546875, 0.2301177978515625, 0.25787353515625, 0.2856292724609375, 0.313385009765625, 0.3411407470703125, 0.368896484375, 0.3966522216796875, 0.424407958984375, 0.4521636962890625, 0.47991943359375, 0.5076751708984375, 0.535430908203125, 0.5631866455078125, 0.5909423828125, 0.6186981201171875, 0.646453857421875, 0.6742095947265625, 0.70196533203125, 0.7297210693359375, 0.757476806640625, 0.7852325439453125, 0.81298828125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 6.0, 5.0, 14.0, 16.0, 21.0, 37.0, 62.0, 84.0, 125.0, 170.0, 250.0, 325.0, 509.0, 680.0, 986.0, 1521.0, 2183.0, 3323.0, 4898.0, 7065.0, 10498.0, 15628.0, 23352.0, 35008.0, 51847.0, 76099.0, 109762.0, 144748.0, 156829.0, 125585.0, 89842.0, 60739.0, 41226.0, 27485.0, 18486.0, 12612.0, 8383.0, 5779.0, 3891.0, 2613.0, 1893.0, 1291.0, 871.0, 566.0, 412.0, 267.0, 172.0, 133.0, 97.0, 56.0, 45.0, 28.0, 15.0, 15.0, 7.0, 1.0, 7.0, 0.0, 0.0, 2.0], "bins": [-0.064208984375, -0.06221580505371094, -0.060222625732421875, -0.05822944641113281, -0.05623626708984375, -0.05424308776855469, -0.052249908447265625, -0.05025672912597656, -0.0482635498046875, -0.04627037048339844, -0.044277191162109375, -0.04228401184082031, -0.04029083251953125, -0.03829765319824219, -0.036304473876953125, -0.03431129455566406, -0.032318115234375, -0.030324935913085938, -0.028331756591796875, -0.026338577270507812, -0.02434539794921875, -0.022352218627929688, -0.020359039306640625, -0.018365859985351562, -0.0163726806640625, -0.014379501342773438, -0.012386322021484375, -0.010393142700195312, -0.00839996337890625, -0.0064067840576171875, -0.004413604736328125, -0.0024204254150390625, -0.00042724609375, 0.0015659332275390625, 0.003559112548828125, 0.0055522918701171875, 0.00754547119140625, 0.009538650512695312, 0.011531829833984375, 0.013525009155273438, 0.0155181884765625, 0.017511367797851562, 0.019504547119140625, 0.021497726440429688, 0.02349090576171875, 0.025484085083007812, 0.027477264404296875, 0.029470443725585938, 0.031463623046875, 0.03345680236816406, 0.035449981689453125, 0.03744316101074219, 0.03943634033203125, 0.04142951965332031, 0.043422698974609375, 0.04541587829589844, 0.0474090576171875, 0.04940223693847656, 0.051395416259765625, 0.05338859558105469, 0.05538177490234375, 0.05737495422363281, 0.059368133544921875, 0.06136131286621094, 0.0633544921875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 7.0, 1.0, 6.0, 5.0, 7.0, 7.0, 7.0, 6.0, 13.0, 11.0, 12.0, 18.0, 22.0, 22.0, 16.0, 25.0, 25.0, 22.0, 32.0, 25.0, 35.0, 33.0, 47.0, 41.0, 42.0, 1057.0, 37.0, 38.0, 30.0, 53.0, 27.0, 22.0, 44.0, 22.0, 25.0, 23.0, 24.0, 22.0, 22.0, 18.0, 16.0, 5.0, 6.0, 14.0, 10.0, 2.0, 7.0, 6.0, 7.0, 4.0, 3.0, 4.0, 0.0, 3.0], "bins": [-0.7802734375, -0.7579879760742188, -0.7357025146484375, -0.7134170532226562, -0.691131591796875, -0.6688461303710938, -0.6465606689453125, -0.6242752075195312, -0.60198974609375, -0.5797042846679688, -0.5574188232421875, -0.5351333618164062, -0.512847900390625, -0.49056243896484375, -0.4682769775390625, -0.44599151611328125, -0.4237060546875, -0.40142059326171875, -0.3791351318359375, -0.35684967041015625, -0.334564208984375, -0.31227874755859375, -0.2899932861328125, -0.26770782470703125, -0.24542236328125, -0.22313690185546875, -0.2008514404296875, -0.17856597900390625, -0.156280517578125, -0.13399505615234375, -0.1117095947265625, -0.08942413330078125, -0.067138671875, -0.04485321044921875, -0.0225677490234375, -0.00028228759765625, 0.022003173828125, 0.04428863525390625, 0.0665740966796875, 0.08885955810546875, 0.11114501953125, 0.13343048095703125, 0.1557159423828125, 0.17800140380859375, 0.200286865234375, 0.22257232666015625, 0.2448577880859375, 0.26714324951171875, 0.2894287109375, 0.31171417236328125, 0.3339996337890625, 0.35628509521484375, 0.378570556640625, 0.40085601806640625, 0.4231414794921875, 0.44542694091796875, 0.46771240234375, 0.48999786376953125, 0.5122833251953125, 0.5345687866210938, 0.556854248046875, 0.5791397094726562, 0.6014251708984375, 0.6237106323242188, 0.64599609375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 7.0, 11.0, 17.0, 22.0, 34.0, 36.0, 68.0, 112.0, 158.0, 253.0, 414.0, 617.0, 931.0, 1476.0, 2288.0, 3694.0, 5966.0, 9580.0, 15669.0, 25857.0, 41608.0, 66345.0, 104533.0, 151878.0, 1221953.0, 155576.0, 107062.0, 68455.0, 43010.0, 26597.0, 16145.0, 10081.0, 6111.0, 3826.0, 2459.0, 1496.0, 978.0, 629.0, 393.0, 259.0, 181.0, 111.0, 103.0, 54.0, 33.0, 19.0, 11.0, 6.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.050628662109375, -0.049118995666503906, -0.04760932922363281, -0.04609966278076172, -0.044589996337890625, -0.04308032989501953, -0.04157066345214844, -0.040060997009277344, -0.03855133056640625, -0.037041664123535156, -0.03553199768066406, -0.03402233123779297, -0.032512664794921875, -0.03100299835205078, -0.029493331909179688, -0.027983665466308594, -0.0264739990234375, -0.024964332580566406, -0.023454666137695312, -0.02194499969482422, -0.020435333251953125, -0.01892566680908203, -0.017416000366210938, -0.015906333923339844, -0.01439666748046875, -0.012887001037597656, -0.011377334594726562, -0.009867668151855469, -0.008358001708984375, -0.006848335266113281, -0.0053386688232421875, -0.0038290023803710938, -0.0023193359375, -0.0008096694946289062, 0.0006999969482421875, 0.0022096633911132812, 0.003719329833984375, 0.005228996276855469, 0.0067386627197265625, 0.008248329162597656, 0.00975799560546875, 0.011267662048339844, 0.012777328491210938, 0.014286994934082031, 0.015796661376953125, 0.01730632781982422, 0.018815994262695312, 0.020325660705566406, 0.0218353271484375, 0.023344993591308594, 0.024854660034179688, 0.02636432647705078, 0.027873992919921875, 0.02938365936279297, 0.030893325805664062, 0.032402992248535156, 0.03391265869140625, 0.035422325134277344, 0.03693199157714844, 0.03844165802001953, 0.039951324462890625, 0.04146099090576172, 0.04297065734863281, 0.044480323791503906, 0.045989990234375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 2.0, 0.0, 13.0, 11.0, 5.0, 7.0, 6.0, 11.0, 25.0, 22.0, 27.0, 24.0, 34.0, 45.0, 63.0, 59.0, 73.0, 73.0, 80.0, 72.0, 46.0, 57.0, 45.0, 44.0, 30.0, 28.0, 16.0, 22.0, 12.0, 8.0, 12.0, 5.0, 5.0, 3.0, 8.0, 1.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.003124237060546875, -0.003028184175491333, -0.002932131290435791, -0.002836078405380249, -0.002740025520324707, -0.002643972635269165, -0.002547919750213623, -0.002451866865158081, -0.002355813980102539, -0.002259761095046997, -0.002163708209991455, -0.002067655324935913, -0.001971602439880371, -0.001875549554824829, -0.0017794966697692871, -0.0016834437847137451, -0.0015873908996582031, -0.0014913380146026611, -0.0013952851295471191, -0.0012992322444915771, -0.0012031793594360352, -0.0011071264743804932, -0.0010110735893249512, -0.0009150207042694092, -0.0008189678192138672, -0.0007229149341583252, -0.0006268620491027832, -0.0005308091640472412, -0.0004347562789916992, -0.0003387033939361572, -0.00024265050888061523, -0.00014659762382507324, -5.054473876953125e-05, 4.550814628601074e-05, 0.00014156103134155273, 0.00023761391639709473, 0.0003336668014526367, 0.0004297196865081787, 0.0005257725715637207, 0.0006218254566192627, 0.0007178783416748047, 0.0008139312267303467, 0.0009099841117858887, 0.0010060369968414307, 0.0011020898818969727, 0.0011981427669525146, 0.0012941956520080566, 0.0013902485370635986, 0.0014863014221191406, 0.0015823543071746826, 0.0016784071922302246, 0.0017744600772857666, 0.0018705129623413086, 0.0019665658473968506, 0.0020626187324523926, 0.0021586716175079346, 0.0022547245025634766, 0.0023507773876190186, 0.0024468302726745605, 0.0025428831577301025, 0.0026389360427856445, 0.0027349889278411865, 0.0028310418128967285, 0.0029270946979522705, 0.0030231475830078125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 11.0, 10.0, 16.0, 20.0, 18.0, 25.0, 27.0, 40.0, 49.0, 77.0, 85.0, 96.0, 140.0, 184.0, 233.0, 303.0, 642.0, 64940.0, 979282.0, 944.0, 352.0, 231.0, 201.0, 115.0, 108.0, 75.0, 62.0, 60.0, 44.0, 31.0, 23.0, 21.0, 18.0, 13.0, 14.0, 13.0, 5.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.052001953125, -0.050332069396972656, -0.04866218566894531, -0.04699230194091797, -0.045322418212890625, -0.04365253448486328, -0.04198265075683594, -0.040312767028808594, -0.03864288330078125, -0.036972999572753906, -0.03530311584472656, -0.03363323211669922, -0.031963348388671875, -0.03029346466064453, -0.028623580932617188, -0.026953697204589844, -0.0252838134765625, -0.023613929748535156, -0.021944046020507812, -0.02027416229248047, -0.018604278564453125, -0.01693439483642578, -0.015264511108398438, -0.013594627380371094, -0.01192474365234375, -0.010254859924316406, -0.008584976196289062, -0.006915092468261719, -0.005245208740234375, -0.0035753250122070312, -0.0019054412841796875, -0.00023555755615234375, 0.001434326171875, 0.0031042098999023438, 0.0047740936279296875, 0.006443977355957031, 0.008113861083984375, 0.009783744812011719, 0.011453628540039062, 0.013123512268066406, 0.01479339599609375, 0.016463279724121094, 0.018133163452148438, 0.01980304718017578, 0.021472930908203125, 0.02314281463623047, 0.024812698364257812, 0.026482582092285156, 0.0281524658203125, 0.029822349548339844, 0.03149223327636719, 0.03316211700439453, 0.034832000732421875, 0.03650188446044922, 0.03817176818847656, 0.039841651916503906, 0.04151153564453125, 0.043181419372558594, 0.04485130310058594, 0.04652118682861328, 0.048191070556640625, 0.04986095428466797, 0.05153083801269531, 0.053200721740722656, 0.05487060546875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 1006.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10752854496240616, -0.10441409051418304, -0.10129962861537933, -0.09818516671657562, -0.09507071226835251, -0.0919562578201294, -0.08884179592132568, -0.08572733402252197, -0.08261287957429886, -0.07949842512607574, -0.07638396322727203, -0.07326950132846832, -0.07015504688024521, -0.0670405924320221, -0.06392613053321838, -0.06081167235970497, -0.05769721418619156, -0.054582756012678146, -0.051468297839164734, -0.04835383966565132, -0.04523938149213791, -0.042124923318624496, -0.039010465145111084, -0.03589600697159767, -0.03278154879808426, -0.029667090624570847, -0.026552632451057434, -0.02343817427754402, -0.02032371610403061, -0.017209257930517197, -0.014094799757003784, -0.010980341583490372, -0.00786588340997696, -0.004751425236463547, -0.0016369670629501343, 0.0014774911105632782, 0.004591949284076691, 0.007706407457590103, 0.010820865631103516, 0.013935323804616928, 0.01704978197813034, 0.020164240151643753, 0.023278698325157166, 0.026393156498670578, 0.02950761467218399, 0.0326220728456974, 0.035736531019210815, 0.03885098919272423, 0.04196544736623764, 0.04507990553975105, 0.048194363713264465, 0.05130882188677788, 0.05442328006029129, 0.0575377382338047, 0.060652196407318115, 0.06376665830612183, 0.06688111275434494, 0.06999556720256805, 0.07311002910137177, 0.07622449100017548, 0.07933894544839859, 0.0824533998966217, 0.08556786179542542, 0.08868232369422913, 0.09179677814245224]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 5.0, 11.0, 14.0, 22.0, 13.0, 22.0, 40.0, 30.0, 54.0, 68.0, 62.0, 50.0, 59.0, 58.0, 66.0, 55.0, 51.0, 60.0, 53.0, 40.0, 44.0, 28.0, 24.0, 25.0, 13.0, 8.0, 12.0, 10.0, 4.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.012783646583557129, -0.012492719106376171, -0.012201791629195213, -0.011910864152014256, -0.011619936674833298, -0.01132900919765234, -0.011038081720471382, -0.010747154243290424, -0.010456226766109467, -0.010165299288928509, -0.009874371811747551, -0.009583444334566593, -0.009292516857385635, -0.009001589380204678, -0.00871066190302372, -0.008419734425842762, -0.008128806948661804, -0.007837879471480846, -0.007546951994299889, -0.007256024517118931, -0.006965097039937973, -0.006674169562757015, -0.0063832420855760574, -0.0060923146083951, -0.005801387131214142, -0.005510459654033184, -0.005219532176852226, -0.0049286046996712685, -0.004637677222490311, -0.004346749745309353, -0.004055822268128395, -0.0037648947909474373, -0.0034739673137664795, -0.0031830398365855217, -0.002892112359404564, -0.002601184882223606, -0.0023102574050426483, -0.0020193299278616905, -0.0017284024506807327, -0.001437474973499775, -0.0011465474963188171, -0.0008556200191378593, -0.0005646925419569016, -0.00027376506477594376, 1.7162412405014038e-05, 0.00030808988958597183, 0.0005990173667669296, 0.0008899448439478874, 0.0011808723211288452, 0.001471799798309803, 0.0017627272754907608, 0.0020536547526717186, 0.0023445822298526764, 0.002635509707033634, 0.002926437184214592, 0.0032173646613955498, 0.0035082921385765076, 0.0037992196157574654, 0.004090147092938423, 0.004381074570119381, 0.004672002047300339, 0.0049629295244812965, 0.005253857001662254, 0.005544784478843212, 0.00583571195602417]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 6.0, 5.0, 5.0, 3.0, 7.0, 8.0, 8.0, 17.0, 12.0, 18.0, 20.0, 21.0, 19.0, 21.0, 22.0, 42.0, 20.0, 26.0, 29.0, 28.0, 34.0, 28.0, 36.0, 46.0, 43.0, 56.0, 41.0, 51.0, 32.0, 31.0, 26.0, 31.0, 32.0, 26.0, 19.0, 15.0, 15.0, 17.0, 10.0, 12.0, 11.0, 9.0, 14.0, 6.0, 10.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-0.96337890625, -0.9356231689453125, -0.907867431640625, -0.8801116943359375, -0.85235595703125, -0.8246002197265625, -0.796844482421875, -0.7690887451171875, -0.7413330078125, -0.7135772705078125, -0.685821533203125, -0.6580657958984375, -0.63031005859375, -0.6025543212890625, -0.574798583984375, -0.5470428466796875, -0.519287109375, -0.4915313720703125, -0.463775634765625, -0.4360198974609375, -0.40826416015625, -0.3805084228515625, -0.352752685546875, -0.3249969482421875, -0.2972412109375, -0.2694854736328125, -0.241729736328125, -0.2139739990234375, -0.18621826171875, -0.1584625244140625, -0.130706787109375, -0.1029510498046875, -0.0751953125, -0.0474395751953125, -0.019683837890625, 0.0080718994140625, 0.03582763671875, 0.0635833740234375, 0.091339111328125, 0.1190948486328125, 0.1468505859375, 0.1746063232421875, 0.202362060546875, 0.2301177978515625, 0.25787353515625, 0.2856292724609375, 0.313385009765625, 0.3411407470703125, 0.368896484375, 0.3966522216796875, 0.424407958984375, 0.4521636962890625, 0.47991943359375, 0.5076751708984375, 0.535430908203125, 0.5631866455078125, 0.5909423828125, 0.6186981201171875, 0.646453857421875, 0.6742095947265625, 0.70196533203125, 0.7297210693359375, 0.757476806640625, 0.7852325439453125, 0.81298828125]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 10.0, 4.0, 9.0, 11.0, 17.0, 23.0, 33.0, 42.0, 47.0, 89.0, 84.0, 119.0, 177.0, 243.0, 303.0, 436.0, 581.0, 850.0, 1248.0, 2008.0, 3235.0, 5561.0, 9989.0, 20657.0, 51473.0, 157371.0, 409026.0, 247527.0, 77142.0, 28718.0, 13318.0, 6972.0, 3845.0, 2368.0, 1501.0, 1041.0, 673.0, 472.0, 307.0, 247.0, 172.0, 151.0, 109.0, 78.0, 70.0, 54.0, 47.0, 30.0, 21.0, 21.0, 12.0, 10.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-3.265625, -3.168701171875, -3.07177734375, -2.974853515625, -2.8779296875, -2.781005859375, -2.68408203125, -2.587158203125, -2.490234375, -2.393310546875, -2.29638671875, -2.199462890625, -2.1025390625, -2.005615234375, -1.90869140625, -1.811767578125, -1.71484375, -1.617919921875, -1.52099609375, -1.424072265625, -1.3271484375, -1.230224609375, -1.13330078125, -1.036376953125, -0.939453125, -0.842529296875, -0.74560546875, -0.648681640625, -0.5517578125, -0.454833984375, -0.35791015625, -0.260986328125, -0.1640625, -0.067138671875, 0.02978515625, 0.126708984375, 0.2236328125, 0.320556640625, 0.41748046875, 0.514404296875, 0.611328125, 0.708251953125, 0.80517578125, 0.902099609375, 0.9990234375, 1.095947265625, 1.19287109375, 1.289794921875, 1.38671875, 1.483642578125, 1.58056640625, 1.677490234375, 1.7744140625, 1.871337890625, 1.96826171875, 2.065185546875, 2.162109375, 2.259033203125, 2.35595703125, 2.452880859375, 2.5498046875, 2.646728515625, 2.74365234375, 2.840576171875, 2.9375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 0.0, 3.0, 6.0, 7.0, 6.0, 2.0, 9.0, 5.0, 14.0, 15.0, 22.0, 28.0, 28.0, 31.0, 26.0, 41.0, 52.0, 62.0, 89.0, 120.0, 196.0, 1322.0, 259.0, 158.0, 120.0, 91.0, 68.0, 59.0, 33.0, 37.0, 23.0, 14.0, 23.0, 17.0, 13.0, 9.0, 11.0, 16.0, 5.0, 4.0, 5.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.9921875, -3.877777099609375, -3.76336669921875, -3.648956298828125, -3.5345458984375, -3.420135498046875, -3.30572509765625, -3.191314697265625, -3.076904296875, -2.962493896484375, -2.84808349609375, -2.733673095703125, -2.6192626953125, -2.504852294921875, -2.39044189453125, -2.276031494140625, -2.16162109375, -2.047210693359375, -1.93280029296875, -1.818389892578125, -1.7039794921875, -1.589569091796875, -1.47515869140625, -1.360748291015625, -1.246337890625, -1.131927490234375, -1.01751708984375, -0.903106689453125, -0.7886962890625, -0.674285888671875, -0.55987548828125, -0.445465087890625, -0.3310546875, -0.216644287109375, -0.10223388671875, 0.012176513671875, 0.1265869140625, 0.240997314453125, 0.35540771484375, 0.469818115234375, 0.584228515625, 0.698638916015625, 0.81304931640625, 0.927459716796875, 1.0418701171875, 1.156280517578125, 1.27069091796875, 1.385101318359375, 1.49951171875, 1.613922119140625, 1.72833251953125, 1.842742919921875, 1.9571533203125, 2.071563720703125, 2.18597412109375, 2.300384521484375, 2.414794921875, 2.529205322265625, 2.64361572265625, 2.758026123046875, 2.8724365234375, 2.986846923828125, 3.10125732421875, 3.215667724609375, 3.330078125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 7.0, 11.0, 15.0, 14.0, 10.0, 11.0, 21.0, 26.0, 29.0, 43.0, 59.0, 94.0, 164.0, 389.0, 2191.0, 285779.0, 2849555.0, 6059.0, 594.0, 200.0, 101.0, 78.0, 33.0, 37.0, 29.0, 18.0, 22.0, 20.0, 13.0, 17.0, 15.0, 6.0, 4.0, 3.0, 9.0, 3.0, 4.0, 4.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1484375, -14.6776123046875, -14.206787109375, -13.7359619140625, -13.26513671875, -12.7943115234375, -12.323486328125, -11.8526611328125, -11.3818359375, -10.9110107421875, -10.440185546875, -9.9693603515625, -9.49853515625, -9.0277099609375, -8.556884765625, -8.0860595703125, -7.615234375, -7.1444091796875, -6.673583984375, -6.2027587890625, -5.73193359375, -5.2611083984375, -4.790283203125, -4.3194580078125, -3.8486328125, -3.3778076171875, -2.906982421875, -2.4361572265625, -1.96533203125, -1.4945068359375, -1.023681640625, -0.5528564453125, -0.08203125, 0.3887939453125, 0.859619140625, 1.3304443359375, 1.80126953125, 2.2720947265625, 2.742919921875, 3.2137451171875, 3.6845703125, 4.1553955078125, 4.626220703125, 5.0970458984375, 5.56787109375, 6.0386962890625, 6.509521484375, 6.9803466796875, 7.451171875, 7.9219970703125, 8.392822265625, 8.8636474609375, 9.33447265625, 9.8052978515625, 10.276123046875, 10.7469482421875, 11.2177734375, 11.6885986328125, 12.159423828125, 12.6302490234375, 13.10107421875, 13.5718994140625, 14.042724609375, 14.5135498046875, 14.984375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [318.0, 699.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.118074417114258, -0.20041775703430176, 2.7172389030456543, 5.634895324707031, 8.552552223205566, 11.470209121704102, 14.38786506652832, 17.305522918701172, 20.22317886352539, 23.14083480834961, 26.05849266052246, 28.97614860534668, 31.89380645751953, 34.81146240234375, 37.72911834716797, 40.64677429199219, 43.564430236816406, 46.482086181640625, 49.399742126464844, 52.31739807128906, 55.23505783081055, 58.152713775634766, 61.070369720458984, 63.98802947998047, 66.90568542480469, 69.8233413696289, 72.74099731445312, 75.65865325927734, 78.57630920410156, 81.49397277832031, 84.41162109375, 87.32928466796875, 90.24694061279297, 93.16459655761719, 96.0822525024414, 98.99990844726562, 101.91756439208984, 104.83522033691406, 107.75288391113281, 110.67053985595703, 113.58819580078125, 116.50585174560547, 119.42350769042969, 122.3411636352539, 125.25881958007812, 128.17648315429688, 131.09413146972656, 134.0117950439453, 136.929443359375, 139.84710693359375, 142.76475524902344, 145.6824188232422, 148.60006713867188, 151.51773071289062, 154.4353790283203, 157.35304260253906, 160.2707061767578, 163.18836975097656, 166.10601806640625, 169.023681640625, 171.9413299560547, 174.85899353027344, 177.77664184570312, 180.69430541992188, 183.61195373535156]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 8.0, 5.0, 6.0, 7.0, 7.0, 13.0, 13.0, 7.0, 13.0, 14.0, 17.0, 27.0, 26.0, 37.0, 42.0, 39.0, 31.0, 45.0, 41.0, 34.0, 42.0, 37.0, 39.0, 40.0, 32.0, 44.0, 31.0, 40.0, 33.0, 38.0, 29.0, 19.0, 30.0, 24.0, 14.0, 13.0, 13.0, 14.0, 12.0, 5.0, 5.0, 5.0, 8.0, 5.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.944540977478027, -10.577326774597168, -10.210112571716309, -9.84289836883545, -9.47568416595459, -9.10846996307373, -8.741256713867188, -8.374042510986328, -8.006828308105469, -7.639614105224609, -7.27239990234375, -6.905185699462891, -6.537971496582031, -6.170757293701172, -5.803543567657471, -5.436329364776611, -5.069114685058594, -4.701900482177734, -4.334686279296875, -3.9674723148345947, -3.6002581119537354, -3.233043909072876, -2.8658299446105957, -2.4986157417297363, -2.131401538848877, -1.7641873359680176, -1.3969732522964478, -1.029759168624878, -0.6625449657440186, -0.2953307628631592, 0.0718832015991211, 0.43909740447998047, 0.8063125610351562, 1.1735267639160156, 1.5407408475875854, 1.9079549312591553, 2.2751691341400146, 2.642383337020874, 3.0095973014831543, 3.3768115043640137, 3.744025707244873, 4.111239910125732, 4.478454113006592, 4.845667839050293, 5.212882041931152, 5.580096244812012, 5.947310447692871, 6.3145246505737305, 6.68173885345459, 7.048953056335449, 7.416167259216309, 7.783381462097168, 8.150595664978027, 8.517809867858887, 8.88502311706543, 9.252237319946289, 9.619451522827148, 9.986665725708008, 10.353879928588867, 10.721094131469727, 11.088308334350586, 11.455522537231445, 11.822736740112305, 12.189950942993164, 12.557165145874023]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 1.0, 3.0, 0.0, 6.0, 7.0, 5.0, 6.0, 7.0, 8.0, 12.0, 9.0, 23.0, 17.0, 13.0, 21.0, 21.0, 25.0, 25.0, 29.0, 17.0, 31.0, 24.0, 32.0, 34.0, 31.0, 28.0, 45.0, 47.0, 51.0, 43.0, 49.0, 24.0, 26.0, 33.0, 26.0, 39.0, 20.0, 22.0, 17.0, 13.0, 10.0, 17.0, 18.0, 7.0, 10.0, 11.0, 5.0, 5.0, 10.0, 6.0, 7.0, 4.0, 2.0, 5.0, 1.0, 2.0], "bins": [-0.98291015625, -0.9546737670898438, -0.9264373779296875, -0.8982009887695312, -0.869964599609375, -0.8417282104492188, -0.8134918212890625, -0.7852554321289062, -0.75701904296875, -0.7287826538085938, -0.7005462646484375, -0.6723098754882812, -0.644073486328125, -0.6158370971679688, -0.5876007080078125, -0.5593643188476562, -0.5311279296875, -0.5028915405273438, -0.4746551513671875, -0.44641876220703125, -0.418182373046875, -0.38994598388671875, -0.3617095947265625, -0.33347320556640625, -0.30523681640625, -0.27700042724609375, -0.2487640380859375, -0.22052764892578125, -0.192291259765625, -0.16405487060546875, -0.1358184814453125, -0.10758209228515625, -0.079345703125, -0.05110931396484375, -0.0228729248046875, 0.00536346435546875, 0.033599853515625, 0.06183624267578125, 0.0900726318359375, 0.11830902099609375, 0.14654541015625, 0.17478179931640625, 0.2030181884765625, 0.23125457763671875, 0.259490966796875, 0.28772735595703125, 0.3159637451171875, 0.34420013427734375, 0.3724365234375, 0.40067291259765625, 0.4289093017578125, 0.45714569091796875, 0.485382080078125, 0.5136184692382812, 0.5418548583984375, 0.5700912475585938, 0.59832763671875, 0.6265640258789062, 0.6548004150390625, 0.6830368041992188, 0.711273193359375, 0.7395095825195312, 0.7677459716796875, 0.7959823608398438, 0.82421875]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 6.0, 11.0, 6.0, 6.0, 6.0, 20.0, 13.0, 20.0, 21.0, 35.0, 34.0, 35.0, 65.0, 73.0, 100.0, 155.0, 189.0, 258.0, 492.0, 996.0, 2536.0, 10960.0, 70533.0, 1035962.0, 2862913.0, 180208.0, 21203.0, 4297.0, 1347.0, 605.0, 332.0, 212.0, 142.0, 108.0, 80.0, 63.0, 46.0, 37.0, 28.0, 18.0, 26.0, 20.0, 16.0, 10.0, 10.0, 7.0, 10.0, 5.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0], "bins": [-5.73828125, -5.57049560546875, -5.4027099609375, -5.23492431640625, -5.067138671875, -4.89935302734375, -4.7315673828125, -4.56378173828125, -4.39599609375, -4.22821044921875, -4.0604248046875, -3.89263916015625, -3.724853515625, -3.55706787109375, -3.3892822265625, -3.22149658203125, -3.0537109375, -2.88592529296875, -2.7181396484375, -2.55035400390625, -2.382568359375, -2.21478271484375, -2.0469970703125, -1.87921142578125, -1.71142578125, -1.54364013671875, -1.3758544921875, -1.20806884765625, -1.040283203125, -0.87249755859375, -0.7047119140625, -0.53692626953125, -0.369140625, -0.20135498046875, -0.0335693359375, 0.13421630859375, 0.302001953125, 0.46978759765625, 0.6375732421875, 0.80535888671875, 0.97314453125, 1.14093017578125, 1.3087158203125, 1.47650146484375, 1.644287109375, 1.81207275390625, 1.9798583984375, 2.14764404296875, 2.3154296875, 2.48321533203125, 2.6510009765625, 2.81878662109375, 2.986572265625, 3.15435791015625, 3.3221435546875, 3.48992919921875, 3.65771484375, 3.82550048828125, 3.9932861328125, 4.16107177734375, 4.328857421875, 4.49664306640625, 4.6644287109375, 4.83221435546875, 5.0]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 7.0, 8.0, 12.0, 30.0, 32.0, 58.0, 125.0, 190.0, 305.0, 539.0, 813.0, 749.0, 513.0, 272.0, 166.0, 88.0, 65.0, 40.0, 20.0, 17.0, 10.0, 4.0, 4.0, 3.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.19921875, -6.021484375, -5.84375, -5.666015625, -5.48828125, -5.310546875, -5.1328125, -4.955078125, -4.77734375, -4.599609375, -4.421875, -4.244140625, -4.06640625, -3.888671875, -3.7109375, -3.533203125, -3.35546875, -3.177734375, -3.0, -2.822265625, -2.64453125, -2.466796875, -2.2890625, -2.111328125, -1.93359375, -1.755859375, -1.578125, -1.400390625, -1.22265625, -1.044921875, -0.8671875, -0.689453125, -0.51171875, -0.333984375, -0.15625, 0.021484375, 0.19921875, 0.376953125, 0.5546875, 0.732421875, 0.91015625, 1.087890625, 1.265625, 1.443359375, 1.62109375, 1.798828125, 1.9765625, 2.154296875, 2.33203125, 2.509765625, 2.6875, 2.865234375, 3.04296875, 3.220703125, 3.3984375, 3.576171875, 3.75390625, 3.931640625, 4.109375, 4.287109375, 4.46484375, 4.642578125, 4.8203125, 4.998046875, 5.17578125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 12.0, 23.0, 25.0, 31.0, 34.0, 54.0, 118.0, 150.0, 253.0, 398.0, 649.0, 1195.0, 2976.0, 10393.0, 66237.0, 703060.0, 2958775.0, 396999.0, 40653.0, 7341.0, 2385.0, 1042.0, 539.0, 319.0, 208.0, 121.0, 80.0, 58.0, 36.0, 19.0, 24.0, 20.0, 8.0, 13.0, 1.0, 4.0, 2.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.87109375, -6.63726806640625, -6.4034423828125, -6.16961669921875, -5.935791015625, -5.70196533203125, -5.4681396484375, -5.23431396484375, -5.00048828125, -4.76666259765625, -4.5328369140625, -4.29901123046875, -4.065185546875, -3.83135986328125, -3.5975341796875, -3.36370849609375, -3.1298828125, -2.89605712890625, -2.6622314453125, -2.42840576171875, -2.194580078125, -1.96075439453125, -1.7269287109375, -1.49310302734375, -1.25927734375, -1.02545166015625, -0.7916259765625, -0.55780029296875, -0.323974609375, -0.09014892578125, 0.1436767578125, 0.37750244140625, 0.611328125, 0.84515380859375, 1.0789794921875, 1.31280517578125, 1.546630859375, 1.78045654296875, 2.0142822265625, 2.24810791015625, 2.48193359375, 2.71575927734375, 2.9495849609375, 3.18341064453125, 3.417236328125, 3.65106201171875, 3.8848876953125, 4.11871337890625, 4.3525390625, 4.58636474609375, 4.8201904296875, 5.05401611328125, 5.287841796875, 5.52166748046875, 5.7554931640625, 5.98931884765625, 6.22314453125, 6.45697021484375, 6.6907958984375, 6.92462158203125, 7.158447265625, 7.39227294921875, 7.6260986328125, 7.85992431640625, 8.09375]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 43.0, 352.0, 483.0, 124.0, 9.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.517608642578125, -37.22113037109375, -34.924652099609375, -32.628173828125, -30.331695556640625, -28.03521728515625, -25.738739013671875, -23.4422607421875, -21.145782470703125, -18.84930419921875, -16.552825927734375, -14.25634765625, -11.959869384765625, -9.66339111328125, -7.366912841796875, -5.0704345703125, -2.773956298828125, -0.47747802734375, 1.819000244140625, 4.115478515625, 6.411956787109375, 8.70843505859375, 11.004913330078125, 13.3013916015625, 15.597869873046875, 17.89434814453125, 20.190826416015625, 22.4873046875, 24.783782958984375, 27.08026123046875, 29.376739501953125, 31.6732177734375, 33.969696044921875, 36.26617431640625, 38.562652587890625, 40.859130859375, 43.155609130859375, 45.45208740234375, 47.748565673828125, 50.0450439453125, 52.341522216796875, 54.63800048828125, 56.934478759765625, 59.23095703125, 61.527435302734375, 63.82391357421875, 66.12039184570312, 68.4168701171875, 70.71334838867188, 73.00982666015625, 75.30630493164062, 77.602783203125, 79.89926147460938, 82.19573974609375, 84.49221801757812, 86.7886962890625, 89.08517456054688, 91.38165283203125, 93.67813110351562, 95.974609375, 98.27108764648438, 100.56756591796875, 102.86404418945312, 105.1605224609375, 107.45700073242188]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 6.0, 1.0, 1.0, 5.0, 4.0, 11.0, 9.0, 21.0, 15.0, 12.0, 18.0, 16.0, 14.0, 22.0, 30.0, 22.0, 38.0, 30.0, 37.0, 38.0, 40.0, 31.0, 50.0, 38.0, 44.0, 39.0, 43.0, 35.0, 47.0, 34.0, 39.0, 30.0, 23.0, 21.0, 20.0, 28.0, 15.0, 12.0, 16.0, 13.0, 11.0, 14.0, 6.0, 3.0, 3.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.111221313476562, -12.712953567504883, -12.314685821533203, -11.91641902923584, -11.51815128326416, -11.11988353729248, -10.721616744995117, -10.323348999023438, -9.925081253051758, -9.526813507080078, -9.128545761108398, -8.730278968811035, -8.332011222839355, -7.933743476867676, -7.535476207733154, -7.137208938598633, -6.738941192626953, -6.340673446655273, -5.942406177520752, -5.5441389083862305, -5.145871162414551, -4.747603416442871, -4.34933614730835, -3.951068639755249, -3.5528011322021484, -3.154533624649048, -2.7562661170959473, -2.3579986095428467, -1.959731101989746, -1.5614635944366455, -1.163196086883545, -0.7649285793304443, -0.36666107177734375, 0.031606435775756836, 0.4298739433288574, 0.828141450881958, 1.2264089584350586, 1.6246764659881592, 2.0229439735412598, 2.4212114810943604, 2.819478988647461, 3.2177464962005615, 3.616014003753662, 4.014281272888184, 4.412549018859863, 4.810816764831543, 5.2090840339660645, 5.607351303100586, 6.005619049072266, 6.403886795043945, 6.802154064178467, 7.200421333312988, 7.598689079284668, 7.996956825256348, 8.395223617553711, 8.79349136352539, 9.19175910949707, 9.59002685546875, 9.98829460144043, 10.386561393737793, 10.784829139709473, 11.183096885681152, 11.581363677978516, 11.979631423950195, 12.377899169921875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 4.0, 6.0, 2.0, 5.0, 9.0, 6.0, 7.0, 12.0, 14.0, 11.0, 20.0, 14.0, 25.0, 25.0, 18.0, 33.0, 27.0, 29.0, 25.0, 35.0, 37.0, 43.0, 28.0, 47.0, 57.0, 38.0, 42.0, 43.0, 28.0, 31.0, 43.0, 19.0, 24.0, 24.0, 31.0, 13.0, 17.0, 25.0, 14.0, 13.0, 6.0, 10.0, 9.0, 10.0, 6.0, 5.0, 4.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.015625, -0.9857330322265625, -0.955841064453125, -0.9259490966796875, -0.89605712890625, -0.8661651611328125, -0.836273193359375, -0.8063812255859375, -0.7764892578125, -0.7465972900390625, -0.716705322265625, -0.6868133544921875, -0.65692138671875, -0.6270294189453125, -0.597137451171875, -0.5672454833984375, -0.537353515625, -0.5074615478515625, -0.477569580078125, -0.4476776123046875, -0.41778564453125, -0.3878936767578125, -0.358001708984375, -0.3281097412109375, -0.2982177734375, -0.2683258056640625, -0.238433837890625, -0.2085418701171875, -0.17864990234375, -0.1487579345703125, -0.118865966796875, -0.0889739990234375, -0.05908203125, -0.0291900634765625, 0.000701904296875, 0.0305938720703125, 0.06048583984375, 0.0903778076171875, 0.120269775390625, 0.1501617431640625, 0.1800537109375, 0.2099456787109375, 0.239837646484375, 0.2697296142578125, 0.29962158203125, 0.3295135498046875, 0.359405517578125, 0.3892974853515625, 0.419189453125, 0.4490814208984375, 0.478973388671875, 0.5088653564453125, 0.53875732421875, 0.5686492919921875, 0.598541259765625, 0.6284332275390625, 0.6583251953125, 0.6882171630859375, 0.718109130859375, 0.7480010986328125, 0.77789306640625, 0.8077850341796875, 0.837677001953125, 0.8675689697265625, 0.8974609375]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 6.0, 7.0, 13.0, 27.0, 21.0, 49.0, 45.0, 98.0, 160.0, 228.0, 344.0, 539.0, 741.0, 1122.0, 1740.0, 2658.0, 3887.0, 5865.0, 8818.0, 13237.0, 20149.0, 30733.0, 46091.0, 69580.0, 102778.0, 142035.0, 163461.0, 138315.0, 99036.0, 66958.0, 43861.0, 29119.0, 19115.0, 12621.0, 8304.0, 5537.0, 3812.0, 2485.0, 1712.0, 1057.0, 755.0, 468.0, 334.0, 205.0, 158.0, 106.0, 59.0, 44.0, 30.0, 11.0, 13.0, 9.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.065673828125, -0.06351661682128906, -0.061359405517578125, -0.05920219421386719, -0.05704498291015625, -0.05488777160644531, -0.052730560302734375, -0.05057334899902344, -0.0484161376953125, -0.04625892639160156, -0.044101715087890625, -0.04194450378417969, -0.03978729248046875, -0.03763008117675781, -0.035472869873046875, -0.03331565856933594, -0.031158447265625, -0.029001235961914062, -0.026844024658203125, -0.024686813354492188, -0.02252960205078125, -0.020372390747070312, -0.018215179443359375, -0.016057968139648438, -0.0139007568359375, -0.011743545532226562, -0.009586334228515625, -0.0074291229248046875, -0.00527191162109375, -0.0031147003173828125, -0.000957489013671875, 0.0011997222900390625, 0.00335693359375, 0.0055141448974609375, 0.007671356201171875, 0.009828567504882812, 0.01198577880859375, 0.014142990112304688, 0.016300201416015625, 0.018457412719726562, 0.0206146240234375, 0.022771835327148438, 0.024929046630859375, 0.027086257934570312, 0.02924346923828125, 0.03140068054199219, 0.033557891845703125, 0.03571510314941406, 0.037872314453125, 0.04002952575683594, 0.042186737060546875, 0.04434394836425781, 0.04650115966796875, 0.04865837097167969, 0.050815582275390625, 0.05297279357910156, 0.0551300048828125, 0.05728721618652344, 0.059444427490234375, 0.06160163879394531, 0.06375885009765625, 0.06591606140136719, 0.06807327270507812, 0.07023048400878906, 0.0723876953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 6.0, 5.0, 6.0, 6.0, 9.0, 7.0, 8.0, 13.0, 10.0, 14.0, 37.0, 18.0, 34.0, 35.0, 34.0, 34.0, 48.0, 40.0, 40.0, 31.0, 39.0, 1063.0, 30.0, 36.0, 55.0, 51.0, 29.0, 34.0, 27.0, 31.0, 35.0, 34.0, 27.0, 16.0, 21.0, 13.0, 12.0, 8.0, 11.0, 7.0, 4.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7900390625, -0.7651214599609375, -0.740203857421875, -0.7152862548828125, -0.69036865234375, -0.6654510498046875, -0.640533447265625, -0.6156158447265625, -0.5906982421875, -0.5657806396484375, -0.540863037109375, -0.5159454345703125, -0.49102783203125, -0.4661102294921875, -0.441192626953125, -0.4162750244140625, -0.391357421875, -0.3664398193359375, -0.341522216796875, -0.3166046142578125, -0.29168701171875, -0.2667694091796875, -0.241851806640625, -0.2169342041015625, -0.1920166015625, -0.1670989990234375, -0.142181396484375, -0.1172637939453125, -0.09234619140625, -0.0674285888671875, -0.042510986328125, -0.0175933837890625, 0.00732421875, 0.0322418212890625, 0.057159423828125, 0.0820770263671875, 0.10699462890625, 0.1319122314453125, 0.156829833984375, 0.1817474365234375, 0.2066650390625, 0.2315826416015625, 0.256500244140625, 0.2814178466796875, 0.30633544921875, 0.3312530517578125, 0.356170654296875, 0.3810882568359375, 0.406005859375, 0.4309234619140625, 0.455841064453125, 0.4807586669921875, 0.50567626953125, 0.5305938720703125, 0.555511474609375, 0.5804290771484375, 0.6053466796875, 0.6302642822265625, 0.655181884765625, 0.6800994873046875, 0.70501708984375, 0.7299346923828125, 0.754852294921875, 0.7797698974609375, 0.8046875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 8.0, 11.0, 16.0, 37.0, 38.0, 53.0, 74.0, 106.0, 154.0, 207.0, 341.0, 457.0, 744.0, 1138.0, 1808.0, 2530.0, 3892.0, 5928.0, 9098.0, 14204.0, 21869.0, 34102.0, 52790.0, 80177.0, 115253.0, 179690.0, 1174142.0, 129427.0, 92553.0, 62029.0, 40130.0, 25750.0, 16801.0, 10856.0, 7091.0, 4568.0, 3041.0, 2023.0, 1324.0, 883.0, 598.0, 384.0, 277.0, 160.0, 106.0, 95.0, 53.0, 40.0, 20.0, 18.0, 12.0, 6.0, 6.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0], "bins": [-0.042205810546875, -0.04080772399902344, -0.039409637451171875, -0.03801155090332031, -0.03661346435546875, -0.03521537780761719, -0.033817291259765625, -0.03241920471191406, -0.0310211181640625, -0.029623031616210938, -0.028224945068359375, -0.026826858520507812, -0.02542877197265625, -0.024030685424804688, -0.022632598876953125, -0.021234512329101562, -0.01983642578125, -0.018438339233398438, -0.017040252685546875, -0.015642166137695312, -0.01424407958984375, -0.012845993041992188, -0.011447906494140625, -0.010049819946289062, -0.0086517333984375, -0.0072536468505859375, -0.005855560302734375, -0.0044574737548828125, -0.00305938720703125, -0.0016613006591796875, -0.000263214111328125, 0.0011348724365234375, 0.002532958984375, 0.0039310455322265625, 0.005329132080078125, 0.0067272186279296875, 0.00812530517578125, 0.009523391723632812, 0.010921478271484375, 0.012319564819335938, 0.0137176513671875, 0.015115737915039062, 0.016513824462890625, 0.017911911010742188, 0.01930999755859375, 0.020708084106445312, 0.022106170654296875, 0.023504257202148438, 0.02490234375, 0.026300430297851562, 0.027698516845703125, 0.029096603393554688, 0.03049468994140625, 0.03189277648925781, 0.033290863037109375, 0.03468894958496094, 0.0360870361328125, 0.03748512268066406, 0.038883209228515625, 0.04028129577636719, 0.04167938232421875, 0.04307746887207031, 0.044475555419921875, 0.04587364196777344, 0.047271728515625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 9.0, 9.0, 11.0, 9.0, 10.0, 13.0, 19.0, 12.0, 27.0, 34.0, 38.0, 45.0, 79.0, 98.0, 106.0, 119.0, 81.0, 63.0, 43.0, 38.0, 23.0, 20.0, 15.0, 17.0, 6.0, 9.0, 6.0, 10.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0016345977783203125, -0.0015827268362045288, -0.0015308558940887451, -0.0014789849519729614, -0.0014271140098571777, -0.001375243067741394, -0.0013233721256256104, -0.0012715011835098267, -0.001219630241394043, -0.0011677592992782593, -0.0011158883571624756, -0.001064017415046692, -0.0010121464729309082, -0.0009602755308151245, -0.0009084045886993408, -0.0008565336465835571, -0.0008046627044677734, -0.0007527917623519897, -0.0007009208202362061, -0.0006490498781204224, -0.0005971789360046387, -0.000545307993888855, -0.0004934370517730713, -0.0004415661096572876, -0.0003896951675415039, -0.0003378242254257202, -0.0002859532833099365, -0.00023408234119415283, -0.00018221139907836914, -0.00013034045696258545, -7.846951484680176e-05, -2.6598572731018066e-05, 2.5272369384765625e-05, 7.714331150054932e-05, 0.000129014253616333, 0.0001808851957321167, 0.0002327561378479004, 0.0002846270799636841, 0.0003364980220794678, 0.00038836896419525146, 0.00044023990631103516, 0.0004921108484268188, 0.0005439817905426025, 0.0005958527326583862, 0.0006477236747741699, 0.0006995946168899536, 0.0007514655590057373, 0.000803336501121521, 0.0008552074432373047, 0.0009070783853530884, 0.0009589493274688721, 0.0010108202695846558, 0.0010626912117004395, 0.0011145621538162231, 0.0011664330959320068, 0.0012183040380477905, 0.0012701749801635742, 0.001322045922279358, 0.0013739168643951416, 0.0014257878065109253, 0.001477658748626709, 0.0015295296907424927, 0.0015814006328582764, 0.00163327157497406, 0.0016851425170898438]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 1.0, 4.0, 6.0, 3.0, 2.0, 9.0, 7.0, 11.0, 7.0, 7.0, 11.0, 26.0, 21.0, 26.0, 12.0, 28.0, 34.0, 49.0, 56.0, 81.0, 111.0, 190.0, 274.0, 875.0, 31389.0, 1001348.0, 12413.0, 664.0, 273.0, 169.0, 96.0, 55.0, 53.0, 46.0, 30.0, 24.0, 23.0, 21.0, 21.0, 18.0, 12.0, 10.0, 5.0, 6.0, 3.0, 4.0, 9.0, 3.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0], "bins": [-0.026641845703125, -0.025819778442382812, -0.024997711181640625, -0.024175643920898438, -0.02335357666015625, -0.022531509399414062, -0.021709442138671875, -0.020887374877929688, -0.0200653076171875, -0.019243240356445312, -0.018421173095703125, -0.017599105834960938, -0.01677703857421875, -0.015954971313476562, -0.015132904052734375, -0.014310836791992188, -0.01348876953125, -0.012666702270507812, -0.011844635009765625, -0.011022567749023438, -0.01020050048828125, -0.009378433227539062, -0.008556365966796875, -0.0077342987060546875, -0.0069122314453125, -0.0060901641845703125, -0.005268096923828125, -0.0044460296630859375, -0.00362396240234375, -0.0028018951416015625, -0.001979827880859375, -0.0011577606201171875, -0.000335693359375, 0.0004863739013671875, 0.001308441162109375, 0.0021305084228515625, 0.00295257568359375, 0.0037746429443359375, 0.004596710205078125, 0.0054187774658203125, 0.0062408447265625, 0.0070629119873046875, 0.007884979248046875, 0.008707046508789062, 0.00952911376953125, 0.010351181030273438, 0.011173248291015625, 0.011995315551757812, 0.0128173828125, 0.013639450073242188, 0.014461517333984375, 0.015283584594726562, 0.01610565185546875, 0.016927719116210938, 0.017749786376953125, 0.018571853637695312, 0.0193939208984375, 0.020215988159179688, 0.021038055419921875, 0.021860122680664062, 0.02268218994140625, 0.023504257202148438, 0.024326324462890625, 0.025148391723632812, 0.025970458984375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 25.0, 694.0, 281.0, 14.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0355561189353466, -0.034506671130657196, -0.03345722705125809, -0.03240777924656868, -0.03135833516716957, -0.030308887362480164, -0.029259441420435905, -0.028209995478391647, -0.02716054953634739, -0.02611110359430313, -0.025061657652258873, -0.024012211710214615, -0.022962763905525208, -0.0219133198261261, -0.02086387202143669, -0.019814426079392433, -0.018764980137348175, -0.017715534195303917, -0.01666608825325966, -0.015616641379892826, -0.014567195437848568, -0.01351774949580431, -0.012468302622437477, -0.011418856680393219, -0.010369410738348961, -0.009319964796304703, -0.008270518854260445, -0.007221071980893612, -0.006171626038849354, -0.005122180096805096, -0.00407273368909955, -0.003023287281394005, -0.0019738413393497467, -0.0009243951644748449, 0.00012505101040005684, 0.0011744971852749586, 0.0022239433601498604, 0.0032733893021941185, 0.004322835709899664, 0.005372282117605209, 0.0064217280596494675, 0.007471174001693726, 0.008520619943737984, 0.009570066817104816, 0.010619512759149075, 0.011668958701193333, 0.012718405574560165, 0.013767851516604424, 0.014817297458648682, 0.01586674340069294, 0.016916189342737198, 0.017965635284781456, 0.019015081226825714, 0.02006452903151512, 0.02111397497355938, 0.022163420915603638, 0.023212866857647896, 0.024262312799692154, 0.025311758741736412, 0.02636120468378067, 0.027410652488470078, 0.028460096567869186, 0.029509544372558594, 0.030558990314602852, 0.03160843625664711]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 6.0, 5.0, 10.0, 4.0, 7.0, 14.0, 20.0, 14.0, 21.0, 27.0, 37.0, 24.0, 30.0, 31.0, 30.0, 51.0, 38.0, 45.0, 47.0, 36.0, 46.0, 50.0, 39.0, 40.0, 30.0, 24.0, 40.0, 29.0, 38.0, 26.0, 20.0, 21.0, 21.0, 24.0, 16.0, 6.0, 9.0, 14.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0026990771293640137, -0.0026254691183567047, -0.0025518611073493958, -0.002478253096342087, -0.002404645085334778, -0.002331037074327469, -0.00225742906332016, -0.002183821052312851, -0.002110213041305542, -0.002036605030298233, -0.001962997019290924, -0.0018893890082836151, -0.0018157809972763062, -0.0017421729862689972, -0.0016685649752616882, -0.0015949569642543793, -0.0015213489532470703, -0.0014477409422397614, -0.0013741329312324524, -0.0013005249202251434, -0.0012269169092178345, -0.0011533088982105255, -0.0010797008872032166, -0.0010060928761959076, -0.0009324848651885986, -0.0008588768541812897, -0.0007852688431739807, -0.0007116608321666718, -0.0006380528211593628, -0.0005644448101520538, -0.0004908367991447449, -0.0004172287881374359, -0.00034362077713012695, -0.000270012766122818, -0.00019640475511550903, -0.00012279674410820007, -4.918873310089111e-05, 2.4419277906417847e-05, 9.80272889137268e-05, 0.00017163529992103577, 0.0002452433109283447, 0.0003188513219356537, 0.00039245933294296265, 0.0004660673439502716, 0.0005396753549575806, 0.0006132833659648895, 0.0006868913769721985, 0.0007604993879795074, 0.0008341073989868164, 0.0009077154099941254, 0.0009813234210014343, 0.0010549314320087433, 0.0011285394430160522, 0.0012021474540233612, 0.0012757554650306702, 0.0013493634760379791, 0.001422971487045288, 0.001496579498052597, 0.001570187509059906, 0.001643795520067215, 0.001717403531074524, 0.0017910115420818329, 0.0018646195530891418, 0.0019382275640964508, 0.0020118355751037598]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 3.0, 5.0, 8.0, 7.0, 7.0, 12.0, 14.0, 11.0, 20.0, 14.0, 23.0, 25.0, 20.0, 31.0, 28.0, 30.0, 25.0, 34.0, 36.0, 45.0, 28.0, 46.0, 58.0, 38.0, 41.0, 44.0, 26.0, 33.0, 43.0, 19.0, 24.0, 24.0, 31.0, 13.0, 15.0, 26.0, 15.0, 13.0, 5.0, 11.0, 9.0, 10.0, 6.0, 4.0, 5.0, 2.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.0166015625, -0.9866943359375, -0.956787109375, -0.9268798828125, -0.89697265625, -0.8670654296875, -0.837158203125, -0.8072509765625, -0.77734375, -0.7474365234375, -0.717529296875, -0.6876220703125, -0.65771484375, -0.6278076171875, -0.597900390625, -0.5679931640625, -0.5380859375, -0.5081787109375, -0.478271484375, -0.4483642578125, -0.41845703125, -0.3885498046875, -0.358642578125, -0.3287353515625, -0.298828125, -0.2689208984375, -0.239013671875, -0.2091064453125, -0.17919921875, -0.1492919921875, -0.119384765625, -0.0894775390625, -0.0595703125, -0.0296630859375, 0.000244140625, 0.0301513671875, 0.06005859375, 0.0899658203125, 0.119873046875, 0.1497802734375, 0.1796875, 0.2095947265625, 0.239501953125, 0.2694091796875, 0.29931640625, 0.3292236328125, 0.359130859375, 0.3890380859375, 0.4189453125, 0.4488525390625, 0.478759765625, 0.5086669921875, 0.53857421875, 0.5684814453125, 0.598388671875, 0.6282958984375, 0.658203125, 0.6881103515625, 0.718017578125, 0.7479248046875, 0.77783203125, 0.8077392578125, 0.837646484375, 0.8675537109375, 0.8974609375]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 1.0, 8.0, 6.0, 10.0, 26.0, 31.0, 54.0, 63.0, 113.0, 122.0, 191.0, 292.0, 452.0, 664.0, 1083.0, 1761.0, 3202.0, 6280.0, 13292.0, 32305.0, 85168.0, 237595.0, 392205.0, 167447.0, 60894.0, 23496.0, 10226.0, 4832.0, 2559.0, 1450.0, 930.0, 645.0, 372.0, 248.0, 193.0, 115.0, 66.0, 58.0, 43.0, 19.0, 18.0, 11.0, 8.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5234375, -1.480316162109375, -1.43719482421875, -1.394073486328125, -1.3509521484375, -1.307830810546875, -1.26470947265625, -1.221588134765625, -1.178466796875, -1.135345458984375, -1.09222412109375, -1.049102783203125, -1.0059814453125, -0.962860107421875, -0.91973876953125, -0.876617431640625, -0.83349609375, -0.790374755859375, -0.74725341796875, -0.704132080078125, -0.6610107421875, -0.617889404296875, -0.57476806640625, -0.531646728515625, -0.488525390625, -0.445404052734375, -0.40228271484375, -0.359161376953125, -0.3160400390625, -0.272918701171875, -0.22979736328125, -0.186676025390625, -0.1435546875, -0.100433349609375, -0.05731201171875, -0.014190673828125, 0.0289306640625, 0.072052001953125, 0.11517333984375, 0.158294677734375, 0.201416015625, 0.244537353515625, 0.28765869140625, 0.330780029296875, 0.3739013671875, 0.417022705078125, 0.46014404296875, 0.503265380859375, 0.54638671875, 0.589508056640625, 0.63262939453125, 0.675750732421875, 0.7188720703125, 0.761993408203125, 0.80511474609375, 0.848236083984375, 0.891357421875, 0.934478759765625, 0.97760009765625, 1.020721435546875, 1.0638427734375, 1.106964111328125, 1.15008544921875, 1.193206787109375, 1.236328125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 8.0, 5.0, 4.0, 11.0, 17.0, 20.0, 22.0, 23.0, 29.0, 39.0, 45.0, 50.0, 66.0, 68.0, 89.0, 237.0, 1617.0, 206.0, 121.0, 57.0, 49.0, 55.0, 45.0, 29.0, 35.0, 20.0, 24.0, 17.0, 16.0, 7.0, 7.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.310791015625, -4.16455078125, -4.018310546875, -3.8720703125, -3.725830078125, -3.57958984375, -3.433349609375, -3.287109375, -3.140869140625, -2.99462890625, -2.848388671875, -2.7021484375, -2.555908203125, -2.40966796875, -2.263427734375, -2.1171875, -1.970947265625, -1.82470703125, -1.678466796875, -1.5322265625, -1.385986328125, -1.23974609375, -1.093505859375, -0.947265625, -0.801025390625, -0.65478515625, -0.508544921875, -0.3623046875, -0.216064453125, -0.06982421875, 0.076416015625, 0.22265625, 0.368896484375, 0.51513671875, 0.661376953125, 0.8076171875, 0.953857421875, 1.10009765625, 1.246337890625, 1.392578125, 1.538818359375, 1.68505859375, 1.831298828125, 1.9775390625, 2.123779296875, 2.27001953125, 2.416259765625, 2.5625, 2.708740234375, 2.85498046875, 3.001220703125, 3.1474609375, 3.293701171875, 3.43994140625, 3.586181640625, 3.732421875, 3.878662109375, 4.02490234375, 4.171142578125, 4.3173828125, 4.463623046875, 4.60986328125, 4.756103515625, 4.90234375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 0.0, 4.0, 4.0, 3.0, 13.0, 9.0, 14.0, 18.0, 24.0, 29.0, 37.0, 59.0, 62.0, 105.0, 252.0, 822.0, 7294.0, 2385932.0, 745152.0, 4607.0, 677.0, 199.0, 112.0, 72.0, 41.0, 43.0, 28.0, 24.0, 27.0, 14.0, 10.0, 2.0, 9.0, 5.0, 7.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.96875, -10.6546630859375, -10.340576171875, -10.0264892578125, -9.71240234375, -9.3983154296875, -9.084228515625, -8.7701416015625, -8.4560546875, -8.1419677734375, -7.827880859375, -7.5137939453125, -7.19970703125, -6.8856201171875, -6.571533203125, -6.2574462890625, -5.943359375, -5.6292724609375, -5.315185546875, -5.0010986328125, -4.68701171875, -4.3729248046875, -4.058837890625, -3.7447509765625, -3.4306640625, -3.1165771484375, -2.802490234375, -2.4884033203125, -2.17431640625, -1.8602294921875, -1.546142578125, -1.2320556640625, -0.91796875, -0.6038818359375, -0.289794921875, 0.0242919921875, 0.33837890625, 0.6524658203125, 0.966552734375, 1.2806396484375, 1.5947265625, 1.9088134765625, 2.222900390625, 2.5369873046875, 2.85107421875, 3.1651611328125, 3.479248046875, 3.7933349609375, 4.107421875, 4.4215087890625, 4.735595703125, 5.0496826171875, 5.36376953125, 5.6778564453125, 5.991943359375, 6.3060302734375, 6.6201171875, 6.9342041015625, 7.248291015625, 7.5623779296875, 7.87646484375, 8.1905517578125, 8.504638671875, 8.8187255859375, 9.1328125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 20.0, 744.0, 248.0, 4.0, 1.0], "bins": [-95.60693359375, -94.03243255615234, -92.45793151855469, -90.8834228515625, -89.30892181396484, -87.73442077636719, -86.15991973876953, -84.58541870117188, -83.01091766357422, -81.43641662597656, -79.8619155883789, -78.28741455078125, -76.71290588378906, -75.1384048461914, -73.56390380859375, -71.9894027709961, -70.41490173339844, -68.84040069580078, -67.26589965820312, -65.69139099121094, -64.11688995361328, -62.542388916015625, -60.96788787841797, -59.39338684082031, -57.818878173828125, -56.24437713623047, -54.66987228393555, -53.09537124633789, -51.520870208740234, -49.94636535644531, -48.371864318847656, -46.79736328125, -45.222862243652344, -43.64836120605469, -42.073856353759766, -40.49935531616211, -38.92485427856445, -37.35034942626953, -35.775848388671875, -34.20134735107422, -32.62684631347656, -31.052343368530273, -29.477842330932617, -27.903339385986328, -26.328838348388672, -24.754335403442383, -23.179832458496094, -21.605331420898438, -20.03082847595215, -18.45632553100586, -16.881824493408203, -15.307321548461914, -13.732819557189941, -12.158317565917969, -10.58381462097168, -9.009312629699707, -7.434810638427734, -5.860308647155762, -4.285806179046631, -2.7113037109375, -1.1368017196655273, 0.4377002716064453, 2.0122032165527344, 3.586705207824707, 5.16120719909668]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 2.0, 5.0, 5.0, 12.0, 17.0, 9.0, 6.0, 15.0, 16.0, 21.0, 16.0, 24.0, 23.0, 30.0, 32.0, 31.0, 32.0, 39.0, 35.0, 49.0, 31.0, 51.0, 48.0, 36.0, 39.0, 30.0, 29.0, 32.0, 24.0, 31.0, 28.0, 22.0, 22.0, 25.0, 20.0, 22.0, 20.0, 20.0, 12.0, 6.0, 6.0, 5.0, 9.0, 11.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0], "bins": [-11.697769165039062, -11.345898628234863, -10.994028091430664, -10.642156600952148, -10.29028606414795, -9.93841552734375, -9.586544036865234, -9.234673500061035, -8.882802963256836, -8.530932426452637, -8.179061889648438, -7.827190399169922, -7.475319862365723, -7.123449325561523, -6.771578311920166, -6.419707298278809, -6.067836761474609, -5.71596622467041, -5.364095211029053, -5.012224197387695, -4.660353660583496, -4.308483123779297, -3.9566121101379395, -3.604741334915161, -3.252870559692383, -2.9009997844696045, -2.549129009246826, -2.197258234024048, -1.8453874588012695, -1.4935166835784912, -1.141645908355713, -0.7897751331329346, -0.43790531158447266, -0.08603453636169434, 0.265836238861084, 0.6177070140838623, 0.9695777893066406, 1.321448564529419, 1.6733193397521973, 2.0251901149749756, 2.377060890197754, 2.7289316654205322, 3.0808024406433105, 3.432673215866089, 3.784543991088867, 4.136414527893066, 4.488285541534424, 4.840156555175781, 5.1920270919799805, 5.54389762878418, 5.895768642425537, 6.2476396560668945, 6.599510192871094, 6.951380729675293, 7.30325174331665, 7.655122756958008, 8.006993293762207, 8.358863830566406, 8.710735321044922, 9.062605857849121, 9.41447639465332, 9.76634693145752, 10.118217468261719, 10.470088958740234, 10.821959495544434]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 1.0, 5.0, 9.0, 6.0, 12.0, 8.0, 15.0, 17.0, 15.0, 21.0, 14.0, 27.0, 22.0, 33.0, 31.0, 36.0, 24.0, 25.0, 42.0, 38.0, 48.0, 54.0, 44.0, 44.0, 41.0, 39.0, 34.0, 40.0, 19.0, 24.0, 22.0, 29.0, 22.0, 21.0, 26.0, 18.0, 8.0, 7.0, 13.0, 5.0, 9.0, 10.0, 4.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.068359375, -1.0366287231445312, -1.0048980712890625, -0.9731674194335938, -0.941436767578125, -0.9097061157226562, -0.8779754638671875, -0.8462448120117188, -0.81451416015625, -0.7827835083007812, -0.7510528564453125, -0.7193222045898438, -0.687591552734375, -0.6558609008789062, -0.6241302490234375, -0.5923995971679688, -0.5606689453125, -0.5289382934570312, -0.4972076416015625, -0.46547698974609375, -0.433746337890625, -0.40201568603515625, -0.3702850341796875, -0.33855438232421875, -0.30682373046875, -0.27509307861328125, -0.2433624267578125, -0.21163177490234375, -0.179901123046875, -0.14817047119140625, -0.1164398193359375, -0.08470916748046875, -0.052978515625, -0.02124786376953125, 0.0104827880859375, 0.04221343994140625, 0.073944091796875, 0.10567474365234375, 0.1374053955078125, 0.16913604736328125, 0.20086669921875, 0.23259735107421875, 0.2643280029296875, 0.29605865478515625, 0.327789306640625, 0.35951995849609375, 0.3912506103515625, 0.42298126220703125, 0.4547119140625, 0.48644256591796875, 0.5181732177734375, 0.5499038696289062, 0.581634521484375, 0.6133651733398438, 0.6450958251953125, 0.6768264770507812, 0.70855712890625, 0.7402877807617188, 0.7720184326171875, 0.8037490844726562, 0.835479736328125, 0.8672103881835938, 0.8989410400390625, 0.9306716918945312, 0.96240234375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 6.0, 5.0, 7.0, 10.0, 7.0, 13.0, 18.0, 23.0, 22.0, 34.0, 42.0, 49.0, 51.0, 78.0, 130.0, 193.0, 318.0, 592.0, 1274.0, 3284.0, 9744.0, 36060.0, 159802.0, 1068376.0, 2427323.0, 385187.0, 73714.0, 18478.0, 5455.0, 1947.0, 829.0, 407.0, 211.0, 138.0, 107.0, 70.0, 53.0, 34.0, 38.0, 26.0, 24.0, 21.0, 17.0, 14.0, 12.0, 13.0, 6.0, 10.0, 2.0, 4.0, 7.0, 1.0, 1.0], "bins": [-3.80078125, -3.692962646484375, -3.58514404296875, -3.477325439453125, -3.3695068359375, -3.261688232421875, -3.15386962890625, -3.046051025390625, -2.938232421875, -2.830413818359375, -2.72259521484375, -2.614776611328125, -2.5069580078125, -2.399139404296875, -2.29132080078125, -2.183502197265625, -2.07568359375, -1.967864990234375, -1.86004638671875, -1.752227783203125, -1.6444091796875, -1.536590576171875, -1.42877197265625, -1.320953369140625, -1.213134765625, -1.105316162109375, -0.99749755859375, -0.889678955078125, -0.7818603515625, -0.674041748046875, -0.56622314453125, -0.458404541015625, -0.3505859375, -0.242767333984375, -0.13494873046875, -0.027130126953125, 0.0806884765625, 0.188507080078125, 0.29632568359375, 0.404144287109375, 0.511962890625, 0.619781494140625, 0.72760009765625, 0.835418701171875, 0.9432373046875, 1.051055908203125, 1.15887451171875, 1.266693115234375, 1.37451171875, 1.482330322265625, 1.59014892578125, 1.697967529296875, 1.8057861328125, 1.913604736328125, 2.02142333984375, 2.129241943359375, 2.237060546875, 2.344879150390625, 2.45269775390625, 2.560516357421875, 2.6683349609375, 2.776153564453125, 2.88397216796875, 2.991790771484375, 3.099609375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 4.0, 6.0, 8.0, 9.0, 11.0, 19.0, 26.0, 49.0, 64.0, 106.0, 122.0, 202.0, 298.0, 453.0, 618.0, 620.0, 449.0, 341.0, 211.0, 145.0, 103.0, 63.0, 43.0, 24.0, 26.0, 21.0, 12.0, 10.0, 4.0, 5.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7109375, -4.57293701171875, -4.4349365234375, -4.29693603515625, -4.158935546875, -4.02093505859375, -3.8829345703125, -3.74493408203125, -3.60693359375, -3.46893310546875, -3.3309326171875, -3.19293212890625, -3.054931640625, -2.91693115234375, -2.7789306640625, -2.64093017578125, -2.5029296875, -2.36492919921875, -2.2269287109375, -2.08892822265625, -1.950927734375, -1.81292724609375, -1.6749267578125, -1.53692626953125, -1.39892578125, -1.26092529296875, -1.1229248046875, -0.98492431640625, -0.846923828125, -0.70892333984375, -0.5709228515625, -0.43292236328125, -0.294921875, -0.15692138671875, -0.0189208984375, 0.11907958984375, 0.257080078125, 0.39508056640625, 0.5330810546875, 0.67108154296875, 0.80908203125, 0.94708251953125, 1.0850830078125, 1.22308349609375, 1.361083984375, 1.49908447265625, 1.6370849609375, 1.77508544921875, 1.9130859375, 2.05108642578125, 2.1890869140625, 2.32708740234375, 2.465087890625, 2.60308837890625, 2.7410888671875, 2.87908935546875, 3.01708984375, 3.15509033203125, 3.2930908203125, 3.43109130859375, 3.569091796875, 3.70709228515625, 3.8450927734375, 3.98309326171875, 4.12109375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 8.0, 8.0, 14.0, 19.0, 30.0, 56.0, 78.0, 93.0, 169.0, 317.0, 531.0, 1131.0, 2479.0, 7043.0, 25714.0, 121973.0, 697312.0, 2492003.0, 688072.0, 120106.0, 25327.0, 6824.0, 2462.0, 1157.0, 533.0, 302.0, 186.0, 120.0, 72.0, 57.0, 35.0, 12.0, 12.0, 7.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6171875, -5.4388427734375, -5.260498046875, -5.0821533203125, -4.90380859375, -4.7254638671875, -4.547119140625, -4.3687744140625, -4.1904296875, -4.0120849609375, -3.833740234375, -3.6553955078125, -3.47705078125, -3.2987060546875, -3.120361328125, -2.9420166015625, -2.763671875, -2.5853271484375, -2.406982421875, -2.2286376953125, -2.05029296875, -1.8719482421875, -1.693603515625, -1.5152587890625, -1.3369140625, -1.1585693359375, -0.980224609375, -0.8018798828125, -0.62353515625, -0.4451904296875, -0.266845703125, -0.0885009765625, 0.08984375, 0.2681884765625, 0.446533203125, 0.6248779296875, 0.80322265625, 0.9815673828125, 1.159912109375, 1.3382568359375, 1.5166015625, 1.6949462890625, 1.873291015625, 2.0516357421875, 2.22998046875, 2.4083251953125, 2.586669921875, 2.7650146484375, 2.943359375, 3.1217041015625, 3.300048828125, 3.4783935546875, 3.65673828125, 3.8350830078125, 4.013427734375, 4.1917724609375, 4.3701171875, 4.5484619140625, 4.726806640625, 4.9051513671875, 5.08349609375, 5.2618408203125, 5.440185546875, 5.6185302734375, 5.796875]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 11.0, 24.0, 58.0, 145.0, 206.0, 231.0, 142.0, 107.0, 47.0, 24.0, 10.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.17232131958008, -39.153106689453125, -38.133888244628906, -37.11466979980469, -36.095455169677734, -35.07624053955078, -34.05702209472656, -33.037803649902344, -32.01858901977539, -30.999372482299805, -29.98015594482422, -28.960939407348633, -27.941722869873047, -26.92250633239746, -25.903289794921875, -24.88407325744629, -23.864856719970703, -22.845640182495117, -21.82642364501953, -20.807207107543945, -19.78799057006836, -18.768774032592773, -17.749557495117188, -16.7303409576416, -15.711124420166016, -14.69190788269043, -13.672691345214844, -12.653474807739258, -11.634258270263672, -10.615041732788086, -9.5958251953125, -8.576608657836914, -7.5573883056640625, -6.538171768188477, -5.518955230712891, -4.499738693237305, -3.4805221557617188, -2.461305618286133, -1.4420890808105469, -0.42287254333496094, 0.596343994140625, 1.615560531616211, 2.634777069091797, 3.653993606567383, 4.673210144042969, 5.692426681518555, 6.711643218994141, 7.730859756469727, 8.750076293945312, 9.769292831420898, 10.788509368896484, 11.80772590637207, 12.826942443847656, 13.846158981323242, 14.865375518798828, 15.884592056274414, 16.90380859375, 17.923025131225586, 18.942241668701172, 19.961458206176758, 20.980674743652344, 21.99989128112793, 23.019107818603516, 24.0383243560791, 25.057540893554688]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 7.0, 6.0, 10.0, 16.0, 17.0, 15.0, 13.0, 19.0, 21.0, 23.0, 19.0, 22.0, 31.0, 34.0, 39.0, 38.0, 33.0, 48.0, 37.0, 44.0, 63.0, 43.0, 37.0, 32.0, 38.0, 28.0, 29.0, 28.0, 32.0, 22.0, 26.0, 23.0, 18.0, 13.0, 16.0, 12.0, 8.0, 8.0, 7.0, 6.0, 4.0, 2.0, 9.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.92625617980957, -10.576140403747559, -10.226024627685547, -9.875908851623535, -9.525793075561523, -9.175678253173828, -8.825562477111816, -8.475446701049805, -8.125330924987793, -7.775215148925781, -7.4250993728637695, -7.074984073638916, -6.724868297576904, -6.374752521514893, -6.024637222290039, -5.674521446228027, -5.324405670166016, -4.974289894104004, -4.624174118041992, -4.274058818817139, -3.923943042755127, -3.5738272666931152, -3.2237117290496826, -2.87359619140625, -2.5234804153442383, -2.1733646392822266, -1.823249101638794, -1.4731334447860718, -1.1230177879333496, -0.7729021310806274, -0.4227864742279053, -0.07267093658447266, 0.27744483947753906, 0.6275604963302612, 0.9776761531829834, 1.3277918100357056, 1.6779074668884277, 2.0280232429504395, 2.378138780593872, 2.7282543182373047, 3.0783700942993164, 3.428485870361328, 3.7786014080047607, 4.128716945648193, 4.478832721710205, 4.828948497772217, 5.17906379699707, 5.529179573059082, 5.879295349121094, 6.2294111251831055, 6.579526901245117, 6.929642200469971, 7.279757976531982, 7.629873752593994, 7.979989051818848, 8.33010482788086, 8.680220603942871, 9.030336380004883, 9.380452156066895, 9.730567932128906, 10.080682754516602, 10.430798530578613, 10.780914306640625, 11.131030082702637, 11.481145858764648]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 4.0, 6.0, 11.0, 14.0, 10.0, 14.0, 17.0, 18.0, 14.0, 24.0, 24.0, 29.0, 28.0, 37.0, 31.0, 35.0, 31.0, 32.0, 41.0, 33.0, 41.0, 42.0, 42.0, 42.0, 32.0, 28.0, 42.0, 31.0, 21.0, 25.0, 19.0, 29.0, 22.0, 18.0, 15.0, 15.0, 11.0, 11.0, 8.0, 7.0, 10.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.98583984375, -0.9546890258789062, -0.9235382080078125, -0.8923873901367188, -0.861236572265625, -0.8300857543945312, -0.7989349365234375, -0.7677841186523438, -0.73663330078125, -0.7054824829101562, -0.6743316650390625, -0.6431808471679688, -0.612030029296875, -0.5808792114257812, -0.5497283935546875, -0.5185775756835938, -0.4874267578125, -0.45627593994140625, -0.4251251220703125, -0.39397430419921875, -0.362823486328125, -0.33167266845703125, -0.3005218505859375, -0.26937103271484375, -0.23822021484375, -0.20706939697265625, -0.1759185791015625, -0.14476776123046875, -0.113616943359375, -0.08246612548828125, -0.0513153076171875, -0.02016448974609375, 0.010986328125, 0.04213714599609375, 0.0732879638671875, 0.10443878173828125, 0.135589599609375, 0.16674041748046875, 0.1978912353515625, 0.22904205322265625, 0.26019287109375, 0.29134368896484375, 0.3224945068359375, 0.35364532470703125, 0.384796142578125, 0.41594696044921875, 0.4470977783203125, 0.47824859619140625, 0.5093994140625, 0.5405502319335938, 0.5717010498046875, 0.6028518676757812, 0.634002685546875, 0.6651535034179688, 0.6963043212890625, 0.7274551391601562, 0.75860595703125, 0.7897567749023438, 0.8209075927734375, 0.8520584106445312, 0.883209228515625, 0.9143600463867188, 0.9455108642578125, 0.9766616821289062, 1.0078125]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 8.0, 7.0, 21.0, 35.0, 48.0, 94.0, 128.0, 218.0, 326.0, 528.0, 766.0, 1082.0, 1801.0, 2768.0, 4249.0, 6548.0, 10000.0, 16149.0, 25290.0, 40330.0, 64318.0, 99745.0, 145308.0, 176900.0, 153674.0, 108197.0, 69913.0, 43859.0, 27479.0, 17378.0, 11091.0, 7254.0, 4731.0, 2891.0, 1911.0, 1223.0, 728.0, 537.0, 375.0, 216.0, 158.0, 99.0, 67.0, 34.0, 23.0, 20.0, 14.0, 8.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0806884765625, -0.07813453674316406, -0.07558059692382812, -0.07302665710449219, -0.07047271728515625, -0.06791877746582031, -0.06536483764648438, -0.06281089782714844, -0.0602569580078125, -0.05770301818847656, -0.055149078369140625, -0.05259513854980469, -0.05004119873046875, -0.04748725891113281, -0.044933319091796875, -0.04237937927246094, -0.039825439453125, -0.03727149963378906, -0.034717559814453125, -0.03216361999511719, -0.02960968017578125, -0.027055740356445312, -0.024501800537109375, -0.021947860717773438, -0.0193939208984375, -0.016839981079101562, -0.014286041259765625, -0.011732101440429688, -0.00917816162109375, -0.0066242218017578125, -0.004070281982421875, -0.0015163421630859375, 0.00103759765625, 0.0035915374755859375, 0.006145477294921875, 0.008699417114257812, 0.01125335693359375, 0.013807296752929688, 0.016361236572265625, 0.018915176391601562, 0.0214691162109375, 0.024023056030273438, 0.026576995849609375, 0.029130935668945312, 0.03168487548828125, 0.03423881530761719, 0.036792755126953125, 0.03934669494628906, 0.041900634765625, 0.04445457458496094, 0.047008514404296875, 0.04956245422363281, 0.05211639404296875, 0.05467033386230469, 0.057224273681640625, 0.05977821350097656, 0.0623321533203125, 0.06488609313964844, 0.06744003295898438, 0.06999397277832031, 0.07254791259765625, 0.07510185241699219, 0.07765579223632812, 0.08020973205566406, 0.082763671875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 4.0, 6.0, 5.0, 8.0, 6.0, 12.0, 8.0, 10.0, 15.0, 14.0, 25.0, 18.0, 32.0, 21.0, 21.0, 26.0, 38.0, 33.0, 34.0, 35.0, 33.0, 42.0, 1070.0, 46.0, 51.0, 34.0, 41.0, 37.0, 37.0, 34.0, 36.0, 22.0, 24.0, 19.0, 16.0, 23.0, 16.0, 20.0, 13.0, 12.0, 9.0, 6.0, 4.0, 4.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.77197265625, -0.7481689453125, -0.724365234375, -0.7005615234375, -0.6767578125, -0.6529541015625, -0.629150390625, -0.6053466796875, -0.58154296875, -0.5577392578125, -0.533935546875, -0.5101318359375, -0.486328125, -0.4625244140625, -0.438720703125, -0.4149169921875, -0.39111328125, -0.3673095703125, -0.343505859375, -0.3197021484375, -0.2958984375, -0.2720947265625, -0.248291015625, -0.2244873046875, -0.20068359375, -0.1768798828125, -0.153076171875, -0.1292724609375, -0.10546875, -0.0816650390625, -0.057861328125, -0.0340576171875, -0.01025390625, 0.0135498046875, 0.037353515625, 0.0611572265625, 0.0849609375, 0.1087646484375, 0.132568359375, 0.1563720703125, 0.18017578125, 0.2039794921875, 0.227783203125, 0.2515869140625, 0.275390625, 0.2991943359375, 0.322998046875, 0.3468017578125, 0.37060546875, 0.3944091796875, 0.418212890625, 0.4420166015625, 0.4658203125, 0.4896240234375, 0.513427734375, 0.5372314453125, 0.56103515625, 0.5848388671875, 0.608642578125, 0.6324462890625, 0.65625, 0.6800537109375, 0.703857421875, 0.7276611328125, 0.75146484375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 7.0, 6.0, 8.0, 17.0, 13.0, 31.0, 32.0, 42.0, 72.0, 127.0, 173.0, 279.0, 473.0, 638.0, 1038.0, 1734.0, 2716.0, 4296.0, 6860.0, 11252.0, 18413.0, 29463.0, 48269.0, 75629.0, 115118.0, 163579.0, 1210390.0, 141336.0, 97902.0, 63559.0, 39773.0, 24565.0, 14818.0, 9231.0, 5751.0, 3538.0, 2100.0, 1474.0, 821.0, 586.0, 320.0, 229.0, 155.0, 117.0, 67.0, 52.0, 27.0, 16.0, 14.0, 4.0, 8.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.046722412109375, -0.04512786865234375, -0.0435333251953125, -0.04193878173828125, -0.04034423828125, -0.03874969482421875, -0.0371551513671875, -0.03556060791015625, -0.033966064453125, -0.03237152099609375, -0.0307769775390625, -0.02918243408203125, -0.027587890625, -0.02599334716796875, -0.0243988037109375, -0.02280426025390625, -0.021209716796875, -0.01961517333984375, -0.0180206298828125, -0.01642608642578125, -0.01483154296875, -0.01323699951171875, -0.0116424560546875, -0.01004791259765625, -0.008453369140625, -0.00685882568359375, -0.0052642822265625, -0.00366973876953125, -0.0020751953125, -0.00048065185546875, 0.0011138916015625, 0.00270843505859375, 0.004302978515625, 0.00589752197265625, 0.0074920654296875, 0.00908660888671875, 0.01068115234375, 0.01227569580078125, 0.0138702392578125, 0.01546478271484375, 0.017059326171875, 0.01865386962890625, 0.0202484130859375, 0.02184295654296875, 0.0234375, 0.02503204345703125, 0.0266265869140625, 0.02822113037109375, 0.029815673828125, 0.03141021728515625, 0.0330047607421875, 0.03459930419921875, 0.03619384765625, 0.03778839111328125, 0.0393829345703125, 0.04097747802734375, 0.042572021484375, 0.04416656494140625, 0.0457611083984375, 0.04735565185546875, 0.0489501953125, 0.05054473876953125, 0.0521392822265625, 0.05373382568359375, 0.055328369140625]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 8.0, 8.0, 7.0, 4.0, 12.0, 16.0, 18.0, 29.0, 24.0, 25.0, 28.0, 33.0, 34.0, 44.0, 48.0, 59.0, 58.0, 62.0, 51.0, 51.0, 52.0, 42.0, 42.0, 34.0, 41.0, 20.0, 24.0, 24.0, 18.0, 8.0, 12.0, 4.0, 5.0, 8.0, 7.0, 6.0, 6.0, 7.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018863677978515625, -0.0018227100372314453, -0.0017590522766113281, -0.001695394515991211, -0.0016317367553710938, -0.0015680789947509766, -0.0015044212341308594, -0.0014407634735107422, -0.001377105712890625, -0.0013134479522705078, -0.0012497901916503906, -0.0011861324310302734, -0.0011224746704101562, -0.001058816909790039, -0.0009951591491699219, -0.0009315013885498047, -0.0008678436279296875, -0.0008041858673095703, -0.0007405281066894531, -0.0006768703460693359, -0.0006132125854492188, -0.0005495548248291016, -0.0004858970642089844, -0.0004222393035888672, -0.00035858154296875, -0.0002949237823486328, -0.00023126602172851562, -0.00016760826110839844, -0.00010395050048828125, -4.029273986816406e-05, 2.3365020751953125e-05, 8.702278137207031e-05, 0.0001506805419921875, 0.0002143383026123047, 0.0002779960632324219, 0.00034165382385253906, 0.00040531158447265625, 0.00046896934509277344, 0.0005326271057128906, 0.0005962848663330078, 0.000659942626953125, 0.0007236003875732422, 0.0007872581481933594, 0.0008509159088134766, 0.0009145736694335938, 0.000978231430053711, 0.0010418891906738281, 0.0011055469512939453, 0.0011692047119140625, 0.0012328624725341797, 0.0012965202331542969, 0.001360177993774414, 0.0014238357543945312, 0.0014874935150146484, 0.0015511512756347656, 0.0016148090362548828, 0.001678466796875, 0.0017421245574951172, 0.0018057823181152344, 0.0018694400787353516, 0.0019330978393554688, 0.001996755599975586, 0.002060413360595703, 0.0021240711212158203, 0.0021877288818359375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 7.0, 5.0, 7.0, 14.0, 8.0, 8.0, 14.0, 18.0, 17.0, 25.0, 29.0, 45.0, 48.0, 54.0, 72.0, 69.0, 106.0, 132.0, 167.0, 269.0, 694.0, 4104.0, 93970.0, 922944.0, 22472.0, 1832.0, 471.0, 237.0, 131.0, 100.0, 103.0, 62.0, 58.0, 39.0, 30.0, 42.0, 32.0, 21.0, 16.0, 27.0, 12.0, 12.0, 10.0, 6.0, 4.0, 3.0, 3.0, 6.0, 3.0, 11.0, 1.0, 0.0, 1.0], "bins": [-0.034332275390625, -0.03333163261413574, -0.032330989837646484, -0.03133034706115723, -0.03032970428466797, -0.02932906150817871, -0.028328418731689453, -0.027327775955200195, -0.026327133178710938, -0.02532649040222168, -0.024325847625732422, -0.023325204849243164, -0.022324562072753906, -0.02132391929626465, -0.02032327651977539, -0.019322633743286133, -0.018321990966796875, -0.017321348190307617, -0.01632070541381836, -0.015320062637329102, -0.014319419860839844, -0.013318777084350586, -0.012318134307861328, -0.01131749153137207, -0.010316848754882812, -0.009316205978393555, -0.008315563201904297, -0.007314920425415039, -0.006314277648925781, -0.0053136348724365234, -0.004312992095947266, -0.003312349319458008, -0.00231170654296875, -0.0013110637664794922, -0.0003104209899902344, 0.0006902217864990234, 0.0016908645629882812, 0.002691507339477539, 0.003692150115966797, 0.004692792892456055, 0.0056934356689453125, 0.00669407844543457, 0.007694721221923828, 0.008695363998413086, 0.009696006774902344, 0.010696649551391602, 0.01169729232788086, 0.012697935104370117, 0.013698577880859375, 0.014699220657348633, 0.01569986343383789, 0.01670050621032715, 0.017701148986816406, 0.018701791763305664, 0.019702434539794922, 0.02070307731628418, 0.021703720092773438, 0.022704362869262695, 0.023705005645751953, 0.02470564842224121, 0.02570629119873047, 0.026706933975219727, 0.027707576751708984, 0.028708219528198242, 0.0297088623046875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 20.0, 82.0, 599.0, 254.0, 41.0, 11.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048878371715545654, -0.04768109321594238, -0.04648381099104881, -0.04528653249144554, -0.04408925026655197, -0.0428919717669487, -0.04169468954205513, -0.04049741104245186, -0.03930012881755829, -0.03810285031795502, -0.03690556809306145, -0.035708289593458176, -0.034511007368564606, -0.033313728868961334, -0.032116446644067764, -0.030919168144464493, -0.029721887782216072, -0.02852460741996765, -0.02732732705771923, -0.02613004669547081, -0.02493276633322239, -0.02373548597097397, -0.022538207471370697, -0.021340925246477127, -0.020143646746873856, -0.018946366384625435, -0.017749086022377014, -0.016551805660128593, -0.015354525297880173, -0.014157244935631752, -0.012959965504705906, -0.011762685142457485, -0.01056540384888649, -0.00936812348663807, -0.008170843124389648, -0.006973563227802515, -0.005776282865554094, -0.004579002503305674, -0.00338172260671854, -0.0021844422444701195, -0.0009871618822216988, 0.00021011836361140013, 0.001407398609444499, 0.002604678738862276, 0.003801959101110697, 0.0049992394633591175, 0.006196519359946251, 0.007393799722194672, 0.008591080084443092, 0.009788360446691513, 0.010985640808939934, 0.012182921171188354, 0.013380201533436775, 0.014577481895685196, 0.015774760395288467, 0.016972042620182037, 0.01816932111978531, 0.01936660148203373, 0.02056388184428215, 0.02176116220653057, 0.02295844256877899, 0.024155722931027412, 0.025353003293275833, 0.026550281792879105, 0.027747564017772675]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 1.0, 5.0, 8.0, 11.0, 11.0, 10.0, 16.0, 13.0, 18.0, 27.0, 23.0, 23.0, 28.0, 37.0, 32.0, 35.0, 35.0, 35.0, 33.0, 40.0, 43.0, 53.0, 44.0, 45.0, 44.0, 31.0, 29.0, 30.0, 23.0, 30.0, 34.0, 14.0, 22.0, 21.0, 21.0, 14.0, 12.0, 8.0, 15.0, 8.0, 3.0, 11.0, 2.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005053520202636719, -0.00487324595451355, -0.004692971706390381, -0.004512697458267212, -0.004332423210144043, -0.004152148962020874, -0.003971874713897705, -0.003791600465774536, -0.003611326217651367, -0.0034310519695281982, -0.0032507777214050293, -0.0030705034732818604, -0.0028902292251586914, -0.0027099549770355225, -0.0025296807289123535, -0.0023494064807891846, -0.0021691322326660156, -0.0019888579845428467, -0.0018085837364196777, -0.0016283094882965088, -0.0014480352401733398, -0.001267760992050171, -0.001087486743927002, -0.000907212495803833, -0.0007269382476806641, -0.0005466639995574951, -0.00036638975143432617, -0.00018611550331115723, -5.841255187988281e-06, 0.00017443299293518066, 0.0003547072410583496, 0.0005349814891815186, 0.0007152557373046875, 0.0008955299854278564, 0.0010758042335510254, 0.0012560784816741943, 0.0014363527297973633, 0.0016166269779205322, 0.0017969012260437012, 0.00197717547416687, 0.002157449722290039, 0.002337723970413208, 0.002517998218536377, 0.002698272466659546, 0.002878546714782715, 0.003058820962905884, 0.0032390952110290527, 0.0034193694591522217, 0.0035996437072753906, 0.0037799179553985596, 0.0039601922035217285, 0.0041404664516448975, 0.004320740699768066, 0.004501014947891235, 0.004681289196014404, 0.004861563444137573, 0.005041837692260742, 0.005222111940383911, 0.00540238618850708, 0.005582660436630249, 0.005762934684753418, 0.005943208932876587, 0.006123483180999756, 0.006303757429122925, 0.006484031677246094]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 3.0, 6.0, 4.0, 6.0, 11.0, 14.0, 10.0, 14.0, 18.0, 17.0, 15.0, 23.0, 24.0, 30.0, 27.0, 38.0, 30.0, 35.0, 31.0, 32.0, 43.0, 31.0, 42.0, 41.0, 42.0, 43.0, 31.0, 29.0, 41.0, 31.0, 21.0, 25.0, 19.0, 29.0, 22.0, 18.0, 15.0, 15.0, 11.0, 11.0, 8.0, 7.0, 10.0, 6.0, 6.0, 5.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9853515625, -0.9542083740234375, -0.923065185546875, -0.8919219970703125, -0.86077880859375, -0.8296356201171875, -0.798492431640625, -0.7673492431640625, -0.7362060546875, -0.7050628662109375, -0.673919677734375, -0.6427764892578125, -0.61163330078125, -0.5804901123046875, -0.549346923828125, -0.5182037353515625, -0.487060546875, -0.4559173583984375, -0.424774169921875, -0.3936309814453125, -0.36248779296875, -0.3313446044921875, -0.300201416015625, -0.2690582275390625, -0.2379150390625, -0.2067718505859375, -0.175628662109375, -0.1444854736328125, -0.11334228515625, -0.0821990966796875, -0.051055908203125, -0.0199127197265625, 0.01123046875, 0.0423736572265625, 0.073516845703125, 0.1046600341796875, 0.13580322265625, 0.1669464111328125, 0.198089599609375, 0.2292327880859375, 0.2603759765625, 0.2915191650390625, 0.322662353515625, 0.3538055419921875, 0.38494873046875, 0.4160919189453125, 0.447235107421875, 0.4783782958984375, 0.509521484375, 0.5406646728515625, 0.571807861328125, 0.6029510498046875, 0.63409423828125, 0.6652374267578125, 0.696380615234375, 0.7275238037109375, 0.7586669921875, 0.7898101806640625, 0.820953369140625, 0.8520965576171875, 0.88323974609375, 0.9143829345703125, 0.945526123046875, 0.9766693115234375, 1.0078125]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 9.0, 9.0, 6.0, 13.0, 12.0, 24.0, 34.0, 35.0, 54.0, 68.0, 102.0, 158.0, 261.0, 332.0, 566.0, 828.0, 1353.0, 2207.0, 3632.0, 6200.0, 10649.0, 19688.0, 38050.0, 79188.0, 173549.0, 310507.0, 208591.0, 94701.0, 44665.0, 23020.0, 12325.0, 6832.0, 4050.0, 2481.0, 1512.0, 980.0, 640.0, 398.0, 255.0, 175.0, 123.0, 90.0, 57.0, 38.0, 33.0, 23.0, 14.0, 9.0, 2.0, 4.0, 8.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-1.240234375, -1.20220947265625, -1.1641845703125, -1.12615966796875, -1.088134765625, -1.05010986328125, -1.0120849609375, -0.97406005859375, -0.93603515625, -0.89801025390625, -0.8599853515625, -0.82196044921875, -0.783935546875, -0.74591064453125, -0.7078857421875, -0.66986083984375, -0.6318359375, -0.59381103515625, -0.5557861328125, -0.51776123046875, -0.479736328125, -0.44171142578125, -0.4036865234375, -0.36566162109375, -0.32763671875, -0.28961181640625, -0.2515869140625, -0.21356201171875, -0.175537109375, -0.13751220703125, -0.0994873046875, -0.06146240234375, -0.0234375, 0.01458740234375, 0.0526123046875, 0.09063720703125, 0.128662109375, 0.16668701171875, 0.2047119140625, 0.24273681640625, 0.28076171875, 0.31878662109375, 0.3568115234375, 0.39483642578125, 0.432861328125, 0.47088623046875, 0.5089111328125, 0.54693603515625, 0.5849609375, 0.62298583984375, 0.6610107421875, 0.69903564453125, 0.737060546875, 0.77508544921875, 0.8131103515625, 0.85113525390625, 0.88916015625, 0.92718505859375, 0.9652099609375, 1.00323486328125, 1.041259765625, 1.07928466796875, 1.1173095703125, 1.15533447265625, 1.193359375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 6.0, 5.0, 6.0, 9.0, 8.0, 13.0, 12.0, 12.0, 22.0, 13.0, 20.0, 31.0, 28.0, 48.0, 43.0, 61.0, 78.0, 147.0, 259.0, 1440.0, 226.0, 131.0, 68.0, 65.0, 39.0, 46.0, 28.0, 35.0, 38.0, 25.0, 17.0, 18.0, 10.0, 14.0, 13.0, 6.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-5.04296875, -4.904296875, -4.765625, -4.626953125, -4.48828125, -4.349609375, -4.2109375, -4.072265625, -3.93359375, -3.794921875, -3.65625, -3.517578125, -3.37890625, -3.240234375, -3.1015625, -2.962890625, -2.82421875, -2.685546875, -2.546875, -2.408203125, -2.26953125, -2.130859375, -1.9921875, -1.853515625, -1.71484375, -1.576171875, -1.4375, -1.298828125, -1.16015625, -1.021484375, -0.8828125, -0.744140625, -0.60546875, -0.466796875, -0.328125, -0.189453125, -0.05078125, 0.087890625, 0.2265625, 0.365234375, 0.50390625, 0.642578125, 0.78125, 0.919921875, 1.05859375, 1.197265625, 1.3359375, 1.474609375, 1.61328125, 1.751953125, 1.890625, 2.029296875, 2.16796875, 2.306640625, 2.4453125, 2.583984375, 2.72265625, 2.861328125, 3.0, 3.138671875, 3.27734375, 3.416015625, 3.5546875, 3.693359375, 3.83203125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 14.0, 12.0, 14.0, 13.0, 15.0, 29.0, 30.0, 48.0, 50.0, 91.0, 161.0, 274.0, 651.0, 2510.0, 18471.0, 418680.0, 2608759.0, 86741.0, 6818.0, 1276.0, 470.0, 210.0, 116.0, 62.0, 35.0, 28.0, 27.0, 26.0, 15.0, 18.0, 10.0, 11.0, 4.0, 4.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.87890625, -5.65521240234375, -5.4315185546875, -5.20782470703125, -4.984130859375, -4.76043701171875, -4.5367431640625, -4.31304931640625, -4.08935546875, -3.86566162109375, -3.6419677734375, -3.41827392578125, -3.194580078125, -2.97088623046875, -2.7471923828125, -2.52349853515625, -2.2998046875, -2.07611083984375, -1.8524169921875, -1.62872314453125, -1.405029296875, -1.18133544921875, -0.9576416015625, -0.73394775390625, -0.51025390625, -0.28656005859375, -0.0628662109375, 0.16082763671875, 0.384521484375, 0.60821533203125, 0.8319091796875, 1.05560302734375, 1.279296875, 1.50299072265625, 1.7266845703125, 1.95037841796875, 2.174072265625, 2.39776611328125, 2.6214599609375, 2.84515380859375, 3.06884765625, 3.29254150390625, 3.5162353515625, 3.73992919921875, 3.963623046875, 4.18731689453125, 4.4110107421875, 4.63470458984375, 4.8583984375, 5.08209228515625, 5.3057861328125, 5.52947998046875, 5.753173828125, 5.97686767578125, 6.2005615234375, 6.42425537109375, 6.64794921875, 6.87164306640625, 7.0953369140625, 7.31903076171875, 7.542724609375, 7.76641845703125, 7.9901123046875, 8.21380615234375, 8.4375]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [17.0, 75.0, 252.0, 355.0, 240.0, 62.0, 14.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6077628135681152, -1.8268611431121826, -1.0459595918655396, -0.2650580406188965, 0.5158436298370361, 1.2967453002929688, 2.0776467323303223, 2.858548641204834, 3.6394500732421875, 4.420351505279541, 5.201253414154053, 5.982154846191406, 6.763056755065918, 7.5439581871032715, 8.324859619140625, 9.105761528015137, 9.886663436889648, 10.66756534576416, 11.448466300964355, 12.229368209838867, 13.010270118713379, 13.79117202758789, 14.572072982788086, 15.352974891662598, 16.13387680053711, 16.914777755737305, 17.695680618286133, 18.476581573486328, 19.257482528686523, 20.03838539123535, 20.819286346435547, 21.600189208984375, 22.38109016418457, 23.161991119384766, 23.942893981933594, 24.72379493713379, 25.504695892333984, 26.285598754882812, 27.066499710083008, 27.847400665283203, 28.62830352783203, 29.409204483032227, 30.190107345581055, 30.97100830078125, 31.751909255981445, 32.53281021118164, 33.31371307373047, 34.0946159362793, 34.87551498413086, 35.65641784667969, 36.43731689453125, 37.21821975708008, 37.999122619628906, 38.78002166748047, 39.5609245300293, 40.341827392578125, 41.12273025512695, 41.90363311767578, 42.684532165527344, 43.46543502807617, 44.246337890625, 45.02723693847656, 45.80813980102539, 46.58904266357422, 47.36994171142578]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 5.0, 9.0, 8.0, 9.0, 12.0, 14.0, 15.0, 21.0, 22.0, 27.0, 18.0, 20.0, 31.0, 31.0, 19.0, 40.0, 30.0, 35.0, 52.0, 46.0, 40.0, 35.0, 45.0, 41.0, 33.0, 35.0, 39.0, 33.0, 36.0, 31.0, 19.0, 18.0, 14.0, 12.0, 12.0, 19.0, 15.0, 20.0, 8.0, 8.0, 6.0, 8.0, 3.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0], "bins": [-13.119026184082031, -12.737293243408203, -12.355560302734375, -11.973828315734863, -11.592095375061035, -11.210362434387207, -10.828630447387695, -10.446897506713867, -10.065164566040039, -9.683431625366211, -9.301698684692383, -8.919966697692871, -8.538233757019043, -8.156500816345215, -7.774768352508545, -7.393035888671875, -7.011302947998047, -6.629570007324219, -6.247837543487549, -5.866105079650879, -5.484372138977051, -5.102639198303223, -4.720906734466553, -4.339174270629883, -3.9574413299560547, -3.5757086277008057, -3.1939759254455566, -2.8122432231903076, -2.4305105209350586, -2.0487778186798096, -1.6670451164245605, -1.2853124141693115, -0.9035806655883789, -0.5218479633331299, -0.14011526107788086, 0.24161744117736816, 0.6233501434326172, 1.0050828456878662, 1.3868155479431152, 1.7685482501983643, 2.1502809524536133, 2.5320136547088623, 2.9137463569641113, 3.2954790592193604, 3.6772117614746094, 4.0589447021484375, 4.440677165985107, 4.822409629821777, 5.2041425704956055, 5.585875511169434, 5.9676079750061035, 6.349340438842773, 6.731073379516602, 7.11280632019043, 7.4945387840271, 7.8762712478637695, 8.258004188537598, 8.639737129211426, 9.021469116210938, 9.403202056884766, 9.784934997558594, 10.166667938232422, 10.54840087890625, 10.930132865905762, 11.31186580657959]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 7.0, 10.0, 6.0, 12.0, 12.0, 12.0, 20.0, 15.0, 19.0, 31.0, 28.0, 20.0, 33.0, 36.0, 27.0, 34.0, 28.0, 28.0, 40.0, 39.0, 39.0, 35.0, 54.0, 39.0, 35.0, 37.0, 33.0, 27.0, 22.0, 32.0, 20.0, 28.0, 14.0, 22.0, 13.0, 7.0, 14.0, 13.0, 8.0, 12.0, 8.0, 8.0, 6.0, 4.0, 1.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.0693359375, -1.0366058349609375, -1.003875732421875, -0.9711456298828125, -0.93841552734375, -0.9056854248046875, -0.872955322265625, -0.8402252197265625, -0.8074951171875, -0.7747650146484375, -0.742034912109375, -0.7093048095703125, -0.67657470703125, -0.6438446044921875, -0.611114501953125, -0.5783843994140625, -0.545654296875, -0.5129241943359375, -0.480194091796875, -0.4474639892578125, -0.41473388671875, -0.3820037841796875, -0.349273681640625, -0.3165435791015625, -0.2838134765625, -0.2510833740234375, -0.218353271484375, -0.1856231689453125, -0.15289306640625, -0.1201629638671875, -0.087432861328125, -0.0547027587890625, -0.02197265625, 0.0107574462890625, 0.043487548828125, 0.0762176513671875, 0.10894775390625, 0.1416778564453125, 0.174407958984375, 0.2071380615234375, 0.2398681640625, 0.2725982666015625, 0.305328369140625, 0.3380584716796875, 0.37078857421875, 0.4035186767578125, 0.436248779296875, 0.4689788818359375, 0.501708984375, 0.5344390869140625, 0.567169189453125, 0.5998992919921875, 0.63262939453125, 0.6653594970703125, 0.698089599609375, 0.7308197021484375, 0.7635498046875, 0.7962799072265625, 0.829010009765625, 0.8617401123046875, 0.89447021484375, 0.9272003173828125, 0.959930419921875, 0.9926605224609375, 1.025390625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 8.0, 7.0, 8.0, 9.0, 17.0, 15.0, 26.0, 28.0, 33.0, 39.0, 44.0, 72.0, 131.0, 194.0, 383.0, 806.0, 2216.0, 6713.0, 25267.0, 116724.0, 791920.0, 2635080.0, 503803.0, 83347.0, 18822.0, 5104.0, 1812.0, 716.0, 336.0, 164.0, 116.0, 69.0, 71.0, 39.0, 34.0, 24.0, 20.0, 15.0, 7.0, 13.0, 8.0, 9.0, 5.0, 4.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.765625, -3.649383544921875, -3.53314208984375, -3.416900634765625, -3.3006591796875, -3.184417724609375, -3.06817626953125, -2.951934814453125, -2.835693359375, -2.719451904296875, -2.60321044921875, -2.486968994140625, -2.3707275390625, -2.254486083984375, -2.13824462890625, -2.022003173828125, -1.90576171875, -1.789520263671875, -1.67327880859375, -1.557037353515625, -1.4407958984375, -1.324554443359375, -1.20831298828125, -1.092071533203125, -0.975830078125, -0.859588623046875, -0.74334716796875, -0.627105712890625, -0.5108642578125, -0.394622802734375, -0.27838134765625, -0.162139892578125, -0.0458984375, 0.070343017578125, 0.18658447265625, 0.302825927734375, 0.4190673828125, 0.535308837890625, 0.65155029296875, 0.767791748046875, 0.884033203125, 1.000274658203125, 1.11651611328125, 1.232757568359375, 1.3489990234375, 1.465240478515625, 1.58148193359375, 1.697723388671875, 1.81396484375, 1.930206298828125, 2.04644775390625, 2.162689208984375, 2.2789306640625, 2.395172119140625, 2.51141357421875, 2.627655029296875, 2.743896484375, 2.860137939453125, 2.97637939453125, 3.092620849609375, 3.2088623046875, 3.325103759765625, 3.44134521484375, 3.557586669921875, 3.673828125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 7.0, 5.0, 7.0, 7.0, 12.0, 18.0, 15.0, 35.0, 40.0, 60.0, 98.0, 135.0, 170.0, 283.0, 386.0, 532.0, 625.0, 504.0, 369.0, 251.0, 167.0, 122.0, 65.0, 46.0, 39.0, 33.0, 18.0, 8.0, 10.0, 3.0, 8.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1875, -4.0498046875, -3.912109375, -3.7744140625, -3.63671875, -3.4990234375, -3.361328125, -3.2236328125, -3.0859375, -2.9482421875, -2.810546875, -2.6728515625, -2.53515625, -2.3974609375, -2.259765625, -2.1220703125, -1.984375, -1.8466796875, -1.708984375, -1.5712890625, -1.43359375, -1.2958984375, -1.158203125, -1.0205078125, -0.8828125, -0.7451171875, -0.607421875, -0.4697265625, -0.33203125, -0.1943359375, -0.056640625, 0.0810546875, 0.21875, 0.3564453125, 0.494140625, 0.6318359375, 0.76953125, 0.9072265625, 1.044921875, 1.1826171875, 1.3203125, 1.4580078125, 1.595703125, 1.7333984375, 1.87109375, 2.0087890625, 2.146484375, 2.2841796875, 2.421875, 2.5595703125, 2.697265625, 2.8349609375, 2.97265625, 3.1103515625, 3.248046875, 3.3857421875, 3.5234375, 3.6611328125, 3.798828125, 3.9365234375, 4.07421875, 4.2119140625, 4.349609375, 4.4873046875, 4.625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 7.0, 8.0, 8.0, 23.0, 39.0, 57.0, 99.0, 175.0, 419.0, 953.0, 3091.0, 11980.0, 75803.0, 706173.0, 2855303.0, 472989.0, 54143.0, 8936.0, 2433.0, 833.0, 374.0, 169.0, 96.0, 53.0, 38.0, 25.0, 15.0, 9.0, 11.0, 10.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.0703125, -7.82879638671875, -7.5872802734375, -7.34576416015625, -7.104248046875, -6.86273193359375, -6.6212158203125, -6.37969970703125, -6.13818359375, -5.89666748046875, -5.6551513671875, -5.41363525390625, -5.172119140625, -4.93060302734375, -4.6890869140625, -4.44757080078125, -4.2060546875, -3.96453857421875, -3.7230224609375, -3.48150634765625, -3.239990234375, -2.99847412109375, -2.7569580078125, -2.51544189453125, -2.27392578125, -2.03240966796875, -1.7908935546875, -1.54937744140625, -1.307861328125, -1.06634521484375, -0.8248291015625, -0.58331298828125, -0.341796875, -0.10028076171875, 0.1412353515625, 0.38275146484375, 0.624267578125, 0.86578369140625, 1.1072998046875, 1.34881591796875, 1.59033203125, 1.83184814453125, 2.0733642578125, 2.31488037109375, 2.556396484375, 2.79791259765625, 3.0394287109375, 3.28094482421875, 3.5224609375, 3.76397705078125, 4.0054931640625, 4.24700927734375, 4.488525390625, 4.73004150390625, 4.9715576171875, 5.21307373046875, 5.45458984375, 5.69610595703125, 5.9376220703125, 6.17913818359375, 6.420654296875, 6.66217041015625, 6.9036865234375, 7.14520263671875, 7.38671875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 6.0, 5.0, 7.0, 6.0, 8.0, 13.0, 28.0, 20.0, 22.0, 35.0, 30.0, 49.0, 53.0, 73.0, 61.0, 83.0, 75.0, 79.0, 66.0, 56.0, 54.0, 29.0, 30.0, 27.0, 32.0, 18.0, 10.0, 8.0, 16.0, 5.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.869624137878418, -8.473861694335938, -8.07809829711914, -7.68233585357666, -7.2865729331970215, -6.890810012817383, -6.495047569274902, -6.099284648895264, -5.703521728515625, -5.307758808135986, -4.911995887756348, -4.516233444213867, -4.1204705238342285, -3.72470760345459, -3.3289449214935303, -2.9331822395324707, -2.537419319152832, -2.1416563987731934, -1.7458937168121338, -1.3501309156417847, -0.9543681144714355, -0.5586053133010864, -0.1628425121307373, 0.23292016983032227, 0.6286830902099609, 1.02444589138031, 1.4202086925506592, 1.8159714937210083, 2.2117342948913574, 2.607497215270996, 3.0032598972320557, 3.3990225791931152, 3.7947845458984375, 4.190547466278076, 4.586310386657715, 4.982072830200195, 5.377835750579834, 5.773598670959473, 6.169361114501953, 6.565124034881592, 6.9608869552612305, 7.356649875640869, 7.752412796020508, 8.148175239562988, 8.543937683105469, 8.939701080322266, 9.335463523864746, 9.731225967407227, 10.126989364624023, 10.522751808166504, 10.9185152053833, 11.314277648925781, 11.710041046142578, 12.105803489685059, 12.501565933227539, 12.897329330444336, 13.293091773986816, 13.688854217529297, 14.084617614746094, 14.480380058288574, 14.876142501831055, 15.271905899047852, 15.667668342590332, 16.063430786132812, 16.45919418334961]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 3.0, 5.0, 6.0, 5.0, 6.0, 8.0, 7.0, 12.0, 7.0, 11.0, 17.0, 22.0, 27.0, 35.0, 21.0, 37.0, 27.0, 34.0, 42.0, 33.0, 41.0, 39.0, 47.0, 36.0, 36.0, 46.0, 50.0, 42.0, 39.0, 35.0, 31.0, 31.0, 25.0, 22.0, 24.0, 13.0, 13.0, 11.0, 10.0, 13.0, 10.0, 8.0, 3.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-12.116527557373047, -11.737661361694336, -11.358794212341309, -10.979928016662598, -10.60106086730957, -10.22219467163086, -9.843328475952148, -9.464461326599121, -9.085594177246094, -8.706727981567383, -8.327860832214355, -7.9489946365356445, -7.570127487182617, -7.191261291503906, -6.812394618988037, -6.433527946472168, -6.054661750793457, -5.675795078277588, -5.296928405761719, -4.918062210083008, -4.5391950607299805, -4.1603288650512695, -3.7814621925354004, -3.4025955200195312, -3.023728847503662, -2.644862174987793, -2.265995502471924, -1.8871290683746338, -1.5082623958587646, -1.1293957233428955, -0.7505292892456055, -0.37166261672973633, 0.0072040557861328125, 0.3860706686973572, 0.7649372816085815, 1.1438038349151611, 1.5226705074310303, 1.9015371799468994, 2.2804036140441895, 2.6592702865600586, 3.0381369590759277, 3.417003631591797, 3.795870304107666, 4.174736976623535, 4.553603172302246, 4.932470321655273, 5.311336517333984, 5.6902031898498535, 6.069069862365723, 6.447936534881592, 6.826803207397461, 7.205669403076172, 7.584536552429199, 7.96340274810791, 8.342269897460938, 8.721136093139648, 9.10000228881836, 9.47886848449707, 9.857735633850098, 10.236601829528809, 10.615468978881836, 10.994335174560547, 11.373201370239258, 11.752068519592285, 12.130935668945312]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 3.0, 10.0, 9.0, 15.0, 10.0, 15.0, 13.0, 15.0, 18.0, 25.0, 26.0, 29.0, 37.0, 24.0, 35.0, 38.0, 40.0, 51.0, 36.0, 27.0, 52.0, 50.0, 36.0, 38.0, 37.0, 32.0, 30.0, 29.0, 32.0, 24.0, 29.0, 18.0, 23.0, 25.0, 15.0, 10.0, 3.0, 4.0, 5.0, 3.0, 6.0, 11.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1552734375, -1.119354248046875, -1.08343505859375, -1.047515869140625, -1.0115966796875, -0.975677490234375, -0.93975830078125, -0.903839111328125, -0.867919921875, -0.832000732421875, -0.79608154296875, -0.760162353515625, -0.7242431640625, -0.688323974609375, -0.65240478515625, -0.616485595703125, -0.58056640625, -0.544647216796875, -0.50872802734375, -0.472808837890625, -0.4368896484375, -0.400970458984375, -0.36505126953125, -0.329132080078125, -0.293212890625, -0.257293701171875, -0.22137451171875, -0.185455322265625, -0.1495361328125, -0.113616943359375, -0.07769775390625, -0.041778564453125, -0.005859375, 0.030059814453125, 0.06597900390625, 0.101898193359375, 0.1378173828125, 0.173736572265625, 0.20965576171875, 0.245574951171875, 0.281494140625, 0.317413330078125, 0.35333251953125, 0.389251708984375, 0.4251708984375, 0.461090087890625, 0.49700927734375, 0.532928466796875, 0.56884765625, 0.604766845703125, 0.64068603515625, 0.676605224609375, 0.7125244140625, 0.748443603515625, 0.78436279296875, 0.820281982421875, 0.856201171875, 0.892120361328125, 0.92803955078125, 0.963958740234375, 0.9998779296875, 1.035797119140625, 1.07171630859375, 1.107635498046875, 1.1435546875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 7.0, 1.0, 5.0, 6.0, 14.0, 23.0, 28.0, 34.0, 39.0, 67.0, 108.0, 163.0, 245.0, 380.0, 523.0, 803.0, 1129.0, 1841.0, 2972.0, 4561.0, 6848.0, 11113.0, 17322.0, 27406.0, 43353.0, 67091.0, 100610.0, 141318.0, 168710.0, 146163.0, 106903.0, 71724.0, 46104.0, 29291.0, 18993.0, 11734.0, 7266.0, 4773.0, 3099.0, 1952.0, 1247.0, 855.0, 585.0, 374.0, 277.0, 175.0, 122.0, 70.0, 43.0, 28.0, 34.0, 16.0, 4.0, 5.0, 6.0, 2.0, 2.0, 2.0], "bins": [-0.0938720703125, -0.0911569595336914, -0.08844184875488281, -0.08572673797607422, -0.08301162719726562, -0.08029651641845703, -0.07758140563964844, -0.07486629486083984, -0.07215118408203125, -0.06943607330322266, -0.06672096252441406, -0.06400585174560547, -0.061290740966796875, -0.05857563018798828, -0.05586051940917969, -0.053145408630371094, -0.0504302978515625, -0.047715187072753906, -0.04500007629394531, -0.04228496551513672, -0.039569854736328125, -0.03685474395751953, -0.03413963317871094, -0.031424522399902344, -0.02870941162109375, -0.025994300842285156, -0.023279190063476562, -0.02056407928466797, -0.017848968505859375, -0.015133857727050781, -0.012418746948242188, -0.009703636169433594, -0.006988525390625, -0.004273414611816406, -0.0015583038330078125, 0.0011568069458007812, 0.003871917724609375, 0.006587028503417969, 0.009302139282226562, 0.012017250061035156, 0.01473236083984375, 0.017447471618652344, 0.020162582397460938, 0.02287769317626953, 0.025592803955078125, 0.02830791473388672, 0.031023025512695312, 0.033738136291503906, 0.0364532470703125, 0.039168357849121094, 0.04188346862792969, 0.04459857940673828, 0.047313690185546875, 0.05002880096435547, 0.05274391174316406, 0.055459022521972656, 0.05817413330078125, 0.060889244079589844, 0.06360435485839844, 0.06631946563720703, 0.06903457641601562, 0.07174968719482422, 0.07446479797363281, 0.0771799087524414, 0.07989501953125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 7.0, 3.0, 8.0, 11.0, 10.0, 7.0, 14.0, 12.0, 12.0, 13.0, 20.0, 18.0, 26.0, 31.0, 25.0, 22.0, 23.0, 26.0, 34.0, 27.0, 34.0, 28.0, 38.0, 43.0, 1056.0, 32.0, 32.0, 47.0, 33.0, 36.0, 34.0, 27.0, 33.0, 21.0, 21.0, 20.0, 18.0, 23.0, 18.0, 20.0, 14.0, 6.0, 10.0, 7.0, 12.0, 7.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7412109375, -0.7174911499023438, -0.6937713623046875, -0.6700515747070312, -0.646331787109375, -0.6226119995117188, -0.5988922119140625, -0.5751724243164062, -0.55145263671875, -0.5277328491210938, -0.5040130615234375, -0.48029327392578125, -0.456573486328125, -0.43285369873046875, -0.4091339111328125, -0.38541412353515625, -0.3616943359375, -0.33797454833984375, -0.3142547607421875, -0.29053497314453125, -0.266815185546875, -0.24309539794921875, -0.2193756103515625, -0.19565582275390625, -0.17193603515625, -0.14821624755859375, -0.1244964599609375, -0.10077667236328125, -0.077056884765625, -0.05333709716796875, -0.0296173095703125, -0.00589752197265625, 0.017822265625, 0.04154205322265625, 0.0652618408203125, 0.08898162841796875, 0.112701416015625, 0.13642120361328125, 0.1601409912109375, 0.18386077880859375, 0.20758056640625, 0.23130035400390625, 0.2550201416015625, 0.27873992919921875, 0.302459716796875, 0.32617950439453125, 0.3498992919921875, 0.37361907958984375, 0.3973388671875, 0.42105865478515625, 0.4447784423828125, 0.46849822998046875, 0.492218017578125, 0.5159378051757812, 0.5396575927734375, 0.5633773803710938, 0.58709716796875, 0.6108169555664062, 0.6345367431640625, 0.6582565307617188, 0.681976318359375, 0.7056961059570312, 0.7294158935546875, 0.7531356811523438, 0.77685546875]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 6.0, 7.0, 9.0, 21.0, 30.0, 37.0, 43.0, 66.0, 96.0, 162.0, 262.0, 400.0, 635.0, 1048.0, 1617.0, 2569.0, 4066.0, 6327.0, 10150.0, 16011.0, 25562.0, 40542.0, 62877.0, 95624.0, 135794.0, 1198525.0, 165909.0, 114583.0, 77894.0, 49861.0, 31920.0, 20178.0, 12381.0, 8037.0, 5219.0, 3190.0, 2068.0, 1232.0, 796.0, 473.0, 329.0, 186.0, 132.0, 93.0, 49.0, 52.0, 26.0, 14.0, 13.0, 7.0, 8.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.053680419921875, -0.05198955535888672, -0.05029869079589844, -0.048607826232910156, -0.046916961669921875, -0.045226097106933594, -0.04353523254394531, -0.04184436798095703, -0.04015350341796875, -0.03846263885498047, -0.03677177429199219, -0.035080909729003906, -0.033390045166015625, -0.031699180603027344, -0.030008316040039062, -0.02831745147705078, -0.0266265869140625, -0.02493572235107422, -0.023244857788085938, -0.021553993225097656, -0.019863128662109375, -0.018172264099121094, -0.016481399536132812, -0.014790534973144531, -0.01309967041015625, -0.011408805847167969, -0.009717941284179688, -0.008027076721191406, -0.006336212158203125, -0.004645347595214844, -0.0029544830322265625, -0.0012636184692382812, 0.00042724609375, 0.0021181106567382812, 0.0038089752197265625, 0.005499839782714844, 0.007190704345703125, 0.008881568908691406, 0.010572433471679688, 0.012263298034667969, 0.01395416259765625, 0.01564502716064453, 0.017335891723632812, 0.019026756286621094, 0.020717620849609375, 0.022408485412597656, 0.024099349975585938, 0.02579021453857422, 0.0274810791015625, 0.02917194366455078, 0.030862808227539062, 0.032553672790527344, 0.034244537353515625, 0.035935401916503906, 0.03762626647949219, 0.03931713104248047, 0.04100799560546875, 0.04269886016845703, 0.04438972473144531, 0.046080589294433594, 0.047771453857421875, 0.049462318420410156, 0.05115318298339844, 0.05284404754638672, 0.054534912109375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 2.0, 1.0, 8.0, 3.0, 8.0, 6.0, 5.0, 8.0, 10.0, 12.0, 15.0, 21.0, 27.0, 41.0, 56.0, 80.0, 89.0, 119.0, 100.0, 93.0, 66.0, 58.0, 34.0, 38.0, 24.0, 14.0, 9.0, 17.0, 7.0, 7.0, 4.0, 4.0, 0.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00324249267578125, -0.0031303763389587402, -0.0030182600021362305, -0.0029061436653137207, -0.002794027328491211, -0.002681910991668701, -0.0025697946548461914, -0.0024576783180236816, -0.002345561981201172, -0.002233445644378662, -0.0021213293075561523, -0.0020092129707336426, -0.0018970966339111328, -0.001784980297088623, -0.0016728639602661133, -0.0015607476234436035, -0.0014486312866210938, -0.001336514949798584, -0.0012243986129760742, -0.0011122822761535645, -0.0010001659393310547, -0.0008880496025085449, -0.0007759332656860352, -0.0006638169288635254, -0.0005517005920410156, -0.00043958425521850586, -0.0003274679183959961, -0.00021535158157348633, -0.00010323524475097656, 8.881092071533203e-06, 0.00012099742889404297, 0.00023311376571655273, 0.0003452301025390625, 0.00045734643936157227, 0.000569462776184082, 0.0006815791130065918, 0.0007936954498291016, 0.0009058117866516113, 0.001017928123474121, 0.0011300444602966309, 0.0012421607971191406, 0.0013542771339416504, 0.0014663934707641602, 0.00157850980758667, 0.0016906261444091797, 0.0018027424812316895, 0.0019148588180541992, 0.002026975154876709, 0.0021390914916992188, 0.0022512078285217285, 0.0023633241653442383, 0.002475440502166748, 0.002587556838989258, 0.0026996731758117676, 0.0028117895126342773, 0.002923905849456787, 0.003036022186279297, 0.0031481385231018066, 0.0032602548599243164, 0.003372371196746826, 0.003484487533569336, 0.0035966038703918457, 0.0037087202072143555, 0.0038208365440368652, 0.003932952880859375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 2.0, 7.0, 6.0, 10.0, 17.0, 27.0, 25.0, 30.0, 48.0, 60.0, 89.0, 86.0, 158.0, 369.0, 1695.0, 89175.0, 946201.0, 9094.0, 681.0, 262.0, 149.0, 87.0, 60.0, 44.0, 25.0, 26.0, 24.0, 16.0, 17.0, 9.0, 9.0, 9.0, 11.0, 4.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.062103271484375, -0.060341835021972656, -0.05858039855957031, -0.05681896209716797, -0.055057525634765625, -0.05329608917236328, -0.05153465270996094, -0.049773216247558594, -0.04801177978515625, -0.046250343322753906, -0.04448890686035156, -0.04272747039794922, -0.040966033935546875, -0.03920459747314453, -0.03744316101074219, -0.035681724548339844, -0.0339202880859375, -0.032158851623535156, -0.030397415161132812, -0.02863597869873047, -0.026874542236328125, -0.02511310577392578, -0.023351669311523438, -0.021590232849121094, -0.01982879638671875, -0.018067359924316406, -0.016305923461914062, -0.014544486999511719, -0.012783050537109375, -0.011021614074707031, -0.009260177612304688, -0.007498741149902344, -0.0057373046875, -0.003975868225097656, -0.0022144317626953125, -0.00045299530029296875, 0.001308441162109375, 0.0030698776245117188, 0.0048313140869140625, 0.006592750549316406, 0.00835418701171875, 0.010115623474121094, 0.011877059936523438, 0.013638496398925781, 0.015399932861328125, 0.01716136932373047, 0.018922805786132812, 0.020684242248535156, 0.0224456787109375, 0.024207115173339844, 0.025968551635742188, 0.02772998809814453, 0.029491424560546875, 0.03125286102294922, 0.03301429748535156, 0.034775733947753906, 0.03653717041015625, 0.038298606872558594, 0.04006004333496094, 0.04182147979736328, 0.043582916259765625, 0.04534435272216797, 0.04710578918457031, 0.048867225646972656, 0.050628662109375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 11.0, 27.0, 70.0, 358.0, 430.0, 73.0, 28.0, 10.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037182606756687164, -0.03598521649837494, -0.03478782996535301, -0.03359043970704079, -0.03239304944872856, -0.031195661053061485, -0.02999827265739441, -0.028800882399082184, -0.027603494003415108, -0.02640610560774803, -0.025208715349435806, -0.02401132695376873, -0.022813938558101654, -0.02161654829978943, -0.020419159904122353, -0.019221771508455276, -0.01802438125014305, -0.016826992854475975, -0.01562960259616375, -0.014432214200496674, -0.013234824873507023, -0.012037435546517372, -0.010840047150850296, -0.009642657823860645, -0.008445268496870995, -0.007247879169881344, -0.00605049030855298, -0.004853101447224617, -0.0036557121202349663, -0.0024583227932453156, -0.0012609339319169521, -6.354507058858871e-05, 0.001133844256401062, 0.002331233350560069, 0.003528622444719076, 0.00472601130604744, 0.00592340063303709, 0.007120789960026741, 0.008318178355693817, 0.009515567682683468, 0.010712957009673119, 0.01191034633666277, 0.01310773566365242, 0.014305124059319496, 0.015502513386309147, 0.016699902713298798, 0.017897291108965874, 0.01909467950463295, 0.020292069762945175, 0.02148945815861225, 0.022686848416924477, 0.023884236812591553, 0.025081627070903778, 0.026279015466570854, 0.02747640386223793, 0.028673794120550156, 0.029871182516217232, 0.031068570911884308, 0.03226596117019653, 0.03346335142850876, 0.034660737961530685, 0.03585812821984291, 0.037055518478155136, 0.03825290501117706, 0.03945029526948929]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 8.0, 4.0, 7.0, 8.0, 15.0, 8.0, 20.0, 25.0, 14.0, 24.0, 26.0, 17.0, 33.0, 34.0, 33.0, 27.0, 31.0, 32.0, 47.0, 29.0, 36.0, 45.0, 49.0, 40.0, 26.0, 42.0, 32.0, 46.0, 30.0, 31.0, 19.0, 26.0, 22.0, 21.0, 8.0, 18.0, 18.0, 9.0, 8.0, 10.0, 9.0, 6.0, 4.0, 3.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.006825387477874756, -0.006605923175811768, -0.006386458873748779, -0.006166994571685791, -0.005947530269622803, -0.0057280659675598145, -0.005508601665496826, -0.005289137363433838, -0.00506967306137085, -0.004850208759307861, -0.004630744457244873, -0.004411280155181885, -0.0041918158531188965, -0.003972351551055908, -0.00375288724899292, -0.0035334229469299316, -0.0033139586448669434, -0.003094494342803955, -0.002875030040740967, -0.0026555657386779785, -0.0024361014366149902, -0.002216637134552002, -0.0019971728324890137, -0.0017777085304260254, -0.0015582442283630371, -0.0013387799263000488, -0.0011193156242370605, -0.0008998513221740723, -0.000680387020111084, -0.0004609227180480957, -0.00024145841598510742, -2.199411392211914e-05, 0.00019747018814086914, 0.0004169344902038574, 0.0006363987922668457, 0.000855863094329834, 0.0010753273963928223, 0.0012947916984558105, 0.0015142560005187988, 0.0017337203025817871, 0.0019531846046447754, 0.0021726489067077637, 0.002392113208770752, 0.0026115775108337402, 0.0028310418128967285, 0.003050506114959717, 0.003269970417022705, 0.0034894347190856934, 0.0037088990211486816, 0.00392836332321167, 0.004147827625274658, 0.0043672919273376465, 0.004586756229400635, 0.004806220531463623, 0.005025684833526611, 0.0052451491355896, 0.005464613437652588, 0.005684077739715576, 0.0059035420417785645, 0.006123006343841553, 0.006342470645904541, 0.006561934947967529, 0.006781399250030518, 0.007000863552093506, 0.007220327854156494]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 2.0, 4.0, 3.0, 10.0, 9.0, 15.0, 10.0, 15.0, 13.0, 15.0, 18.0, 25.0, 26.0, 28.0, 38.0, 25.0, 34.0, 38.0, 40.0, 51.0, 36.0, 27.0, 52.0, 50.0, 36.0, 38.0, 37.0, 32.0, 31.0, 28.0, 32.0, 24.0, 29.0, 18.0, 23.0, 25.0, 15.0, 10.0, 3.0, 4.0, 5.0, 3.0, 6.0, 11.0, 4.0, 2.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1552734375, -1.119354248046875, -1.08343505859375, -1.047515869140625, -1.0115966796875, -0.975677490234375, -0.93975830078125, -0.903839111328125, -0.867919921875, -0.832000732421875, -0.79608154296875, -0.760162353515625, -0.7242431640625, -0.688323974609375, -0.65240478515625, -0.616485595703125, -0.58056640625, -0.544647216796875, -0.50872802734375, -0.472808837890625, -0.4368896484375, -0.400970458984375, -0.36505126953125, -0.329132080078125, -0.293212890625, -0.257293701171875, -0.22137451171875, -0.185455322265625, -0.1495361328125, -0.113616943359375, -0.07769775390625, -0.041778564453125, -0.005859375, 0.030059814453125, 0.06597900390625, 0.101898193359375, 0.1378173828125, 0.173736572265625, 0.20965576171875, 0.245574951171875, 0.281494140625, 0.317413330078125, 0.35333251953125, 0.389251708984375, 0.4251708984375, 0.461090087890625, 0.49700927734375, 0.532928466796875, 0.56884765625, 0.604766845703125, 0.64068603515625, 0.676605224609375, 0.7125244140625, 0.748443603515625, 0.78436279296875, 0.820281982421875, 0.856201171875, 0.892120361328125, 0.92803955078125, 0.963958740234375, 0.9998779296875, 1.035797119140625, 1.07171630859375, 1.107635498046875, 1.1435546875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 5.0, 7.0, 3.0, 15.0, 21.0, 19.0, 33.0, 33.0, 52.0, 62.0, 112.0, 157.0, 229.0, 330.0, 532.0, 840.0, 1420.0, 2455.0, 4395.0, 8291.0, 15832.0, 32785.0, 74263.0, 181509.0, 338707.0, 218130.0, 89325.0, 39004.0, 18811.0, 9310.0, 4887.0, 2727.0, 1522.0, 962.0, 563.0, 361.0, 259.0, 164.0, 112.0, 86.0, 62.0, 37.0, 27.0, 32.0, 15.0, 17.0, 12.0, 6.0, 10.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2939453125, -1.2530059814453125, -1.212066650390625, -1.1711273193359375, -1.13018798828125, -1.0892486572265625, -1.048309326171875, -1.0073699951171875, -0.9664306640625, -0.9254913330078125, -0.884552001953125, -0.8436126708984375, -0.80267333984375, -0.7617340087890625, -0.720794677734375, -0.6798553466796875, -0.638916015625, -0.5979766845703125, -0.557037353515625, -0.5160980224609375, -0.47515869140625, -0.4342193603515625, -0.393280029296875, -0.3523406982421875, -0.3114013671875, -0.2704620361328125, -0.229522705078125, -0.1885833740234375, -0.14764404296875, -0.1067047119140625, -0.065765380859375, -0.0248260498046875, 0.01611328125, 0.0570526123046875, 0.097991943359375, 0.1389312744140625, 0.17987060546875, 0.2208099365234375, 0.261749267578125, 0.3026885986328125, 0.3436279296875, 0.3845672607421875, 0.425506591796875, 0.4664459228515625, 0.50738525390625, 0.5483245849609375, 0.589263916015625, 0.6302032470703125, 0.671142578125, 0.7120819091796875, 0.753021240234375, 0.7939605712890625, 0.83489990234375, 0.8758392333984375, 0.916778564453125, 0.9577178955078125, 0.9986572265625, 1.0395965576171875, 1.080535888671875, 1.1214752197265625, 1.16241455078125, 1.2033538818359375, 1.244293212890625, 1.2852325439453125, 1.326171875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 4.0, 8.0, 7.0, 10.0, 16.0, 19.0, 26.0, 26.0, 42.0, 34.0, 53.0, 62.0, 80.0, 130.0, 386.0, 1567.0, 133.0, 88.0, 65.0, 54.0, 46.0, 47.0, 34.0, 26.0, 18.0, 18.0, 16.0, 11.0, 9.0, 3.0, 4.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.29296875, -6.10845947265625, -5.9239501953125, -5.73944091796875, -5.554931640625, -5.37042236328125, -5.1859130859375, -5.00140380859375, -4.81689453125, -4.63238525390625, -4.4478759765625, -4.26336669921875, -4.078857421875, -3.89434814453125, -3.7098388671875, -3.52532958984375, -3.3408203125, -3.15631103515625, -2.9718017578125, -2.78729248046875, -2.602783203125, -2.41827392578125, -2.2337646484375, -2.04925537109375, -1.86474609375, -1.68023681640625, -1.4957275390625, -1.31121826171875, -1.126708984375, -0.94219970703125, -0.7576904296875, -0.57318115234375, -0.388671875, -0.20416259765625, -0.0196533203125, 0.16485595703125, 0.349365234375, 0.53387451171875, 0.7183837890625, 0.90289306640625, 1.08740234375, 1.27191162109375, 1.4564208984375, 1.64093017578125, 1.825439453125, 2.00994873046875, 2.1944580078125, 2.37896728515625, 2.5634765625, 2.74798583984375, 2.9324951171875, 3.11700439453125, 3.301513671875, 3.48602294921875, 3.6705322265625, 3.85504150390625, 4.03955078125, 4.22406005859375, 4.4085693359375, 4.59307861328125, 4.777587890625, 4.96209716796875, 5.1466064453125, 5.33111572265625, 5.515625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 1.0, 3.0, 3.0, 7.0, 11.0, 10.0, 17.0, 23.0, 36.0, 38.0, 64.0, 86.0, 121.0, 204.0, 518.0, 1681.0, 7846.0, 92898.0, 2852792.0, 174758.0, 11146.0, 2128.0, 604.0, 287.0, 139.0, 69.0, 52.0, 35.0, 33.0, 18.0, 22.0, 20.0, 14.0, 5.0, 2.0, 2.0, 8.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-6.3046875, -6.076171875, -5.84765625, -5.619140625, -5.390625, -5.162109375, -4.93359375, -4.705078125, -4.4765625, -4.248046875, -4.01953125, -3.791015625, -3.5625, -3.333984375, -3.10546875, -2.876953125, -2.6484375, -2.419921875, -2.19140625, -1.962890625, -1.734375, -1.505859375, -1.27734375, -1.048828125, -0.8203125, -0.591796875, -0.36328125, -0.134765625, 0.09375, 0.322265625, 0.55078125, 0.779296875, 1.0078125, 1.236328125, 1.46484375, 1.693359375, 1.921875, 2.150390625, 2.37890625, 2.607421875, 2.8359375, 3.064453125, 3.29296875, 3.521484375, 3.75, 3.978515625, 4.20703125, 4.435546875, 4.6640625, 4.892578125, 5.12109375, 5.349609375, 5.578125, 5.806640625, 6.03515625, 6.263671875, 6.4921875, 6.720703125, 6.94921875, 7.177734375, 7.40625, 7.634765625, 7.86328125, 8.091796875, 8.3203125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [21.0, 789.0, 204.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.155524730682373, -1.7681946754455566, 0.6191353797912598, 3.006465435028076, 5.393795490264893, 7.781125545501709, 10.168455123901367, 12.5557861328125, 14.943115234375, 17.3304443359375, 19.717775344848633, 22.105106353759766, 24.492435455322266, 26.879764556884766, 29.2670955657959, 31.65442657470703, 34.04175567626953, 36.42908477783203, 38.81641387939453, 41.2037467956543, 43.5910758972168, 45.9784049987793, 48.36573791503906, 50.75306701660156, 53.14039611816406, 55.52772521972656, 57.91505432128906, 60.30238723754883, 62.68971633911133, 65.0770492553711, 67.4643783569336, 69.8517074584961, 72.23904418945312, 74.62637329101562, 77.01370239257812, 79.40103149414062, 81.78836059570312, 84.17569732666016, 86.56302642822266, 88.95035552978516, 91.33768463134766, 93.72501373291016, 96.11234283447266, 98.49967193603516, 100.88700866699219, 103.27433776855469, 105.66166687011719, 108.04899597167969, 110.43632507324219, 112.82365417480469, 115.21098327636719, 117.59831237792969, 119.98564147949219, 122.37297821044922, 124.76030731201172, 127.14763641357422, 129.53497314453125, 131.92230224609375, 134.30963134765625, 136.69696044921875, 139.08428955078125, 141.47161865234375, 143.85894775390625, 146.24627685546875, 148.63360595703125]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 5.0, 6.0, 10.0, 14.0, 11.0, 29.0, 20.0, 17.0, 19.0, 13.0, 26.0, 30.0, 25.0, 29.0, 32.0, 33.0, 42.0, 37.0, 36.0, 35.0, 54.0, 50.0, 42.0, 42.0, 35.0, 42.0, 32.0, 32.0, 33.0, 26.0, 24.0, 22.0, 22.0, 11.0, 14.0, 11.0, 7.0, 12.0, 10.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.868556022644043, -13.431768417358398, -12.994980812072754, -12.55819320678711, -12.121405601501465, -11.68461799621582, -11.247830390930176, -10.811042785644531, -10.374255180358887, -9.937467575073242, -9.500679969787598, -9.063892364501953, -8.627104759216309, -8.190317153930664, -7.7535295486450195, -7.316741943359375, -6.8799543380737305, -6.443166732788086, -6.006379127502441, -5.569591522216797, -5.132803916931152, -4.696016311645508, -4.259228706359863, -3.8224411010742188, -3.385653495788574, -2.9488658905029297, -2.512078285217285, -2.0752906799316406, -1.638503074645996, -1.2017154693603516, -0.764927864074707, -0.3281402587890625, 0.10864734649658203, 0.5454349517822266, 0.9822225570678711, 1.4190101623535156, 1.8557977676391602, 2.2925853729248047, 2.729372978210449, 3.1661605834960938, 3.6029481887817383, 4.039735794067383, 4.476523399353027, 4.913311004638672, 5.350098609924316, 5.786886215209961, 6.2236738204956055, 6.66046142578125, 7.0972490310668945, 7.534036636352539, 7.970824241638184, 8.407611846923828, 8.844399452209473, 9.281187057495117, 9.717974662780762, 10.154762268066406, 10.59154987335205, 11.028337478637695, 11.46512508392334, 11.901912689208984, 12.338700294494629, 12.775487899780273, 13.212275505065918, 13.649063110351562, 14.085850715637207]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 9.0, 6.0, 11.0, 14.0, 8.0, 12.0, 15.0, 20.0, 13.0, 20.0, 23.0, 35.0, 31.0, 35.0, 36.0, 29.0, 46.0, 38.0, 39.0, 43.0, 37.0, 51.0, 39.0, 42.0, 22.0, 31.0, 42.0, 28.0, 33.0, 30.0, 24.0, 25.0, 17.0, 16.0, 17.0, 10.0, 10.0, 6.0, 6.0, 5.0, 5.0, 8.0, 5.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.232421875, -1.1954803466796875, -1.158538818359375, -1.1215972900390625, -1.08465576171875, -1.0477142333984375, -1.010772705078125, -0.9738311767578125, -0.9368896484375, -0.8999481201171875, -0.863006591796875, -0.8260650634765625, -0.78912353515625, -0.7521820068359375, -0.715240478515625, -0.6782989501953125, -0.641357421875, -0.6044158935546875, -0.567474365234375, -0.5305328369140625, -0.49359130859375, -0.4566497802734375, -0.419708251953125, -0.3827667236328125, -0.3458251953125, -0.3088836669921875, -0.271942138671875, -0.2350006103515625, -0.19805908203125, -0.1611175537109375, -0.124176025390625, -0.0872344970703125, -0.05029296875, -0.0133514404296875, 0.023590087890625, 0.0605316162109375, 0.09747314453125, 0.1344146728515625, 0.171356201171875, 0.2082977294921875, 0.2452392578125, 0.2821807861328125, 0.319122314453125, 0.3560638427734375, 0.39300537109375, 0.4299468994140625, 0.466888427734375, 0.5038299560546875, 0.540771484375, 0.5777130126953125, 0.614654541015625, 0.6515960693359375, 0.68853759765625, 0.7254791259765625, 0.762420654296875, 0.7993621826171875, 0.8363037109375, 0.8732452392578125, 0.910186767578125, 0.9471282958984375, 0.98406982421875, 1.0210113525390625, 1.057952880859375, 1.0948944091796875, 1.1318359375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 6.0, 5.0, 6.0, 6.0, 13.0, 7.0, 24.0, 25.0, 34.0, 33.0, 49.0, 67.0, 130.0, 200.0, 303.0, 652.0, 1250.0, 2539.0, 5487.0, 12455.0, 30127.0, 80416.0, 243410.0, 896982.0, 1880939.0, 724016.0, 200367.0, 67989.0, 26080.0, 11016.0, 4837.0, 2232.0, 1116.0, 558.0, 310.0, 198.0, 113.0, 89.0, 60.0, 34.0, 32.0, 20.0, 12.0, 8.0, 13.0, 8.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.08203125, -2.011260986328125, -1.94049072265625, -1.869720458984375, -1.7989501953125, -1.728179931640625, -1.65740966796875, -1.586639404296875, -1.515869140625, -1.445098876953125, -1.37432861328125, -1.303558349609375, -1.2327880859375, -1.162017822265625, -1.09124755859375, -1.020477294921875, -0.94970703125, -0.878936767578125, -0.80816650390625, -0.737396240234375, -0.6666259765625, -0.595855712890625, -0.52508544921875, -0.454315185546875, -0.383544921875, -0.312774658203125, -0.24200439453125, -0.171234130859375, -0.1004638671875, -0.029693603515625, 0.04107666015625, 0.111846923828125, 0.1826171875, 0.253387451171875, 0.32415771484375, 0.394927978515625, 0.4656982421875, 0.536468505859375, 0.60723876953125, 0.678009033203125, 0.748779296875, 0.819549560546875, 0.89031982421875, 0.961090087890625, 1.0318603515625, 1.102630615234375, 1.17340087890625, 1.244171142578125, 1.31494140625, 1.385711669921875, 1.45648193359375, 1.527252197265625, 1.5980224609375, 1.668792724609375, 1.73956298828125, 1.810333251953125, 1.881103515625, 1.951873779296875, 2.02264404296875, 2.093414306640625, 2.1641845703125, 2.234954833984375, 2.30572509765625, 2.376495361328125, 2.447265625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 3.0, 5.0, 6.0, 6.0, 11.0, 22.0, 25.0, 42.0, 55.0, 71.0, 98.0, 152.0, 210.0, 350.0, 431.0, 577.0, 548.0, 439.0, 325.0, 225.0, 122.0, 106.0, 61.0, 62.0, 34.0, 25.0, 19.0, 10.0, 6.0, 12.0, 3.0, 3.0, 4.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.36328125, -4.230712890625, -4.09814453125, -3.965576171875, -3.8330078125, -3.700439453125, -3.56787109375, -3.435302734375, -3.302734375, -3.170166015625, -3.03759765625, -2.905029296875, -2.7724609375, -2.639892578125, -2.50732421875, -2.374755859375, -2.2421875, -2.109619140625, -1.97705078125, -1.844482421875, -1.7119140625, -1.579345703125, -1.44677734375, -1.314208984375, -1.181640625, -1.049072265625, -0.91650390625, -0.783935546875, -0.6513671875, -0.518798828125, -0.38623046875, -0.253662109375, -0.12109375, 0.011474609375, 0.14404296875, 0.276611328125, 0.4091796875, 0.541748046875, 0.67431640625, 0.806884765625, 0.939453125, 1.072021484375, 1.20458984375, 1.337158203125, 1.4697265625, 1.602294921875, 1.73486328125, 1.867431640625, 2.0, 2.132568359375, 2.26513671875, 2.397705078125, 2.5302734375, 2.662841796875, 2.79541015625, 2.927978515625, 3.060546875, 3.193115234375, 3.32568359375, 3.458251953125, 3.5908203125, 3.723388671875, 3.85595703125, 3.988525390625, 4.12109375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 6.0, 10.0, 16.0, 30.0, 37.0, 51.0, 80.0, 150.0, 269.0, 506.0, 1043.0, 2143.0, 5984.0, 20100.0, 86269.0, 450249.0, 2219132.0, 1145578.0, 202471.0, 42443.0, 10959.0, 3588.0, 1524.0, 720.0, 384.0, 212.0, 136.0, 65.0, 47.0, 23.0, 13.0, 11.0, 9.0, 7.0, 4.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-5.94140625, -5.76544189453125, -5.5894775390625, -5.41351318359375, -5.237548828125, -5.06158447265625, -4.8856201171875, -4.70965576171875, -4.53369140625, -4.35772705078125, -4.1817626953125, -4.00579833984375, -3.829833984375, -3.65386962890625, -3.4779052734375, -3.30194091796875, -3.1259765625, -2.95001220703125, -2.7740478515625, -2.59808349609375, -2.422119140625, -2.24615478515625, -2.0701904296875, -1.89422607421875, -1.71826171875, -1.54229736328125, -1.3663330078125, -1.19036865234375, -1.014404296875, -0.83843994140625, -0.6624755859375, -0.48651123046875, -0.310546875, -0.13458251953125, 0.0413818359375, 0.21734619140625, 0.393310546875, 0.56927490234375, 0.7452392578125, 0.92120361328125, 1.09716796875, 1.27313232421875, 1.4490966796875, 1.62506103515625, 1.801025390625, 1.97698974609375, 2.1529541015625, 2.32891845703125, 2.5048828125, 2.68084716796875, 2.8568115234375, 3.03277587890625, 3.208740234375, 3.38470458984375, 3.5606689453125, 3.73663330078125, 3.91259765625, 4.08856201171875, 4.2645263671875, 4.44049072265625, 4.616455078125, 4.79241943359375, 4.9683837890625, 5.14434814453125, 5.3203125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 28.0, 121.0, 284.0, 334.0, 181.0, 56.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.04283905029297, -85.95830535888672, -83.873779296875, -81.78924560546875, -79.70471954345703, -77.62018585205078, -75.53565979003906, -73.45112609863281, -71.36659240722656, -69.28205871582031, -67.1975326538086, -65.11299896240234, -63.028472900390625, -60.943939208984375, -58.85940933227539, -56.774879455566406, -54.69035339355469, -52.6058235168457, -50.52129364013672, -48.436763763427734, -46.35223388671875, -44.2677001953125, -42.183170318603516, -40.09864044189453, -38.01411056518555, -35.92958068847656, -33.84505081176758, -31.76051902770996, -29.675989151000977, -27.591459274291992, -25.506927490234375, -23.42239761352539, -21.337871551513672, -19.253341674804688, -17.168811798095703, -15.084280014038086, -12.999750137329102, -10.915220260620117, -8.830689430236816, -6.746158599853516, -4.661628723144531, -2.5770983695983887, -0.4925680160522461, 1.5919623374938965, 3.676492691040039, 5.761022567749023, 7.845553398132324, 9.930084228515625, 12.01461410522461, 14.099143981933594, 16.183673858642578, 18.268205642700195, 20.35273551940918, 22.437265396118164, 24.52179718017578, 26.606327056884766, 28.69085693359375, 30.775386810302734, 32.85991668701172, 34.9444465637207, 37.02897644042969, 39.11351013183594, 41.19804000854492, 43.282569885253906, 45.36709976196289]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 8.0, 5.0, 6.0, 5.0, 10.0, 13.0, 14.0, 15.0, 13.0, 21.0, 29.0, 31.0, 33.0, 44.0, 38.0, 33.0, 35.0, 36.0, 45.0, 51.0, 43.0, 46.0, 36.0, 40.0, 37.0, 34.0, 43.0, 26.0, 33.0, 35.0, 20.0, 24.0, 21.0, 17.0, 13.0, 9.0, 7.0, 6.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.617027282714844, -12.220959663391113, -11.824891090393066, -11.428823471069336, -11.032754898071289, -10.636687278747559, -10.240619659423828, -9.844551086425781, -9.448482513427734, -9.052414894104004, -8.656346321105957, -8.260278701782227, -7.86421012878418, -7.468142509460449, -7.0720744132995605, -6.676006317138672, -6.279938697814941, -5.883870601654053, -5.487802505493164, -5.091734886169434, -4.695666313171387, -4.299598693847656, -3.9035305976867676, -3.507462501525879, -3.1113944053649902, -2.7153263092041016, -2.319258213043213, -1.9231903553009033, -1.5271222591400146, -1.131054162979126, -0.7349863052368164, -0.33891820907592773, 0.05714988708496094, 0.45321792364120483, 0.8492859601974487, 1.2453539371490479, 1.6414220333099365, 2.037490129470825, 2.4335579872131348, 2.8296260833740234, 3.225694179534912, 3.621762275695801, 4.0178303718566895, 4.413898468017578, 4.809966087341309, 5.2060346603393555, 5.602102279663086, 5.998170375823975, 6.394238471984863, 6.790306568145752, 7.186374664306641, 7.582442283630371, 7.978510856628418, 8.374578475952148, 8.770647048950195, 9.166714668273926, 9.562782287597656, 9.958849906921387, 10.354918479919434, 10.750986099243164, 11.147054672241211, 11.543122291564941, 11.939189910888672, 12.335258483886719, 12.731327056884766]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 6.0, 14.0, 11.0, 12.0, 21.0, 16.0, 10.0, 14.0, 21.0, 32.0, 40.0, 28.0, 26.0, 44.0, 37.0, 30.0, 32.0, 40.0, 35.0, 43.0, 40.0, 36.0, 32.0, 27.0, 38.0, 30.0, 26.0, 26.0, 27.0, 36.0, 31.0, 18.0, 14.0, 22.0, 15.0, 11.0, 9.0, 5.0, 6.0, 5.0, 7.0, 6.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1552734375, -1.1186676025390625, -1.082061767578125, -1.0454559326171875, -1.00885009765625, -0.9722442626953125, -0.935638427734375, -0.8990325927734375, -0.8624267578125, -0.8258209228515625, -0.789215087890625, -0.7526092529296875, -0.71600341796875, -0.6793975830078125, -0.642791748046875, -0.6061859130859375, -0.569580078125, -0.5329742431640625, -0.496368408203125, -0.4597625732421875, -0.42315673828125, -0.3865509033203125, -0.349945068359375, -0.3133392333984375, -0.2767333984375, -0.2401275634765625, -0.203521728515625, -0.1669158935546875, -0.13031005859375, -0.0937042236328125, -0.057098388671875, -0.0204925537109375, 0.01611328125, 0.0527191162109375, 0.089324951171875, 0.1259307861328125, 0.16253662109375, 0.1991424560546875, 0.235748291015625, 0.2723541259765625, 0.3089599609375, 0.3455657958984375, 0.382171630859375, 0.4187774658203125, 0.45538330078125, 0.4919891357421875, 0.528594970703125, 0.5652008056640625, 0.601806640625, 0.6384124755859375, 0.675018310546875, 0.7116241455078125, 0.74822998046875, 0.7848358154296875, 0.821441650390625, 0.8580474853515625, 0.8946533203125, 0.9312591552734375, 0.967864990234375, 1.0044708251953125, 1.04107666015625, 1.0776824951171875, 1.114288330078125, 1.1508941650390625, 1.1875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 7.0, 7.0, 8.0, 10.0, 22.0, 32.0, 37.0, 75.0, 101.0, 150.0, 216.0, 313.0, 451.0, 697.0, 1006.0, 1475.0, 2137.0, 3391.0, 5176.0, 7913.0, 12209.0, 18561.0, 28786.0, 43800.0, 64833.0, 94977.0, 131749.0, 157519.0, 143268.0, 108237.0, 74855.0, 50237.0, 33254.0, 21744.0, 14405.0, 9232.0, 6043.0, 3895.0, 2480.0, 1711.0, 1133.0, 753.0, 513.0, 368.0, 260.0, 201.0, 98.0, 78.0, 43.0, 45.0, 20.0, 11.0, 12.0, 3.0, 6.0, 3.0, 0.0, 3.0], "bins": [-0.09307861328125, -0.09031486511230469, -0.08755111694335938, -0.08478736877441406, -0.08202362060546875, -0.07925987243652344, -0.07649612426757812, -0.07373237609863281, -0.0709686279296875, -0.06820487976074219, -0.06544113159179688, -0.06267738342285156, -0.05991363525390625, -0.05714988708496094, -0.054386138916015625, -0.05162239074707031, -0.048858642578125, -0.04609489440917969, -0.043331146240234375, -0.04056739807128906, -0.03780364990234375, -0.03503990173339844, -0.032276153564453125, -0.029512405395507812, -0.0267486572265625, -0.023984909057617188, -0.021221160888671875, -0.018457412719726562, -0.01569366455078125, -0.012929916381835938, -0.010166168212890625, -0.0074024200439453125, -0.004638671875, -0.0018749237060546875, 0.000888824462890625, 0.0036525726318359375, 0.00641632080078125, 0.009180068969726562, 0.011943817138671875, 0.014707565307617188, 0.0174713134765625, 0.020235061645507812, 0.022998809814453125, 0.025762557983398438, 0.02852630615234375, 0.03129005432128906, 0.034053802490234375, 0.03681755065917969, 0.039581298828125, 0.04234504699707031, 0.045108795166015625, 0.04787254333496094, 0.05063629150390625, 0.05340003967285156, 0.056163787841796875, 0.05892753601074219, 0.0616912841796875, 0.06445503234863281, 0.06721878051757812, 0.06998252868652344, 0.07274627685546875, 0.07551002502441406, 0.07827377319335938, 0.08103752136230469, 0.08380126953125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 5.0, 5.0, 14.0, 14.0, 12.0, 12.0, 15.0, 15.0, 25.0, 17.0, 32.0, 31.0, 29.0, 29.0, 37.0, 31.0, 31.0, 43.0, 44.0, 34.0, 1075.0, 38.0, 36.0, 41.0, 56.0, 28.0, 35.0, 40.0, 19.0, 21.0, 26.0, 15.0, 19.0, 13.0, 17.0, 9.0, 12.0, 10.0, 10.0, 8.0, 6.0, 5.0, 5.0, 0.0, 2.0, 3.0, 1.0, 4.0], "bins": [-1.013671875, -0.9856491088867188, -0.9576263427734375, -0.9296035766601562, -0.901580810546875, -0.8735580444335938, -0.8455352783203125, -0.8175125122070312, -0.78948974609375, -0.7614669799804688, -0.7334442138671875, -0.7054214477539062, -0.677398681640625, -0.6493759155273438, -0.6213531494140625, -0.5933303833007812, -0.5653076171875, -0.5372848510742188, -0.5092620849609375, -0.48123931884765625, -0.453216552734375, -0.42519378662109375, -0.3971710205078125, -0.36914825439453125, -0.34112548828125, -0.31310272216796875, -0.2850799560546875, -0.25705718994140625, -0.229034423828125, -0.20101165771484375, -0.1729888916015625, -0.14496612548828125, -0.116943359375, -0.08892059326171875, -0.0608978271484375, -0.03287506103515625, -0.004852294921875, 0.02317047119140625, 0.0511932373046875, 0.07921600341796875, 0.10723876953125, 0.13526153564453125, 0.1632843017578125, 0.19130706787109375, 0.219329833984375, 0.24735260009765625, 0.2753753662109375, 0.30339813232421875, 0.3314208984375, 0.35944366455078125, 0.3874664306640625, 0.41548919677734375, 0.443511962890625, 0.47153472900390625, 0.4995574951171875, 0.5275802612304688, 0.55560302734375, 0.5836257934570312, 0.6116485595703125, 0.6396713256835938, 0.667694091796875, 0.6957168579101562, 0.7237396240234375, 0.7517623901367188, 0.77978515625]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 8.0, 16.0, 23.0, 23.0, 41.0, 65.0, 101.0, 151.0, 227.0, 343.0, 611.0, 916.0, 1551.0, 2403.0, 3940.0, 6231.0, 10136.0, 16584.0, 27184.0, 44223.0, 71226.0, 109997.0, 158167.0, 1220659.0, 148506.0, 102156.0, 65858.0, 40435.0, 25075.0, 15224.0, 9535.0, 5921.0, 3627.0, 2242.0, 1426.0, 890.0, 523.0, 327.0, 183.0, 135.0, 78.0, 54.0, 41.0, 24.0, 14.0, 17.0, 6.0, 9.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.069091796875, -0.06708383560180664, -0.06507587432861328, -0.06306791305541992, -0.06105995178222656, -0.0590519905090332, -0.057044029235839844, -0.055036067962646484, -0.053028106689453125, -0.051020145416259766, -0.049012184143066406, -0.04700422286987305, -0.04499626159667969, -0.04298830032348633, -0.04098033905029297, -0.03897237777709961, -0.03696441650390625, -0.03495645523071289, -0.03294849395751953, -0.030940532684326172, -0.028932571411132812, -0.026924610137939453, -0.024916648864746094, -0.022908687591552734, -0.020900726318359375, -0.018892765045166016, -0.016884803771972656, -0.014876842498779297, -0.012868881225585938, -0.010860919952392578, -0.008852958679199219, -0.006844997406005859, -0.0048370361328125, -0.0028290748596191406, -0.0008211135864257812, 0.0011868476867675781, 0.0031948089599609375, 0.005202770233154297, 0.007210731506347656, 0.009218692779541016, 0.011226654052734375, 0.013234615325927734, 0.015242576599121094, 0.017250537872314453, 0.019258499145507812, 0.021266460418701172, 0.02327442169189453, 0.02528238296508789, 0.02729034423828125, 0.02929830551147461, 0.03130626678466797, 0.03331422805786133, 0.03532218933105469, 0.03733015060424805, 0.039338111877441406, 0.041346073150634766, 0.043354034423828125, 0.045361995697021484, 0.047369956970214844, 0.0493779182434082, 0.05138587951660156, 0.05339384078979492, 0.05540180206298828, 0.05740976333618164, 0.059417724609375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 6.0, 1.0, 4.0, 3.0, 2.0, 4.0, 3.0, 6.0, 4.0, 14.0, 8.0, 12.0, 9.0, 15.0, 12.0, 26.0, 15.0, 41.0, 74.0, 98.0, 161.0, 150.0, 104.0, 39.0, 21.0, 32.0, 24.0, 6.0, 18.0, 18.0, 15.0, 16.0, 6.0, 5.0, 0.0, 7.0, 4.0, 3.0, 6.0, 5.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0033130645751953125, -0.003214806318283081, -0.0031165480613708496, -0.003018289804458618, -0.0029200315475463867, -0.0028217732906341553, -0.002723515033721924, -0.0026252567768096924, -0.002526998519897461, -0.0024287402629852295, -0.002330482006072998, -0.0022322237491607666, -0.002133965492248535, -0.0020357072353363037, -0.0019374489784240723, -0.0018391907215118408, -0.0017409324645996094, -0.001642674207687378, -0.0015444159507751465, -0.001446157693862915, -0.0013478994369506836, -0.0012496411800384521, -0.0011513829231262207, -0.0010531246662139893, -0.0009548664093017578, -0.0008566081523895264, -0.0007583498954772949, -0.0006600916385650635, -0.000561833381652832, -0.0004635751247406006, -0.00036531686782836914, -0.0002670586109161377, -0.00016880035400390625, -7.05420970916748e-05, 2.771615982055664e-05, 0.00012597441673278809, 0.00022423267364501953, 0.000322490930557251, 0.0004207491874694824, 0.0005190074443817139, 0.0006172657012939453, 0.0007155239582061768, 0.0008137822151184082, 0.0009120404720306396, 0.001010298728942871, 0.0011085569858551025, 0.001206815242767334, 0.0013050734996795654, 0.0014033317565917969, 0.0015015900135040283, 0.0015998482704162598, 0.0016981065273284912, 0.0017963647842407227, 0.001894623041152954, 0.0019928812980651855, 0.002091139554977417, 0.0021893978118896484, 0.00228765606880188, 0.0023859143257141113, 0.0024841725826263428, 0.0025824308395385742, 0.0026806890964508057, 0.002778947353363037, 0.0028772056102752686, 0.0029754638671875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 9.0, 9.0, 6.0, 13.0, 7.0, 12.0, 18.0, 18.0, 19.0, 31.0, 31.0, 18.0, 43.0, 49.0, 53.0, 88.0, 144.0, 421.0, 1412.0, 8678.0, 202613.0, 812847.0, 18516.0, 2262.0, 542.0, 221.0, 101.0, 79.0, 49.0, 41.0, 30.0, 32.0, 14.0, 22.0, 16.0, 20.0, 17.0, 9.0, 9.0, 7.0, 10.0, 2.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.042327880859375, -0.040924072265625, -0.039520263671875, -0.038116455078125, -0.036712646484375, -0.035308837890625, -0.033905029296875, -0.032501220703125, -0.031097412109375, -0.029693603515625, -0.028289794921875, -0.026885986328125, -0.025482177734375, -0.024078369140625, -0.022674560546875, -0.021270751953125, -0.019866943359375, -0.018463134765625, -0.017059326171875, -0.015655517578125, -0.014251708984375, -0.012847900390625, -0.011444091796875, -0.010040283203125, -0.008636474609375, -0.007232666015625, -0.005828857421875, -0.004425048828125, -0.003021240234375, -0.001617431640625, -0.000213623046875, 0.001190185546875, 0.002593994140625, 0.003997802734375, 0.005401611328125, 0.006805419921875, 0.008209228515625, 0.009613037109375, 0.011016845703125, 0.012420654296875, 0.013824462890625, 0.015228271484375, 0.016632080078125, 0.018035888671875, 0.019439697265625, 0.020843505859375, 0.022247314453125, 0.023651123046875, 0.025054931640625, 0.026458740234375, 0.027862548828125, 0.029266357421875, 0.030670166015625, 0.032073974609375, 0.033477783203125, 0.034881591796875, 0.036285400390625, 0.037689208984375, 0.039093017578125, 0.040496826171875, 0.041900634765625, 0.043304443359375, 0.044708251953125, 0.046112060546875, 0.047515869140625]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 12.0, 12.0, 19.0, 39.0, 43.0, 73.0, 163.0, 272.0, 142.0, 79.0, 42.0, 33.0, 22.0, 11.0, 8.0, 7.0, 10.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01952221989631653, -0.019002266228199005, -0.018482312560081482, -0.01796235889196396, -0.017442405223846436, -0.016922451555728912, -0.01640249788761139, -0.015882546082139015, -0.015362592414021492, -0.014842638745903969, -0.014322685077786446, -0.013802731409668922, -0.013282778672873974, -0.01276282500475645, -0.012242871336638927, -0.011722917668521404, -0.011202964000403881, -0.010683010332286358, -0.010163056664168835, -0.009643103927373886, -0.009123150259256363, -0.00860319659113884, -0.008083242923021317, -0.007563289254903793, -0.0070433360524475574, -0.006523382384330034, -0.006003429181873798, -0.005483475513756275, -0.004963521845638752, -0.004443568643182516, -0.003923614975064993, -0.0034036615397781134, -0.002883707173168659, -0.0023637537378817797, -0.0018438001861795783, -0.001323846634477377, -0.0008038931991904974, -0.00028393976390361786, 0.00023601390421390533, 0.0007559673395007849, 0.0012759207747876644, 0.001795874210074544, 0.0023158276453614235, 0.0028357813134789467, 0.0033557347487658262, 0.0038756881840527058, 0.004395641852170229, 0.004915595054626465, 0.005435548722743988, 0.005955502390861511, 0.006475455593317747, 0.00699540926143527, 0.007515362463891506, 0.00803531613200903, 0.008555269800126553, 0.009075223468244076, 0.009595176205039024, 0.010115129873156548, 0.01063508354127407, 0.011155037209391594, 0.011674989946186543, 0.012194943614304066, 0.012714897282421589, 0.013234850950539112, 0.013754804618656635]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 4.0, 8.0, 12.0, 11.0, 14.0, 19.0, 15.0, 23.0, 19.0, 31.0, 17.0, 26.0, 33.0, 28.0, 29.0, 37.0, 38.0, 31.0, 36.0, 47.0, 33.0, 33.0, 33.0, 29.0, 42.0, 35.0, 30.0, 28.0, 26.0, 29.0, 27.0, 24.0, 21.0, 17.0, 8.0, 18.0, 22.0, 13.0, 15.0, 8.0, 9.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.005797326564788818, -0.005614700727164745, -0.005432074889540672, -0.005249449051916599, -0.005066823214292526, -0.004884197376668453, -0.00470157153904438, -0.004518945701420307, -0.004336319863796234, -0.004153694026172161, -0.003971068188548088, -0.003788442350924015, -0.003605816513299942, -0.003423190675675869, -0.003240564838051796, -0.003057939000427723, -0.00287531316280365, -0.002692687325179577, -0.002510061487555504, -0.002327435649931431, -0.002144809812307358, -0.0019621839746832848, -0.0017795581370592117, -0.0015969322994351387, -0.0014143064618110657, -0.0012316806241869926, -0.0010490547865629196, -0.0008664289489388466, -0.0006838031113147736, -0.0005011772736907005, -0.0003185514360666275, -0.00013592559844255447, 4.6700239181518555e-05, 0.00022932607680559158, 0.0004119519144296646, 0.0005945777520537376, 0.0007772035896778107, 0.0009598294273018837, 0.0011424552649259567, 0.0013250811025500298, 0.0015077069401741028, 0.0016903327777981758, 0.0018729586154222488, 0.002055584453046322, 0.002238210290670395, 0.002420836128294468, 0.002603461965918541, 0.002786087803542614, 0.002968713641166687, 0.00315133947879076, 0.003333965316414833, 0.003516591154038906, 0.003699216991662979, 0.003881842829287052, 0.004064468666911125, 0.004247094504535198, 0.004429720342159271, 0.004612346179783344, 0.004794972017407417, 0.00497759785503149, 0.005160223692655563, 0.005342849530279636, 0.005525475367903709, 0.0057081012055277824, 0.0058907270431518555]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 6.0, 14.0, 11.0, 11.0, 21.0, 16.0, 11.0, 14.0, 21.0, 32.0, 40.0, 28.0, 26.0, 44.0, 36.0, 31.0, 32.0, 40.0, 34.0, 44.0, 40.0, 36.0, 31.0, 27.0, 39.0, 30.0, 25.0, 27.0, 27.0, 36.0, 30.0, 19.0, 14.0, 22.0, 15.0, 11.0, 9.0, 5.0, 5.0, 6.0, 7.0, 6.0, 3.0, 2.0, 1.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1552734375, -1.118682861328125, -1.08209228515625, -1.045501708984375, -1.0089111328125, -0.972320556640625, -0.93572998046875, -0.899139404296875, -0.862548828125, -0.825958251953125, -0.78936767578125, -0.752777099609375, -0.7161865234375, -0.679595947265625, -0.64300537109375, -0.606414794921875, -0.56982421875, -0.533233642578125, -0.49664306640625, -0.460052490234375, -0.4234619140625, -0.386871337890625, -0.35028076171875, -0.313690185546875, -0.277099609375, -0.240509033203125, -0.20391845703125, -0.167327880859375, -0.1307373046875, -0.094146728515625, -0.05755615234375, -0.020965576171875, 0.015625, 0.052215576171875, 0.08880615234375, 0.125396728515625, 0.1619873046875, 0.198577880859375, 0.23516845703125, 0.271759033203125, 0.308349609375, 0.344940185546875, 0.38153076171875, 0.418121337890625, 0.4547119140625, 0.491302490234375, 0.52789306640625, 0.564483642578125, 0.60107421875, 0.637664794921875, 0.67425537109375, 0.710845947265625, 0.7474365234375, 0.784027099609375, 0.82061767578125, 0.857208251953125, 0.893798828125, 0.930389404296875, 0.96697998046875, 1.003570556640625, 1.0401611328125, 1.076751708984375, 1.11334228515625, 1.149932861328125, 1.1865234375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 11.0, 11.0, 16.0, 20.0, 33.0, 55.0, 87.0, 145.0, 195.0, 257.0, 475.0, 684.0, 1125.0, 1701.0, 2740.0, 4426.0, 7175.0, 11712.0, 19501.0, 32239.0, 54086.0, 88023.0, 139299.0, 189084.0, 177735.0, 122678.0, 76685.0, 46351.0, 28394.0, 16834.0, 10110.0, 6230.0, 3859.0, 2456.0, 1501.0, 939.0, 598.0, 397.0, 242.0, 135.0, 94.0, 75.0, 44.0, 26.0, 26.0, 11.0, 9.0, 10.0, 8.0, 6.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.84619140625, -0.8178482055664062, -0.7895050048828125, -0.7611618041992188, -0.732818603515625, -0.7044754028320312, -0.6761322021484375, -0.6477890014648438, -0.61944580078125, -0.5911026000976562, -0.5627593994140625, -0.5344161987304688, -0.506072998046875, -0.47772979736328125, -0.4493865966796875, -0.42104339599609375, -0.3927001953125, -0.36435699462890625, -0.3360137939453125, -0.30767059326171875, -0.279327392578125, -0.25098419189453125, -0.2226409912109375, -0.19429779052734375, -0.16595458984375, -0.13761138916015625, -0.1092681884765625, -0.08092498779296875, -0.052581787109375, -0.02423858642578125, 0.0041046142578125, 0.03244781494140625, 0.060791015625, 0.08913421630859375, 0.1174774169921875, 0.14582061767578125, 0.174163818359375, 0.20250701904296875, 0.2308502197265625, 0.25919342041015625, 0.28753662109375, 0.31587982177734375, 0.3442230224609375, 0.37256622314453125, 0.400909423828125, 0.42925262451171875, 0.4575958251953125, 0.48593902587890625, 0.5142822265625, 0.5426254272460938, 0.5709686279296875, 0.5993118286132812, 0.627655029296875, 0.6559982299804688, 0.6843414306640625, 0.7126846313476562, 0.74102783203125, 0.7693710327148438, 0.7977142333984375, 0.8260574340820312, 0.854400634765625, 0.8827438354492188, 0.9110870361328125, 0.9394302368164062, 0.9677734375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 1.0, 3.0, 5.0, 12.0, 7.0, 7.0, 12.0, 12.0, 16.0, 12.0, 22.0, 21.0, 29.0, 38.0, 37.0, 37.0, 57.0, 62.0, 87.0, 128.0, 284.0, 1401.0, 217.0, 112.0, 65.0, 60.0, 50.0, 37.0, 28.0, 25.0, 21.0, 21.0, 26.0, 21.0, 27.0, 9.0, 8.0, 3.0, 9.0, 9.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 1.0], "bins": [-5.44921875, -5.29931640625, -5.1494140625, -4.99951171875, -4.849609375, -4.69970703125, -4.5498046875, -4.39990234375, -4.25, -4.10009765625, -3.9501953125, -3.80029296875, -3.650390625, -3.50048828125, -3.3505859375, -3.20068359375, -3.05078125, -2.90087890625, -2.7509765625, -2.60107421875, -2.451171875, -2.30126953125, -2.1513671875, -2.00146484375, -1.8515625, -1.70166015625, -1.5517578125, -1.40185546875, -1.251953125, -1.10205078125, -0.9521484375, -0.80224609375, -0.65234375, -0.50244140625, -0.3525390625, -0.20263671875, -0.052734375, 0.09716796875, 0.2470703125, 0.39697265625, 0.546875, 0.69677734375, 0.8466796875, 0.99658203125, 1.146484375, 1.29638671875, 1.4462890625, 1.59619140625, 1.74609375, 1.89599609375, 2.0458984375, 2.19580078125, 2.345703125, 2.49560546875, 2.6455078125, 2.79541015625, 2.9453125, 3.09521484375, 3.2451171875, 3.39501953125, 3.544921875, 3.69482421875, 3.8447265625, 3.99462890625, 4.14453125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 2.0, 6.0, 11.0, 12.0, 9.0, 26.0, 22.0, 29.0, 45.0, 57.0, 72.0, 94.0, 249.0, 471.0, 1025.0, 3278.0, 26076.0, 987918.0, 2074958.0, 44530.0, 4338.0, 1237.0, 493.0, 280.0, 138.0, 108.0, 65.0, 38.0, 22.0, 17.0, 20.0, 15.0, 9.0, 11.0, 3.0, 7.0, 2.0, 0.0, 9.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5234375, -7.2734375, -7.0234375, -6.7734375, -6.5234375, -6.2734375, -6.0234375, -5.7734375, -5.5234375, -5.2734375, -5.0234375, -4.7734375, -4.5234375, -4.2734375, -4.0234375, -3.7734375, -3.5234375, -3.2734375, -3.0234375, -2.7734375, -2.5234375, -2.2734375, -2.0234375, -1.7734375, -1.5234375, -1.2734375, -1.0234375, -0.7734375, -0.5234375, -0.2734375, -0.0234375, 0.2265625, 0.4765625, 0.7265625, 0.9765625, 1.2265625, 1.4765625, 1.7265625, 1.9765625, 2.2265625, 2.4765625, 2.7265625, 2.9765625, 3.2265625, 3.4765625, 3.7265625, 3.9765625, 4.2265625, 4.4765625, 4.7265625, 4.9765625, 5.2265625, 5.4765625, 5.7265625, 5.9765625, 6.2265625, 6.4765625, 6.7265625, 6.9765625, 7.2265625, 7.4765625, 7.7265625, 7.9765625, 8.2265625, 8.4765625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [6.0, 4.0, 26.0, 110.0, 251.0, 358.0, 197.0, 57.0, 10.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.952155590057373, -4.00191068649292, -3.051665782928467, -2.1014206409454346, -1.1511757373809814, -0.20093059539794922, 0.7493143081665039, 1.699559211730957, 2.64980411529541, 3.6000490188598633, 4.550293922424316, 5.5005388259887695, 6.450783729553223, 7.401029109954834, 8.351274490356445, 9.301519393920898, 10.251764297485352, 11.202009201049805, 12.152254104614258, 13.102499008178711, 14.052743911743164, 15.002988815307617, 15.95323371887207, 16.903478622436523, 17.853723526000977, 18.80396842956543, 19.754213333129883, 20.704458236694336, 21.65470314025879, 22.604948043823242, 23.555192947387695, 24.50543785095215, 25.4556827545166, 26.405927658081055, 27.356172561645508, 28.30641746520996, 29.256662368774414, 30.206907272338867, 31.15715217590332, 32.107398986816406, 33.05764389038086, 34.00788879394531, 34.958133697509766, 35.90837860107422, 36.85862350463867, 37.808868408203125, 38.75911331176758, 39.70935821533203, 40.659603118896484, 41.60984802246094, 42.56009292602539, 43.510337829589844, 44.4605827331543, 45.41082763671875, 46.3610725402832, 47.311317443847656, 48.26156234741211, 49.21180725097656, 50.162052154541016, 51.11229705810547, 52.06254196166992, 53.012786865234375, 53.96303176879883, 54.91327667236328, 55.863521575927734]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 5.0, 3.0, 3.0, 11.0, 8.0, 14.0, 13.0, 11.0, 10.0, 17.0, 29.0, 21.0, 23.0, 30.0, 31.0, 34.0, 46.0, 32.0, 43.0, 42.0, 41.0, 55.0, 44.0, 44.0, 47.0, 37.0, 30.0, 32.0, 30.0, 32.0, 27.0, 29.0, 31.0, 23.0, 11.0, 11.0, 19.0, 13.0, 10.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.284618377685547, -16.785127639770508, -16.285634994506836, -15.786144256591797, -15.286653518676758, -14.787161827087402, -14.287670135498047, -13.788179397583008, -13.288687705993652, -12.789196014404297, -12.289705276489258, -11.790213584899902, -11.290721893310547, -10.791231155395508, -10.291739463806152, -9.792247772216797, -9.292757034301758, -8.793265342712402, -8.293774604797363, -7.794282913208008, -7.2947916984558105, -6.795300483703613, -6.295808792114258, -5.7963175773620605, -5.296826362609863, -4.797335147857666, -4.297843933105469, -3.7983522415161133, -3.298861026763916, -2.7993698120117188, -2.2998783588409424, -1.800386905670166, -1.3008947372436523, -0.8014034032821655, -0.3019120693206787, 0.1975792646408081, 0.6970705986022949, 1.1965618133544922, 1.6960532665252686, 2.195544719696045, 2.695035934448242, 3.1945271492004395, 3.694018602371216, 4.193510055541992, 4.6930012702941895, 5.192492485046387, 5.691984176635742, 6.1914753913879395, 6.690966606140137, 7.190457820892334, 7.689949035644531, 8.189440727233887, 8.688932418823242, 9.188423156738281, 9.687914848327637, 10.187406539916992, 10.686897277832031, 11.186388969421387, 11.685879707336426, 12.185371398925781, 12.68486213684082, 13.184353828430176, 13.683845520019531, 14.18333625793457, 14.682827949523926]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 4.0, 6.0, 10.0, 11.0, 13.0, 6.0, 13.0, 15.0, 17.0, 34.0, 20.0, 21.0, 28.0, 35.0, 41.0, 36.0, 31.0, 32.0, 46.0, 33.0, 35.0, 32.0, 33.0, 36.0, 46.0, 33.0, 27.0, 32.0, 41.0, 27.0, 23.0, 31.0, 20.0, 27.0, 12.0, 11.0, 18.0, 15.0, 7.0, 13.0, 10.0, 5.0, 6.0, 3.0, 1.0, 3.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.2314453125, -1.192413330078125, -1.15338134765625, -1.114349365234375, -1.0753173828125, -1.036285400390625, -0.99725341796875, -0.958221435546875, -0.919189453125, -0.880157470703125, -0.84112548828125, -0.802093505859375, -0.7630615234375, -0.724029541015625, -0.68499755859375, -0.645965576171875, -0.60693359375, -0.567901611328125, -0.52886962890625, -0.489837646484375, -0.4508056640625, -0.411773681640625, -0.37274169921875, -0.333709716796875, -0.294677734375, -0.255645751953125, -0.21661376953125, -0.177581787109375, -0.1385498046875, -0.099517822265625, -0.06048583984375, -0.021453857421875, 0.017578125, 0.056610107421875, 0.09564208984375, 0.134674072265625, 0.1737060546875, 0.212738037109375, 0.25177001953125, 0.290802001953125, 0.329833984375, 0.368865966796875, 0.40789794921875, 0.446929931640625, 0.4859619140625, 0.524993896484375, 0.56402587890625, 0.603057861328125, 0.64208984375, 0.681121826171875, 0.72015380859375, 0.759185791015625, 0.7982177734375, 0.837249755859375, 0.87628173828125, 0.915313720703125, 0.954345703125, 0.993377685546875, 1.03240966796875, 1.071441650390625, 1.1104736328125, 1.149505615234375, 1.18853759765625, 1.227569580078125, 1.2666015625]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 7.0, 8.0, 9.0, 15.0, 22.0, 26.0, 38.0, 59.0, 95.0, 100.0, 237.0, 431.0, 919.0, 2016.0, 5173.0, 14597.0, 43650.0, 145392.0, 595259.0, 1977524.0, 1064136.0, 241184.0, 68043.0, 21998.0, 7764.0, 2915.0, 1219.0, 595.0, 293.0, 191.0, 121.0, 77.0, 44.0, 31.0, 27.0, 15.0, 11.0, 12.0, 8.0, 9.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.576171875, -2.489410400390625, -2.40264892578125, -2.315887451171875, -2.2291259765625, -2.142364501953125, -2.05560302734375, -1.968841552734375, -1.882080078125, -1.795318603515625, -1.70855712890625, -1.621795654296875, -1.5350341796875, -1.448272705078125, -1.36151123046875, -1.274749755859375, -1.18798828125, -1.101226806640625, -1.01446533203125, -0.927703857421875, -0.8409423828125, -0.754180908203125, -0.66741943359375, -0.580657958984375, -0.493896484375, -0.407135009765625, -0.32037353515625, -0.233612060546875, -0.1468505859375, -0.060089111328125, 0.02667236328125, 0.113433837890625, 0.2001953125, 0.286956787109375, 0.37371826171875, 0.460479736328125, 0.5472412109375, 0.634002685546875, 0.72076416015625, 0.807525634765625, 0.894287109375, 0.981048583984375, 1.06781005859375, 1.154571533203125, 1.2413330078125, 1.328094482421875, 1.41485595703125, 1.501617431640625, 1.58837890625, 1.675140380859375, 1.76190185546875, 1.848663330078125, 1.9354248046875, 2.022186279296875, 2.10894775390625, 2.195709228515625, 2.282470703125, 2.369232177734375, 2.45599365234375, 2.542755126953125, 2.6295166015625, 2.716278076171875, 2.80303955078125, 2.889801025390625, 2.9765625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 14.0, 24.0, 40.0, 52.0, 89.0, 182.0, 338.0, 566.0, 848.0, 812.0, 467.0, 289.0, 159.0, 85.0, 45.0, 30.0, 17.0, 5.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.828125, -7.6033935546875, -7.378662109375, -7.1539306640625, -6.92919921875, -6.7044677734375, -6.479736328125, -6.2550048828125, -6.0302734375, -5.8055419921875, -5.580810546875, -5.3560791015625, -5.13134765625, -4.9066162109375, -4.681884765625, -4.4571533203125, -4.232421875, -4.0076904296875, -3.782958984375, -3.5582275390625, -3.33349609375, -3.1087646484375, -2.884033203125, -2.6593017578125, -2.4345703125, -2.2098388671875, -1.985107421875, -1.7603759765625, -1.53564453125, -1.3109130859375, -1.086181640625, -0.8614501953125, -0.63671875, -0.4119873046875, -0.187255859375, 0.0374755859375, 0.26220703125, 0.4869384765625, 0.711669921875, 0.9364013671875, 1.1611328125, 1.3858642578125, 1.610595703125, 1.8353271484375, 2.06005859375, 2.2847900390625, 2.509521484375, 2.7342529296875, 2.958984375, 3.1837158203125, 3.408447265625, 3.6331787109375, 3.85791015625, 4.0826416015625, 4.307373046875, 4.5321044921875, 4.7568359375, 4.9815673828125, 5.206298828125, 5.4310302734375, 5.65576171875, 5.8804931640625, 6.105224609375, 6.3299560546875, 6.5546875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 8.0, 17.0, 22.0, 34.0, 69.0, 139.0, 263.0, 595.0, 1561.0, 6173.0, 45958.0, 637469.0, 3092792.0, 372967.0, 29487.0, 4492.0, 1244.0, 496.0, 231.0, 108.0, 58.0, 47.0, 22.0, 14.0, 4.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9296875, -8.635986328125, -8.34228515625, -8.048583984375, -7.7548828125, -7.461181640625, -7.16748046875, -6.873779296875, -6.580078125, -6.286376953125, -5.99267578125, -5.698974609375, -5.4052734375, -5.111572265625, -4.81787109375, -4.524169921875, -4.23046875, -3.936767578125, -3.64306640625, -3.349365234375, -3.0556640625, -2.761962890625, -2.46826171875, -2.174560546875, -1.880859375, -1.587158203125, -1.29345703125, -0.999755859375, -0.7060546875, -0.412353515625, -0.11865234375, 0.175048828125, 0.46875, 0.762451171875, 1.05615234375, 1.349853515625, 1.6435546875, 1.937255859375, 2.23095703125, 2.524658203125, 2.818359375, 3.112060546875, 3.40576171875, 3.699462890625, 3.9931640625, 4.286865234375, 4.58056640625, 4.874267578125, 5.16796875, 5.461669921875, 5.75537109375, 6.049072265625, 6.3427734375, 6.636474609375, 6.93017578125, 7.223876953125, 7.517578125, 7.811279296875, 8.10498046875, 8.398681640625, 8.6923828125, 8.986083984375, 9.27978515625, 9.573486328125, 9.8671875]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 11.0, 27.0, 54.0, 79.0, 129.0, 167.0, 164.0, 124.0, 116.0, 68.0, 31.0, 21.0, 9.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.20561218261719, -37.1865348815918, -36.16745376586914, -35.14837646484375, -34.129295349121094, -33.1102180480957, -32.09114074707031, -31.07206153869629, -30.052982330322266, -29.033903121948242, -28.01482391357422, -26.995746612548828, -25.976667404174805, -24.95758819580078, -23.93851089477539, -22.919431686401367, -21.900352478027344, -20.88127326965332, -19.862194061279297, -18.843116760253906, -17.824037551879883, -16.80495834350586, -15.785880088806152, -14.766801834106445, -13.747722625732422, -12.728643417358398, -11.709565162658691, -10.690486907958984, -9.671407699584961, -8.652328491210938, -7.6332502365112305, -6.614171504974365, -5.595096588134766, -4.5760178565979, -3.556939125061035, -2.53786039352417, -1.5187816619873047, -0.49970293045043945, 0.5193758010864258, 1.538454532623291, 2.5575332641601562, 3.5766119956970215, 4.595690727233887, 5.614769458770752, 6.633848190307617, 7.652926921844482, 8.672005653381348, 9.691083908081055, 10.710163116455078, 11.729242324829102, 12.748320579528809, 13.767398834228516, 14.786478042602539, 15.805557250976562, 16.824634552001953, 17.843713760375977, 18.86279296875, 19.881872177124023, 20.900951385498047, 21.920028686523438, 22.93910789489746, 23.958187103271484, 24.977264404296875, 25.9963436126709, 27.015422821044922]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 0.0, 6.0, 6.0, 10.0, 8.0, 11.0, 14.0, 10.0, 14.0, 15.0, 21.0, 25.0, 28.0, 34.0, 27.0, 40.0, 42.0, 41.0, 34.0, 38.0, 27.0, 47.0, 46.0, 39.0, 32.0, 39.0, 33.0, 37.0, 33.0, 29.0, 30.0, 28.0, 29.0, 15.0, 17.0, 22.0, 17.0, 10.0, 10.0, 9.0, 7.0, 13.0, 4.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.176565170288086, -12.760970115661621, -12.345376014709473, -11.929780960083008, -11.514185905456543, -11.098590850830078, -10.68299674987793, -10.267401695251465, -9.851806640625, -9.436211585998535, -9.020617485046387, -8.605022430419922, -8.189427375793457, -7.77383279800415, -7.358238220214844, -6.942643165588379, -6.527048587799072, -6.111454010009766, -5.695858955383301, -5.280264377593994, -4.864669322967529, -4.449074745178223, -4.033479690551758, -3.617885112762451, -3.2022902965545654, -2.7866954803466797, -2.371100664138794, -1.9555059671401978, -1.539911150932312, -1.1243164539337158, -0.7087216377258301, -0.29312682151794434, 0.1224679946899414, 0.5380628108978271, 0.9536575675010681, 1.369252324104309, 1.7848471403121948, 2.200441837310791, 2.6160366535186768, 3.0316314697265625, 3.4472262859344482, 3.862821102142334, 4.278415679931641, 4.6940107345581055, 5.109605312347412, 5.525199890136719, 5.940794944763184, 6.356389999389648, 6.771984577178955, 7.187579154968262, 7.603174209594727, 8.018769264221191, 8.43436336517334, 8.849958419799805, 9.26555347442627, 9.681148529052734, 10.096742630004883, 10.512337684631348, 10.927931785583496, 11.343526840209961, 11.759121894836426, 12.17471694946289, 12.590311050415039, 13.005906105041504, 13.421501159667969]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 3.0, 11.0, 13.0, 7.0, 13.0, 8.0, 15.0, 15.0, 18.0, 25.0, 21.0, 35.0, 36.0, 37.0, 25.0, 34.0, 32.0, 39.0, 44.0, 40.0, 25.0, 39.0, 42.0, 35.0, 45.0, 28.0, 34.0, 34.0, 22.0, 32.0, 30.0, 17.0, 18.0, 24.0, 19.0, 17.0, 12.0, 12.0, 8.0, 3.0, 5.0, 6.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.139617919921875, -1.09857177734375, -1.057525634765625, -1.0164794921875, -0.975433349609375, -0.93438720703125, -0.893341064453125, -0.852294921875, -0.811248779296875, -0.77020263671875, -0.729156494140625, -0.6881103515625, -0.647064208984375, -0.60601806640625, -0.564971923828125, -0.52392578125, -0.482879638671875, -0.44183349609375, -0.400787353515625, -0.3597412109375, -0.318695068359375, -0.27764892578125, -0.236602783203125, -0.195556640625, -0.154510498046875, -0.11346435546875, -0.072418212890625, -0.0313720703125, 0.009674072265625, 0.05072021484375, 0.091766357421875, 0.1328125, 0.173858642578125, 0.21490478515625, 0.255950927734375, 0.2969970703125, 0.338043212890625, 0.37908935546875, 0.420135498046875, 0.461181640625, 0.502227783203125, 0.54327392578125, 0.584320068359375, 0.6253662109375, 0.666412353515625, 0.70745849609375, 0.748504638671875, 0.78955078125, 0.830596923828125, 0.87164306640625, 0.912689208984375, 0.9537353515625, 0.994781494140625, 1.03582763671875, 1.076873779296875, 1.117919921875, 1.158966064453125, 1.20001220703125, 1.241058349609375, 1.2821044921875, 1.323150634765625, 1.36419677734375, 1.405242919921875, 1.4462890625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 5.0, 2.0, 9.0, 13.0, 13.0, 11.0, 15.0, 34.0, 55.0, 68.0, 83.0, 137.0, 198.0, 282.0, 402.0, 607.0, 859.0, 1330.0, 2082.0, 3127.0, 4957.0, 7756.0, 12695.0, 20088.0, 32821.0, 53202.0, 85959.0, 131749.0, 179452.0, 173933.0, 124286.0, 80305.0, 50323.0, 30606.0, 18585.0, 11773.0, 7376.0, 4603.0, 2929.0, 1897.0, 1266.0, 893.0, 519.0, 350.0, 275.0, 162.0, 127.0, 112.0, 55.0, 46.0, 42.0, 22.0, 20.0, 13.0, 9.0, 11.0, 10.0, 9.0, 1.0, 1.0, 1.0], "bins": [-0.13671875, -0.13243675231933594, -0.12815475463867188, -0.12387275695800781, -0.11959075927734375, -0.11530876159667969, -0.11102676391601562, -0.10674476623535156, -0.1024627685546875, -0.09818077087402344, -0.09389877319335938, -0.08961677551269531, -0.08533477783203125, -0.08105278015136719, -0.07677078247070312, -0.07248878479003906, -0.068206787109375, -0.06392478942871094, -0.059642791748046875, -0.05536079406738281, -0.05107879638671875, -0.04679679870605469, -0.042514801025390625, -0.03823280334472656, -0.0339508056640625, -0.029668807983398438, -0.025386810302734375, -0.021104812622070312, -0.01682281494140625, -0.012540817260742188, -0.008258819580078125, -0.0039768218994140625, 0.00030517578125, 0.0045871734619140625, 0.008869171142578125, 0.013151168823242188, 0.01743316650390625, 0.021715164184570312, 0.025997161865234375, 0.030279159545898438, 0.0345611572265625, 0.03884315490722656, 0.043125152587890625, 0.04740715026855469, 0.05168914794921875, 0.05597114562988281, 0.060253143310546875, 0.06453514099121094, 0.068817138671875, 0.07309913635253906, 0.07738113403320312, 0.08166313171386719, 0.08594512939453125, 0.09022712707519531, 0.09450912475585938, 0.09879112243652344, 0.1030731201171875, 0.10735511779785156, 0.11163711547851562, 0.11591911315917969, 0.12020111083984375, 0.12448310852050781, 0.12876510620117188, 0.13304710388183594, 0.1373291015625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 4.0, 5.0, 12.0, 5.0, 10.0, 10.0, 11.0, 8.0, 26.0, 18.0, 27.0, 20.0, 34.0, 33.0, 35.0, 36.0, 37.0, 37.0, 39.0, 46.0, 1071.0, 41.0, 54.0, 50.0, 45.0, 36.0, 43.0, 44.0, 25.0, 25.0, 21.0, 25.0, 19.0, 24.0, 19.0, 14.0, 11.0, 2.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0888671875, -1.0532379150390625, -1.017608642578125, -0.9819793701171875, -0.94635009765625, -0.9107208251953125, -0.875091552734375, -0.8394622802734375, -0.8038330078125, -0.7682037353515625, -0.732574462890625, -0.6969451904296875, -0.66131591796875, -0.6256866455078125, -0.590057373046875, -0.5544281005859375, -0.518798828125, -0.4831695556640625, -0.447540283203125, -0.4119110107421875, -0.37628173828125, -0.3406524658203125, -0.305023193359375, -0.2693939208984375, -0.2337646484375, -0.1981353759765625, -0.162506103515625, -0.1268768310546875, -0.09124755859375, -0.0556182861328125, -0.019989013671875, 0.0156402587890625, 0.05126953125, 0.0868988037109375, 0.122528076171875, 0.1581573486328125, 0.19378662109375, 0.2294158935546875, 0.265045166015625, 0.3006744384765625, 0.3363037109375, 0.3719329833984375, 0.407562255859375, 0.4431915283203125, 0.47882080078125, 0.5144500732421875, 0.550079345703125, 0.5857086181640625, 0.621337890625, 0.6569671630859375, 0.692596435546875, 0.7282257080078125, 0.76385498046875, 0.7994842529296875, 0.835113525390625, 0.8707427978515625, 0.9063720703125, 0.9420013427734375, 0.977630615234375, 1.0132598876953125, 1.04888916015625, 1.0845184326171875, 1.120147705078125, 1.1557769775390625, 1.19140625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 12.0, 9.0, 17.0, 32.0, 38.0, 61.0, 68.0, 109.0, 177.0, 270.0, 377.0, 604.0, 963.0, 1539.0, 2427.0, 3764.0, 6181.0, 9449.0, 15307.0, 24878.0, 41081.0, 66590.0, 106854.0, 167550.0, 1213898.0, 161756.0, 103429.0, 65203.0, 39842.0, 24228.0, 14968.0, 9576.0, 5831.0, 3525.0, 2330.0, 1493.0, 952.0, 614.0, 405.0, 245.0, 157.0, 111.0, 73.0, 50.0, 31.0, 30.0, 12.0, 8.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0784912109375, -0.07599735260009766, -0.07350349426269531, -0.07100963592529297, -0.06851577758789062, -0.06602191925048828, -0.06352806091308594, -0.061034202575683594, -0.05854034423828125, -0.056046485900878906, -0.05355262756347656, -0.05105876922607422, -0.048564910888671875, -0.04607105255126953, -0.04357719421386719, -0.041083335876464844, -0.0385894775390625, -0.036095619201660156, -0.03360176086425781, -0.03110790252685547, -0.028614044189453125, -0.02612018585205078, -0.023626327514648438, -0.021132469177246094, -0.01863861083984375, -0.016144752502441406, -0.013650894165039062, -0.011157035827636719, -0.008663177490234375, -0.006169319152832031, -0.0036754608154296875, -0.0011816024780273438, 0.001312255859375, 0.0038061141967773438, 0.0062999725341796875, 0.008793830871582031, 0.011287689208984375, 0.013781547546386719, 0.016275405883789062, 0.018769264221191406, 0.02126312255859375, 0.023756980895996094, 0.026250839233398438, 0.02874469757080078, 0.031238555908203125, 0.03373241424560547, 0.03622627258300781, 0.038720130920410156, 0.0412139892578125, 0.043707847595214844, 0.04620170593261719, 0.04869556427001953, 0.051189422607421875, 0.05368328094482422, 0.05617713928222656, 0.058670997619628906, 0.06116485595703125, 0.0636587142944336, 0.06615257263183594, 0.06864643096923828, 0.07114028930664062, 0.07363414764404297, 0.07612800598144531, 0.07862186431884766, 0.08111572265625]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 10.0, 10.0, 7.0, 9.0, 11.0, 11.0, 12.0, 14.0, 16.0, 22.0, 29.0, 32.0, 33.0, 59.0, 70.0, 113.0, 120.0, 81.0, 67.0, 52.0, 38.0, 18.0, 20.0, 17.0, 19.0, 21.0, 15.0, 11.0, 16.0, 5.0, 9.0, 4.0, 2.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.0071563720703125, -0.006940722465515137, -0.0067250728607177734, -0.00650942325592041, -0.006293773651123047, -0.006078124046325684, -0.00586247444152832, -0.005646824836730957, -0.005431175231933594, -0.0052155256271362305, -0.004999876022338867, -0.004784226417541504, -0.004568576812744141, -0.004352927207946777, -0.004137277603149414, -0.003921627998352051, -0.0037059783935546875, -0.0034903287887573242, -0.003274679183959961, -0.0030590295791625977, -0.0028433799743652344, -0.002627730369567871, -0.002412080764770508, -0.0021964311599731445, -0.0019807815551757812, -0.001765131950378418, -0.0015494823455810547, -0.0013338327407836914, -0.0011181831359863281, -0.0009025335311889648, -0.0006868839263916016, -0.0004712343215942383, -0.000255584716796875, -3.993511199951172e-05, 0.00017571449279785156, 0.00039136409759521484, 0.0006070137023925781, 0.0008226633071899414, 0.0010383129119873047, 0.001253962516784668, 0.0014696121215820312, 0.0016852617263793945, 0.0019009113311767578, 0.002116560935974121, 0.0023322105407714844, 0.0025478601455688477, 0.002763509750366211, 0.0029791593551635742, 0.0031948089599609375, 0.0034104585647583008, 0.003626108169555664, 0.0038417577743530273, 0.004057407379150391, 0.004273056983947754, 0.004488706588745117, 0.0047043561935424805, 0.004920005798339844, 0.005135655403137207, 0.00535130500793457, 0.005566954612731934, 0.005782604217529297, 0.00599825382232666, 0.0062139034271240234, 0.006429553031921387, 0.00664520263671875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 6.0, 12.0, 12.0, 18.0, 24.0, 38.0, 49.0, 65.0, 92.0, 135.0, 259.0, 817.0, 3681.0, 23527.0, 756168.0, 245328.0, 14547.0, 2450.0, 668.0, 273.0, 112.0, 64.0, 41.0, 35.0, 27.0, 23.0, 18.0, 12.0, 12.0, 11.0, 8.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1268310546875, -0.12272453308105469, -0.11861801147460938, -0.11451148986816406, -0.11040496826171875, -0.10629844665527344, -0.10219192504882812, -0.09808540344238281, -0.0939788818359375, -0.08987236022949219, -0.08576583862304688, -0.08165931701660156, -0.07755279541015625, -0.07344627380371094, -0.06933975219726562, -0.06523323059082031, -0.061126708984375, -0.05702018737792969, -0.052913665771484375, -0.04880714416503906, -0.04470062255859375, -0.04059410095214844, -0.036487579345703125, -0.03238105773925781, -0.0282745361328125, -0.024168014526367188, -0.020061492919921875, -0.015954971313476562, -0.01184844970703125, -0.0077419281005859375, -0.003635406494140625, 0.0004711151123046875, 0.00457763671875, 0.008684158325195312, 0.012790679931640625, 0.016897201538085938, 0.02100372314453125, 0.025110244750976562, 0.029216766357421875, 0.03332328796386719, 0.0374298095703125, 0.04153633117675781, 0.045642852783203125, 0.04974937438964844, 0.05385589599609375, 0.05796241760253906, 0.062068939208984375, 0.06617546081542969, 0.070281982421875, 0.07438850402832031, 0.07849502563476562, 0.08260154724121094, 0.08670806884765625, 0.09081459045410156, 0.09492111206054688, 0.09902763366699219, 0.1031341552734375, 0.10724067687988281, 0.11134719848632812, 0.11545372009277344, 0.11956024169921875, 0.12366676330566406, 0.12777328491210938, 0.1318798065185547, 0.135986328125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 4.0, 2.0, 4.0, 2.0, 7.0, 7.0, 17.0, 33.0, 52.0, 131.0, 295.0, 207.0, 111.0, 47.0, 33.0, 21.0, 13.0, 8.0, 5.0, 6.0, 2.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034836478531360626, -0.032118216156959534, -0.02939995564520359, -0.026681695133447647, -0.023963432759046555, -0.021245170384645462, -0.01852690987288952, -0.015808649361133575, -0.013090386986732483, -0.010372125543653965, -0.007653864100575447, -0.004935602657496929, -0.0022173412144184113, 0.0005009202286601067, 0.0032191816717386246, 0.005937442183494568, 0.00865570455789566, 0.011373966000974178, 0.014092227444052696, 0.01681048795580864, 0.019528750330209732, 0.022247012704610825, 0.024965273216366768, 0.02768353372812271, 0.030401796102523804, 0.033120058476924896, 0.03583832085132599, 0.03855657950043678, 0.041274841874837875, 0.04399310424923897, 0.04671136289834976, 0.049429625272750854, 0.05214788019657135, 0.05486614257097244, 0.057584404945373535, 0.06030266359448433, 0.06302092969417572, 0.06573918461799622, 0.06845744699239731, 0.0711757093667984, 0.0738939717411995, 0.07661223411560059, 0.07933049649000168, 0.08204875886440277, 0.08476701378822327, 0.08748527616262436, 0.09020353853702545, 0.09292180091142654, 0.09564006328582764, 0.09835832566022873, 0.10107658803462982, 0.10379485040903091, 0.106513112783432, 0.1092313677072525, 0.1119496300816536, 0.11466789245605469, 0.11738615483045578, 0.12010441720485687, 0.12282267957925797, 0.12554094195365906, 0.12825919687747955, 0.13097746670246124, 0.13369572162628174, 0.13641399145126343, 0.13913224637508392]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 3.0, 8.0, 5.0, 7.0, 14.0, 10.0, 16.0, 12.0, 19.0, 31.0, 25.0, 23.0, 26.0, 42.0, 29.0, 30.0, 42.0, 31.0, 39.0, 43.0, 34.0, 29.0, 39.0, 31.0, 36.0, 32.0, 38.0, 37.0, 26.0, 28.0, 24.0, 24.0, 20.0, 18.0, 24.0, 10.0, 14.0, 13.0, 11.0, 10.0, 5.0, 12.0, 8.0, 3.0, 4.0, 1.0, 7.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.017328619956970215, -0.016740141436457634, -0.016151662915945053, -0.015563184395432472, -0.014974705874919891, -0.01438622735440731, -0.01379774883389473, -0.013209270313382149, -0.012620791792869568, -0.012032313272356987, -0.011443834751844406, -0.010855356231331825, -0.010266877710819244, -0.009678399190306664, -0.009089920669794083, -0.008501442149281502, -0.007912963628768921, -0.00732448510825634, -0.006736006587743759, -0.006147528067231178, -0.005559049546718597, -0.0049705710262060165, -0.004382092505693436, -0.003793613985180855, -0.003205135464668274, -0.002616656944155693, -0.002028178423643112, -0.0014396999031305313, -0.0008512213826179504, -0.00026274286210536957, 0.0003257356584072113, 0.0009142141789197922, 0.001502692699432373, 0.002091171219944954, 0.002679649740457535, 0.0032681282609701157, 0.0038566067814826965, 0.004445085301995277, 0.005033563822507858, 0.005622042343020439, 0.00621052086353302, 0.006798999384045601, 0.007387477904558182, 0.007975956425070763, 0.008564434945583344, 0.009152913466095924, 0.009741391986608505, 0.010329870507121086, 0.010918349027633667, 0.011506827548146248, 0.012095306068658829, 0.01268378458917141, 0.01327226310968399, 0.013860741630196571, 0.014449220150709152, 0.015037698671221733, 0.015626177191734314, 0.016214655712246895, 0.016803134232759476, 0.017391612753272057, 0.017980091273784637, 0.01856856979429722, 0.0191570483148098, 0.01974552683532238, 0.02033400535583496]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 3.0, 3.0, 10.0, 14.0, 7.0, 13.0, 8.0, 15.0, 16.0, 17.0, 25.0, 21.0, 35.0, 36.0, 37.0, 24.0, 35.0, 32.0, 37.0, 46.0, 39.0, 26.0, 38.0, 43.0, 34.0, 45.0, 29.0, 34.0, 34.0, 22.0, 32.0, 29.0, 18.0, 17.0, 25.0, 19.0, 17.0, 12.0, 12.0, 8.0, 3.0, 5.0, 6.0, 9.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1806640625, -1.1396331787109375, -1.098602294921875, -1.0575714111328125, -1.01654052734375, -0.9755096435546875, -0.934478759765625, -0.8934478759765625, -0.8524169921875, -0.8113861083984375, -0.770355224609375, -0.7293243408203125, -0.68829345703125, -0.6472625732421875, -0.606231689453125, -0.5652008056640625, -0.524169921875, -0.4831390380859375, -0.442108154296875, -0.4010772705078125, -0.36004638671875, -0.3190155029296875, -0.277984619140625, -0.2369537353515625, -0.1959228515625, -0.1548919677734375, -0.113861083984375, -0.0728302001953125, -0.03179931640625, 0.0092315673828125, 0.050262451171875, 0.0912933349609375, 0.13232421875, 0.1733551025390625, 0.214385986328125, 0.2554168701171875, 0.29644775390625, 0.3374786376953125, 0.378509521484375, 0.4195404052734375, 0.4605712890625, 0.5016021728515625, 0.542633056640625, 0.5836639404296875, 0.62469482421875, 0.6657257080078125, 0.706756591796875, 0.7477874755859375, 0.788818359375, 0.8298492431640625, 0.870880126953125, 0.9119110107421875, 0.95294189453125, 0.9939727783203125, 1.035003662109375, 1.0760345458984375, 1.1170654296875, 1.1580963134765625, 1.199127197265625, 1.2401580810546875, 1.28118896484375, 1.3222198486328125, 1.363250732421875, 1.4042816162109375, 1.4453125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 8.0, 8.0, 8.0, 12.0, 17.0, 24.0, 36.0, 59.0, 81.0, 147.0, 238.0, 411.0, 716.0, 1334.0, 2375.0, 4539.0, 8842.0, 17584.0, 35992.0, 79117.0, 200483.0, 405980.0, 161728.0, 66539.0, 30921.0, 14847.0, 7736.0, 4008.0, 2060.0, 1096.0, 675.0, 359.0, 204.0, 140.0, 69.0, 44.0, 33.0, 22.0, 13.0, 12.0, 4.0, 6.0, 6.0, 5.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-2.595703125, -2.520233154296875, -2.44476318359375, -2.369293212890625, -2.2938232421875, -2.218353271484375, -2.14288330078125, -2.067413330078125, -1.991943359375, -1.916473388671875, -1.84100341796875, -1.765533447265625, -1.6900634765625, -1.614593505859375, -1.53912353515625, -1.463653564453125, -1.38818359375, -1.312713623046875, -1.23724365234375, -1.161773681640625, -1.0863037109375, -1.010833740234375, -0.93536376953125, -0.859893798828125, -0.784423828125, -0.708953857421875, -0.63348388671875, -0.558013916015625, -0.4825439453125, -0.407073974609375, -0.33160400390625, -0.256134033203125, -0.1806640625, -0.105194091796875, -0.02972412109375, 0.045745849609375, 0.1212158203125, 0.196685791015625, 0.27215576171875, 0.347625732421875, 0.423095703125, 0.498565673828125, 0.57403564453125, 0.649505615234375, 0.7249755859375, 0.800445556640625, 0.87591552734375, 0.951385498046875, 1.02685546875, 1.102325439453125, 1.17779541015625, 1.253265380859375, 1.3287353515625, 1.404205322265625, 1.47967529296875, 1.555145263671875, 1.630615234375, 1.706085205078125, 1.78155517578125, 1.857025146484375, 1.9324951171875, 2.007965087890625, 2.08343505859375, 2.158905029296875, 2.234375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 6.0, 8.0, 12.0, 9.0, 10.0, 10.0, 17.0, 15.0, 33.0, 33.0, 35.0, 30.0, 37.0, 64.0, 58.0, 111.0, 135.0, 274.0, 1394.0, 205.0, 109.0, 66.0, 60.0, 39.0, 38.0, 36.0, 26.0, 30.0, 19.0, 30.0, 20.0, 10.0, 11.0, 11.0, 7.0, 6.0, 8.0, 8.0, 3.0, 5.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.55078125, -5.38397216796875, -5.2171630859375, -5.05035400390625, -4.883544921875, -4.71673583984375, -4.5499267578125, -4.38311767578125, -4.21630859375, -4.04949951171875, -3.8826904296875, -3.71588134765625, -3.549072265625, -3.38226318359375, -3.2154541015625, -3.04864501953125, -2.8818359375, -2.71502685546875, -2.5482177734375, -2.38140869140625, -2.214599609375, -2.04779052734375, -1.8809814453125, -1.71417236328125, -1.54736328125, -1.38055419921875, -1.2137451171875, -1.04693603515625, -0.880126953125, -0.71331787109375, -0.5465087890625, -0.37969970703125, -0.212890625, -0.04608154296875, 0.1207275390625, 0.28753662109375, 0.454345703125, 0.62115478515625, 0.7879638671875, 0.95477294921875, 1.12158203125, 1.28839111328125, 1.4552001953125, 1.62200927734375, 1.788818359375, 1.95562744140625, 2.1224365234375, 2.28924560546875, 2.4560546875, 2.62286376953125, 2.7896728515625, 2.95648193359375, 3.123291015625, 3.29010009765625, 3.4569091796875, 3.62371826171875, 3.79052734375, 3.95733642578125, 4.1241455078125, 4.29095458984375, 4.457763671875, 4.62457275390625, 4.7913818359375, 4.95819091796875, 5.125]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 8.0, 2.0, 14.0, 9.0, 9.0, 14.0, 16.0, 17.0, 27.0, 39.0, 36.0, 65.0, 110.0, 154.0, 198.0, 404.0, 1093.0, 4109.0, 30311.0, 582820.0, 2422330.0, 91528.0, 9078.0, 1853.0, 617.0, 271.0, 147.0, 114.0, 79.0, 50.0, 35.0, 32.0, 21.0, 23.0, 14.0, 18.0, 17.0, 8.0, 3.0, 7.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.2109375, -7.929931640625, -7.64892578125, -7.367919921875, -7.0869140625, -6.805908203125, -6.52490234375, -6.243896484375, -5.962890625, -5.681884765625, -5.40087890625, -5.119873046875, -4.8388671875, -4.557861328125, -4.27685546875, -3.995849609375, -3.71484375, -3.433837890625, -3.15283203125, -2.871826171875, -2.5908203125, -2.309814453125, -2.02880859375, -1.747802734375, -1.466796875, -1.185791015625, -0.90478515625, -0.623779296875, -0.3427734375, -0.061767578125, 0.21923828125, 0.500244140625, 0.78125, 1.062255859375, 1.34326171875, 1.624267578125, 1.9052734375, 2.186279296875, 2.46728515625, 2.748291015625, 3.029296875, 3.310302734375, 3.59130859375, 3.872314453125, 4.1533203125, 4.434326171875, 4.71533203125, 4.996337890625, 5.27734375, 5.558349609375, 5.83935546875, 6.120361328125, 6.4013671875, 6.682373046875, 6.96337890625, 7.244384765625, 7.525390625, 7.806396484375, 8.08740234375, 8.368408203125, 8.6494140625, 8.930419921875, 9.21142578125, 9.492431640625, 9.7734375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 14.0, 40.0, 101.0, 228.0, 260.0, 206.0, 101.0, 47.0, 9.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9103498458862305, -5.981358528137207, -5.052367210388184, -4.123375415802002, -3.1943840980529785, -2.265392780303955, -1.3364009857177734, -0.40740966796875, 0.5215816497802734, 1.4505730867385864, 2.3795645236968994, 3.308556079864502, 4.237547397613525, 5.166538715362549, 6.0955305099487305, 7.024521827697754, 7.953513145446777, 8.8825044631958, 9.811495780944824, 10.740488052368164, 11.669479370117188, 12.598470687866211, 13.527462005615234, 14.456453323364258, 15.385444641113281, 16.314435958862305, 17.243427276611328, 18.17241859436035, 19.101409912109375, 20.0304012298584, 20.959392547607422, 21.888385772705078, 22.81737518310547, 23.746366500854492, 24.675357818603516, 25.60434913635254, 26.533340454101562, 27.462331771850586, 28.39132308959961, 29.320316314697266, 30.249305725097656, 31.17829704284668, 32.1072883605957, 33.03628158569336, 33.96527099609375, 34.894264221191406, 35.8232536315918, 36.75224685668945, 37.681236267089844, 38.6102294921875, 39.53921890258789, 40.46821212768555, 41.39720153808594, 42.326194763183594, 43.255184173583984, 44.18417739868164, 45.1131706237793, 46.04216384887695, 46.971153259277344, 47.900146484375, 48.82913589477539, 49.75812911987305, 50.68711853027344, 51.616111755371094, 52.545101165771484]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 3.0, 4.0, 3.0, 3.0, 5.0, 5.0, 12.0, 9.0, 10.0, 16.0, 11.0, 16.0, 27.0, 15.0, 15.0, 27.0, 27.0, 28.0, 25.0, 37.0, 33.0, 40.0, 46.0, 31.0, 43.0, 40.0, 32.0, 54.0, 44.0, 30.0, 40.0, 32.0, 23.0, 30.0, 30.0, 24.0, 16.0, 19.0, 14.0, 9.0, 19.0, 15.0, 13.0, 5.0, 6.0, 5.0, 8.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 2.0], "bins": [-14.890142440795898, -14.454320907592773, -14.018499374389648, -13.582677841186523, -13.146855354309082, -12.711033821105957, -12.275212287902832, -11.839390754699707, -11.403568267822266, -10.96774673461914, -10.531925201416016, -10.09610366821289, -9.66028118133545, -9.224459648132324, -8.7886381149292, -8.352816581726074, -7.916995048522949, -7.481173515319824, -7.045351505279541, -6.609529972076416, -6.173707962036133, -5.737886428833008, -5.302064895629883, -4.866243362426758, -4.430421352386475, -3.9945995807647705, -3.5587778091430664, -3.1229562759399414, -2.6871345043182373, -2.251312732696533, -1.8154911994934082, -1.379669427871704, -0.9438486099243164, -0.5080268979072571, -0.07220518589019775, 0.3636164665222168, 0.7994382381439209, 1.235260009765625, 1.67108154296875, 2.106903314590454, 2.542725086212158, 2.9785468578338623, 3.4143686294555664, 3.8501901626586914, 4.286011695861816, 4.7218337059021, 5.157655239105225, 5.593477249145508, 6.029298782348633, 6.465120315551758, 6.900942325592041, 7.336763858795166, 7.772585868835449, 8.208407402038574, 8.6442289352417, 9.080050468444824, 9.515872955322266, 9.95169448852539, 10.387516021728516, 10.82333755493164, 11.259160041809082, 11.694981575012207, 12.130803108215332, 12.566624641418457, 13.002446174621582]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 4.0, 3.0, 5.0, 11.0, 4.0, 11.0, 13.0, 11.0, 11.0, 13.0, 16.0, 15.0, 22.0, 25.0, 32.0, 35.0, 27.0, 40.0, 23.0, 44.0, 43.0, 34.0, 28.0, 47.0, 40.0, 35.0, 27.0, 30.0, 43.0, 30.0, 30.0, 31.0, 25.0, 25.0, 21.0, 23.0, 17.0, 21.0, 18.0, 13.0, 11.0, 12.0, 10.0, 4.0, 9.0, 6.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.3671875, -1.3243865966796875, -1.281585693359375, -1.2387847900390625, -1.19598388671875, -1.1531829833984375, -1.110382080078125, -1.0675811767578125, -1.0247802734375, -0.9819793701171875, -0.939178466796875, -0.8963775634765625, -0.85357666015625, -0.8107757568359375, -0.767974853515625, -0.7251739501953125, -0.682373046875, -0.6395721435546875, -0.596771240234375, -0.5539703369140625, -0.51116943359375, -0.4683685302734375, -0.425567626953125, -0.3827667236328125, -0.3399658203125, -0.2971649169921875, -0.254364013671875, -0.2115631103515625, -0.16876220703125, -0.1259613037109375, -0.083160400390625, -0.0403594970703125, 0.00244140625, 0.0452423095703125, 0.088043212890625, 0.1308441162109375, 0.17364501953125, 0.2164459228515625, 0.259246826171875, 0.3020477294921875, 0.3448486328125, 0.3876495361328125, 0.430450439453125, 0.4732513427734375, 0.51605224609375, 0.5588531494140625, 0.601654052734375, 0.6444549560546875, 0.687255859375, 0.7300567626953125, 0.772857666015625, 0.8156585693359375, 0.85845947265625, 0.9012603759765625, 0.944061279296875, 0.9868621826171875, 1.0296630859375, 1.0724639892578125, 1.115264892578125, 1.1580657958984375, 1.20086669921875, 1.2436676025390625, 1.286468505859375, 1.3292694091796875, 1.3720703125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 6.0, 8.0, 6.0, 9.0, 27.0, 35.0, 29.0, 45.0, 99.0, 128.0, 193.0, 329.0, 572.0, 870.0, 1653.0, 3000.0, 5962.0, 11430.0, 23190.0, 48060.0, 103945.0, 239949.0, 586159.0, 1214676.0, 1095519.0, 487340.0, 201003.0, 87982.0, 40733.0, 19735.0, 9971.0, 5036.0, 2709.0, 1590.0, 925.0, 480.0, 307.0, 188.0, 137.0, 87.0, 49.0, 37.0, 27.0, 21.0, 17.0, 8.0, 3.0, 3.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.8134765625, -1.756622314453125, -1.69976806640625, -1.642913818359375, -1.5860595703125, -1.529205322265625, -1.47235107421875, -1.415496826171875, -1.358642578125, -1.301788330078125, -1.24493408203125, -1.188079833984375, -1.1312255859375, -1.074371337890625, -1.01751708984375, -0.960662841796875, -0.90380859375, -0.846954345703125, -0.79010009765625, -0.733245849609375, -0.6763916015625, -0.619537353515625, -0.56268310546875, -0.505828857421875, -0.448974609375, -0.392120361328125, -0.33526611328125, -0.278411865234375, -0.2215576171875, -0.164703369140625, -0.10784912109375, -0.050994873046875, 0.005859375, 0.062713623046875, 0.11956787109375, 0.176422119140625, 0.2332763671875, 0.290130615234375, 0.34698486328125, 0.403839111328125, 0.460693359375, 0.517547607421875, 0.57440185546875, 0.631256103515625, 0.6881103515625, 0.744964599609375, 0.80181884765625, 0.858673095703125, 0.91552734375, 0.972381591796875, 1.02923583984375, 1.086090087890625, 1.1429443359375, 1.199798583984375, 1.25665283203125, 1.313507080078125, 1.370361328125, 1.427215576171875, 1.48406982421875, 1.540924072265625, 1.5977783203125, 1.654632568359375, 1.71148681640625, 1.768341064453125, 1.8251953125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 10.0, 6.0, 8.0, 19.0, 23.0, 23.0, 51.0, 60.0, 99.0, 116.0, 196.0, 242.0, 390.0, 488.0, 597.0, 481.0, 347.0, 269.0, 203.0, 151.0, 89.0, 62.0, 52.0, 26.0, 23.0, 14.0, 9.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.6640625, -5.50848388671875, -5.3529052734375, -5.19732666015625, -5.041748046875, -4.88616943359375, -4.7305908203125, -4.57501220703125, -4.41943359375, -4.26385498046875, -4.1082763671875, -3.95269775390625, -3.797119140625, -3.64154052734375, -3.4859619140625, -3.33038330078125, -3.1748046875, -3.01922607421875, -2.8636474609375, -2.70806884765625, -2.552490234375, -2.39691162109375, -2.2413330078125, -2.08575439453125, -1.93017578125, -1.77459716796875, -1.6190185546875, -1.46343994140625, -1.307861328125, -1.15228271484375, -0.9967041015625, -0.84112548828125, -0.685546875, -0.52996826171875, -0.3743896484375, -0.21881103515625, -0.063232421875, 0.09234619140625, 0.2479248046875, 0.40350341796875, 0.55908203125, 0.71466064453125, 0.8702392578125, 1.02581787109375, 1.181396484375, 1.33697509765625, 1.4925537109375, 1.64813232421875, 1.8037109375, 1.95928955078125, 2.1148681640625, 2.27044677734375, 2.426025390625, 2.58160400390625, 2.7371826171875, 2.89276123046875, 3.04833984375, 3.20391845703125, 3.3594970703125, 3.51507568359375, 3.670654296875, 3.82623291015625, 3.9818115234375, 4.13739013671875, 4.29296875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 4.0, 3.0, 6.0, 10.0, 27.0, 31.0, 48.0, 54.0, 95.0, 173.0, 322.0, 623.0, 1398.0, 3930.0, 12583.0, 50474.0, 235518.0, 1173348.0, 2082231.0, 497544.0, 102296.0, 23022.0, 6437.0, 2159.0, 951.0, 422.0, 224.0, 126.0, 64.0, 56.0, 35.0, 29.0, 15.0, 11.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6640625, -4.48626708984375, -4.3084716796875, -4.13067626953125, -3.952880859375, -3.77508544921875, -3.5972900390625, -3.41949462890625, -3.24169921875, -3.06390380859375, -2.8861083984375, -2.70831298828125, -2.530517578125, -2.35272216796875, -2.1749267578125, -1.99713134765625, -1.8193359375, -1.64154052734375, -1.4637451171875, -1.28594970703125, -1.108154296875, -0.93035888671875, -0.7525634765625, -0.57476806640625, -0.39697265625, -0.21917724609375, -0.0413818359375, 0.13641357421875, 0.314208984375, 0.49200439453125, 0.6697998046875, 0.84759521484375, 1.025390625, 1.20318603515625, 1.3809814453125, 1.55877685546875, 1.736572265625, 1.91436767578125, 2.0921630859375, 2.26995849609375, 2.44775390625, 2.62554931640625, 2.8033447265625, 2.98114013671875, 3.158935546875, 3.33673095703125, 3.5145263671875, 3.69232177734375, 3.8701171875, 4.04791259765625, 4.2257080078125, 4.40350341796875, 4.581298828125, 4.75909423828125, 4.9368896484375, 5.11468505859375, 5.29248046875, 5.47027587890625, 5.6480712890625, 5.82586669921875, 6.003662109375, 6.18145751953125, 6.3592529296875, 6.53704833984375, 6.71484375]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 10.0, 19.0, 27.0, 52.0, 56.0, 82.0, 105.0, 122.0, 115.0, 117.0, 110.0, 69.0, 50.0, 43.0, 11.0, 10.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.524375915527344, -23.683923721313477, -22.843473434448242, -22.003021240234375, -21.16257095336914, -20.322118759155273, -19.481666564941406, -18.641216278076172, -17.800764083862305, -16.960311889648438, -16.119861602783203, -15.279409408569336, -14.438958168029785, -13.598506927490234, -12.758054733276367, -11.917603492736816, -11.077152252197266, -10.236701011657715, -9.396249771118164, -8.555797576904297, -7.715346336364746, -6.874895095825195, -6.034443378448486, -5.193991661071777, -4.353540420532227, -3.5130889415740967, -2.672637462615967, -1.832185983657837, -0.991734504699707, -0.15128326416015625, 0.6891684532165527, 1.5296201705932617, 2.3700714111328125, 3.2105228900909424, 4.050974369049072, 4.891426086425781, 5.731877326965332, 6.572328567504883, 7.412780284881592, 8.2532320022583, 9.093683242797852, 9.934134483337402, 10.774585723876953, 11.61503791809082, 12.455489158630371, 13.295940399169922, 14.136392593383789, 14.97684383392334, 15.81729507446289, 16.657747268676758, 17.498197555541992, 18.33864974975586, 19.179100036621094, 20.01955223083496, 20.860004425048828, 21.700454711914062, 22.54090690612793, 23.381359100341797, 24.22180938720703, 25.0622615814209, 25.902713775634766, 26.7431640625, 27.583616256713867, 28.424068450927734, 29.26451873779297]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 5.0, 10.0, 6.0, 13.0, 12.0, 16.0, 12.0, 16.0, 18.0, 29.0, 38.0, 37.0, 36.0, 34.0, 54.0, 44.0, 41.0, 40.0, 54.0, 56.0, 45.0, 32.0, 46.0, 36.0, 34.0, 28.0, 47.0, 23.0, 19.0, 21.0, 18.0, 20.0, 9.0, 11.0, 7.0, 6.0, 6.0, 2.0, 6.0, 4.0, 5.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.654029846191406, -16.171327590942383, -15.688624382019043, -15.205921173095703, -14.72321891784668, -14.24051570892334, -13.7578125, -13.275110244750977, -12.792407035827637, -12.309703826904297, -11.827001571655273, -11.344298362731934, -10.861595153808594, -10.37889289855957, -9.89618968963623, -9.41348648071289, -8.930784225463867, -8.448081016540527, -7.965378761291504, -7.482675552368164, -6.999972820281982, -6.517270088195801, -6.034566879272461, -5.551864147186279, -5.069161415100098, -4.586458683013916, -4.103755950927734, -3.6210527420043945, -3.138350009918213, -2.6556472778320312, -2.1729443073272705, -1.6902413368225098, -1.2075386047363281, -0.7248357534408569, -0.24213290214538574, 0.24056994915008545, 0.7232728004455566, 1.2059755325317383, 1.688678503036499, 2.1713814735412598, 2.6540842056274414, 3.136786937713623, 3.619489908218384, 4.1021928787231445, 4.584895610809326, 5.067598342895508, 5.550301551818848, 6.033004283905029, 6.515707015991211, 6.998409748077393, 7.481112480163574, 7.963815689086914, 8.446517944335938, 8.929221153259277, 9.411924362182617, 9.89462661743164, 10.37732982635498, 10.86003303527832, 11.342735290527344, 11.825438499450684, 12.308141708374023, 12.790843963623047, 13.273547172546387, 13.756250381469727, 14.23895263671875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 6.0, 7.0, 10.0, 10.0, 5.0, 12.0, 8.0, 9.0, 15.0, 14.0, 17.0, 23.0, 24.0, 33.0, 29.0, 16.0, 32.0, 32.0, 44.0, 31.0, 46.0, 37.0, 43.0, 32.0, 40.0, 34.0, 37.0, 31.0, 26.0, 24.0, 30.0, 42.0, 26.0, 20.0, 24.0, 25.0, 15.0, 10.0, 11.0, 15.0, 8.0, 10.0, 9.0, 9.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.4609375, -1.416656494140625, -1.37237548828125, -1.328094482421875, -1.2838134765625, -1.239532470703125, -1.19525146484375, -1.150970458984375, -1.106689453125, -1.062408447265625, -1.01812744140625, -0.973846435546875, -0.9295654296875, -0.885284423828125, -0.84100341796875, -0.796722412109375, -0.75244140625, -0.708160400390625, -0.66387939453125, -0.619598388671875, -0.5753173828125, -0.531036376953125, -0.48675537109375, -0.442474365234375, -0.398193359375, -0.353912353515625, -0.30963134765625, -0.265350341796875, -0.2210693359375, -0.176788330078125, -0.13250732421875, -0.088226318359375, -0.0439453125, 0.000335693359375, 0.04461669921875, 0.088897705078125, 0.1331787109375, 0.177459716796875, 0.22174072265625, 0.266021728515625, 0.310302734375, 0.354583740234375, 0.39886474609375, 0.443145751953125, 0.4874267578125, 0.531707763671875, 0.57598876953125, 0.620269775390625, 0.66455078125, 0.708831787109375, 0.75311279296875, 0.797393798828125, 0.8416748046875, 0.885955810546875, 0.93023681640625, 0.974517822265625, 1.018798828125, 1.063079833984375, 1.10736083984375, 1.151641845703125, 1.1959228515625, 1.240203857421875, 1.28448486328125, 1.328765869140625, 1.373046875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 6.0, 5.0, 4.0, 7.0, 10.0, 16.0, 18.0, 32.0, 42.0, 74.0, 133.0, 187.0, 285.0, 394.0, 633.0, 987.0, 1543.0, 2430.0, 4013.0, 6491.0, 10495.0, 17476.0, 28885.0, 48352.0, 79686.0, 127523.0, 180728.0, 185627.0, 134953.0, 86059.0, 52034.0, 31216.0, 18531.0, 11236.0, 6925.0, 4203.0, 2644.0, 1700.0, 1035.0, 661.0, 438.0, 298.0, 177.0, 113.0, 86.0, 57.0, 38.0, 25.0, 22.0, 7.0, 8.0, 8.0, 1.0, 4.0, 2.0, 0.0, 4.0], "bins": [-0.17578125, -0.1706218719482422, -0.16546249389648438, -0.16030311584472656, -0.15514373779296875, -0.14998435974121094, -0.14482498168945312, -0.1396656036376953, -0.1345062255859375, -0.1293468475341797, -0.12418746948242188, -0.11902809143066406, -0.11386871337890625, -0.10870933532714844, -0.10354995727539062, -0.09839057922363281, -0.093231201171875, -0.08807182312011719, -0.08291244506835938, -0.07775306701660156, -0.07259368896484375, -0.06743431091308594, -0.062274932861328125, -0.05711555480957031, -0.0519561767578125, -0.04679679870605469, -0.041637420654296875, -0.03647804260253906, -0.03131866455078125, -0.026159286499023438, -0.020999908447265625, -0.015840530395507812, -0.01068115234375, -0.0055217742919921875, -0.000362396240234375, 0.0047969818115234375, 0.00995635986328125, 0.015115737915039062, 0.020275115966796875, 0.025434494018554688, 0.0305938720703125, 0.03575325012207031, 0.040912628173828125, 0.04607200622558594, 0.05123138427734375, 0.05639076232910156, 0.061550140380859375, 0.06670951843261719, 0.071868896484375, 0.07702827453613281, 0.08218765258789062, 0.08734703063964844, 0.09250640869140625, 0.09766578674316406, 0.10282516479492188, 0.10798454284667969, 0.1131439208984375, 0.11830329895019531, 0.12346267700195312, 0.12862205505371094, 0.13378143310546875, 0.13894081115722656, 0.14410018920898438, 0.1492595672607422, 0.1544189453125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 6.0, 3.0, 8.0, 10.0, 10.0, 9.0, 8.0, 15.0, 12.0, 16.0, 29.0, 15.0, 22.0, 24.0, 27.0, 31.0, 36.0, 29.0, 41.0, 36.0, 41.0, 42.0, 1064.0, 39.0, 39.0, 42.0, 49.0, 37.0, 32.0, 26.0, 28.0, 36.0, 24.0, 25.0, 18.0, 13.0, 9.0, 16.0, 16.0, 7.0, 6.0, 9.0, 12.0, 0.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.12890625, -1.0932769775390625, -1.057647705078125, -1.0220184326171875, -0.98638916015625, -0.9507598876953125, -0.915130615234375, -0.8795013427734375, -0.8438720703125, -0.8082427978515625, -0.772613525390625, -0.7369842529296875, -0.70135498046875, -0.6657257080078125, -0.630096435546875, -0.5944671630859375, -0.558837890625, -0.5232086181640625, -0.487579345703125, -0.4519500732421875, -0.41632080078125, -0.3806915283203125, -0.345062255859375, -0.3094329833984375, -0.2738037109375, -0.2381744384765625, -0.202545166015625, -0.1669158935546875, -0.13128662109375, -0.0956573486328125, -0.060028076171875, -0.0243988037109375, 0.01123046875, 0.0468597412109375, 0.082489013671875, 0.1181182861328125, 0.15374755859375, 0.1893768310546875, 0.225006103515625, 0.2606353759765625, 0.2962646484375, 0.3318939208984375, 0.367523193359375, 0.4031524658203125, 0.43878173828125, 0.4744110107421875, 0.510040283203125, 0.5456695556640625, 0.581298828125, 0.6169281005859375, 0.652557373046875, 0.6881866455078125, 0.72381591796875, 0.7594451904296875, 0.795074462890625, 0.8307037353515625, 0.8663330078125, 0.9019622802734375, 0.937591552734375, 0.9732208251953125, 1.00885009765625, 1.0444793701171875, 1.080108642578125, 1.1157379150390625, 1.1513671875]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 3.0, 8.0, 15.0, 21.0, 21.0, 37.0, 44.0, 76.0, 112.0, 151.0, 236.0, 345.0, 576.0, 819.0, 1246.0, 1936.0, 2947.0, 4614.0, 7014.0, 11131.0, 17581.0, 27427.0, 43005.0, 66578.0, 99643.0, 152050.0, 1168221.0, 176567.0, 109347.0, 72798.0, 47808.0, 30689.0, 19342.0, 12377.0, 7809.0, 5000.0, 3297.0, 2165.0, 1289.0, 939.0, 594.0, 408.0, 274.0, 191.0, 127.0, 85.0, 65.0, 41.0, 24.0, 16.0, 11.0, 5.0, 7.0, 1.0, 3.0, 4.0, 1.0], "bins": [-0.08245849609375, -0.08000469207763672, -0.07755088806152344, -0.07509708404541016, -0.07264328002929688, -0.0701894760131836, -0.06773567199707031, -0.06528186798095703, -0.06282806396484375, -0.06037425994873047, -0.05792045593261719, -0.055466651916503906, -0.053012847900390625, -0.050559043884277344, -0.04810523986816406, -0.04565143585205078, -0.0431976318359375, -0.04074382781982422, -0.03829002380371094, -0.035836219787597656, -0.033382415771484375, -0.030928611755371094, -0.028474807739257812, -0.02602100372314453, -0.02356719970703125, -0.02111339569091797, -0.018659591674804688, -0.016205787658691406, -0.013751983642578125, -0.011298179626464844, -0.008844375610351562, -0.006390571594238281, -0.003936767578125, -0.0014829635620117188, 0.0009708404541015625, 0.0034246444702148438, 0.005878448486328125, 0.008332252502441406, 0.010786056518554688, 0.013239860534667969, 0.01569366455078125, 0.01814746856689453, 0.020601272583007812, 0.023055076599121094, 0.025508880615234375, 0.027962684631347656, 0.030416488647460938, 0.03287029266357422, 0.0353240966796875, 0.03777790069580078, 0.04023170471191406, 0.042685508728027344, 0.045139312744140625, 0.047593116760253906, 0.05004692077636719, 0.05250072479248047, 0.05495452880859375, 0.05740833282470703, 0.05986213684082031, 0.062315940856933594, 0.06476974487304688, 0.06722354888916016, 0.06967735290527344, 0.07213115692138672, 0.0745849609375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 7.0, 6.0, 8.0, 8.0, 2.0, 6.0, 7.0, 2.0, 10.0, 14.0, 17.0, 22.0, 21.0, 21.0, 31.0, 34.0, 57.0, 93.0, 121.0, 147.0, 89.0, 67.0, 40.0, 38.0, 26.0, 18.0, 12.0, 16.0, 11.0, 8.0, 4.0, 7.0, 5.0, 6.0, 4.0, 3.0, 5.0, 4.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0203857421875, -0.019821643829345703, -0.019257545471191406, -0.01869344711303711, -0.018129348754882812, -0.017565250396728516, -0.01700115203857422, -0.016437053680419922, -0.015872955322265625, -0.015308856964111328, -0.014744758605957031, -0.014180660247802734, -0.013616561889648438, -0.01305246353149414, -0.012488365173339844, -0.011924266815185547, -0.01136016845703125, -0.010796070098876953, -0.010231971740722656, -0.00966787338256836, -0.009103775024414062, -0.008539676666259766, -0.007975578308105469, -0.007411479949951172, -0.006847381591796875, -0.006283283233642578, -0.005719184875488281, -0.005155086517333984, -0.0045909881591796875, -0.004026889801025391, -0.0034627914428710938, -0.002898693084716797, -0.0023345947265625, -0.0017704963684082031, -0.0012063980102539062, -0.0006422996520996094, -7.82012939453125e-05, 0.0004858970642089844, 0.0010499954223632812, 0.0016140937805175781, 0.002178192138671875, 0.002742290496826172, 0.0033063888549804688, 0.0038704872131347656, 0.0044345855712890625, 0.004998683929443359, 0.005562782287597656, 0.006126880645751953, 0.00669097900390625, 0.007255077362060547, 0.007819175720214844, 0.00838327407836914, 0.008947372436523438, 0.009511470794677734, 0.010075569152832031, 0.010639667510986328, 0.011203765869140625, 0.011767864227294922, 0.012331962585449219, 0.012896060943603516, 0.013460159301757812, 0.01402425765991211, 0.014588356018066406, 0.015152454376220703, 0.015716552734375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 5.0, 7.0, 4.0, 5.0, 3.0, 11.0, 8.0, 11.0, 13.0, 26.0, 40.0, 50.0, 64.0, 90.0, 137.0, 222.0, 534.0, 3868.0, 102693.0, 927246.0, 11745.0, 988.0, 253.0, 162.0, 102.0, 76.0, 50.0, 42.0, 19.0, 23.0, 5.0, 12.0, 8.0, 3.0, 6.0, 9.0, 7.0, 3.0, 5.0, 3.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27490234375, -0.2651557922363281, -0.25540924072265625, -0.24566268920898438, -0.2359161376953125, -0.22616958618164062, -0.21642303466796875, -0.20667648315429688, -0.196929931640625, -0.18718338012695312, -0.17743682861328125, -0.16769027709960938, -0.1579437255859375, -0.14819717407226562, -0.13845062255859375, -0.12870407104492188, -0.11895751953125, -0.10921096801757812, -0.09946441650390625, -0.08971786499023438, -0.0799713134765625, -0.07022476196289062, -0.06047821044921875, -0.050731658935546875, -0.040985107421875, -0.031238555908203125, -0.02149200439453125, -0.011745452880859375, -0.0019989013671875, 0.007747650146484375, 0.01749420166015625, 0.027240753173828125, 0.0369873046875, 0.046733856201171875, 0.05648040771484375, 0.06622695922851562, 0.0759735107421875, 0.08572006225585938, 0.09546661376953125, 0.10521316528320312, 0.114959716796875, 0.12470626831054688, 0.13445281982421875, 0.14419937133789062, 0.1539459228515625, 0.16369247436523438, 0.17343902587890625, 0.18318557739257812, 0.19293212890625, 0.20267868041992188, 0.21242523193359375, 0.22217178344726562, 0.2319183349609375, 0.24166488647460938, 0.25141143798828125, 0.2611579895019531, 0.270904541015625, 0.2806510925292969, 0.29039764404296875, 0.3001441955566406, 0.3098907470703125, 0.3196372985839844, 0.32938385009765625, 0.3391304016113281, 0.348876953125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 4.0, 13.0, 26.0, 40.0, 112.0, 311.0, 283.0, 103.0, 48.0, 27.0, 11.0, 8.0, 7.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07367777824401855, -0.06875813007354736, -0.06383848935365677, -0.05891884118318558, -0.053999193012714386, -0.04907954856753349, -0.0441599041223526, -0.03924025595188141, -0.034320611506700516, -0.029400965198874474, -0.02448131889104843, -0.01956167444586754, -0.014642028138041496, -0.009722381830215454, -0.004802737385034561, 0.00011691078543663025, 0.005036555230617523, 0.009956201538443565, 0.014875846914947033, 0.0197954922914505, 0.024715138599276543, 0.029634784907102585, 0.03455442935228348, 0.03947407752275467, 0.04439372196793556, 0.049313366413116455, 0.054233014583587646, 0.05915265902876854, 0.06407230347394943, 0.06899195164442062, 0.07391159236431122, 0.07883124053478241, 0.0837508887052536, 0.08867053687572479, 0.09359017759561539, 0.09850982576608658, 0.10342947393655777, 0.10834911465644836, 0.11326876282691956, 0.11818841099739075, 0.12310805916786194, 0.12802770733833313, 0.13294735550880432, 0.1378670036792755, 0.1427866369485855, 0.1477062851190567, 0.1526259332895279, 0.15754558145999908, 0.16246521472930908, 0.16738486289978027, 0.17230451107025146, 0.17722415924072266, 0.18214379251003265, 0.18706344068050385, 0.19198308885097504, 0.19690273702144623, 0.20182238519191742, 0.2067420333623886, 0.2116616815328598, 0.2165813148021698, 0.221500962972641, 0.22642061114311218, 0.23134025931358337, 0.23625990748405457, 0.24117955565452576]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 4.0, 8.0, 5.0, 12.0, 4.0, 8.0, 22.0, 13.0, 22.0, 22.0, 18.0, 34.0, 35.0, 25.0, 30.0, 40.0, 34.0, 25.0, 26.0, 42.0, 37.0, 42.0, 33.0, 33.0, 32.0, 38.0, 43.0, 28.0, 29.0, 30.0, 29.0, 17.0, 27.0, 16.0, 21.0, 11.0, 15.0, 15.0, 16.0, 12.0, 18.0, 6.0, 4.0, 2.0, 9.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.043266475200653076, -0.04177241027355194, -0.040278345346450806, -0.03878428041934967, -0.037290215492248535, -0.0357961505651474, -0.034302085638046265, -0.03280802071094513, -0.031313955783843994, -0.02981989085674286, -0.028325825929641724, -0.02683176100254059, -0.025337696075439453, -0.023843631148338318, -0.022349566221237183, -0.020855501294136047, -0.019361436367034912, -0.017867371439933777, -0.01637330651283264, -0.014879241585731506, -0.013385176658630371, -0.011891111731529236, -0.0103970468044281, -0.008902981877326965, -0.00740891695022583, -0.005914852023124695, -0.00442078709602356, -0.0029267221689224243, -0.001432657241821289, 6.140768527984619e-05, 0.0015554726123809814, 0.0030495375394821167, 0.004543602466583252, 0.006037667393684387, 0.0075317323207855225, 0.009025797247886658, 0.010519862174987793, 0.012013927102088928, 0.013507992029190063, 0.015002056956291199, 0.016496121883392334, 0.01799018681049347, 0.019484251737594604, 0.02097831666469574, 0.022472381591796875, 0.02396644651889801, 0.025460511445999146, 0.02695457637310028, 0.028448641300201416, 0.02994270622730255, 0.031436771154403687, 0.03293083608150482, 0.03442490100860596, 0.03591896593570709, 0.03741303086280823, 0.03890709578990936, 0.0404011607170105, 0.04189522564411163, 0.04338929057121277, 0.044883355498313904, 0.04637742042541504, 0.047871485352516174, 0.04936555027961731, 0.050859615206718445, 0.05235368013381958]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 7.0, 12.0, 8.0, 5.0, 12.0, 8.0, 9.0, 16.0, 14.0, 17.0, 22.0, 24.0, 34.0, 29.0, 14.0, 32.0, 33.0, 43.0, 33.0, 45.0, 37.0, 43.0, 32.0, 41.0, 33.0, 36.0, 32.0, 26.0, 25.0, 29.0, 42.0, 24.0, 23.0, 22.0, 26.0, 15.0, 10.0, 11.0, 15.0, 8.0, 10.0, 9.0, 9.0, 3.0, 4.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.4599609375, -1.41571044921875, -1.3714599609375, -1.32720947265625, -1.282958984375, -1.23870849609375, -1.1944580078125, -1.15020751953125, -1.10595703125, -1.06170654296875, -1.0174560546875, -0.97320556640625, -0.928955078125, -0.88470458984375, -0.8404541015625, -0.79620361328125, -0.751953125, -0.70770263671875, -0.6634521484375, -0.61920166015625, -0.574951171875, -0.53070068359375, -0.4864501953125, -0.44219970703125, -0.39794921875, -0.35369873046875, -0.3094482421875, -0.26519775390625, -0.220947265625, -0.17669677734375, -0.1324462890625, -0.08819580078125, -0.0439453125, 0.00030517578125, 0.0445556640625, 0.08880615234375, 0.133056640625, 0.17730712890625, 0.2215576171875, 0.26580810546875, 0.31005859375, 0.35430908203125, 0.3985595703125, 0.44281005859375, 0.487060546875, 0.53131103515625, 0.5755615234375, 0.61981201171875, 0.6640625, 0.70831298828125, 0.7525634765625, 0.79681396484375, 0.841064453125, 0.88531494140625, 0.9295654296875, 0.97381591796875, 1.01806640625, 1.06231689453125, 1.1065673828125, 1.15081787109375, 1.195068359375, 1.23931884765625, 1.2835693359375, 1.32781982421875, 1.3720703125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 11.0, 8.0, 11.0, 20.0, 32.0, 44.0, 74.0, 74.0, 131.0, 164.0, 242.0, 347.0, 498.0, 724.0, 1093.0, 1560.0, 2432.0, 3581.0, 5502.0, 8624.0, 13706.0, 22619.0, 38263.0, 65983.0, 114247.0, 190670.0, 225465.0, 143905.0, 84735.0, 47966.0, 28101.0, 17024.0, 10614.0, 6904.0, 4320.0, 2879.0, 1949.0, 1221.0, 893.0, 613.0, 393.0, 277.0, 193.0, 142.0, 100.0, 72.0, 37.0, 36.0, 21.0, 14.0, 7.0, 11.0, 6.0, 5.0, 0.0, 1.0, 1.0], "bins": [-1.5302734375, -1.4842071533203125, -1.438140869140625, -1.3920745849609375, -1.34600830078125, -1.2999420166015625, -1.253875732421875, -1.2078094482421875, -1.1617431640625, -1.1156768798828125, -1.069610595703125, -1.0235443115234375, -0.97747802734375, -0.9314117431640625, -0.885345458984375, -0.8392791748046875, -0.793212890625, -0.7471466064453125, -0.701080322265625, -0.6550140380859375, -0.60894775390625, -0.5628814697265625, -0.516815185546875, -0.4707489013671875, -0.4246826171875, -0.3786163330078125, -0.332550048828125, -0.2864837646484375, -0.24041748046875, -0.1943511962890625, -0.148284912109375, -0.1022186279296875, -0.05615234375, -0.0100860595703125, 0.035980224609375, 0.0820465087890625, 0.12811279296875, 0.1741790771484375, 0.220245361328125, 0.2663116455078125, 0.3123779296875, 0.3584442138671875, 0.404510498046875, 0.4505767822265625, 0.49664306640625, 0.5427093505859375, 0.588775634765625, 0.6348419189453125, 0.680908203125, 0.7269744873046875, 0.773040771484375, 0.8191070556640625, 0.86517333984375, 0.9112396240234375, 0.957305908203125, 1.0033721923828125, 1.0494384765625, 1.0955047607421875, 1.141571044921875, 1.1876373291015625, 1.23370361328125, 1.2797698974609375, 1.325836181640625, 1.3719024658203125, 1.41796875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 8.0, 12.0, 12.0, 10.0, 19.0, 20.0, 28.0, 34.0, 35.0, 55.0, 45.0, 44.0, 72.0, 105.0, 195.0, 1378.0, 298.0, 157.0, 98.0, 71.0, 42.0, 48.0, 33.0, 25.0, 25.0, 28.0, 13.0, 24.0, 18.0, 15.0, 12.0, 10.0, 13.0, 7.0, 5.0, 3.0, 4.0, 7.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.6015625, -5.40728759765625, -5.2130126953125, -5.01873779296875, -4.824462890625, -4.63018798828125, -4.4359130859375, -4.24163818359375, -4.04736328125, -3.85308837890625, -3.6588134765625, -3.46453857421875, -3.270263671875, -3.07598876953125, -2.8817138671875, -2.68743896484375, -2.4931640625, -2.29888916015625, -2.1046142578125, -1.91033935546875, -1.716064453125, -1.52178955078125, -1.3275146484375, -1.13323974609375, -0.93896484375, -0.74468994140625, -0.5504150390625, -0.35614013671875, -0.161865234375, 0.03240966796875, 0.2266845703125, 0.42095947265625, 0.615234375, 0.80950927734375, 1.0037841796875, 1.19805908203125, 1.392333984375, 1.58660888671875, 1.7808837890625, 1.97515869140625, 2.16943359375, 2.36370849609375, 2.5579833984375, 2.75225830078125, 2.946533203125, 3.14080810546875, 3.3350830078125, 3.52935791015625, 3.7236328125, 3.91790771484375, 4.1121826171875, 4.30645751953125, 4.500732421875, 4.69500732421875, 4.8892822265625, 5.08355712890625, 5.27783203125, 5.47210693359375, 5.6663818359375, 5.86065673828125, 6.054931640625, 6.24920654296875, 6.4434814453125, 6.63775634765625, 6.83203125]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 7.0, 5.0, 11.0, 16.0, 15.0, 25.0, 37.0, 51.0, 54.0, 120.0, 191.0, 379.0, 944.0, 7090.0, 843514.0, 2279384.0, 11686.0, 1235.0, 422.0, 193.0, 112.0, 61.0, 43.0, 42.0, 15.0, 23.0, 13.0, 8.0, 5.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.640625, -19.0963134765625, -18.552001953125, -18.0076904296875, -17.46337890625, -16.9190673828125, -16.374755859375, -15.8304443359375, -15.2861328125, -14.7418212890625, -14.197509765625, -13.6531982421875, -13.10888671875, -12.5645751953125, -12.020263671875, -11.4759521484375, -10.931640625, -10.3873291015625, -9.843017578125, -9.2987060546875, -8.75439453125, -8.2100830078125, -7.665771484375, -7.1214599609375, -6.5771484375, -6.0328369140625, -5.488525390625, -4.9442138671875, -4.39990234375, -3.8555908203125, -3.311279296875, -2.7669677734375, -2.22265625, -1.6783447265625, -1.134033203125, -0.5897216796875, -0.04541015625, 0.4989013671875, 1.043212890625, 1.5875244140625, 2.1318359375, 2.6761474609375, 3.220458984375, 3.7647705078125, 4.30908203125, 4.8533935546875, 5.397705078125, 5.9420166015625, 6.486328125, 7.0306396484375, 7.574951171875, 8.1192626953125, 8.66357421875, 9.2078857421875, 9.752197265625, 10.2965087890625, 10.8408203125, 11.3851318359375, 11.929443359375, 12.4737548828125, 13.01806640625, 13.5623779296875, 14.106689453125, 14.6510009765625, 15.1953125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 31.0, 325.0, 543.0, 113.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.222177505493164, -23.89309310913086, -21.564008712768555, -19.23492431640625, -16.905841827392578, -14.576756477355957, -12.247673034667969, -9.918588638305664, -7.589504241943359, -5.260419845581055, -2.931335926055908, -0.6022520065307617, 1.726832389831543, 4.055916786193848, 6.385000228881836, 8.71408462524414, 11.043169021606445, 13.37225341796875, 15.701337814331055, 18.03042221069336, 20.35950469970703, 22.68859100341797, 25.01767349243164, 27.346757888793945, 29.67584228515625, 32.00492477416992, 34.33401107788086, 36.66309356689453, 38.99217987060547, 41.32126235961914, 43.65034484863281, 45.97943115234375, 48.30851745605469, 50.63759994506836, 52.9666862487793, 55.29576873779297, 57.624855041503906, 59.95393753051758, 62.28302001953125, 64.61210632324219, 66.94119262695312, 69.27027893066406, 71.59935760498047, 73.9284439086914, 76.25753021240234, 78.58661651611328, 80.91569519042969, 83.24478149414062, 85.57386779785156, 87.9029541015625, 90.2320327758789, 92.56111907958984, 94.89020538330078, 97.21929168701172, 99.54837036132812, 101.87745666503906, 104.20653533935547, 106.5356216430664, 108.86470031738281, 111.19378662109375, 113.52287292480469, 115.85195922851562, 118.18103790283203, 120.51012420654297, 122.8392105102539]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 0.0, 4.0, 0.0, 3.0, 3.0, 4.0, 2.0, 7.0, 10.0, 12.0, 13.0, 14.0, 13.0, 17.0, 32.0, 22.0, 26.0, 37.0, 26.0, 33.0, 37.0, 42.0, 32.0, 45.0, 34.0, 35.0, 39.0, 45.0, 41.0, 38.0, 36.0, 47.0, 44.0, 27.0, 34.0, 28.0, 25.0, 14.0, 15.0, 19.0, 14.0, 7.0, 8.0, 9.0, 6.0, 3.0, 8.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.820556640625, -13.345344543457031, -12.870133399963379, -12.39492130279541, -11.919709205627441, -11.444498062133789, -10.96928596496582, -10.494073867797852, -10.0188627243042, -9.54365062713623, -9.068439483642578, -8.59322738647461, -8.11801528930664, -7.642804145812988, -7.1675920486450195, -6.692380428314209, -6.21716833114624, -5.74195671081543, -5.266744613647461, -4.79153299331665, -4.31632137298584, -3.84110951423645, -3.3658976554870605, -2.89068603515625, -2.4154741764068604, -1.9402624368667603, -1.4650506973266602, -0.9898388385772705, -0.5146270990371704, -0.03941535949707031, 0.43579649925231934, 0.9110081195831299, 1.3862199783325195, 1.8614317178726196, 2.3366434574127197, 2.8118553161621094, 3.28706693649292, 3.7622787952423096, 4.237490653991699, 4.71270227432251, 5.18791389465332, 5.663125514984131, 6.1383376121521, 6.61354923248291, 7.088760852813721, 7.563972473144531, 8.0391845703125, 8.514396667480469, 8.989608764648438, 9.464820861816406, 9.940032005310059, 10.415244102478027, 10.890456199645996, 11.365667343139648, 11.840879440307617, 12.316091537475586, 12.791302680969238, 13.266514778137207, 13.74172592163086, 14.216938018798828, 14.692150115966797, 15.16736125946045, 15.642573356628418, 16.11778450012207, 16.59299659729004]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 1.0, 8.0, 7.0, 9.0, 7.0, 12.0, 11.0, 15.0, 9.0, 18.0, 13.0, 14.0, 25.0, 25.0, 20.0, 32.0, 31.0, 34.0, 34.0, 37.0, 44.0, 33.0, 40.0, 46.0, 33.0, 30.0, 33.0, 32.0, 30.0, 31.0, 34.0, 24.0, 28.0, 23.0, 20.0, 28.0, 13.0, 17.0, 15.0, 14.0, 14.0, 15.0, 13.0, 5.0, 4.0, 5.0, 2.0, 6.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.5029296875, -1.45697021484375, -1.4110107421875, -1.36505126953125, -1.319091796875, -1.27313232421875, -1.2271728515625, -1.18121337890625, -1.13525390625, -1.08929443359375, -1.0433349609375, -0.99737548828125, -0.951416015625, -0.90545654296875, -0.8594970703125, -0.81353759765625, -0.767578125, -0.72161865234375, -0.6756591796875, -0.62969970703125, -0.583740234375, -0.53778076171875, -0.4918212890625, -0.44586181640625, -0.39990234375, -0.35394287109375, -0.3079833984375, -0.26202392578125, -0.216064453125, -0.17010498046875, -0.1241455078125, -0.07818603515625, -0.0322265625, 0.01373291015625, 0.0596923828125, 0.10565185546875, 0.151611328125, 0.19757080078125, 0.2435302734375, 0.28948974609375, 0.33544921875, 0.38140869140625, 0.4273681640625, 0.47332763671875, 0.519287109375, 0.56524658203125, 0.6112060546875, 0.65716552734375, 0.703125, 0.74908447265625, 0.7950439453125, 0.84100341796875, 0.886962890625, 0.93292236328125, 0.9788818359375, 1.02484130859375, 1.07080078125, 1.11676025390625, 1.1627197265625, 1.20867919921875, 1.254638671875, 1.30059814453125, 1.3465576171875, 1.39251708984375, 1.4384765625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 4.0, 7.0, 6.0, 3.0, 9.0, 10.0, 6.0, 12.0, 19.0, 15.0, 18.0, 26.0, 24.0, 33.0, 49.0, 41.0, 66.0, 79.0, 94.0, 139.0, 267.0, 769.0, 2595.0, 11423.0, 67296.0, 578819.0, 2781719.0, 658411.0, 75164.0, 12644.0, 2802.0, 756.0, 298.0, 156.0, 98.0, 65.0, 50.0, 51.0, 42.0, 34.0, 34.0, 28.0, 23.0, 19.0, 14.0, 14.0, 7.0, 11.0, 5.0, 8.0, 4.0, 2.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.8984375, -4.7325439453125, -4.566650390625, -4.4007568359375, -4.23486328125, -4.0689697265625, -3.903076171875, -3.7371826171875, -3.5712890625, -3.4053955078125, -3.239501953125, -3.0736083984375, -2.90771484375, -2.7418212890625, -2.575927734375, -2.4100341796875, -2.244140625, -2.0782470703125, -1.912353515625, -1.7464599609375, -1.58056640625, -1.4146728515625, -1.248779296875, -1.0828857421875, -0.9169921875, -0.7510986328125, -0.585205078125, -0.4193115234375, -0.25341796875, -0.0875244140625, 0.078369140625, 0.2442626953125, 0.41015625, 0.5760498046875, 0.741943359375, 0.9078369140625, 1.07373046875, 1.2396240234375, 1.405517578125, 1.5714111328125, 1.7373046875, 1.9031982421875, 2.069091796875, 2.2349853515625, 2.40087890625, 2.5667724609375, 2.732666015625, 2.8985595703125, 3.064453125, 3.2303466796875, 3.396240234375, 3.5621337890625, 3.72802734375, 3.8939208984375, 4.059814453125, 4.2257080078125, 4.3916015625, 4.5574951171875, 4.723388671875, 4.8892822265625, 5.05517578125, 5.2210693359375, 5.386962890625, 5.5528564453125, 5.71875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 11.0, 11.0, 21.0, 29.0, 35.0, 71.0, 89.0, 130.0, 206.0, 305.0, 480.0, 613.0, 631.0, 488.0, 315.0, 203.0, 135.0, 87.0, 81.0, 40.0, 32.0, 19.0, 10.0, 7.0, 6.0, 5.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.41796875, -7.22271728515625, -7.0274658203125, -6.83221435546875, -6.636962890625, -6.44171142578125, -6.2464599609375, -6.05120849609375, -5.85595703125, -5.66070556640625, -5.4654541015625, -5.27020263671875, -5.074951171875, -4.87969970703125, -4.6844482421875, -4.48919677734375, -4.2939453125, -4.09869384765625, -3.9034423828125, -3.70819091796875, -3.512939453125, -3.31768798828125, -3.1224365234375, -2.92718505859375, -2.73193359375, -2.53668212890625, -2.3414306640625, -2.14617919921875, -1.950927734375, -1.75567626953125, -1.5604248046875, -1.36517333984375, -1.169921875, -0.97467041015625, -0.7794189453125, -0.58416748046875, -0.388916015625, -0.19366455078125, 0.0015869140625, 0.19683837890625, 0.39208984375, 0.58734130859375, 0.7825927734375, 0.97784423828125, 1.173095703125, 1.36834716796875, 1.5635986328125, 1.75885009765625, 1.9541015625, 2.14935302734375, 2.3446044921875, 2.53985595703125, 2.735107421875, 2.93035888671875, 3.1256103515625, 3.32086181640625, 3.51611328125, 3.71136474609375, 3.9066162109375, 4.10186767578125, 4.297119140625, 4.49237060546875, 4.6876220703125, 4.88287353515625, 5.078125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 11.0, 11.0, 33.0, 44.0, 84.0, 132.0, 214.0, 526.0, 2032.0, 30677.0, 2043759.0, 2082324.0, 31433.0, 1987.0, 495.0, 201.0, 110.0, 82.0, 44.0, 12.0, 21.0, 16.0, 7.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.84375, -11.328857421875, -10.81396484375, -10.299072265625, -9.7841796875, -9.269287109375, -8.75439453125, -8.239501953125, -7.724609375, -7.209716796875, -6.69482421875, -6.179931640625, -5.6650390625, -5.150146484375, -4.63525390625, -4.120361328125, -3.60546875, -3.090576171875, -2.57568359375, -2.060791015625, -1.5458984375, -1.031005859375, -0.51611328125, -0.001220703125, 0.513671875, 1.028564453125, 1.54345703125, 2.058349609375, 2.5732421875, 3.088134765625, 3.60302734375, 4.117919921875, 4.6328125, 5.147705078125, 5.66259765625, 6.177490234375, 6.6923828125, 7.207275390625, 7.72216796875, 8.237060546875, 8.751953125, 9.266845703125, 9.78173828125, 10.296630859375, 10.8115234375, 11.326416015625, 11.84130859375, 12.356201171875, 12.87109375, 13.385986328125, 13.90087890625, 14.415771484375, 14.9306640625, 15.445556640625, 15.96044921875, 16.475341796875, 16.990234375, 17.505126953125, 18.02001953125, 18.534912109375, 19.0498046875, 19.564697265625, 20.07958984375, 20.594482421875, 21.109375]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 15.0, 22.0, 24.0, 18.0, 24.0, 40.0, 37.0, 45.0, 66.0, 68.0, 63.0, 60.0, 61.0, 61.0, 58.0, 67.0, 51.0, 35.0, 30.0, 25.0, 36.0, 22.0, 20.0, 18.0, 9.0, 3.0, 1.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.389070510864258, -15.908631324768066, -15.428192138671875, -14.947752952575684, -14.467313766479492, -13.9868745803833, -13.50643539428711, -13.025996208190918, -12.545557022094727, -12.065117835998535, -11.584678649902344, -11.104239463806152, -10.623800277709961, -10.14336109161377, -9.662921905517578, -9.182482719421387, -8.702043533325195, -8.221604347229004, -7.7411651611328125, -7.260725975036621, -6.78028678894043, -6.299847602844238, -5.819408416748047, -5.3389692306518555, -4.858530044555664, -4.378090858459473, -3.8976516723632812, -3.41721248626709, -2.9367733001708984, -2.456334114074707, -1.9758949279785156, -1.4954557418823242, -1.0150165557861328, -0.5345773696899414, -0.05413818359375, 0.4263010025024414, 0.9067401885986328, 1.3871793746948242, 1.8676185607910156, 2.348057746887207, 2.8284969329833984, 3.30893611907959, 3.7893753051757812, 4.269814491271973, 4.750253677368164, 5.2306928634643555, 5.711132049560547, 6.191571235656738, 6.67201042175293, 7.152449607849121, 7.6328887939453125, 8.113327980041504, 8.593767166137695, 9.074206352233887, 9.554645538330078, 10.03508472442627, 10.515523910522461, 10.995963096618652, 11.476402282714844, 11.956841468811035, 12.437280654907227, 12.917719841003418, 13.39815902709961, 13.8785982131958, 14.359037399291992]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 2.0, 5.0, 11.0, 4.0, 8.0, 15.0, 17.0, 16.0, 23.0, 24.0, 34.0, 23.0, 38.0, 37.0, 40.0, 44.0, 47.0, 32.0, 54.0, 47.0, 42.0, 48.0, 47.0, 33.0, 38.0, 27.0, 36.0, 30.0, 31.0, 19.0, 25.0, 12.0, 22.0, 16.0, 15.0, 10.0, 8.0, 5.0, 5.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-19.84613037109375, -19.331809997558594, -18.81749153137207, -18.303171157836914, -17.788850784301758, -17.2745304107666, -16.760211944580078, -16.245891571044922, -15.731571197509766, -15.217251777648926, -14.70293140411377, -14.18861198425293, -13.674291610717773, -13.159972190856934, -12.645652770996094, -12.131332397460938, -11.617012977600098, -11.102693557739258, -10.588373184204102, -10.074053764343262, -9.559733390808105, -9.045413970947266, -8.53109359741211, -8.01677417755127, -7.5024542808532715, -6.988134384155273, -6.473814487457275, -5.959494590759277, -5.4451751708984375, -4.930854797363281, -4.416535377502441, -3.9022154808044434, -3.3878955841064453, -2.8735756874084473, -2.359255790710449, -1.8449361324310303, -1.3306162357330322, -0.8162963390350342, -0.30197668075561523, 0.2123432159423828, 0.7266631126403809, 1.240983009338379, 1.7553027868270874, 2.269622564315796, 2.783942461013794, 3.298262357711792, 3.812582015991211, 4.326901912689209, 4.841221809387207, 5.355541706085205, 5.869861602783203, 6.384181022644043, 6.898501396179199, 7.412820816040039, 7.927140712738037, 8.441460609436035, 8.955780029296875, 9.470099449157715, 9.984419822692871, 10.498739242553711, 11.013059616088867, 11.527379035949707, 12.041698455810547, 12.556018829345703, 13.07033920288086]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 5.0, 2.0, 1.0, 9.0, 8.0, 5.0, 6.0, 6.0, 9.0, 10.0, 14.0, 21.0, 12.0, 23.0, 25.0, 16.0, 33.0, 22.0, 35.0, 30.0, 24.0, 33.0, 37.0, 38.0, 37.0, 31.0, 32.0, 31.0, 32.0, 38.0, 30.0, 40.0, 31.0, 34.0, 24.0, 24.0, 25.0, 27.0, 14.0, 13.0, 9.0, 21.0, 17.0, 11.0, 16.0, 10.0, 5.0, 6.0, 8.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.4365234375, -1.3918914794921875, -1.347259521484375, -1.3026275634765625, -1.25799560546875, -1.2133636474609375, -1.168731689453125, -1.1240997314453125, -1.0794677734375, -1.0348358154296875, -0.990203857421875, -0.9455718994140625, -0.90093994140625, -0.8563079833984375, -0.811676025390625, -0.7670440673828125, -0.722412109375, -0.6777801513671875, -0.633148193359375, -0.5885162353515625, -0.54388427734375, -0.4992523193359375, -0.454620361328125, -0.4099884033203125, -0.3653564453125, -0.3207244873046875, -0.276092529296875, -0.2314605712890625, -0.18682861328125, -0.1421966552734375, -0.097564697265625, -0.0529327392578125, -0.00830078125, 0.0363311767578125, 0.080963134765625, 0.1255950927734375, 0.17022705078125, 0.2148590087890625, 0.259490966796875, 0.3041229248046875, 0.3487548828125, 0.3933868408203125, 0.438018798828125, 0.4826507568359375, 0.52728271484375, 0.5719146728515625, 0.616546630859375, 0.6611785888671875, 0.705810546875, 0.7504425048828125, 0.795074462890625, 0.8397064208984375, 0.88433837890625, 0.9289703369140625, 0.973602294921875, 1.0182342529296875, 1.0628662109375, 1.1074981689453125, 1.152130126953125, 1.1967620849609375, 1.24139404296875, 1.2860260009765625, 1.330657958984375, 1.3752899169921875, 1.419921875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 12.0, 3.0, 15.0, 30.0, 38.0, 58.0, 92.0, 142.0, 211.0, 324.0, 486.0, 771.0, 1143.0, 1678.0, 2631.0, 3845.0, 6118.0, 9237.0, 13981.0, 21609.0, 33323.0, 51112.0, 77216.0, 113347.0, 152383.0, 162407.0, 129419.0, 91174.0, 61104.0, 39924.0, 25976.0, 16816.0, 11217.0, 7136.0, 4555.0, 3068.0, 2100.0, 1298.0, 881.0, 557.0, 388.0, 254.0, 179.0, 107.0, 72.0, 40.0, 29.0, 25.0, 12.0, 5.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0], "bins": [-0.1644287109375, -0.15947723388671875, -0.1545257568359375, -0.14957427978515625, -0.144622802734375, -0.13967132568359375, -0.1347198486328125, -0.12976837158203125, -0.12481689453125, -0.11986541748046875, -0.1149139404296875, -0.10996246337890625, -0.105010986328125, -0.10005950927734375, -0.0951080322265625, -0.09015655517578125, -0.085205078125, -0.08025360107421875, -0.0753021240234375, -0.07035064697265625, -0.065399169921875, -0.06044769287109375, -0.0554962158203125, -0.05054473876953125, -0.04559326171875, -0.04064178466796875, -0.0356903076171875, -0.03073883056640625, -0.025787353515625, -0.02083587646484375, -0.0158843994140625, -0.01093292236328125, -0.0059814453125, -0.00102996826171875, 0.0039215087890625, 0.00887298583984375, 0.013824462890625, 0.01877593994140625, 0.0237274169921875, 0.02867889404296875, 0.03363037109375, 0.03858184814453125, 0.0435333251953125, 0.04848480224609375, 0.053436279296875, 0.05838775634765625, 0.0633392333984375, 0.06829071044921875, 0.0732421875, 0.07819366455078125, 0.0831451416015625, 0.08809661865234375, 0.093048095703125, 0.09799957275390625, 0.1029510498046875, 0.10790252685546875, 0.11285400390625, 0.11780548095703125, 0.1227569580078125, 0.12770843505859375, 0.132659912109375, 0.13761138916015625, 0.1425628662109375, 0.14751434326171875, 0.1524658203125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 2.0, 7.0, 4.0, 8.0, 16.0, 11.0, 14.0, 13.0, 17.0, 17.0, 18.0, 17.0, 14.0, 31.0, 28.0, 26.0, 29.0, 24.0, 32.0, 33.0, 42.0, 41.0, 31.0, 1056.0, 53.0, 41.0, 46.0, 37.0, 26.0, 29.0, 37.0, 33.0, 23.0, 21.0, 23.0, 23.0, 21.0, 18.0, 24.0, 4.0, 5.0, 5.0, 5.0, 5.0, 4.0, 3.0, 4.0, 3.0, 1.0, 3.0, 4.0], "bins": [-1.3359375, -1.298919677734375, -1.26190185546875, -1.224884033203125, -1.1878662109375, -1.150848388671875, -1.11383056640625, -1.076812744140625, -1.039794921875, -1.002777099609375, -0.96575927734375, -0.928741455078125, -0.8917236328125, -0.854705810546875, -0.81768798828125, -0.780670166015625, -0.74365234375, -0.706634521484375, -0.66961669921875, -0.632598876953125, -0.5955810546875, -0.558563232421875, -0.52154541015625, -0.484527587890625, -0.447509765625, -0.410491943359375, -0.37347412109375, -0.336456298828125, -0.2994384765625, -0.262420654296875, -0.22540283203125, -0.188385009765625, -0.1513671875, -0.114349365234375, -0.07733154296875, -0.040313720703125, -0.0032958984375, 0.033721923828125, 0.07073974609375, 0.107757568359375, 0.144775390625, 0.181793212890625, 0.21881103515625, 0.255828857421875, 0.2928466796875, 0.329864501953125, 0.36688232421875, 0.403900146484375, 0.44091796875, 0.477935791015625, 0.51495361328125, 0.551971435546875, 0.5889892578125, 0.626007080078125, 0.66302490234375, 0.700042724609375, 0.737060546875, 0.774078369140625, 0.81109619140625, 0.848114013671875, 0.8851318359375, 0.922149658203125, 0.95916748046875, 0.996185302734375, 1.033203125]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 6.0, 15.0, 17.0, 22.0, 21.0, 36.0, 60.0, 75.0, 138.0, 203.0, 355.0, 487.0, 829.0, 1299.0, 2155.0, 3642.0, 6045.0, 9645.0, 16192.0, 26170.0, 44263.0, 73750.0, 119911.0, 205968.0, 1206632.0, 145925.0, 92186.0, 56245.0, 33503.0, 20055.0, 12190.0, 7517.0, 4457.0, 2723.0, 1626.0, 994.0, 665.0, 406.0, 237.0, 173.0, 99.0, 72.0, 44.0, 38.0, 17.0, 11.0, 7.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.10174560546875, -0.09868335723876953, -0.09562110900878906, -0.0925588607788086, -0.08949661254882812, -0.08643436431884766, -0.08337211608886719, -0.08030986785888672, -0.07724761962890625, -0.07418537139892578, -0.07112312316894531, -0.06806087493896484, -0.06499862670898438, -0.061936378479003906, -0.05887413024902344, -0.05581188201904297, -0.0527496337890625, -0.04968738555908203, -0.04662513732910156, -0.043562889099121094, -0.040500640869140625, -0.037438392639160156, -0.03437614440917969, -0.03131389617919922, -0.02825164794921875, -0.02518939971923828, -0.022127151489257812, -0.019064903259277344, -0.016002655029296875, -0.012940406799316406, -0.009878158569335938, -0.006815910339355469, -0.003753662109375, -0.0006914138793945312, 0.0023708343505859375, 0.005433082580566406, 0.008495330810546875, 0.011557579040527344, 0.014619827270507812, 0.01768207550048828, 0.02074432373046875, 0.02380657196044922, 0.026868820190429688, 0.029931068420410156, 0.032993316650390625, 0.036055564880371094, 0.03911781311035156, 0.04218006134033203, 0.0452423095703125, 0.04830455780029297, 0.05136680603027344, 0.054429054260253906, 0.057491302490234375, 0.060553550720214844, 0.06361579895019531, 0.06667804718017578, 0.06974029541015625, 0.07280254364013672, 0.07586479187011719, 0.07892704010009766, 0.08198928833007812, 0.0850515365600586, 0.08811378479003906, 0.09117603302001953, 0.09423828125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 1.0, 7.0, 7.0, 9.0, 7.0, 10.0, 7.0, 14.0, 12.0, 15.0, 16.0, 11.0, 25.0, 29.0, 27.0, 54.0, 51.0, 82.0, 80.0, 97.0, 76.0, 55.0, 42.0, 56.0, 38.0, 18.0, 25.0, 15.0, 16.0, 11.0, 14.0, 13.0, 8.0, 6.0, 13.0, 6.0, 5.0, 9.0, 3.0, 3.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0064697265625, -0.006255030632019043, -0.006040334701538086, -0.005825638771057129, -0.005610942840576172, -0.005396246910095215, -0.005181550979614258, -0.004966855049133301, -0.004752159118652344, -0.004537463188171387, -0.00432276725769043, -0.004108071327209473, -0.0038933753967285156, -0.0036786794662475586, -0.0034639835357666016, -0.0032492876052856445, -0.0030345916748046875, -0.0028198957443237305, -0.0026051998138427734, -0.0023905038833618164, -0.0021758079528808594, -0.0019611120223999023, -0.0017464160919189453, -0.0015317201614379883, -0.0013170242309570312, -0.0011023283004760742, -0.0008876323699951172, -0.0006729364395141602, -0.0004582405090332031, -0.0002435445785522461, -2.8848648071289062e-05, 0.00018584728240966797, 0.000400543212890625, 0.000615239143371582, 0.0008299350738525391, 0.001044631004333496, 0.0012593269348144531, 0.0014740228652954102, 0.0016887187957763672, 0.0019034147262573242, 0.0021181106567382812, 0.0023328065872192383, 0.0025475025177001953, 0.0027621984481811523, 0.0029768943786621094, 0.0031915903091430664, 0.0034062862396240234, 0.0036209821701049805, 0.0038356781005859375, 0.0040503740310668945, 0.0042650699615478516, 0.004479765892028809, 0.004694461822509766, 0.004909157752990723, 0.00512385368347168, 0.005338549613952637, 0.005553245544433594, 0.005767941474914551, 0.005982637405395508, 0.006197333335876465, 0.006412029266357422, 0.006626725196838379, 0.006841421127319336, 0.007056117057800293, 0.00727081298828125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 7.0, 6.0, 5.0, 6.0, 8.0, 9.0, 9.0, 16.0, 17.0, 20.0, 29.0, 41.0, 59.0, 93.0, 166.0, 366.0, 1008.0, 3882.0, 26948.0, 766563.0, 232038.0, 13296.0, 2558.0, 703.0, 290.0, 127.0, 87.0, 46.0, 33.0, 29.0, 16.0, 16.0, 9.0, 7.0, 9.0, 8.0, 10.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.12445068359375, -0.12066173553466797, -0.11687278747558594, -0.1130838394165039, -0.10929489135742188, -0.10550594329833984, -0.10171699523925781, -0.09792804718017578, -0.09413909912109375, -0.09035015106201172, -0.08656120300292969, -0.08277225494384766, -0.07898330688476562, -0.0751943588256836, -0.07140541076660156, -0.06761646270751953, -0.0638275146484375, -0.06003856658935547, -0.05624961853027344, -0.052460670471191406, -0.048671722412109375, -0.044882774353027344, -0.04109382629394531, -0.03730487823486328, -0.03351593017578125, -0.02972698211669922, -0.025938034057617188, -0.022149085998535156, -0.018360137939453125, -0.014571189880371094, -0.010782241821289062, -0.006993293762207031, -0.003204345703125, 0.0005846023559570312, 0.0043735504150390625, 0.008162498474121094, 0.011951446533203125, 0.015740394592285156, 0.019529342651367188, 0.02331829071044922, 0.02710723876953125, 0.03089618682861328, 0.03468513488769531, 0.038474082946777344, 0.042263031005859375, 0.046051979064941406, 0.04984092712402344, 0.05362987518310547, 0.0574188232421875, 0.06120777130126953, 0.06499671936035156, 0.0687856674194336, 0.07257461547851562, 0.07636356353759766, 0.08015251159667969, 0.08394145965576172, 0.08773040771484375, 0.09151935577392578, 0.09530830383300781, 0.09909725189208984, 0.10288619995117188, 0.1066751480102539, 0.11046409606933594, 0.11425304412841797, 0.1180419921875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 4.0, 2.0, 9.0, 6.0, 24.0, 21.0, 39.0, 55.0, 72.0, 109.0, 232.0, 160.0, 89.0, 57.0, 31.0, 29.0, 23.0, 12.0, 7.0, 3.0, 6.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044838305562734604, -0.04316065460443497, -0.04148300364613533, -0.03980535268783569, -0.03812769800424576, -0.03645004704594612, -0.034772396087646484, -0.03309474512934685, -0.03141709417104721, -0.029739443212747574, -0.028061790391802788, -0.02638413943350315, -0.024706486612558365, -0.023028835654258728, -0.02135118469595909, -0.019673533737659454, -0.01799587905406952, -0.016318228095769882, -0.014640575274825096, -0.01296292431652546, -0.011285272426903248, -0.009607620537281036, -0.0079299695789814, -0.006252317689359188, -0.004574665799736977, -0.002897014142945409, -0.001219362486153841, 0.00045828893780708313, 0.0021359408274292946, 0.003813592717051506, 0.005491243675351143, 0.007168895564973354, 0.008846551179885864, 0.010524203069508076, 0.012201854959130287, 0.013879505917429924, 0.015557157807052135, 0.017234809696674347, 0.018912460654973984, 0.02059011161327362, 0.022267764434218407, 0.023945415392518044, 0.02562306821346283, 0.027300719171762466, 0.028978370130062103, 0.03065602295100689, 0.03233367204666138, 0.03401132673025131, 0.03568897768855095, 0.037366628646850586, 0.03904427960515022, 0.04072193056344986, 0.042399585247039795, 0.04407723620533943, 0.04575488716363907, 0.047432538121938705, 0.04911018908023834, 0.05078784003853798, 0.052465490996837616, 0.05414314568042755, 0.05582079663872719, 0.057498447597026825, 0.05917609855532646, 0.0608537495136261, 0.06253140419721603]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 5.0, 8.0, 4.0, 6.0, 9.0, 10.0, 10.0, 11.0, 13.0, 18.0, 20.0, 20.0, 27.0, 27.0, 32.0, 26.0, 19.0, 40.0, 33.0, 27.0, 28.0, 24.0, 30.0, 30.0, 37.0, 35.0, 30.0, 43.0, 38.0, 23.0, 26.0, 32.0, 26.0, 21.0, 27.0, 23.0, 21.0, 16.0, 19.0, 15.0, 14.0, 10.0, 12.0, 9.0, 6.0, 7.0, 7.0, 6.0, 3.0, 7.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 2.0], "bins": [-0.0170099139213562, -0.01646992191672325, -0.01592993177473545, -0.015389940701425076, -0.0148499496281147, -0.014309958554804325, -0.01376996748149395, -0.013229976408183575, -0.0126899853348732, -0.012149994261562824, -0.011610003188252449, -0.011070012114942074, -0.010530021041631699, -0.009990029968321323, -0.009450038895010948, -0.008910047821700573, -0.008370056748390198, -0.007830065675079823, -0.007290074601769447, -0.006750083528459072, -0.006210092455148697, -0.005670101381838322, -0.0051301103085279465, -0.004590119235217571, -0.004050128161907196, -0.003510137088596821, -0.0029701460152864456, -0.0024301549419760704, -0.0018901638686656952, -0.00135017279535532, -0.0008101817220449448, -0.00027019064873456955, 0.00026980042457580566, 0.0008097914978861809, 0.001349782571196556, 0.0018897736445069313, 0.0024297647178173065, 0.0029697557911276817, 0.003509746864438057, 0.004049737937748432, 0.004589729011058807, 0.005129720084369183, 0.005669711157679558, 0.006209702230989933, 0.006749693304300308, 0.0072896843776106834, 0.007829675450921059, 0.008369666524231434, 0.008909657597541809, 0.009449648670852184, 0.00998963974416256, 0.010529630817472935, 0.01106962189078331, 0.011609612964093685, 0.01214960403740406, 0.012689595110714436, 0.01322958618402481, 0.013769577257335186, 0.014309568330645561, 0.014849559403955936, 0.015389550477266312, 0.01592954248189926, 0.016469532623887062, 0.017009522765874863, 0.017549514770507812]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 2.0, 1.0, 9.0, 8.0, 5.0, 6.0, 6.0, 9.0, 10.0, 15.0, 20.0, 12.0, 23.0, 26.0, 15.0, 33.0, 22.0, 35.0, 30.0, 24.0, 33.0, 37.0, 38.0, 37.0, 31.0, 32.0, 32.0, 31.0, 38.0, 30.0, 40.0, 31.0, 34.0, 24.0, 23.0, 26.0, 27.0, 13.0, 14.0, 10.0, 19.0, 17.0, 12.0, 16.0, 10.0, 5.0, 6.0, 8.0, 4.0, 4.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.435546875, -1.3909454345703125, -1.346343994140625, -1.3017425537109375, -1.25714111328125, -1.2125396728515625, -1.167938232421875, -1.1233367919921875, -1.0787353515625, -1.0341339111328125, -0.989532470703125, -0.9449310302734375, -0.90032958984375, -0.8557281494140625, -0.811126708984375, -0.7665252685546875, -0.721923828125, -0.6773223876953125, -0.632720947265625, -0.5881195068359375, -0.54351806640625, -0.4989166259765625, -0.454315185546875, -0.4097137451171875, -0.3651123046875, -0.3205108642578125, -0.275909423828125, -0.2313079833984375, -0.18670654296875, -0.1421051025390625, -0.097503662109375, -0.0529022216796875, -0.00830078125, 0.0363006591796875, 0.080902099609375, 0.1255035400390625, 0.17010498046875, 0.2147064208984375, 0.259307861328125, 0.3039093017578125, 0.3485107421875, 0.3931121826171875, 0.437713623046875, 0.4823150634765625, 0.52691650390625, 0.5715179443359375, 0.616119384765625, 0.6607208251953125, 0.705322265625, 0.7499237060546875, 0.794525146484375, 0.8391265869140625, 0.88372802734375, 0.9283294677734375, 0.972930908203125, 1.0175323486328125, 1.0621337890625, 1.1067352294921875, 1.151336669921875, 1.1959381103515625, 1.24053955078125, 1.2851409912109375, 1.329742431640625, 1.3743438720703125, 1.4189453125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 7.0, 12.0, 23.0, 35.0, 50.0, 83.0, 120.0, 201.0, 332.0, 526.0, 839.0, 1368.0, 2165.0, 3490.0, 5660.0, 8775.0, 14038.0, 22238.0, 36184.0, 59925.0, 107393.0, 198495.0, 242074.0, 145261.0, 78499.0, 45682.0, 28075.0, 17430.0, 10961.0, 6924.0, 4409.0, 2760.0, 1680.0, 1078.0, 667.0, 391.0, 242.0, 195.0, 108.0, 64.0, 45.0, 19.0, 15.0, 10.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4638671875, -1.4170074462890625, -1.370147705078125, -1.3232879638671875, -1.27642822265625, -1.2295684814453125, -1.182708740234375, -1.1358489990234375, -1.0889892578125, -1.0421295166015625, -0.995269775390625, -0.9484100341796875, -0.90155029296875, -0.8546905517578125, -0.807830810546875, -0.7609710693359375, -0.714111328125, -0.6672515869140625, -0.620391845703125, -0.5735321044921875, -0.52667236328125, -0.4798126220703125, -0.432952880859375, -0.3860931396484375, -0.3392333984375, -0.2923736572265625, -0.245513916015625, -0.1986541748046875, -0.15179443359375, -0.1049346923828125, -0.058074951171875, -0.0112152099609375, 0.03564453125, 0.0825042724609375, 0.129364013671875, 0.1762237548828125, 0.22308349609375, 0.2699432373046875, 0.316802978515625, 0.3636627197265625, 0.4105224609375, 0.4573822021484375, 0.504241943359375, 0.5511016845703125, 0.59796142578125, 0.6448211669921875, 0.691680908203125, 0.7385406494140625, 0.785400390625, 0.8322601318359375, 0.879119873046875, 0.9259796142578125, 0.97283935546875, 1.0196990966796875, 1.066558837890625, 1.1134185791015625, 1.1602783203125, 1.2071380615234375, 1.253997802734375, 1.3008575439453125, 1.34771728515625, 1.3945770263671875, 1.441436767578125, 1.4882965087890625, 1.53515625]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 3.0, 8.0, 3.0, 18.0, 8.0, 11.0, 15.0, 20.0, 21.0, 35.0, 24.0, 31.0, 35.0, 46.0, 51.0, 81.0, 149.0, 272.0, 1483.0, 230.0, 101.0, 57.0, 49.0, 48.0, 41.0, 34.0, 40.0, 30.0, 15.0, 17.0, 17.0, 15.0, 9.0, 6.0, 2.0, 10.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.04296875, -6.8104248046875, -6.577880859375, -6.3453369140625, -6.11279296875, -5.8802490234375, -5.647705078125, -5.4151611328125, -5.1826171875, -4.9500732421875, -4.717529296875, -4.4849853515625, -4.25244140625, -4.0198974609375, -3.787353515625, -3.5548095703125, -3.322265625, -3.0897216796875, -2.857177734375, -2.6246337890625, -2.39208984375, -2.1595458984375, -1.927001953125, -1.6944580078125, -1.4619140625, -1.2293701171875, -0.996826171875, -0.7642822265625, -0.53173828125, -0.2991943359375, -0.066650390625, 0.1658935546875, 0.3984375, 0.6309814453125, 0.863525390625, 1.0960693359375, 1.32861328125, 1.5611572265625, 1.793701171875, 2.0262451171875, 2.2587890625, 2.4913330078125, 2.723876953125, 2.9564208984375, 3.18896484375, 3.4215087890625, 3.654052734375, 3.8865966796875, 4.119140625, 4.3516845703125, 4.584228515625, 4.8167724609375, 5.04931640625, 5.2818603515625, 5.514404296875, 5.7469482421875, 5.9794921875, 6.2120361328125, 6.444580078125, 6.6771240234375, 6.90966796875, 7.1422119140625, 7.374755859375, 7.6072998046875, 7.83984375]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 4.0, 1.0, 3.0, 6.0, 9.0, 23.0, 20.0, 21.0, 21.0, 44.0, 51.0, 57.0, 113.0, 169.0, 219.0, 404.0, 1052.0, 11597.0, 1238559.0, 1876664.0, 14315.0, 1172.0, 406.0, 244.0, 149.0, 99.0, 80.0, 45.0, 46.0, 30.0, 20.0, 13.0, 14.0, 10.0, 8.0, 6.0, 4.0, 6.0, 0.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.984375, -13.502685546875, -13.02099609375, -12.539306640625, -12.0576171875, -11.575927734375, -11.09423828125, -10.612548828125, -10.130859375, -9.649169921875, -9.16748046875, -8.685791015625, -8.2041015625, -7.722412109375, -7.24072265625, -6.759033203125, -6.27734375, -5.795654296875, -5.31396484375, -4.832275390625, -4.3505859375, -3.868896484375, -3.38720703125, -2.905517578125, -2.423828125, -1.942138671875, -1.46044921875, -0.978759765625, -0.4970703125, -0.015380859375, 0.46630859375, 0.947998046875, 1.4296875, 1.911376953125, 2.39306640625, 2.874755859375, 3.3564453125, 3.838134765625, 4.31982421875, 4.801513671875, 5.283203125, 5.764892578125, 6.24658203125, 6.728271484375, 7.2099609375, 7.691650390625, 8.17333984375, 8.655029296875, 9.13671875, 9.618408203125, 10.10009765625, 10.581787109375, 11.0634765625, 11.545166015625, 12.02685546875, 12.508544921875, 12.990234375, 13.471923828125, 13.95361328125, 14.435302734375, 14.9169921875, 15.398681640625, 15.88037109375, 16.362060546875, 16.84375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [609.0, 410.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.447629928588867, 0.2961602210998535, 6.039950370788574, 11.783740997314453, 17.527530670166016, 23.271320343017578, 29.015111923217773, 34.75890350341797, 40.50269317626953, 46.246482849121094, 51.990272521972656, 57.73406219482422, 63.47785186767578, 69.22164154052734, 74.96543884277344, 80.709228515625, 86.45301055908203, 92.1968002319336, 97.94058990478516, 103.68437957763672, 109.42816925048828, 115.17195892333984, 120.91575622558594, 126.6595458984375, 132.40333557128906, 138.14712524414062, 143.8909149169922, 149.63470458984375, 155.3784942626953, 161.12228393554688, 166.86607360839844, 172.60986328125, 178.35365295410156, 184.09744262695312, 189.8412322998047, 195.58502197265625, 201.3288116455078, 207.07260131835938, 212.81639099121094, 218.5601806640625, 224.30397033691406, 230.04776000976562, 235.7915496826172, 241.53533935546875, 247.2791290283203, 253.02291870117188, 258.7667236328125, 264.510498046875, 270.2543029785156, 275.99810791015625, 281.74188232421875, 287.4856872558594, 293.2294616699219, 298.9732666015625, 304.717041015625, 310.4608459472656, 316.2046203613281, 321.94842529296875, 327.69219970703125, 333.4360046386719, 339.1797790527344, 344.923583984375, 350.6673583984375, 356.4111633300781, 362.1549377441406]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 5.0, 5.0, 7.0, 23.0, 10.0, 26.0, 17.0, 27.0, 26.0, 36.0, 33.0, 34.0, 39.0, 37.0, 34.0, 28.0, 33.0, 39.0, 34.0, 42.0, 51.0, 31.0, 38.0, 43.0, 35.0, 30.0, 37.0, 37.0, 32.0, 22.0, 22.0, 9.0, 13.0, 8.0, 10.0, 10.0, 9.0, 5.0, 3.0, 1.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.397764205932617, -17.783998489379883, -17.17023277282715, -16.556467056274414, -15.94270133972168, -15.328935623168945, -14.715168952941895, -14.10140323638916, -13.487637519836426, -12.873871803283691, -12.260106086730957, -11.646340370178223, -11.032573699951172, -10.418807983398438, -9.805042266845703, -9.191276550292969, -8.577510833740234, -7.9637451171875, -7.349979400634766, -6.736213207244873, -6.122447490692139, -5.508681774139404, -4.894915580749512, -4.281149864196777, -3.667384147644043, -3.0536184310913086, -2.439852476119995, -1.8260866403579712, -1.2123208045959473, -0.5985550880432129, 0.015210866928100586, 0.6289768218994141, 1.2427406311035156, 1.8565064668655396, 2.4702723026275635, 3.084038257598877, 3.6978039741516113, 4.311569690704346, 4.925335884094238, 5.539101600646973, 6.152867317199707, 6.766633033752441, 7.380398750305176, 7.994164943695068, 8.607931137084961, 9.221696853637695, 9.83546257019043, 10.449228286743164, 11.062994003295898, 11.676759719848633, 12.290525436401367, 12.904291152954102, 13.518056869506836, 14.13182258605957, 14.745589256286621, 15.359354972839355, 15.97312068939209, 16.58688735961914, 17.200653076171875, 17.81441879272461, 18.428184509277344, 19.041950225830078, 19.655715942382812, 20.269481658935547, 20.88324737548828]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 4.0, 5.0, 8.0, 4.0, 11.0, 9.0, 12.0, 19.0, 10.0, 22.0, 20.0, 19.0, 19.0, 30.0, 26.0, 21.0, 33.0, 28.0, 46.0, 39.0, 39.0, 37.0, 33.0, 49.0, 31.0, 37.0, 39.0, 37.0, 26.0, 41.0, 31.0, 27.0, 25.0, 15.0, 26.0, 17.0, 22.0, 14.0, 12.0, 12.0, 11.0, 6.0, 16.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.853515625, -1.8003082275390625, -1.747100830078125, -1.6938934326171875, -1.64068603515625, -1.5874786376953125, -1.534271240234375, -1.4810638427734375, -1.4278564453125, -1.3746490478515625, -1.321441650390625, -1.2682342529296875, -1.21502685546875, -1.1618194580078125, -1.108612060546875, -1.0554046630859375, -1.002197265625, -0.9489898681640625, -0.895782470703125, -0.8425750732421875, -0.78936767578125, -0.7361602783203125, -0.682952880859375, -0.6297454833984375, -0.5765380859375, -0.5233306884765625, -0.470123291015625, -0.4169158935546875, -0.36370849609375, -0.3105010986328125, -0.257293701171875, -0.2040863037109375, -0.15087890625, -0.0976715087890625, -0.044464111328125, 0.0087432861328125, 0.06195068359375, 0.1151580810546875, 0.168365478515625, 0.2215728759765625, 0.2747802734375, 0.3279876708984375, 0.381195068359375, 0.4344024658203125, 0.48760986328125, 0.5408172607421875, 0.594024658203125, 0.6472320556640625, 0.700439453125, 0.7536468505859375, 0.806854248046875, 0.8600616455078125, 0.91326904296875, 0.9664764404296875, 1.019683837890625, 1.0728912353515625, 1.1260986328125, 1.1793060302734375, 1.232513427734375, 1.2857208251953125, 1.33892822265625, 1.3921356201171875, 1.445343017578125, 1.4985504150390625, 1.5517578125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 1.0, 5.0, 6.0, 10.0, 6.0, 10.0, 16.0, 16.0, 22.0, 40.0, 45.0, 71.0, 99.0, 208.0, 350.0, 787.0, 1679.0, 4104.0, 11068.0, 31638.0, 98148.0, 326939.0, 1073322.0, 1646033.0, 698281.0, 204727.0, 62542.0, 21050.0, 7560.0, 2965.0, 1213.0, 585.0, 285.0, 154.0, 87.0, 58.0, 32.0, 26.0, 21.0, 13.0, 19.0, 8.0, 4.0, 4.0, 3.0, 11.0, 1.0, 4.0, 5.0, 2.0, 1.0, 0.0, 3.0], "bins": [-3.107421875, -3.016845703125, -2.92626953125, -2.835693359375, -2.7451171875, -2.654541015625, -2.56396484375, -2.473388671875, -2.3828125, -2.292236328125, -2.20166015625, -2.111083984375, -2.0205078125, -1.929931640625, -1.83935546875, -1.748779296875, -1.658203125, -1.567626953125, -1.47705078125, -1.386474609375, -1.2958984375, -1.205322265625, -1.11474609375, -1.024169921875, -0.93359375, -0.843017578125, -0.75244140625, -0.661865234375, -0.5712890625, -0.480712890625, -0.39013671875, -0.299560546875, -0.208984375, -0.118408203125, -0.02783203125, 0.062744140625, 0.1533203125, 0.243896484375, 0.33447265625, 0.425048828125, 0.515625, 0.606201171875, 0.69677734375, 0.787353515625, 0.8779296875, 0.968505859375, 1.05908203125, 1.149658203125, 1.240234375, 1.330810546875, 1.42138671875, 1.511962890625, 1.6025390625, 1.693115234375, 1.78369140625, 1.874267578125, 1.96484375, 2.055419921875, 2.14599609375, 2.236572265625, 2.3271484375, 2.417724609375, 2.50830078125, 2.598876953125, 2.689453125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 8.0, 10.0, 20.0, 23.0, 26.0, 52.0, 76.0, 114.0, 146.0, 207.0, 300.0, 378.0, 484.0, 498.0, 494.0, 346.0, 246.0, 183.0, 134.0, 103.0, 59.0, 49.0, 44.0, 22.0, 18.0, 10.0, 9.0, 3.0, 5.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-6.81640625, -6.65155029296875, -6.4866943359375, -6.32183837890625, -6.156982421875, -5.99212646484375, -5.8272705078125, -5.66241455078125, -5.49755859375, -5.33270263671875, -5.1678466796875, -5.00299072265625, -4.838134765625, -4.67327880859375, -4.5084228515625, -4.34356689453125, -4.1787109375, -4.01385498046875, -3.8489990234375, -3.68414306640625, -3.519287109375, -3.35443115234375, -3.1895751953125, -3.02471923828125, -2.85986328125, -2.69500732421875, -2.5301513671875, -2.36529541015625, -2.200439453125, -2.03558349609375, -1.8707275390625, -1.70587158203125, -1.541015625, -1.37615966796875, -1.2113037109375, -1.04644775390625, -0.881591796875, -0.71673583984375, -0.5518798828125, -0.38702392578125, -0.22216796875, -0.05731201171875, 0.1075439453125, 0.27239990234375, 0.437255859375, 0.60211181640625, 0.7669677734375, 0.93182373046875, 1.0966796875, 1.26153564453125, 1.4263916015625, 1.59124755859375, 1.756103515625, 1.92095947265625, 2.0858154296875, 2.25067138671875, 2.41552734375, 2.58038330078125, 2.7452392578125, 2.91009521484375, 3.074951171875, 3.23980712890625, 3.4046630859375, 3.56951904296875, 3.734375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 8.0, 9.0, 15.0, 18.0, 32.0, 44.0, 70.0, 92.0, 130.0, 216.0, 338.0, 761.0, 2472.0, 15581.0, 158292.0, 1744910.0, 2051636.0, 196117.0, 18910.0, 2888.0, 780.0, 345.0, 221.0, 138.0, 85.0, 63.0, 39.0, 29.0, 15.0, 14.0, 7.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.0625, -5.7874755859375, -5.512451171875, -5.2374267578125, -4.96240234375, -4.6873779296875, -4.412353515625, -4.1373291015625, -3.8623046875, -3.5872802734375, -3.312255859375, -3.0372314453125, -2.76220703125, -2.4871826171875, -2.212158203125, -1.9371337890625, -1.662109375, -1.3870849609375, -1.112060546875, -0.8370361328125, -0.56201171875, -0.2869873046875, -0.011962890625, 0.2630615234375, 0.5380859375, 0.8131103515625, 1.088134765625, 1.3631591796875, 1.63818359375, 1.9132080078125, 2.188232421875, 2.4632568359375, 2.73828125, 3.0133056640625, 3.288330078125, 3.5633544921875, 3.83837890625, 4.1134033203125, 4.388427734375, 4.6634521484375, 4.9384765625, 5.2135009765625, 5.488525390625, 5.7635498046875, 6.03857421875, 6.3135986328125, 6.588623046875, 6.8636474609375, 7.138671875, 7.4136962890625, 7.688720703125, 7.9637451171875, 8.23876953125, 8.5137939453125, 8.788818359375, 9.0638427734375, 9.3388671875, 9.6138916015625, 9.888916015625, 10.1639404296875, 10.43896484375, 10.7139892578125, 10.989013671875, 11.2640380859375, 11.5390625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 29.0, 68.0, 127.0, 170.0, 211.0, 188.0, 136.0, 56.0, 15.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.99323272705078, -41.537227630615234, -40.08122253417969, -38.625213623046875, -37.16920852661133, -35.71320343017578, -34.257198333740234, -32.80119323730469, -31.345186233520508, -29.88918113708496, -28.43317413330078, -26.977169036865234, -25.521163940429688, -24.065156936645508, -22.60915184020996, -21.15314483642578, -19.697139739990234, -18.241134643554688, -16.785127639770508, -15.329122543334961, -13.873116493225098, -12.417110443115234, -10.961105346679688, -9.505099296569824, -8.049093246459961, -6.593087196350098, -5.137081623077393, -3.6810760498046875, -2.225069999694824, -0.7690639495849609, 0.6869411468505859, 2.142947196960449, 3.598949432373047, 5.05495548248291, 6.510961055755615, 7.96696662902832, 9.422972679138184, 10.878978729248047, 12.334983825683594, 13.790989875793457, 15.24699592590332, 16.703001022338867, 18.159008026123047, 19.615013122558594, 21.07101821899414, 22.52702522277832, 23.983030319213867, 25.439037322998047, 26.895042419433594, 28.35104751586914, 29.80705451965332, 31.263059616088867, 32.71906661987305, 34.175071716308594, 35.63107681274414, 37.08708190917969, 38.5430908203125, 39.99909591674805, 41.455101013183594, 42.911109924316406, 44.36711502075195, 45.8231201171875, 47.27912521362305, 48.735130310058594, 50.19113540649414]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 6.0, 4.0, 3.0, 10.0, 11.0, 9.0, 13.0, 14.0, 18.0, 19.0, 24.0, 27.0, 28.0, 32.0, 44.0, 44.0, 41.0, 35.0, 47.0, 37.0, 40.0, 38.0, 44.0, 45.0, 51.0, 40.0, 32.0, 30.0, 37.0, 25.0, 21.0, 16.0, 28.0, 18.0, 17.0, 11.0, 9.0, 9.0, 10.0, 7.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.689109802246094, -12.217751502990723, -11.746392250061035, -11.275033950805664, -10.803675651550293, -10.332316398620605, -9.860958099365234, -9.389598846435547, -8.918240547180176, -8.446882247924805, -7.975523471832275, -7.504164695739746, -7.032805919647217, -6.5614471435546875, -6.090088844299316, -5.618730068206787, -5.147371768951416, -4.676012992858887, -4.204654693603516, -3.7332959175109863, -3.261937141418457, -2.790578603744507, -2.3192200660705566, -1.8478612899780273, -1.3765027523040771, -0.9051440954208374, -0.43378549814224243, 0.03757309913635254, 0.5089317560195923, 0.980290412902832, 1.4516489505767822, 1.9230077266693115, 2.3943662643432617, 2.865724802017212, 3.337083578109741, 3.8084421157836914, 4.279800891876221, 4.75115966796875, 5.222517967224121, 5.69387674331665, 6.16523551940918, 6.636594295501709, 7.10795259475708, 7.579311370849609, 8.05066967010498, 8.522028923034668, 8.993387222290039, 9.464746475219727, 9.936103820800781, 10.407462120056152, 10.87882137298584, 11.350179672241211, 11.821537971496582, 12.29289722442627, 12.76425552368164, 13.235614776611328, 13.7069730758667, 14.17833137512207, 14.649690628051758, 15.121048927307129, 15.5924072265625, 16.063766479492188, 16.535125732421875, 17.00648307800293, 17.477842330932617]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 6.0, 8.0, 7.0, 8.0, 13.0, 11.0, 23.0, 19.0, 23.0, 13.0, 20.0, 29.0, 22.0, 30.0, 36.0, 36.0, 31.0, 36.0, 40.0, 36.0, 36.0, 47.0, 35.0, 40.0, 38.0, 30.0, 26.0, 40.0, 36.0, 27.0, 34.0, 23.0, 20.0, 13.0, 13.0, 18.0, 10.0, 13.0, 11.0, 8.0, 8.0, 8.0, 8.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-1.97265625, -1.9188232421875, -1.864990234375, -1.8111572265625, -1.75732421875, -1.7034912109375, -1.649658203125, -1.5958251953125, -1.5419921875, -1.4881591796875, -1.434326171875, -1.3804931640625, -1.32666015625, -1.2728271484375, -1.218994140625, -1.1651611328125, -1.111328125, -1.0574951171875, -1.003662109375, -0.9498291015625, -0.89599609375, -0.8421630859375, -0.788330078125, -0.7344970703125, -0.6806640625, -0.6268310546875, -0.572998046875, -0.5191650390625, -0.46533203125, -0.4114990234375, -0.357666015625, -0.3038330078125, -0.25, -0.1961669921875, -0.142333984375, -0.0885009765625, -0.03466796875, 0.0191650390625, 0.072998046875, 0.1268310546875, 0.1806640625, 0.2344970703125, 0.288330078125, 0.3421630859375, 0.39599609375, 0.4498291015625, 0.503662109375, 0.5574951171875, 0.611328125, 0.6651611328125, 0.718994140625, 0.7728271484375, 0.82666015625, 0.8804931640625, 0.934326171875, 0.9881591796875, 1.0419921875, 1.0958251953125, 1.149658203125, 1.2034912109375, 1.25732421875, 1.3111572265625, 1.364990234375, 1.4188232421875, 1.47265625]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 7.0, 5.0, 8.0, 16.0, 28.0, 44.0, 81.0, 104.0, 151.0, 255.0, 374.0, 546.0, 869.0, 1387.0, 2021.0, 3130.0, 4690.0, 6912.0, 10736.0, 16274.0, 24552.0, 38400.0, 58738.0, 88667.0, 129066.0, 165426.0, 156757.0, 114622.0, 77333.0, 51201.0, 33230.0, 21500.0, 14159.0, 9142.0, 6130.0, 4002.0, 2773.0, 1801.0, 1186.0, 766.0, 546.0, 295.0, 204.0, 158.0, 106.0, 77.0, 32.0, 18.0, 17.0, 10.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1728515625, -0.16724586486816406, -0.16164016723632812, -0.1560344696044922, -0.15042877197265625, -0.1448230743408203, -0.13921737670898438, -0.13361167907714844, -0.1280059814453125, -0.12240028381347656, -0.11679458618164062, -0.11118888854980469, -0.10558319091796875, -0.09997749328613281, -0.09437179565429688, -0.08876609802246094, -0.083160400390625, -0.07755470275878906, -0.07194900512695312, -0.06634330749511719, -0.06073760986328125, -0.05513191223144531, -0.049526214599609375, -0.04392051696777344, -0.0383148193359375, -0.03270912170410156, -0.027103424072265625, -0.021497726440429688, -0.01589202880859375, -0.010286331176757812, -0.004680633544921875, 0.0009250640869140625, 0.00653076171875, 0.012136459350585938, 0.017742156982421875, 0.023347854614257812, 0.02895355224609375, 0.03455924987792969, 0.040164947509765625, 0.04577064514160156, 0.0513763427734375, 0.05698204040527344, 0.06258773803710938, 0.06819343566894531, 0.07379913330078125, 0.07940483093261719, 0.08501052856445312, 0.09061622619628906, 0.096221923828125, 0.10182762145996094, 0.10743331909179688, 0.11303901672363281, 0.11864471435546875, 0.12425041198730469, 0.12985610961914062, 0.13546180725097656, 0.1410675048828125, 0.14667320251464844, 0.15227890014648438, 0.1578845977783203, 0.16349029541015625, 0.1690959930419922, 0.17470169067382812, 0.18030738830566406, 0.1859130859375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 3.0, 6.0, 4.0, 9.0, 10.0, 15.0, 12.0, 12.0, 16.0, 21.0, 13.0, 17.0, 22.0, 26.0, 37.0, 24.0, 36.0, 36.0, 30.0, 44.0, 30.0, 41.0, 1062.0, 32.0, 35.0, 34.0, 37.0, 36.0, 28.0, 40.0, 33.0, 29.0, 17.0, 24.0, 25.0, 14.0, 16.0, 13.0, 13.0, 9.0, 15.0, 7.0, 12.0, 1.0, 9.0, 6.0, 4.0, 1.0, 3.0, 5.0, 2.0, 2.0], "bins": [-1.521484375, -1.4777984619140625, -1.434112548828125, -1.3904266357421875, -1.34674072265625, -1.3030548095703125, -1.259368896484375, -1.2156829833984375, -1.1719970703125, -1.1283111572265625, -1.084625244140625, -1.0409393310546875, -0.99725341796875, -0.9535675048828125, -0.909881591796875, -0.8661956787109375, -0.822509765625, -0.7788238525390625, -0.735137939453125, -0.6914520263671875, -0.64776611328125, -0.6040802001953125, -0.560394287109375, -0.5167083740234375, -0.4730224609375, -0.4293365478515625, -0.385650634765625, -0.3419647216796875, -0.29827880859375, -0.2545928955078125, -0.210906982421875, -0.1672210693359375, -0.12353515625, -0.0798492431640625, -0.036163330078125, 0.0075225830078125, 0.05120849609375, 0.0948944091796875, 0.138580322265625, 0.1822662353515625, 0.2259521484375, 0.2696380615234375, 0.313323974609375, 0.3570098876953125, 0.40069580078125, 0.4443817138671875, 0.488067626953125, 0.5317535400390625, 0.575439453125, 0.6191253662109375, 0.662811279296875, 0.7064971923828125, 0.75018310546875, 0.7938690185546875, 0.837554931640625, 0.8812408447265625, 0.9249267578125, 0.9686126708984375, 1.012298583984375, 1.0559844970703125, 1.09967041015625, 1.1433563232421875, 1.187042236328125, 1.2307281494140625, 1.2744140625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 15.0, 15.0, 14.0, 34.0, 46.0, 60.0, 93.0, 143.0, 237.0, 364.0, 577.0, 826.0, 1347.0, 2360.0, 3728.0, 6139.0, 10069.0, 16606.0, 27446.0, 45364.0, 75145.0, 121060.0, 212735.0, 1199920.0, 142757.0, 90667.0, 54858.0, 33003.0, 20022.0, 12222.0, 7424.0, 4483.0, 2799.0, 1623.0, 1045.0, 653.0, 454.0, 249.0, 175.0, 115.0, 72.0, 50.0, 34.0, 34.0, 18.0, 17.0, 4.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.10809326171875, -0.10462760925292969, -0.10116195678710938, -0.09769630432128906, -0.09423065185546875, -0.09076499938964844, -0.08729934692382812, -0.08383369445800781, -0.0803680419921875, -0.07690238952636719, -0.07343673706054688, -0.06997108459472656, -0.06650543212890625, -0.06303977966308594, -0.059574127197265625, -0.05610847473144531, -0.052642822265625, -0.04917716979980469, -0.045711517333984375, -0.04224586486816406, -0.03878021240234375, -0.03531455993652344, -0.031848907470703125, -0.028383255004882812, -0.0249176025390625, -0.021451950073242188, -0.017986297607421875, -0.014520645141601562, -0.01105499267578125, -0.0075893402099609375, -0.004123687744140625, -0.0006580352783203125, 0.0028076171875, 0.0062732696533203125, 0.009738922119140625, 0.013204574584960938, 0.01667022705078125, 0.020135879516601562, 0.023601531982421875, 0.027067184448242188, 0.0305328369140625, 0.03399848937988281, 0.037464141845703125, 0.04092979431152344, 0.04439544677734375, 0.04786109924316406, 0.051326751708984375, 0.05479240417480469, 0.058258056640625, 0.06172370910644531, 0.06518936157226562, 0.06865501403808594, 0.07212066650390625, 0.07558631896972656, 0.07905197143554688, 0.08251762390136719, 0.0859832763671875, 0.08944892883300781, 0.09291458129882812, 0.09638023376464844, 0.09984588623046875, 0.10331153869628906, 0.10677719116210938, 0.11024284362792969, 0.11370849609375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 1.0, 5.0, 5.0, 7.0, 10.0, 4.0, 13.0, 9.0, 13.0, 9.0, 21.0, 18.0, 19.0, 21.0, 20.0, 27.0, 38.0, 43.0, 56.0, 74.0, 67.0, 67.0, 53.0, 63.0, 41.0, 47.0, 32.0, 29.0, 13.0, 24.0, 18.0, 19.0, 15.0, 17.0, 11.0, 9.0, 13.0, 16.0, 10.0, 5.0, 7.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004978179931640625, -0.004803657531738281, -0.0046291351318359375, -0.004454612731933594, -0.00428009033203125, -0.004105567932128906, -0.0039310455322265625, -0.0037565231323242188, -0.003582000732421875, -0.0034074783325195312, -0.0032329559326171875, -0.0030584335327148438, -0.0028839111328125, -0.0027093887329101562, -0.0025348663330078125, -0.0023603439331054688, -0.002185821533203125, -0.0020112991333007812, -0.0018367767333984375, -0.0016622543334960938, -0.00148773193359375, -0.0013132095336914062, -0.0011386871337890625, -0.0009641647338867188, -0.000789642333984375, -0.0006151199340820312, -0.0004405975341796875, -0.00026607513427734375, -9.1552734375e-05, 8.296966552734375e-05, 0.0002574920654296875, 0.00043201446533203125, 0.000606536865234375, 0.0007810592651367188, 0.0009555816650390625, 0.0011301040649414062, 0.00130462646484375, 0.0014791488647460938, 0.0016536712646484375, 0.0018281936645507812, 0.002002716064453125, 0.0021772384643554688, 0.0023517608642578125, 0.0025262832641601562, 0.0027008056640625, 0.0028753280639648438, 0.0030498504638671875, 0.0032243728637695312, 0.003398895263671875, 0.0035734176635742188, 0.0037479400634765625, 0.003922462463378906, 0.00409698486328125, 0.004271507263183594, 0.0044460296630859375, 0.004620552062988281, 0.004795074462890625, 0.004969596862792969, 0.0051441192626953125, 0.005318641662597656, 0.0054931640625, 0.005667686462402344, 0.0058422088623046875, 0.006016731262207031, 0.006191253662109375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 8.0, 11.0, 6.0, 12.0, 15.0, 9.0, 11.0, 13.0, 21.0, 19.0, 39.0, 40.0, 49.0, 82.0, 170.0, 319.0, 811.0, 2223.0, 9709.0, 160164.0, 844840.0, 23751.0, 3994.0, 1114.0, 494.0, 229.0, 121.0, 62.0, 50.0, 29.0, 19.0, 18.0, 15.0, 18.0, 20.0, 6.0, 4.0, 10.0, 5.0, 8.0, 5.0, 2.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0], "bins": [-0.11114501953125, -0.10798835754394531, -0.10483169555664062, -0.10167503356933594, -0.09851837158203125, -0.09536170959472656, -0.09220504760742188, -0.08904838562011719, -0.0858917236328125, -0.08273506164550781, -0.07957839965820312, -0.07642173767089844, -0.07326507568359375, -0.07010841369628906, -0.06695175170898438, -0.06379508972167969, -0.060638427734375, -0.05748176574707031, -0.054325103759765625, -0.05116844177246094, -0.04801177978515625, -0.04485511779785156, -0.041698455810546875, -0.03854179382324219, -0.0353851318359375, -0.03222846984863281, -0.029071807861328125, -0.025915145874023438, -0.02275848388671875, -0.019601821899414062, -0.016445159912109375, -0.013288497924804688, -0.0101318359375, -0.0069751739501953125, -0.003818511962890625, -0.0006618499755859375, 0.00249481201171875, 0.0056514739990234375, 0.008808135986328125, 0.011964797973632812, 0.0151214599609375, 0.018278121948242188, 0.021434783935546875, 0.024591445922851562, 0.02774810791015625, 0.030904769897460938, 0.034061431884765625, 0.03721809387207031, 0.040374755859375, 0.04353141784667969, 0.046688079833984375, 0.04984474182128906, 0.05300140380859375, 0.05615806579589844, 0.059314727783203125, 0.06247138977050781, 0.0656280517578125, 0.06878471374511719, 0.07194137573242188, 0.07509803771972656, 0.07825469970703125, 0.08141136169433594, 0.08456802368164062, 0.08772468566894531, 0.09088134765625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 6.0, 4.0, 9.0, 13.0, 24.0, 61.0, 110.0, 280.0, 265.0, 115.0, 55.0, 26.0, 25.0, 7.0, 7.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09323345124721527, -0.09124884009361267, -0.08926422148942947, -0.08727961033582687, -0.08529499918222427, -0.08331038802862167, -0.08132576942443848, -0.07934115827083588, -0.07735654711723328, -0.07537193596363068, -0.07338731735944748, -0.07140270620584488, -0.06941809505224228, -0.06743348389863968, -0.06544886529445648, -0.06346425414085388, -0.06147963926196098, -0.059495024383068085, -0.057510413229465485, -0.055525798350572586, -0.053541187196969986, -0.05155657231807709, -0.04957196116447449, -0.04758734628558159, -0.04560273140668869, -0.04361811652779579, -0.04163350537419319, -0.03964889049530029, -0.03766427934169769, -0.035679664462804794, -0.033695049583911896, -0.031710438430309296, -0.029725831001996994, -0.027741217985749245, -0.025756604969501495, -0.023771990090608597, -0.021787378937005997, -0.019802764058113098, -0.01781815104186535, -0.0158335380256176, -0.01384892500936985, -0.0118643119931221, -0.009879698976874352, -0.007895085029304028, -0.005910472013056278, -0.003925858996808529, -0.001941245049238205, 4.336796700954437e-05, 0.0020279809832572937, 0.004012593999505043, 0.00599720748141408, 0.007981820963323116, 0.009966433979570866, 0.011951046995818615, 0.013935660943388939, 0.015920273959636688, 0.017904886975884438, 0.019889499992132187, 0.021874113008379936, 0.023858726024627686, 0.025843340903520584, 0.027827952057123184, 0.029812566936016083, 0.03179717808961868, 0.03378179296851158]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 3.0, 3.0, 5.0, 5.0, 6.0, 6.0, 11.0, 15.0, 16.0, 16.0, 15.0, 14.0, 22.0, 30.0, 27.0, 19.0, 26.0, 25.0, 25.0, 28.0, 33.0, 40.0, 32.0, 44.0, 30.0, 31.0, 44.0, 34.0, 45.0, 34.0, 25.0, 27.0, 35.0, 32.0, 23.0, 33.0, 19.0, 24.0, 13.0, 21.0, 9.0, 11.0, 10.0, 8.0, 5.0, 9.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.011769711971282959, -0.011364804580807686, -0.010959897190332413, -0.01055498979985714, -0.010150082409381866, -0.009745175018906593, -0.00934026762843132, -0.008935360237956047, -0.008530452847480774, -0.0081255454570055, -0.007720638066530228, -0.0073157306760549545, -0.006910823285579681, -0.006505915895104408, -0.006101008504629135, -0.005696101114153862, -0.005291193723678589, -0.004886286333203316, -0.004481378942728043, -0.0040764715522527695, -0.0036715641617774963, -0.003266656771302223, -0.00286174938082695, -0.002456841990351677, -0.002051934599876404, -0.0016470272094011307, -0.0012421198189258575, -0.0008372124284505844, -0.0004323050379753113, -2.7397647500038147e-05, 0.000377509742975235, 0.0007824171334505081, 0.0011873245239257812, 0.0015922319144010544, 0.0019971393048763275, 0.0024020466953516006, 0.0028069540858268738, 0.003211861476302147, 0.00361676886677742, 0.004021676257252693, 0.004426583647727966, 0.0048314910382032394, 0.005236398428678513, 0.005641305819153786, 0.006046213209629059, 0.006451120600104332, 0.006856027990579605, 0.007260935381054878, 0.007665842771530151, 0.008070750162005424, 0.008475657552480698, 0.00888056494295597, 0.009285472333431244, 0.009690379723906517, 0.01009528711438179, 0.010500194504857063, 0.010905101895332336, 0.01131000928580761, 0.011714916676282883, 0.012119824066758156, 0.012524731457233429, 0.012929638847708702, 0.013334546238183975, 0.013739453628659248, 0.014144361019134521]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 5.0, 2.0, 7.0, 5.0, 9.0, 7.0, 8.0, 12.0, 12.0, 23.0, 18.0, 24.0, 12.0, 21.0, 29.0, 22.0, 30.0, 36.0, 35.0, 31.0, 37.0, 40.0, 36.0, 36.0, 47.0, 34.0, 41.0, 38.0, 30.0, 26.0, 40.0, 36.0, 26.0, 34.0, 24.0, 18.0, 15.0, 13.0, 18.0, 10.0, 13.0, 11.0, 8.0, 8.0, 7.0, 9.0, 1.0, 0.0, 4.0, 0.0, 1.0], "bins": [-1.9736328125, -1.9197845458984375, -1.865936279296875, -1.8120880126953125, -1.75823974609375, -1.7043914794921875, -1.650543212890625, -1.5966949462890625, -1.5428466796875, -1.4889984130859375, -1.435150146484375, -1.3813018798828125, -1.32745361328125, -1.2736053466796875, -1.219757080078125, -1.1659088134765625, -1.112060546875, -1.0582122802734375, -1.004364013671875, -0.9505157470703125, -0.89666748046875, -0.8428192138671875, -0.788970947265625, -0.7351226806640625, -0.6812744140625, -0.6274261474609375, -0.573577880859375, -0.5197296142578125, -0.46588134765625, -0.4120330810546875, -0.358184814453125, -0.3043365478515625, -0.25048828125, -0.1966400146484375, -0.142791748046875, -0.0889434814453125, -0.03509521484375, 0.0187530517578125, 0.072601318359375, 0.1264495849609375, 0.1802978515625, 0.2341461181640625, 0.287994384765625, 0.3418426513671875, 0.39569091796875, 0.4495391845703125, 0.503387451171875, 0.5572357177734375, 0.611083984375, 0.6649322509765625, 0.718780517578125, 0.7726287841796875, 0.82647705078125, 0.8803253173828125, 0.934173583984375, 0.9880218505859375, 1.0418701171875, 1.0957183837890625, 1.149566650390625, 1.2034149169921875, 1.25726318359375, 1.3111114501953125, 1.364959716796875, 1.4188079833984375, 1.47265625]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 9.0, 24.0, 16.0, 26.0, 35.0, 57.0, 87.0, 114.0, 173.0, 272.0, 359.0, 600.0, 835.0, 1333.0, 2033.0, 3109.0, 5380.0, 8982.0, 15617.0, 27677.0, 49957.0, 93171.0, 166817.0, 237457.0, 189839.0, 108821.0, 59023.0, 32187.0, 17695.0, 10296.0, 6095.0, 3692.0, 2330.0, 1514.0, 971.0, 602.0, 428.0, 289.0, 194.0, 137.0, 88.0, 72.0, 36.0, 25.0, 22.0, 15.0, 9.0, 13.0, 4.0, 3.0, 2.0, 3.0, 4.0], "bins": [-1.9228515625, -1.8673248291015625, -1.811798095703125, -1.7562713623046875, -1.70074462890625, -1.6452178955078125, -1.589691162109375, -1.5341644287109375, -1.4786376953125, -1.4231109619140625, -1.367584228515625, -1.3120574951171875, -1.25653076171875, -1.2010040283203125, -1.145477294921875, -1.0899505615234375, -1.034423828125, -0.9788970947265625, -0.923370361328125, -0.8678436279296875, -0.81231689453125, -0.7567901611328125, -0.701263427734375, -0.6457366943359375, -0.5902099609375, -0.5346832275390625, -0.479156494140625, -0.4236297607421875, -0.36810302734375, -0.3125762939453125, -0.257049560546875, -0.2015228271484375, -0.14599609375, -0.0904693603515625, -0.034942626953125, 0.0205841064453125, 0.07611083984375, 0.1316375732421875, 0.187164306640625, 0.2426910400390625, 0.2982177734375, 0.3537445068359375, 0.409271240234375, 0.4647979736328125, 0.52032470703125, 0.5758514404296875, 0.631378173828125, 0.6869049072265625, 0.742431640625, 0.7979583740234375, 0.853485107421875, 0.9090118408203125, 0.96453857421875, 1.0200653076171875, 1.075592041015625, 1.1311187744140625, 1.1866455078125, 1.2421722412109375, 1.297698974609375, 1.3532257080078125, 1.40875244140625, 1.4642791748046875, 1.519805908203125, 1.5753326416015625, 1.630859375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 6.0, 6.0, 6.0, 6.0, 15.0, 12.0, 22.0, 19.0, 19.0, 35.0, 28.0, 46.0, 34.0, 54.0, 59.0, 97.0, 145.0, 306.0, 1377.0, 205.0, 117.0, 73.0, 52.0, 56.0, 41.0, 35.0, 33.0, 29.0, 23.0, 14.0, 15.0, 8.0, 10.0, 6.0, 10.0, 5.0, 5.0, 5.0, 5.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.04296875, -6.79302978515625, -6.5430908203125, -6.29315185546875, -6.043212890625, -5.79327392578125, -5.5433349609375, -5.29339599609375, -5.04345703125, -4.79351806640625, -4.5435791015625, -4.29364013671875, -4.043701171875, -3.79376220703125, -3.5438232421875, -3.29388427734375, -3.0439453125, -2.79400634765625, -2.5440673828125, -2.29412841796875, -2.044189453125, -1.79425048828125, -1.5443115234375, -1.29437255859375, -1.04443359375, -0.79449462890625, -0.5445556640625, -0.29461669921875, -0.044677734375, 0.20526123046875, 0.4552001953125, 0.70513916015625, 0.955078125, 1.20501708984375, 1.4549560546875, 1.70489501953125, 1.954833984375, 2.20477294921875, 2.4547119140625, 2.70465087890625, 2.95458984375, 3.20452880859375, 3.4544677734375, 3.70440673828125, 3.954345703125, 4.20428466796875, 4.4542236328125, 4.70416259765625, 4.9541015625, 5.20404052734375, 5.4539794921875, 5.70391845703125, 5.953857421875, 6.20379638671875, 6.4537353515625, 6.70367431640625, 6.95361328125, 7.20355224609375, 7.4534912109375, 7.70343017578125, 7.953369140625, 8.20330810546875, 8.4532470703125, 8.70318603515625, 8.953125]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 5.0, 6.0, 10.0, 19.0, 10.0, 16.0, 29.0, 27.0, 35.0, 45.0, 63.0, 80.0, 130.0, 171.0, 250.0, 448.0, 1241.0, 7791.0, 279052.0, 2793801.0, 57037.0, 3516.0, 759.0, 362.0, 201.0, 174.0, 94.0, 69.0, 49.0, 33.0, 37.0, 35.0, 26.0, 17.0, 12.0, 12.0, 10.0, 4.0, 6.0, 7.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-15.5859375, -15.1181640625, -14.650390625, -14.1826171875, -13.71484375, -13.2470703125, -12.779296875, -12.3115234375, -11.84375, -11.3759765625, -10.908203125, -10.4404296875, -9.97265625, -9.5048828125, -9.037109375, -8.5693359375, -8.1015625, -7.6337890625, -7.166015625, -6.6982421875, -6.23046875, -5.7626953125, -5.294921875, -4.8271484375, -4.359375, -3.8916015625, -3.423828125, -2.9560546875, -2.48828125, -2.0205078125, -1.552734375, -1.0849609375, -0.6171875, -0.1494140625, 0.318359375, 0.7861328125, 1.25390625, 1.7216796875, 2.189453125, 2.6572265625, 3.125, 3.5927734375, 4.060546875, 4.5283203125, 4.99609375, 5.4638671875, 5.931640625, 6.3994140625, 6.8671875, 7.3349609375, 7.802734375, 8.2705078125, 8.73828125, 9.2060546875, 9.673828125, 10.1416015625, 10.609375, 11.0771484375, 11.544921875, 12.0126953125, 12.48046875, 12.9482421875, 13.416015625, 13.8837890625, 14.3515625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 306.0, 709.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.964099884033203, -18.96812629699707, -12.972151756286621, -6.976177215576172, -0.9802036285400391, 5.015769958496094, 11.01174545288086, 17.00771713256836, 23.003692626953125, 28.999666213989258, 34.99563980102539, 40.991615295410156, 46.987586975097656, 52.98356246948242, 58.97953796386719, 64.97550964355469, 70.97148132324219, 76.96745300292969, 82.96343231201172, 88.95940399169922, 94.95537567138672, 100.95135498046875, 106.94732666015625, 112.94329833984375, 118.93927764892578, 124.93524932861328, 130.9312286376953, 136.9272003173828, 142.9231719970703, 148.9191436767578, 154.91513061523438, 160.91110229492188, 166.9070587158203, 172.9030303955078, 178.8990020751953, 184.89498901367188, 190.89096069335938, 196.88693237304688, 202.88290405273438, 208.87887573242188, 214.87484741210938, 220.87081909179688, 226.86679077148438, 232.86276245117188, 238.85874938964844, 244.85472106933594, 250.85069274902344, 256.8466796875, 262.8426513671875, 268.838623046875, 274.8345947265625, 280.83056640625, 286.8265380859375, 292.822509765625, 298.8184814453125, 304.814453125, 310.8104248046875, 316.806396484375, 322.8023681640625, 328.79833984375, 334.7943115234375, 340.790283203125, 346.7862548828125, 352.7822265625, 358.7782287597656]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 3.0, 6.0, 2.0, 13.0, 4.0, 9.0, 10.0, 9.0, 21.0, 17.0, 21.0, 15.0, 28.0, 30.0, 24.0, 32.0, 40.0, 45.0, 39.0, 50.0, 47.0, 43.0, 42.0, 41.0, 36.0, 40.0, 37.0, 38.0, 33.0, 36.0, 18.0, 32.0, 27.0, 24.0, 17.0, 15.0, 9.0, 17.0, 11.0, 7.0, 7.0, 2.0, 6.0, 2.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-20.82842254638672, -20.219711303710938, -19.611000061035156, -19.002290725708008, -18.393579483032227, -17.784868240356445, -17.176158905029297, -16.567447662353516, -15.958736419677734, -15.350025177001953, -14.741314888000488, -14.132604598999023, -13.523893356323242, -12.915182113647461, -12.306471824645996, -11.697761535644531, -11.08905029296875, -10.480339050292969, -9.871628761291504, -9.262918472290039, -8.654207229614258, -8.045495986938477, -7.436785697937012, -6.828074932098389, -6.219364166259766, -5.610653400421143, -5.0019426345825195, -4.3932318687438965, -3.7845211029052734, -3.1758103370666504, -2.5670995712280273, -1.9583888053894043, -1.3496780395507812, -0.7409672737121582, -0.13225650787353516, 0.4764542579650879, 1.085165023803711, 1.693875789642334, 2.302586555480957, 2.91129732131958, 3.520008087158203, 4.128718852996826, 4.737429618835449, 5.346140384674072, 5.954851150512695, 6.563561916351318, 7.172272682189941, 7.7809834480285645, 8.389694213867188, 8.998405456542969, 9.607115745544434, 10.215826034545898, 10.82453727722168, 11.433248519897461, 12.041958808898926, 12.65066909790039, 13.259380340576172, 13.868091583251953, 14.476801872253418, 15.085512161254883, 15.694223403930664, 16.302934646606445, 16.911643981933594, 17.520355224609375, 18.129066467285156]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 5.0, 3.0, 6.0, 5.0, 7.0, 13.0, 14.0, 11.0, 14.0, 19.0, 15.0, 19.0, 25.0, 23.0, 29.0, 25.0, 38.0, 34.0, 27.0, 34.0, 47.0, 23.0, 41.0, 35.0, 47.0, 40.0, 31.0, 27.0, 41.0, 29.0, 24.0, 28.0, 25.0, 27.0, 34.0, 26.0, 16.0, 22.0, 12.0, 9.0, 10.0, 8.0, 5.0, 4.0, 13.0, 3.0, 7.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-2.091796875, -2.0325469970703125, -1.973297119140625, -1.9140472412109375, -1.85479736328125, -1.7955474853515625, -1.736297607421875, -1.6770477294921875, -1.6177978515625, -1.5585479736328125, -1.499298095703125, -1.4400482177734375, -1.38079833984375, -1.3215484619140625, -1.262298583984375, -1.2030487060546875, -1.143798828125, -1.0845489501953125, -1.025299072265625, -0.9660491943359375, -0.90679931640625, -0.8475494384765625, -0.788299560546875, -0.7290496826171875, -0.6697998046875, -0.6105499267578125, -0.551300048828125, -0.4920501708984375, -0.43280029296875, -0.3735504150390625, -0.314300537109375, -0.2550506591796875, -0.19580078125, -0.1365509033203125, -0.077301025390625, -0.0180511474609375, 0.04119873046875, 0.1004486083984375, 0.159698486328125, 0.2189483642578125, 0.2781982421875, 0.3374481201171875, 0.396697998046875, 0.4559478759765625, 0.51519775390625, 0.5744476318359375, 0.633697509765625, 0.6929473876953125, 0.752197265625, 0.8114471435546875, 0.870697021484375, 0.9299468994140625, 0.98919677734375, 1.0484466552734375, 1.107696533203125, 1.1669464111328125, 1.2261962890625, 1.2854461669921875, 1.344696044921875, 1.4039459228515625, 1.46319580078125, 1.5224456787109375, 1.581695556640625, 1.6409454345703125, 1.7001953125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 3.0, 2.0, 5.0, 7.0, 11.0, 10.0, 14.0, 12.0, 11.0, 11.0, 18.0, 15.0, 27.0, 26.0, 49.0, 62.0, 85.0, 168.0, 387.0, 1074.0, 3834.0, 21157.0, 148665.0, 1109429.0, 2310547.0, 516472.0, 68106.0, 10415.0, 2200.0, 705.0, 259.0, 136.0, 67.0, 50.0, 38.0, 34.0, 30.0, 18.0, 19.0, 16.0, 9.0, 16.0, 11.0, 10.0, 12.0, 5.0, 6.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-5.52734375, -5.3662109375, -5.205078125, -5.0439453125, -4.8828125, -4.7216796875, -4.560546875, -4.3994140625, -4.23828125, -4.0771484375, -3.916015625, -3.7548828125, -3.59375, -3.4326171875, -3.271484375, -3.1103515625, -2.94921875, -2.7880859375, -2.626953125, -2.4658203125, -2.3046875, -2.1435546875, -1.982421875, -1.8212890625, -1.66015625, -1.4990234375, -1.337890625, -1.1767578125, -1.015625, -0.8544921875, -0.693359375, -0.5322265625, -0.37109375, -0.2099609375, -0.048828125, 0.1123046875, 0.2734375, 0.4345703125, 0.595703125, 0.7568359375, 0.91796875, 1.0791015625, 1.240234375, 1.4013671875, 1.5625, 1.7236328125, 1.884765625, 2.0458984375, 2.20703125, 2.3681640625, 2.529296875, 2.6904296875, 2.8515625, 3.0126953125, 3.173828125, 3.3349609375, 3.49609375, 3.6572265625, 3.818359375, 3.9794921875, 4.140625, 4.3017578125, 4.462890625, 4.6240234375, 4.78515625]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 6.0, 13.0, 20.0, 40.0, 49.0, 76.0, 106.0, 153.0, 195.0, 300.0, 419.0, 510.0, 558.0, 443.0, 351.0, 240.0, 181.0, 123.0, 96.0, 61.0, 38.0, 28.0, 30.0, 14.0, 6.0, 3.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5703125, -4.3883056640625, -4.206298828125, -4.0242919921875, -3.84228515625, -3.6602783203125, -3.478271484375, -3.2962646484375, -3.1142578125, -2.9322509765625, -2.750244140625, -2.5682373046875, -2.38623046875, -2.2042236328125, -2.022216796875, -1.8402099609375, -1.658203125, -1.4761962890625, -1.294189453125, -1.1121826171875, -0.93017578125, -0.7481689453125, -0.566162109375, -0.3841552734375, -0.2021484375, -0.0201416015625, 0.161865234375, 0.3438720703125, 0.52587890625, 0.7078857421875, 0.889892578125, 1.0718994140625, 1.25390625, 1.4359130859375, 1.617919921875, 1.7999267578125, 1.98193359375, 2.1639404296875, 2.345947265625, 2.5279541015625, 2.7099609375, 2.8919677734375, 3.073974609375, 3.2559814453125, 3.43798828125, 3.6199951171875, 3.802001953125, 3.9840087890625, 4.166015625, 4.3480224609375, 4.530029296875, 4.7120361328125, 4.89404296875, 5.0760498046875, 5.258056640625, 5.4400634765625, 5.6220703125, 5.8040771484375, 5.986083984375, 6.1680908203125, 6.35009765625, 6.5321044921875, 6.714111328125, 6.8961181640625, 7.078125]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 7.0, 3.0, 12.0, 15.0, 33.0, 39.0, 69.0, 92.0, 150.0, 291.0, 566.0, 1628.0, 14975.0, 407400.0, 3319168.0, 431163.0, 15868.0, 1648.0, 483.0, 282.0, 156.0, 91.0, 46.0, 33.0, 24.0, 18.0, 7.0, 7.0, 6.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2578125, -13.877685546875, -13.49755859375, -13.117431640625, -12.7373046875, -12.357177734375, -11.97705078125, -11.596923828125, -11.216796875, -10.836669921875, -10.45654296875, -10.076416015625, -9.6962890625, -9.316162109375, -8.93603515625, -8.555908203125, -8.17578125, -7.795654296875, -7.41552734375, -7.035400390625, -6.6552734375, -6.275146484375, -5.89501953125, -5.514892578125, -5.134765625, -4.754638671875, -4.37451171875, -3.994384765625, -3.6142578125, -3.234130859375, -2.85400390625, -2.473876953125, -2.09375, -1.713623046875, -1.33349609375, -0.953369140625, -0.5732421875, -0.193115234375, 0.18701171875, 0.567138671875, 0.947265625, 1.327392578125, 1.70751953125, 2.087646484375, 2.4677734375, 2.847900390625, 3.22802734375, 3.608154296875, 3.98828125, 4.368408203125, 4.74853515625, 5.128662109375, 5.5087890625, 5.888916015625, 6.26904296875, 6.649169921875, 7.029296875, 7.409423828125, 7.78955078125, 8.169677734375, 8.5498046875, 8.929931640625, 9.31005859375, 9.690185546875, 10.0703125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 15.0, 30.0, 67.0, 135.0, 166.0, 188.0, 158.0, 124.0, 78.0, 33.0, 14.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-43.829986572265625, -42.477596282958984, -41.12520980834961, -39.77281951904297, -38.42042922973633, -37.06804275512695, -35.71565246582031, -34.36326599121094, -33.0108757019043, -31.65848731994629, -30.30609703063965, -28.95370864868164, -27.601320266723633, -26.248931884765625, -24.896541595458984, -23.544153213500977, -22.191762924194336, -20.839374542236328, -19.486984252929688, -18.13459587097168, -16.782207489013672, -15.429818153381348, -14.077428817749023, -12.725040435791016, -11.372651100158691, -10.020261764526367, -8.66787338256836, -7.315484046936035, -5.963095188140869, -4.610706329345703, -3.258316993713379, -1.905928611755371, -0.5535392761230469, 0.7988497018814087, 2.1512386798858643, 3.5036277770996094, 4.856016635894775, 6.208405494689941, 7.560794830322266, 8.913183212280273, 10.265572547912598, 11.617961883544922, 12.97035026550293, 14.322739601135254, 15.675128936767578, 17.027517318725586, 18.379905700683594, 19.732295989990234, 21.084684371948242, 22.43707275390625, 23.78946304321289, 25.1418514251709, 26.494239807128906, 27.846630096435547, 29.199018478393555, 30.551406860351562, 31.903797149658203, 33.256187438964844, 34.60857391357422, 35.96096420288086, 37.3133544921875, 38.665740966796875, 40.018131256103516, 41.370521545410156, 42.72290802001953]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 1.0, 4.0, 4.0, 8.0, 14.0, 12.0, 13.0, 16.0, 12.0, 14.0, 21.0, 26.0, 28.0, 38.0, 36.0, 39.0, 60.0, 46.0, 42.0, 41.0, 51.0, 37.0, 54.0, 31.0, 39.0, 36.0, 39.0, 34.0, 42.0, 30.0, 23.0, 22.0, 16.0, 18.0, 12.0, 11.0, 12.0, 6.0, 9.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.98637580871582, -17.468435287475586, -16.95049476623535, -16.43255615234375, -15.914615631103516, -15.396675109863281, -14.878734588623047, -14.360795021057129, -13.842855453491211, -13.324914932250977, -12.806975364685059, -12.289034843444824, -11.771095275878906, -11.253154754638672, -10.735214233398438, -10.21727466583252, -9.699334144592285, -9.18139362335205, -8.663454055786133, -8.145513534545898, -7.6275739669799805, -7.109633445739746, -6.59169340133667, -6.073753356933594, -5.555813312530518, -5.037873268127441, -4.519933223724365, -4.001993179321289, -3.484052896499634, -2.9661128520965576, -2.4481725692749023, -1.9302325248718262, -1.41229248046875, -0.894352376461029, -0.3764122724533081, 0.14152789115905762, 0.6594679355621338, 1.17740797996521, 1.6953482627868652, 2.2132883071899414, 2.7312283515930176, 3.2491683959960938, 3.76710844039917, 4.285048484802246, 4.8029890060424805, 5.320928573608398, 5.838869094848633, 6.356809139251709, 6.874749183654785, 7.392689228057861, 7.9106292724609375, 8.428569793701172, 8.94650936126709, 9.464449882507324, 9.982389450073242, 10.500329971313477, 11.018270492553711, 11.536211013793945, 12.054150581359863, 12.572091102600098, 13.090030670166016, 13.60797119140625, 14.125911712646484, 14.643851280212402, 15.16179084777832]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 8.0, 7.0, 13.0, 11.0, 21.0, 15.0, 18.0, 21.0, 16.0, 34.0, 27.0, 28.0, 23.0, 40.0, 46.0, 49.0, 45.0, 46.0, 36.0, 45.0, 29.0, 43.0, 45.0, 47.0, 42.0, 34.0, 27.0, 25.0, 23.0, 27.0, 15.0, 19.0, 18.0, 7.0, 11.0, 11.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.349609375, -2.2816162109375, -2.213623046875, -2.1456298828125, -2.07763671875, -2.0096435546875, -1.941650390625, -1.8736572265625, -1.8056640625, -1.7376708984375, -1.669677734375, -1.6016845703125, -1.53369140625, -1.4656982421875, -1.397705078125, -1.3297119140625, -1.26171875, -1.1937255859375, -1.125732421875, -1.0577392578125, -0.98974609375, -0.9217529296875, -0.853759765625, -0.7857666015625, -0.7177734375, -0.6497802734375, -0.581787109375, -0.5137939453125, -0.44580078125, -0.3778076171875, -0.309814453125, -0.2418212890625, -0.173828125, -0.1058349609375, -0.037841796875, 0.0301513671875, 0.09814453125, 0.1661376953125, 0.234130859375, 0.3021240234375, 0.3701171875, 0.4381103515625, 0.506103515625, 0.5740966796875, 0.64208984375, 0.7100830078125, 0.778076171875, 0.8460693359375, 0.9140625, 0.9820556640625, 1.050048828125, 1.1180419921875, 1.18603515625, 1.2540283203125, 1.322021484375, 1.3900146484375, 1.4580078125, 1.5260009765625, 1.593994140625, 1.6619873046875, 1.72998046875, 1.7979736328125, 1.865966796875, 1.9339599609375, 2.001953125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 1.0, 6.0, 15.0, 14.0, 27.0, 51.0, 68.0, 95.0, 129.0, 216.0, 287.0, 414.0, 637.0, 941.0, 1355.0, 2042.0, 2768.0, 4181.0, 6143.0, 9158.0, 13821.0, 20547.0, 30900.0, 46044.0, 68569.0, 98738.0, 135388.0, 156219.0, 136875.0, 100758.0, 69446.0, 46951.0, 31534.0, 21029.0, 13853.0, 9306.0, 6388.0, 4336.0, 2980.0, 1992.0, 1388.0, 943.0, 657.0, 445.0, 303.0, 211.0, 132.0, 86.0, 67.0, 38.0, 28.0, 16.0, 6.0, 13.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1739501953125, -0.16843223571777344, -0.16291427612304688, -0.1573963165283203, -0.15187835693359375, -0.1463603973388672, -0.14084243774414062, -0.13532447814941406, -0.1298065185546875, -0.12428855895996094, -0.11877059936523438, -0.11325263977050781, -0.10773468017578125, -0.10221672058105469, -0.09669876098632812, -0.09118080139160156, -0.085662841796875, -0.08014488220214844, -0.07462692260742188, -0.06910896301269531, -0.06359100341796875, -0.05807304382324219, -0.052555084228515625, -0.04703712463378906, -0.0415191650390625, -0.03600120544433594, -0.030483245849609375, -0.024965286254882812, -0.01944732666015625, -0.013929367065429688, -0.008411407470703125, -0.0028934478759765625, 0.00262451171875, 0.008142471313476562, 0.013660430908203125, 0.019178390502929688, 0.02469635009765625, 0.030214309692382812, 0.035732269287109375, 0.04125022888183594, 0.0467681884765625, 0.05228614807128906, 0.057804107666015625, 0.06332206726074219, 0.06884002685546875, 0.07435798645019531, 0.07987594604492188, 0.08539390563964844, 0.090911865234375, 0.09642982482910156, 0.10194778442382812, 0.10746574401855469, 0.11298370361328125, 0.11850166320800781, 0.12401962280273438, 0.12953758239746094, 0.1350555419921875, 0.14057350158691406, 0.14609146118164062, 0.1516094207763672, 0.15712738037109375, 0.1626453399658203, 0.16816329956054688, 0.17368125915527344, 0.17919921875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 7.0, 8.0, 8.0, 5.0, 13.0, 10.0, 11.0, 19.0, 23.0, 23.0, 28.0, 28.0, 30.0, 31.0, 41.0, 32.0, 41.0, 46.0, 34.0, 1067.0, 38.0, 43.0, 35.0, 49.0, 39.0, 34.0, 37.0, 25.0, 29.0, 31.0, 30.0, 16.0, 18.0, 13.0, 14.0, 12.0, 9.0, 8.0, 6.0, 8.0, 6.0, 8.0, 5.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6328125, -1.574371337890625, -1.51593017578125, -1.457489013671875, -1.3990478515625, -1.340606689453125, -1.28216552734375, -1.223724365234375, -1.165283203125, -1.106842041015625, -1.04840087890625, -0.989959716796875, -0.9315185546875, -0.873077392578125, -0.81463623046875, -0.756195068359375, -0.69775390625, -0.639312744140625, -0.58087158203125, -0.522430419921875, -0.4639892578125, -0.405548095703125, -0.34710693359375, -0.288665771484375, -0.230224609375, -0.171783447265625, -0.11334228515625, -0.054901123046875, 0.0035400390625, 0.061981201171875, 0.12042236328125, 0.178863525390625, 0.2373046875, 0.295745849609375, 0.35418701171875, 0.412628173828125, 0.4710693359375, 0.529510498046875, 0.58795166015625, 0.646392822265625, 0.704833984375, 0.763275146484375, 0.82171630859375, 0.880157470703125, 0.9385986328125, 0.997039794921875, 1.05548095703125, 1.113922119140625, 1.17236328125, 1.230804443359375, 1.28924560546875, 1.347686767578125, 1.4061279296875, 1.464569091796875, 1.52301025390625, 1.581451416015625, 1.639892578125, 1.698333740234375, 1.75677490234375, 1.815216064453125, 1.8736572265625, 1.932098388671875, 1.99053955078125, 2.048980712890625, 2.107421875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 4.0, 1.0, 4.0, 10.0, 15.0, 19.0, 18.0, 33.0, 50.0, 66.0, 129.0, 184.0, 252.0, 378.0, 595.0, 891.0, 1404.0, 2313.0, 3722.0, 5956.0, 9456.0, 15308.0, 24618.0, 40449.0, 65013.0, 104113.0, 157031.0, 1234183.0, 156808.0, 104064.0, 64413.0, 39986.0, 24565.0, 15277.0, 9526.0, 5978.0, 3776.0, 2291.0, 1470.0, 984.0, 606.0, 377.0, 259.0, 171.0, 105.0, 66.0, 58.0, 50.0, 34.0, 26.0, 15.0, 9.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.1268310546875, -0.12292861938476562, -0.11902618408203125, -0.11512374877929688, -0.1112213134765625, -0.10731887817382812, -0.10341644287109375, -0.09951400756835938, -0.095611572265625, -0.09170913696289062, -0.08780670166015625, -0.08390426635742188, -0.0800018310546875, -0.07609939575195312, -0.07219696044921875, -0.06829452514648438, -0.06439208984375, -0.060489654541015625, -0.05658721923828125, -0.052684783935546875, -0.0487823486328125, -0.044879913330078125, -0.04097747802734375, -0.037075042724609375, -0.033172607421875, -0.029270172119140625, -0.02536773681640625, -0.021465301513671875, -0.0175628662109375, -0.013660430908203125, -0.00975799560546875, -0.005855560302734375, -0.001953125, 0.001949310302734375, 0.00585174560546875, 0.009754180908203125, 0.0136566162109375, 0.017559051513671875, 0.02146148681640625, 0.025363922119140625, 0.029266357421875, 0.033168792724609375, 0.03707122802734375, 0.040973663330078125, 0.0448760986328125, 0.048778533935546875, 0.05268096923828125, 0.056583404541015625, 0.06048583984375, 0.06438827514648438, 0.06829071044921875, 0.07219314575195312, 0.0760955810546875, 0.07999801635742188, 0.08390045166015625, 0.08780288696289062, 0.091705322265625, 0.09560775756835938, 0.09951019287109375, 0.10341262817382812, 0.1073150634765625, 0.11121749877929688, 0.11511993408203125, 0.11902236938476562, 0.1229248046875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 5.0, 5.0, 4.0, 5.0, 6.0, 7.0, 13.0, 9.0, 14.0, 25.0, 27.0, 25.0, 28.0, 41.0, 46.0, 73.0, 113.0, 149.0, 101.0, 48.0, 35.0, 37.0, 26.0, 30.0, 19.0, 23.0, 21.0, 11.0, 9.0, 7.0, 1.0, 9.0, 9.0, 2.0, 3.0, 4.0, 3.0, 7.0, 6.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0128936767578125, -0.012509584426879883, -0.012125492095947266, -0.011741399765014648, -0.011357307434082031, -0.010973215103149414, -0.010589122772216797, -0.01020503044128418, -0.009820938110351562, -0.009436845779418945, -0.009052753448486328, -0.008668661117553711, -0.008284568786621094, -0.007900476455688477, -0.007516384124755859, -0.007132291793823242, -0.006748199462890625, -0.006364107131958008, -0.005980014801025391, -0.0055959224700927734, -0.005211830139160156, -0.004827737808227539, -0.004443645477294922, -0.004059553146362305, -0.0036754608154296875, -0.0032913684844970703, -0.002907276153564453, -0.002523183822631836, -0.0021390914916992188, -0.0017549991607666016, -0.0013709068298339844, -0.0009868144989013672, -0.00060272216796875, -0.0002186298370361328, 0.00016546249389648438, 0.0005495548248291016, 0.0009336471557617188, 0.001317739486694336, 0.0017018318176269531, 0.0020859241485595703, 0.0024700164794921875, 0.0028541088104248047, 0.003238201141357422, 0.003622293472290039, 0.004006385803222656, 0.0043904781341552734, 0.004774570465087891, 0.005158662796020508, 0.005542755126953125, 0.005926847457885742, 0.006310939788818359, 0.0066950321197509766, 0.007079124450683594, 0.007463216781616211, 0.007847309112548828, 0.008231401443481445, 0.008615493774414062, 0.00899958610534668, 0.009383678436279297, 0.009767770767211914, 0.010151863098144531, 0.010535955429077148, 0.010920047760009766, 0.011304140090942383, 0.011688232421875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 5.0, 8.0, 1.0, 3.0, 3.0, 3.0, 10.0, 8.0, 3.0, 12.0, 22.0, 28.0, 32.0, 44.0, 62.0, 105.0, 191.0, 367.0, 1248.0, 46945.0, 985940.0, 11926.0, 806.0, 298.0, 156.0, 100.0, 47.0, 63.0, 36.0, 21.0, 12.0, 8.0, 11.0, 4.0, 7.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2042236328125, -0.1974945068359375, -0.190765380859375, -0.1840362548828125, -0.17730712890625, -0.1705780029296875, -0.163848876953125, -0.1571197509765625, -0.150390625, -0.1436614990234375, -0.136932373046875, -0.1302032470703125, -0.12347412109375, -0.1167449951171875, -0.110015869140625, -0.1032867431640625, -0.0965576171875, -0.0898284912109375, -0.083099365234375, -0.0763702392578125, -0.06964111328125, -0.0629119873046875, -0.056182861328125, -0.0494537353515625, -0.042724609375, -0.0359954833984375, -0.029266357421875, -0.0225372314453125, -0.01580810546875, -0.0090789794921875, -0.002349853515625, 0.0043792724609375, 0.0111083984375, 0.0178375244140625, 0.024566650390625, 0.0312957763671875, 0.03802490234375, 0.0447540283203125, 0.051483154296875, 0.0582122802734375, 0.06494140625, 0.0716705322265625, 0.078399658203125, 0.0851287841796875, 0.09185791015625, 0.0985870361328125, 0.105316162109375, 0.1120452880859375, 0.1187744140625, 0.1255035400390625, 0.132232666015625, 0.1389617919921875, 0.14569091796875, 0.1524200439453125, 0.159149169921875, 0.1658782958984375, 0.172607421875, 0.1793365478515625, 0.186065673828125, 0.1927947998046875, 0.19952392578125, 0.2062530517578125, 0.212982177734375, 0.2197113037109375, 0.2264404296875]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 4.0, 3.0, 11.0, 11.0, 23.0, 28.0, 70.0, 106.0, 245.0, 278.0, 108.0, 53.0, 31.0, 18.0, 9.0, 7.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07136812806129456, -0.06899288296699524, -0.06661764532327652, -0.0642424002289772, -0.06186715513467789, -0.05949191376566887, -0.05711667239665985, -0.054741427302360535, -0.05236618220806122, -0.0499909408390522, -0.047615695744752884, -0.045240454375743866, -0.04286520928144455, -0.04048996791243553, -0.038114726543426514, -0.0357394814491272, -0.03336424008011818, -0.030988996848464012, -0.028613753616809845, -0.026238512247800827, -0.02386326715350151, -0.021488025784492493, -0.019112782552838326, -0.01673753932118416, -0.014362296089529991, -0.011987052857875824, -0.009611809626221657, -0.007236567325890064, -0.004861324094235897, -0.00248608086258173, -0.00011083856225013733, 0.00226440466940403, 0.004639647901058197, 0.007014891132712364, 0.009390134364366531, 0.011765376664698124, 0.014140619896352291, 0.016515862196683884, 0.01889110542833805, 0.021266348659992218, 0.023641591891646385, 0.026016835123300552, 0.02839207835495472, 0.030767321586608887, 0.033142562955617905, 0.03551780804991722, 0.03789304941892624, 0.040268294513225555, 0.04264353588223457, 0.04501877725124359, 0.04739402234554291, 0.049769263714551926, 0.05214450880885124, 0.05451975017786026, 0.056894995272159576, 0.059270236641168594, 0.06164547801017761, 0.06402072310447693, 0.06639596074819565, 0.06877120584249496, 0.07114645093679428, 0.0735216960310936, 0.07589693367481232, 0.07827217876911163, 0.08064742386341095]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 4.0, 5.0, 7.0, 12.0, 11.0, 5.0, 15.0, 18.0, 24.0, 23.0, 21.0, 29.0, 28.0, 32.0, 43.0, 33.0, 37.0, 36.0, 33.0, 30.0, 47.0, 43.0, 43.0, 36.0, 34.0, 42.0, 39.0, 32.0, 26.0, 33.0, 24.0, 26.0, 20.0, 23.0, 15.0, 17.0, 12.0, 9.0, 8.0, 8.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03070664405822754, -0.029656948521733284, -0.02860725298523903, -0.027557557448744774, -0.02650786191225052, -0.025458166375756264, -0.02440847083926201, -0.023358775302767754, -0.0223090797662735, -0.021259384229779243, -0.02020968869328499, -0.019159993156790733, -0.01811029762029648, -0.017060602083802223, -0.016010906547307968, -0.014961211010813713, -0.013911515474319458, -0.012861819937825203, -0.011812124401330948, -0.010762428864836693, -0.009712733328342438, -0.008663037791848183, -0.007613342255353928, -0.0065636467188596725, -0.0055139511823654175, -0.004464255645871162, -0.0034145601093769073, -0.0023648645728826523, -0.0013151690363883972, -0.00026547349989414215, 0.0007842220366001129, 0.001833917573094368, 0.002883613109588623, 0.003933308646082878, 0.004983004182577133, 0.006032699719071388, 0.007082395255565643, 0.008132090792059898, 0.009181786328554153, 0.010231481865048409, 0.011281177401542664, 0.012330872938036919, 0.013380568474531174, 0.014430264011025429, 0.015479959547519684, 0.01652965508401394, 0.017579350620508194, 0.01862904615700245, 0.019678741693496704, 0.02072843722999096, 0.021778132766485214, 0.02282782830297947, 0.023877523839473724, 0.02492721937596798, 0.025976914912462234, 0.02702661044895649, 0.028076305985450745, 0.029126001521945, 0.030175697058439255, 0.03122539259493351, 0.032275088131427765, 0.03332478553056717, 0.034374479204416275, 0.03542417287826538, 0.036473870277404785]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 7.0, 8.0, 7.0, 13.0, 11.0, 21.0, 15.0, 18.0, 21.0, 16.0, 34.0, 26.0, 29.0, 19.0, 44.0, 42.0, 51.0, 47.0, 45.0, 36.0, 44.0, 31.0, 43.0, 43.0, 48.0, 43.0, 31.0, 29.0, 26.0, 19.0, 28.0, 17.0, 19.0, 18.0, 8.0, 11.0, 10.0, 9.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.3515625, -2.2835693359375, -2.215576171875, -2.1475830078125, -2.07958984375, -2.0115966796875, -1.943603515625, -1.8756103515625, -1.8076171875, -1.7396240234375, -1.671630859375, -1.6036376953125, -1.53564453125, -1.4676513671875, -1.399658203125, -1.3316650390625, -1.263671875, -1.1956787109375, -1.127685546875, -1.0596923828125, -0.99169921875, -0.9237060546875, -0.855712890625, -0.7877197265625, -0.7197265625, -0.6517333984375, -0.583740234375, -0.5157470703125, -0.44775390625, -0.3797607421875, -0.311767578125, -0.2437744140625, -0.17578125, -0.1077880859375, -0.039794921875, 0.0281982421875, 0.09619140625, 0.1641845703125, 0.232177734375, 0.3001708984375, 0.3681640625, 0.4361572265625, 0.504150390625, 0.5721435546875, 0.64013671875, 0.7081298828125, 0.776123046875, 0.8441162109375, 0.912109375, 0.9801025390625, 1.048095703125, 1.1160888671875, 1.18408203125, 1.2520751953125, 1.320068359375, 1.3880615234375, 1.4560546875, 1.5240478515625, 1.592041015625, 1.6600341796875, 1.72802734375, 1.7960205078125, 1.864013671875, 1.9320068359375, 2.0]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 7.0, 6.0, 7.0, 16.0, 21.0, 27.0, 17.0, 46.0, 67.0, 112.0, 200.0, 306.0, 561.0, 1142.0, 2078.0, 3942.0, 7315.0, 14005.0, 27028.0, 52738.0, 106632.0, 225679.0, 304654.0, 151011.0, 73748.0, 36950.0, 18859.0, 9881.0, 5222.0, 2824.0, 1560.0, 794.0, 425.0, 258.0, 149.0, 82.0, 55.0, 41.0, 26.0, 17.0, 12.0, 10.0, 5.0, 6.0, 8.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-2.515625, -2.435089111328125, -2.35455322265625, -2.274017333984375, -2.1934814453125, -2.112945556640625, -2.03240966796875, -1.951873779296875, -1.871337890625, -1.790802001953125, -1.71026611328125, -1.629730224609375, -1.5491943359375, -1.468658447265625, -1.38812255859375, -1.307586669921875, -1.22705078125, -1.146514892578125, -1.06597900390625, -0.985443115234375, -0.9049072265625, -0.824371337890625, -0.74383544921875, -0.663299560546875, -0.582763671875, -0.502227783203125, -0.42169189453125, -0.341156005859375, -0.2606201171875, -0.180084228515625, -0.09954833984375, -0.019012451171875, 0.0615234375, 0.142059326171875, 0.22259521484375, 0.303131103515625, 0.3836669921875, 0.464202880859375, 0.54473876953125, 0.625274658203125, 0.705810546875, 0.786346435546875, 0.86688232421875, 0.947418212890625, 1.0279541015625, 1.108489990234375, 1.18902587890625, 1.269561767578125, 1.35009765625, 1.430633544921875, 1.51116943359375, 1.591705322265625, 1.6722412109375, 1.752777099609375, 1.83331298828125, 1.913848876953125, 1.994384765625, 2.074920654296875, 2.15545654296875, 2.235992431640625, 2.3165283203125, 2.397064208984375, 2.47760009765625, 2.558135986328125, 2.638671875]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 2.0, 5.0, 5.0, 11.0, 10.0, 9.0, 16.0, 21.0, 22.0, 27.0, 31.0, 28.0, 39.0, 44.0, 44.0, 62.0, 78.0, 121.0, 226.0, 1446.0, 233.0, 118.0, 92.0, 42.0, 52.0, 38.0, 46.0, 33.0, 27.0, 27.0, 18.0, 16.0, 15.0, 11.0, 10.0, 3.0, 3.0, 8.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.2890625, -7.0494384765625, -6.809814453125, -6.5701904296875, -6.33056640625, -6.0909423828125, -5.851318359375, -5.6116943359375, -5.3720703125, -5.1324462890625, -4.892822265625, -4.6531982421875, -4.41357421875, -4.1739501953125, -3.934326171875, -3.6947021484375, -3.455078125, -3.2154541015625, -2.975830078125, -2.7362060546875, -2.49658203125, -2.2569580078125, -2.017333984375, -1.7777099609375, -1.5380859375, -1.2984619140625, -1.058837890625, -0.8192138671875, -0.57958984375, -0.3399658203125, -0.100341796875, 0.1392822265625, 0.37890625, 0.6185302734375, 0.858154296875, 1.0977783203125, 1.33740234375, 1.5770263671875, 1.816650390625, 2.0562744140625, 2.2958984375, 2.5355224609375, 2.775146484375, 3.0147705078125, 3.25439453125, 3.4940185546875, 3.733642578125, 3.9732666015625, 4.212890625, 4.4525146484375, 4.692138671875, 4.9317626953125, 5.17138671875, 5.4110107421875, 5.650634765625, 5.8902587890625, 6.1298828125, 6.3695068359375, 6.609130859375, 6.8487548828125, 7.08837890625, 7.3280029296875, 7.567626953125, 7.8072509765625, 8.046875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 5.0, 4.0, 5.0, 8.0, 6.0, 10.0, 13.0, 12.0, 28.0, 28.0, 38.0, 52.0, 59.0, 96.0, 99.0, 131.0, 187.0, 302.0, 580.0, 1907.0, 32662.0, 2557351.0, 539954.0, 9734.0, 1079.0, 404.0, 234.0, 195.0, 110.0, 85.0, 66.0, 60.0, 46.0, 35.0, 26.0, 20.0, 18.0, 12.0, 12.0, 12.0, 5.0, 8.0, 2.0, 4.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.703125, -15.224609375, -14.74609375, -14.267578125, -13.7890625, -13.310546875, -12.83203125, -12.353515625, -11.875, -11.396484375, -10.91796875, -10.439453125, -9.9609375, -9.482421875, -9.00390625, -8.525390625, -8.046875, -7.568359375, -7.08984375, -6.611328125, -6.1328125, -5.654296875, -5.17578125, -4.697265625, -4.21875, -3.740234375, -3.26171875, -2.783203125, -2.3046875, -1.826171875, -1.34765625, -0.869140625, -0.390625, 0.087890625, 0.56640625, 1.044921875, 1.5234375, 2.001953125, 2.48046875, 2.958984375, 3.4375, 3.916015625, 4.39453125, 4.873046875, 5.3515625, 5.830078125, 6.30859375, 6.787109375, 7.265625, 7.744140625, 8.22265625, 8.701171875, 9.1796875, 9.658203125, 10.13671875, 10.615234375, 11.09375, 11.572265625, 12.05078125, 12.529296875, 13.0078125, 13.486328125, 13.96484375, 14.443359375, 14.921875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 57.0, 618.0, 332.0, 10.0], "bins": [-199.62710571289062, -196.3944091796875, -193.16172790527344, -189.9290313720703, -186.69635009765625, -183.46365356445312, -180.23097229003906, -176.99827575683594, -173.76559448242188, -170.53289794921875, -167.3002166748047, -164.06752014160156, -160.8348388671875, -157.60214233398438, -154.3694610595703, -151.1367645263672, -147.90406799316406, -144.67137145996094, -141.43869018554688, -138.20599365234375, -134.9733123779297, -131.74061584472656, -128.5079345703125, -125.27523803710938, -122.04255676269531, -118.80986785888672, -115.57717895507812, -112.34449005126953, -109.11180114746094, -105.87910461425781, -102.64642333984375, -99.41372680664062, -96.1810302734375, -92.9483413696289, -89.71565246582031, -86.48296356201172, -83.25027465820312, -80.017578125, -76.78489685058594, -73.55220031738281, -70.31951141357422, -67.08682250976562, -63.85413360595703, -60.62144470214844, -57.38875198364258, -54.156063079833984, -50.92337417602539, -47.69068145751953, -44.4579963684082, -41.22530746459961, -37.992618560791016, -34.759925842285156, -31.527236938476562, -28.29454803466797, -25.061859130859375, -21.82916831970215, -18.596479415893555, -15.363789558410645, -12.131099700927734, -8.89841079711914, -5.6657209396362305, -2.4330310821533203, 0.7996578216552734, 4.0323486328125, 7.2650370597839355]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 3.0, 10.0, 8.0, 13.0, 15.0, 12.0, 19.0, 21.0, 27.0, 26.0, 32.0, 36.0, 38.0, 33.0, 33.0, 36.0, 38.0, 41.0, 50.0, 38.0, 33.0, 35.0, 48.0, 25.0, 30.0, 29.0, 30.0, 31.0, 32.0, 24.0, 18.0, 18.0, 22.0, 24.0, 9.0, 13.0, 6.0, 6.0, 5.0, 5.0, 4.0, 4.0, 6.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-19.61960792541504, -18.98553466796875, -18.351463317871094, -17.717390060424805, -17.08331871032715, -16.44924545288086, -15.815174102783203, -15.181100845336914, -14.547029495239258, -13.912957191467285, -13.278884887695312, -12.64481258392334, -12.010740280151367, -11.376667976379395, -10.742595672607422, -10.108522415161133, -9.47445011138916, -8.840377807617188, -8.206305503845215, -7.572233200073242, -6.9381608963012695, -6.304088592529297, -5.670015811920166, -5.035943508148193, -4.401871204376221, -3.767798900604248, -3.1337265968322754, -2.4996540546417236, -1.865581750869751, -1.2315094470977783, -0.5974369049072266, 0.036635398864746094, 0.6707077026367188, 1.3047800064086914, 1.9388524293899536, 2.572924852371216, 3.2069971561431885, 3.841069459915161, 4.475142002105713, 5.1092143058776855, 5.743286609649658, 6.377358913421631, 7.0114312171936035, 7.645503997802734, 8.279576301574707, 8.91364860534668, 9.547720909118652, 10.181793212890625, 10.815865516662598, 11.44993782043457, 12.084010124206543, 12.718082427978516, 13.352154731750488, 13.986227035522461, 14.62030029296875, 15.254371643066406, 15.888444900512695, 16.522518157958984, 17.15658950805664, 17.79066276550293, 18.424734115600586, 19.058807373046875, 19.69287872314453, 20.32695198059082, 20.961023330688477]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 5.0, 11.0, 6.0, 9.0, 10.0, 16.0, 12.0, 23.0, 23.0, 27.0, 23.0, 24.0, 26.0, 30.0, 47.0, 36.0, 43.0, 39.0, 58.0, 35.0, 38.0, 50.0, 49.0, 43.0, 40.0, 40.0, 26.0, 27.0, 33.0, 21.0, 23.0, 16.0, 17.0, 16.0, 12.0, 13.0, 11.0, 6.0, 7.0, 1.0, 6.0, 2.0, 0.0, 0.0, 3.0, 3.0], "bins": [-2.857421875, -2.781524658203125, -2.70562744140625, -2.629730224609375, -2.5538330078125, -2.477935791015625, -2.40203857421875, -2.326141357421875, -2.250244140625, -2.174346923828125, -2.09844970703125, -2.022552490234375, -1.9466552734375, -1.870758056640625, -1.79486083984375, -1.718963623046875, -1.64306640625, -1.567169189453125, -1.49127197265625, -1.415374755859375, -1.3394775390625, -1.263580322265625, -1.18768310546875, -1.111785888671875, -1.035888671875, -0.959991455078125, -0.88409423828125, -0.808197021484375, -0.7322998046875, -0.656402587890625, -0.58050537109375, -0.504608154296875, -0.4287109375, -0.352813720703125, -0.27691650390625, -0.201019287109375, -0.1251220703125, -0.049224853515625, 0.02667236328125, 0.102569580078125, 0.178466796875, 0.254364013671875, 0.33026123046875, 0.406158447265625, 0.4820556640625, 0.557952880859375, 0.63385009765625, 0.709747314453125, 0.78564453125, 0.861541748046875, 0.93743896484375, 1.013336181640625, 1.0892333984375, 1.165130615234375, 1.24102783203125, 1.316925048828125, 1.392822265625, 1.468719482421875, 1.54461669921875, 1.620513916015625, 1.6964111328125, 1.772308349609375, 1.84820556640625, 1.924102783203125, 2.0]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 5.0, 6.0, 7.0, 6.0, 5.0, 17.0, 17.0, 14.0, 28.0, 38.0, 33.0, 62.0, 87.0, 163.0, 345.0, 958.0, 3302.0, 15447.0, 96181.0, 677982.0, 2249055.0, 975324.0, 145870.0, 22574.0, 4652.0, 1171.0, 417.0, 163.0, 95.0, 71.0, 42.0, 29.0, 24.0, 18.0, 13.0, 11.0, 19.0, 7.0, 3.0, 8.0, 6.0, 1.0, 6.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.16796875, -5.00946044921875, -4.8509521484375, -4.69244384765625, -4.533935546875, -4.37542724609375, -4.2169189453125, -4.05841064453125, -3.89990234375, -3.74139404296875, -3.5828857421875, -3.42437744140625, -3.265869140625, -3.10736083984375, -2.9488525390625, -2.79034423828125, -2.6318359375, -2.47332763671875, -2.3148193359375, -2.15631103515625, -1.997802734375, -1.83929443359375, -1.6807861328125, -1.52227783203125, -1.36376953125, -1.20526123046875, -1.0467529296875, -0.88824462890625, -0.729736328125, -0.57122802734375, -0.4127197265625, -0.25421142578125, -0.095703125, 0.06280517578125, 0.2213134765625, 0.37982177734375, 0.538330078125, 0.69683837890625, 0.8553466796875, 1.01385498046875, 1.17236328125, 1.33087158203125, 1.4893798828125, 1.64788818359375, 1.806396484375, 1.96490478515625, 2.1234130859375, 2.28192138671875, 2.4404296875, 2.59893798828125, 2.7574462890625, 2.91595458984375, 3.074462890625, 3.23297119140625, 3.3914794921875, 3.54998779296875, 3.70849609375, 3.86700439453125, 4.0255126953125, 4.18402099609375, 4.342529296875, 4.50103759765625, 4.6595458984375, 4.81805419921875, 4.9765625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 2.0, 4.0, 5.0, 3.0, 3.0, 7.0, 2.0, 9.0, 8.0, 12.0, 11.0, 24.0, 29.0, 34.0, 41.0, 57.0, 61.0, 113.0, 125.0, 160.0, 206.0, 228.0, 288.0, 336.0, 343.0, 398.0, 298.0, 248.0, 223.0, 169.0, 146.0, 125.0, 81.0, 63.0, 51.0, 44.0, 35.0, 20.0, 19.0, 17.0, 10.0, 3.0, 5.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.59375, -3.46429443359375, -3.3348388671875, -3.20538330078125, -3.075927734375, -2.94647216796875, -2.8170166015625, -2.68756103515625, -2.55810546875, -2.42864990234375, -2.2991943359375, -2.16973876953125, -2.040283203125, -1.91082763671875, -1.7813720703125, -1.65191650390625, -1.5224609375, -1.39300537109375, -1.2635498046875, -1.13409423828125, -1.004638671875, -0.87518310546875, -0.7457275390625, -0.61627197265625, -0.48681640625, -0.35736083984375, -0.2279052734375, -0.09844970703125, 0.031005859375, 0.16046142578125, 0.2899169921875, 0.41937255859375, 0.548828125, 0.67828369140625, 0.8077392578125, 0.93719482421875, 1.066650390625, 1.19610595703125, 1.3255615234375, 1.45501708984375, 1.58447265625, 1.71392822265625, 1.8433837890625, 1.97283935546875, 2.102294921875, 2.23175048828125, 2.3612060546875, 2.49066162109375, 2.6201171875, 2.74957275390625, 2.8790283203125, 3.00848388671875, 3.137939453125, 3.26739501953125, 3.3968505859375, 3.52630615234375, 3.65576171875, 3.78521728515625, 3.9146728515625, 4.04412841796875, 4.173583984375, 4.30303955078125, 4.4324951171875, 4.56195068359375, 4.69140625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 6.0, 5.0, 9.0, 10.0, 19.0, 32.0, 32.0, 40.0, 60.0, 71.0, 95.0, 132.0, 180.0, 246.0, 445.0, 1229.0, 10293.0, 299382.0, 3366054.0, 497045.0, 15920.0, 1492.0, 463.0, 283.0, 193.0, 148.0, 88.0, 57.0, 61.0, 44.0, 31.0, 29.0, 15.0, 16.0, 10.0, 7.0, 6.0, 4.0, 7.0, 4.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0], "bins": [-14.3984375, -13.99365234375, -13.5888671875, -13.18408203125, -12.779296875, -12.37451171875, -11.9697265625, -11.56494140625, -11.16015625, -10.75537109375, -10.3505859375, -9.94580078125, -9.541015625, -9.13623046875, -8.7314453125, -8.32666015625, -7.921875, -7.51708984375, -7.1123046875, -6.70751953125, -6.302734375, -5.89794921875, -5.4931640625, -5.08837890625, -4.68359375, -4.27880859375, -3.8740234375, -3.46923828125, -3.064453125, -2.65966796875, -2.2548828125, -1.85009765625, -1.4453125, -1.04052734375, -0.6357421875, -0.23095703125, 0.173828125, 0.57861328125, 0.9833984375, 1.38818359375, 1.79296875, 2.19775390625, 2.6025390625, 3.00732421875, 3.412109375, 3.81689453125, 4.2216796875, 4.62646484375, 5.03125, 5.43603515625, 5.8408203125, 6.24560546875, 6.650390625, 7.05517578125, 7.4599609375, 7.86474609375, 8.26953125, 8.67431640625, 9.0791015625, 9.48388671875, 9.888671875, 10.29345703125, 10.6982421875, 11.10302734375, 11.5078125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 7.0, 12.0, 22.0, 45.0, 87.0, 121.0, 153.0, 162.0, 155.0, 112.0, 70.0, 44.0, 19.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.078163146972656, -58.88465881347656, -57.69115447998047, -56.497650146484375, -55.30414581298828, -54.11064147949219, -52.917137145996094, -51.7236328125, -50.530128479003906, -49.33662414550781, -48.14311981201172, -46.949615478515625, -45.75611114501953, -44.56260681152344, -43.369102478027344, -42.17559814453125, -40.982093811035156, -39.78858947753906, -38.59508514404297, -37.401580810546875, -36.20807647705078, -35.01457214355469, -33.821067810058594, -32.6275634765625, -31.43405532836914, -30.240550994873047, -29.047046661376953, -27.85354232788086, -26.660037994384766, -25.466533660888672, -24.273029327392578, -23.079524993896484, -21.886022567749023, -20.69251823425293, -19.499013900756836, -18.305509567260742, -17.11200523376465, -15.918500900268555, -14.724995613098145, -13.53149127960205, -12.337986946105957, -11.144482612609863, -9.95097827911377, -8.75747299194336, -7.563969135284424, -6.37046480178833, -5.176959991455078, -3.9834556579589844, -2.7899513244628906, -1.5964468717575073, -0.402942419052124, 0.7905621528625488, 1.9840664863586426, 3.1775708198547363, 4.371075630187988, 5.564579963684082, 6.758084297180176, 7.9515886306762695, 9.145092964172363, 10.338598251342773, 11.532102584838867, 12.725606918334961, 13.919111251831055, 15.112615585327148, 16.306119918823242]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 9.0, 5.0, 16.0, 15.0, 10.0, 19.0, 30.0, 26.0, 24.0, 22.0, 31.0, 29.0, 31.0, 29.0, 28.0, 41.0, 44.0, 37.0, 40.0, 38.0, 31.0, 47.0, 45.0, 44.0, 26.0, 34.0, 34.0, 28.0, 23.0, 26.0, 20.0, 24.0, 13.0, 22.0, 13.0, 9.0, 7.0, 4.0, 6.0, 3.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.418663024902344, -13.909097671508789, -13.399532318115234, -12.889967918395996, -12.380402565002441, -11.870837211608887, -11.361272811889648, -10.851707458496094, -10.342142105102539, -9.832576751708984, -9.32301139831543, -8.813446998596191, -8.303881645202637, -7.794316291809082, -7.2847514152526855, -6.775186538696289, -6.265621185302734, -5.75605583190918, -5.246490955352783, -4.736926078796387, -4.227360725402832, -3.7177956104278564, -3.208230495452881, -2.6986653804779053, -2.1891002655029297, -1.679535150527954, -1.1699700355529785, -0.6604049205780029, -0.15083980560302734, 0.35872530937194824, 0.8682904243469238, 1.3778555393218994, 1.887420654296875, 2.3969857692718506, 2.906550884246826, 3.4161159992218018, 3.9256811141967773, 4.435246467590332, 4.9448113441467285, 5.454376220703125, 5.96394157409668, 6.473506927490234, 6.983071804046631, 7.492636680603027, 8.002202033996582, 8.511767387390137, 9.021331787109375, 9.53089714050293, 10.040462493896484, 10.550027847290039, 11.059593200683594, 11.569157600402832, 12.078722953796387, 12.588288307189941, 13.09785270690918, 13.607418060302734, 14.116983413696289, 14.626548767089844, 15.136114120483398, 15.645678520202637, 16.155242919921875, 16.66480827331543, 17.174373626708984, 17.68393898010254, 18.193504333496094]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 10.0, 14.0, 16.0, 16.0, 17.0, 28.0, 24.0, 21.0, 35.0, 30.0, 35.0, 33.0, 41.0, 39.0, 53.0, 44.0, 40.0, 40.0, 45.0, 47.0, 42.0, 35.0, 35.0, 44.0, 17.0, 23.0, 34.0, 28.0, 22.0, 22.0, 12.0, 12.0, 5.0, 7.0, 4.0, 6.0, 4.0, 5.0, 0.0, 5.0, 0.0, 2.0], "bins": [-2.90625, -2.830902099609375, -2.75555419921875, -2.680206298828125, -2.6048583984375, -2.529510498046875, -2.45416259765625, -2.378814697265625, -2.303466796875, -2.228118896484375, -2.15277099609375, -2.077423095703125, -2.0020751953125, -1.926727294921875, -1.85137939453125, -1.776031494140625, -1.70068359375, -1.625335693359375, -1.54998779296875, -1.474639892578125, -1.3992919921875, -1.323944091796875, -1.24859619140625, -1.173248291015625, -1.097900390625, -1.022552490234375, -0.94720458984375, -0.871856689453125, -0.7965087890625, -0.721160888671875, -0.64581298828125, -0.570465087890625, -0.4951171875, -0.419769287109375, -0.34442138671875, -0.269073486328125, -0.1937255859375, -0.118377685546875, -0.04302978515625, 0.032318115234375, 0.107666015625, 0.183013916015625, 0.25836181640625, 0.333709716796875, 0.4090576171875, 0.484405517578125, 0.55975341796875, 0.635101318359375, 0.71044921875, 0.785797119140625, 0.86114501953125, 0.936492919921875, 1.0118408203125, 1.087188720703125, 1.16253662109375, 1.237884521484375, 1.313232421875, 1.388580322265625, 1.46392822265625, 1.539276123046875, 1.6146240234375, 1.689971923828125, 1.76531982421875, 1.840667724609375, 1.916015625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 6.0, 2.0, 6.0, 5.0, 20.0, 19.0, 25.0, 45.0, 71.0, 97.0, 178.0, 253.0, 355.0, 652.0, 1098.0, 1661.0, 2754.0, 4503.0, 7442.0, 12504.0, 20758.0, 34415.0, 57068.0, 92102.0, 141241.0, 187423.0, 171236.0, 119669.0, 75981.0, 46457.0, 28430.0, 16503.0, 10121.0, 5989.0, 3611.0, 2220.0, 1351.0, 835.0, 535.0, 331.0, 199.0, 137.0, 86.0, 53.0, 37.0, 23.0, 17.0, 13.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.23486328125, -0.22770118713378906, -0.22053909301757812, -0.2133769989013672, -0.20621490478515625, -0.1990528106689453, -0.19189071655273438, -0.18472862243652344, -0.1775665283203125, -0.17040443420410156, -0.16324234008789062, -0.1560802459716797, -0.14891815185546875, -0.1417560577392578, -0.13459396362304688, -0.12743186950683594, -0.120269775390625, -0.11310768127441406, -0.10594558715820312, -0.09878349304199219, -0.09162139892578125, -0.08445930480957031, -0.07729721069335938, -0.07013511657714844, -0.0629730224609375, -0.05581092834472656, -0.048648834228515625, -0.04148674011230469, -0.03432464599609375, -0.027162551879882812, -0.020000457763671875, -0.012838363647460938, -0.00567626953125, 0.0014858245849609375, 0.008647918701171875, 0.015810012817382812, 0.02297210693359375, 0.030134201049804688, 0.037296295166015625, 0.04445838928222656, 0.0516204833984375, 0.05878257751464844, 0.06594467163085938, 0.07310676574707031, 0.08026885986328125, 0.08743095397949219, 0.09459304809570312, 0.10175514221191406, 0.108917236328125, 0.11607933044433594, 0.12324142456054688, 0.1304035186767578, 0.13756561279296875, 0.1447277069091797, 0.15188980102539062, 0.15905189514160156, 0.1662139892578125, 0.17337608337402344, 0.18053817749023438, 0.1877002716064453, 0.19486236572265625, 0.2020244598388672, 0.20918655395507812, 0.21634864807128906, 0.2235107421875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 6.0, 1.0, 5.0, 1.0, 5.0, 5.0, 3.0, 7.0, 9.0, 13.0, 12.0, 18.0, 17.0, 18.0, 26.0, 31.0, 26.0, 26.0, 29.0, 29.0, 42.0, 37.0, 37.0, 37.0, 27.0, 31.0, 32.0, 1060.0, 24.0, 39.0, 36.0, 29.0, 35.0, 30.0, 28.0, 19.0, 24.0, 29.0, 23.0, 17.0, 20.0, 16.0, 9.0, 14.0, 9.0, 8.0, 7.0, 13.0, 8.0, 3.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.9453125, -1.8903961181640625, -1.835479736328125, -1.7805633544921875, -1.72564697265625, -1.6707305908203125, -1.615814208984375, -1.5608978271484375, -1.5059814453125, -1.4510650634765625, -1.396148681640625, -1.3412322998046875, -1.28631591796875, -1.2313995361328125, -1.176483154296875, -1.1215667724609375, -1.066650390625, -1.0117340087890625, -0.956817626953125, -0.9019012451171875, -0.84698486328125, -0.7920684814453125, -0.737152099609375, -0.6822357177734375, -0.6273193359375, -0.5724029541015625, -0.517486572265625, -0.4625701904296875, -0.40765380859375, -0.3527374267578125, -0.297821044921875, -0.2429046630859375, -0.18798828125, -0.1330718994140625, -0.078155517578125, -0.0232391357421875, 0.03167724609375, 0.0865936279296875, 0.141510009765625, 0.1964263916015625, 0.2513427734375, 0.3062591552734375, 0.361175537109375, 0.4160919189453125, 0.47100830078125, 0.5259246826171875, 0.580841064453125, 0.6357574462890625, 0.690673828125, 0.7455902099609375, 0.800506591796875, 0.8554229736328125, 0.91033935546875, 0.9652557373046875, 1.020172119140625, 1.0750885009765625, 1.1300048828125, 1.1849212646484375, 1.239837646484375, 1.2947540283203125, 1.34967041015625, 1.4045867919921875, 1.459503173828125, 1.5144195556640625, 1.5693359375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 10.0, 11.0, 13.0, 20.0, 26.0, 37.0, 42.0, 78.0, 119.0, 174.0, 267.0, 435.0, 649.0, 1083.0, 1643.0, 2743.0, 4458.0, 7409.0, 11763.0, 18799.0, 30365.0, 48268.0, 75304.0, 116203.0, 185040.0, 1197203.0, 139172.0, 94907.0, 60457.0, 38192.0, 23498.0, 14646.0, 9363.0, 5545.0, 3413.0, 2126.0, 1392.0, 799.0, 526.0, 318.0, 209.0, 141.0, 84.0, 65.0, 45.0, 26.0, 19.0, 15.0, 3.0, 5.0, 4.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.12005615234375, -0.11608600616455078, -0.11211585998535156, -0.10814571380615234, -0.10417556762695312, -0.1002054214477539, -0.09623527526855469, -0.09226512908935547, -0.08829498291015625, -0.08432483673095703, -0.08035469055175781, -0.0763845443725586, -0.07241439819335938, -0.06844425201416016, -0.06447410583496094, -0.06050395965576172, -0.0565338134765625, -0.05256366729736328, -0.04859352111816406, -0.044623374938964844, -0.040653228759765625, -0.036683082580566406, -0.03271293640136719, -0.02874279022216797, -0.02477264404296875, -0.02080249786376953, -0.016832351684570312, -0.012862205505371094, -0.008892059326171875, -0.004921913146972656, -0.0009517669677734375, 0.0030183792114257812, 0.006988525390625, 0.010958671569824219, 0.014928817749023438, 0.018898963928222656, 0.022869110107421875, 0.026839256286621094, 0.030809402465820312, 0.03477954864501953, 0.03874969482421875, 0.04271984100341797, 0.04668998718261719, 0.050660133361816406, 0.054630279541015625, 0.058600425720214844, 0.06257057189941406, 0.06654071807861328, 0.0705108642578125, 0.07448101043701172, 0.07845115661621094, 0.08242130279541016, 0.08639144897460938, 0.0903615951538086, 0.09433174133300781, 0.09830188751220703, 0.10227203369140625, 0.10624217987060547, 0.11021232604980469, 0.1141824722290039, 0.11815261840820312, 0.12212276458740234, 0.12609291076660156, 0.13006305694580078, 0.134033203125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 5.0, 10.0, 14.0, 17.0, 15.0, 21.0, 19.0, 42.0, 43.0, 38.0, 48.0, 47.0, 94.0, 99.0, 89.0, 86.0, 49.0, 43.0, 32.0, 33.0, 23.0, 22.0, 22.0, 16.0, 12.0, 10.0, 9.0, 9.0, 4.0, 9.0, 1.0, 3.0, 1.0, 6.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01479339599609375, -0.014354825019836426, -0.013916254043579102, -0.013477683067321777, -0.013039112091064453, -0.012600541114807129, -0.012161970138549805, -0.01172339916229248, -0.011284828186035156, -0.010846257209777832, -0.010407686233520508, -0.009969115257263184, -0.00953054428100586, -0.009091973304748535, -0.008653402328491211, -0.008214831352233887, -0.0077762603759765625, -0.007337689399719238, -0.006899118423461914, -0.00646054744720459, -0.006021976470947266, -0.005583405494689941, -0.005144834518432617, -0.004706263542175293, -0.004267692565917969, -0.0038291215896606445, -0.0033905506134033203, -0.002951979637145996, -0.002513408660888672, -0.0020748376846313477, -0.0016362667083740234, -0.0011976957321166992, -0.000759124755859375, -0.0003205537796020508, 0.00011801719665527344, 0.0005565881729125977, 0.0009951591491699219, 0.001433730125427246, 0.0018723011016845703, 0.0023108720779418945, 0.0027494430541992188, 0.003188014030456543, 0.003626585006713867, 0.004065155982971191, 0.004503726959228516, 0.00494229793548584, 0.005380868911743164, 0.005819439888000488, 0.0062580108642578125, 0.006696581840515137, 0.007135152816772461, 0.007573723793029785, 0.00801229476928711, 0.008450865745544434, 0.008889436721801758, 0.009328007698059082, 0.009766578674316406, 0.01020514965057373, 0.010643720626831055, 0.011082291603088379, 0.011520862579345703, 0.011959433555603027, 0.012398004531860352, 0.012836575508117676, 0.013275146484375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 2.0, 3.0, 4.0, 4.0, 0.0, 10.0, 6.0, 10.0, 15.0, 10.0, 16.0, 22.0, 33.0, 34.0, 66.0, 105.0, 188.0, 374.0, 1309.0, 25617.0, 996411.0, 22174.0, 1237.0, 368.0, 181.0, 122.0, 76.0, 44.0, 26.0, 25.0, 17.0, 9.0, 13.0, 8.0, 5.0, 5.0, 4.0, 3.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2626953125, -0.254608154296875, -0.24652099609375, -0.238433837890625, -0.2303466796875, -0.222259521484375, -0.21417236328125, -0.206085205078125, -0.197998046875, -0.189910888671875, -0.18182373046875, -0.173736572265625, -0.1656494140625, -0.157562255859375, -0.14947509765625, -0.141387939453125, -0.13330078125, -0.125213623046875, -0.11712646484375, -0.109039306640625, -0.1009521484375, -0.092864990234375, -0.08477783203125, -0.076690673828125, -0.068603515625, -0.060516357421875, -0.05242919921875, -0.044342041015625, -0.0362548828125, -0.028167724609375, -0.02008056640625, -0.011993408203125, -0.00390625, 0.004180908203125, 0.01226806640625, 0.020355224609375, 0.0284423828125, 0.036529541015625, 0.04461669921875, 0.052703857421875, 0.060791015625, 0.068878173828125, 0.07696533203125, 0.085052490234375, 0.0931396484375, 0.101226806640625, 0.10931396484375, 0.117401123046875, 0.12548828125, 0.133575439453125, 0.14166259765625, 0.149749755859375, 0.1578369140625, 0.165924072265625, 0.17401123046875, 0.182098388671875, 0.190185546875, 0.198272705078125, 0.20635986328125, 0.214447021484375, 0.2225341796875, 0.230621337890625, 0.23870849609375, 0.246795654296875, 0.2548828125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 23.0, 22.0, 43.0, 71.0, 198.0, 353.0, 142.0, 77.0, 40.0, 16.0, 10.0, 8.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06489820033311844, -0.06136474385857582, -0.0578312873840332, -0.054297834634780884, -0.05076437443494797, -0.04723092168569565, -0.04369746521115303, -0.04016400873661041, -0.036630552262067795, -0.03309709578752518, -0.02956363931298256, -0.02603018470108509, -0.022496728226542473, -0.018963271751999855, -0.015429817140102386, -0.011896360665559769, -0.008362904191017151, -0.00482944818213582, -0.00129599217325449, 0.0022374633699655533, 0.005770919844508171, 0.009304376319050789, 0.012837830930948257, 0.016371287405490875, 0.019904743880033493, 0.02343820035457611, 0.02697165682911873, 0.030505111441016197, 0.034038566052913666, 0.03757202625274658, 0.0411054790019989, 0.04463893547654152, 0.048172399401664734, 0.05170585587620735, 0.05523931235074997, 0.05877276510000229, 0.062306225299835205, 0.06583967804908752, 0.06937313079833984, 0.07290659099817276, 0.07644005119800568, 0.079973503947258, 0.08350696414709091, 0.08704041689634323, 0.09057387709617615, 0.09410732984542847, 0.09764078259468079, 0.1011742427945137, 0.10470769554376602, 0.10824114829301834, 0.11177460849285126, 0.11530806124210358, 0.11884152144193649, 0.12237497419118881, 0.12590843439102173, 0.12944188714027405, 0.13297533988952637, 0.1365087926387787, 0.140042245388031, 0.14357571303844452, 0.14710916578769684, 0.15064261853694916, 0.15417607128620148, 0.157709538936615, 0.1612429916858673]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 4.0, 6.0, 14.0, 10.0, 18.0, 27.0, 22.0, 25.0, 31.0, 29.0, 33.0, 30.0, 47.0, 35.0, 37.0, 35.0, 25.0, 44.0, 47.0, 36.0, 37.0, 47.0, 37.0, 34.0, 35.0, 26.0, 34.0, 31.0, 30.0, 21.0, 22.0, 17.0, 17.0, 16.0, 12.0, 5.0, 6.0, 3.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.044296205043792725, -0.04289322346448898, -0.04149023815989494, -0.0400872528553009, -0.03868427127599716, -0.03728128969669342, -0.03587830439209938, -0.03447531908750534, -0.0330723375082016, -0.03166935592889786, -0.030266370624303818, -0.028863387182354927, -0.027460403740406036, -0.026057420298457146, -0.024654436856508255, -0.023251453414559364, -0.021848469972610474, -0.020445486530661583, -0.019042503088712692, -0.0176395196467638, -0.01623653620481491, -0.01483355276286602, -0.01343056932091713, -0.012027585878968239, -0.010624602437019348, -0.009221618995070457, -0.007818635553121567, -0.006415652111172676, -0.005012668669223785, -0.0036096852272748947, -0.002206701785326004, -0.0008037183433771133, 0.0005992650985717773, 0.002002248540520668, 0.0034052319824695587, 0.004808215424418449, 0.00621119886636734, 0.007614182308316231, 0.009017165750265121, 0.010420149192214012, 0.011823132634162903, 0.013226116076111794, 0.014629099518060684, 0.016032082960009575, 0.017435066401958466, 0.018838049843907356, 0.020241033285856247, 0.021644016727805138, 0.02304700016975403, 0.02444998361170292, 0.02585296705365181, 0.0272559504956007, 0.02865893393754959, 0.030061917379498482, 0.03146490082144737, 0.03286788612604141, 0.034270867705345154, 0.035673849284648895, 0.037076834589242935, 0.038479819893836975, 0.03988280147314072, 0.04128578305244446, 0.0426887683570385, 0.04409175366163254, 0.04549473524093628]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 5.0, 4.0, 5.0, 9.0, 10.0, 14.0, 16.0, 16.0, 17.0, 28.0, 24.0, 21.0, 35.0, 30.0, 34.0, 33.0, 42.0, 39.0, 53.0, 44.0, 40.0, 41.0, 44.0, 47.0, 42.0, 34.0, 36.0, 44.0, 18.0, 22.0, 34.0, 28.0, 22.0, 22.0, 12.0, 12.0, 5.0, 7.0, 4.0, 6.0, 4.0, 5.0, 0.0, 5.0, 0.0, 2.0], "bins": [-2.908203125, -2.8328094482421875, -2.757415771484375, -2.6820220947265625, -2.60662841796875, -2.5312347412109375, -2.455841064453125, -2.3804473876953125, -2.3050537109375, -2.2296600341796875, -2.154266357421875, -2.0788726806640625, -2.00347900390625, -1.9280853271484375, -1.852691650390625, -1.7772979736328125, -1.701904296875, -1.6265106201171875, -1.551116943359375, -1.4757232666015625, -1.40032958984375, -1.3249359130859375, -1.249542236328125, -1.1741485595703125, -1.0987548828125, -1.0233612060546875, -0.947967529296875, -0.8725738525390625, -0.79718017578125, -0.7217864990234375, -0.646392822265625, -0.5709991455078125, -0.49560546875, -0.4202117919921875, -0.344818115234375, -0.2694244384765625, -0.19403076171875, -0.1186370849609375, -0.043243408203125, 0.0321502685546875, 0.1075439453125, 0.1829376220703125, 0.258331298828125, 0.3337249755859375, 0.40911865234375, 0.4845123291015625, 0.559906005859375, 0.6352996826171875, 0.710693359375, 0.7860870361328125, 0.861480712890625, 0.9368743896484375, 1.01226806640625, 1.0876617431640625, 1.163055419921875, 1.2384490966796875, 1.3138427734375, 1.3892364501953125, 1.464630126953125, 1.5400238037109375, 1.61541748046875, 1.6908111572265625, 1.766204833984375, 1.8415985107421875, 1.9169921875]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 14.0, 18.0, 34.0, 54.0, 87.0, 144.0, 273.0, 426.0, 902.0, 1693.0, 3323.0, 7091.0, 15766.0, 36530.0, 85525.0, 211046.0, 358496.0, 190139.0, 76983.0, 32684.0, 14225.0, 6548.0, 3138.0, 1568.0, 791.0, 439.0, 253.0, 142.0, 96.0, 40.0, 41.0, 16.0, 12.0, 11.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.43359375, -2.34490966796875, -2.2562255859375, -2.16754150390625, -2.078857421875, -1.99017333984375, -1.9014892578125, -1.81280517578125, -1.72412109375, -1.63543701171875, -1.5467529296875, -1.45806884765625, -1.369384765625, -1.28070068359375, -1.1920166015625, -1.10333251953125, -1.0146484375, -0.92596435546875, -0.8372802734375, -0.74859619140625, -0.659912109375, -0.57122802734375, -0.4825439453125, -0.39385986328125, -0.30517578125, -0.21649169921875, -0.1278076171875, -0.03912353515625, 0.049560546875, 0.13824462890625, 0.2269287109375, 0.31561279296875, 0.404296875, 0.49298095703125, 0.5816650390625, 0.67034912109375, 0.759033203125, 0.84771728515625, 0.9364013671875, 1.02508544921875, 1.11376953125, 1.20245361328125, 1.2911376953125, 1.37982177734375, 1.468505859375, 1.55718994140625, 1.6458740234375, 1.73455810546875, 1.8232421875, 1.91192626953125, 2.0006103515625, 2.08929443359375, 2.177978515625, 2.26666259765625, 2.3553466796875, 2.44403076171875, 2.53271484375, 2.62139892578125, 2.7100830078125, 2.79876708984375, 2.887451171875, 2.97613525390625, 3.0648193359375, 3.15350341796875, 3.2421875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 12.0, 7.0, 8.0, 10.0, 14.0, 28.0, 18.0, 25.0, 31.0, 20.0, 43.0, 38.0, 43.0, 48.0, 80.0, 138.0, 285.0, 1414.0, 224.0, 131.0, 71.0, 45.0, 49.0, 34.0, 38.0, 31.0, 17.0, 25.0, 20.0, 14.0, 18.0, 15.0, 16.0, 16.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-8.5703125, -8.32080078125, -8.0712890625, -7.82177734375, -7.572265625, -7.32275390625, -7.0732421875, -6.82373046875, -6.57421875, -6.32470703125, -6.0751953125, -5.82568359375, -5.576171875, -5.32666015625, -5.0771484375, -4.82763671875, -4.578125, -4.32861328125, -4.0791015625, -3.82958984375, -3.580078125, -3.33056640625, -3.0810546875, -2.83154296875, -2.58203125, -2.33251953125, -2.0830078125, -1.83349609375, -1.583984375, -1.33447265625, -1.0849609375, -0.83544921875, -0.5859375, -0.33642578125, -0.0869140625, 0.16259765625, 0.412109375, 0.66162109375, 0.9111328125, 1.16064453125, 1.41015625, 1.65966796875, 1.9091796875, 2.15869140625, 2.408203125, 2.65771484375, 2.9072265625, 3.15673828125, 3.40625, 3.65576171875, 3.9052734375, 4.15478515625, 4.404296875, 4.65380859375, 4.9033203125, 5.15283203125, 5.40234375, 5.65185546875, 5.9013671875, 6.15087890625, 6.400390625, 6.64990234375, 6.8994140625, 7.14892578125, 7.3984375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 2.0, 9.0, 3.0, 6.0, 7.0, 12.0, 11.0, 23.0, 28.0, 50.0, 68.0, 84.0, 108.0, 167.0, 256.0, 379.0, 723.0, 5558.0, 2113038.0, 1019400.0, 3974.0, 642.0, 369.0, 225.0, 161.0, 109.0, 98.0, 64.0, 38.0, 23.0, 23.0, 13.0, 11.0, 12.0, 1.0, 8.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-20.65625, -19.966552734375, -19.27685546875, -18.587158203125, -17.8974609375, -17.207763671875, -16.51806640625, -15.828369140625, -15.138671875, -14.448974609375, -13.75927734375, -13.069580078125, -12.3798828125, -11.690185546875, -11.00048828125, -10.310791015625, -9.62109375, -8.931396484375, -8.24169921875, -7.552001953125, -6.8623046875, -6.172607421875, -5.48291015625, -4.793212890625, -4.103515625, -3.413818359375, -2.72412109375, -2.034423828125, -1.3447265625, -0.655029296875, 0.03466796875, 0.724365234375, 1.4140625, 2.103759765625, 2.79345703125, 3.483154296875, 4.1728515625, 4.862548828125, 5.55224609375, 6.241943359375, 6.931640625, 7.621337890625, 8.31103515625, 9.000732421875, 9.6904296875, 10.380126953125, 11.06982421875, 11.759521484375, 12.44921875, 13.138916015625, 13.82861328125, 14.518310546875, 15.2080078125, 15.897705078125, 16.58740234375, 17.277099609375, 17.966796875, 18.656494140625, 19.34619140625, 20.035888671875, 20.7255859375, 21.415283203125, 22.10498046875, 22.794677734375, 23.484375]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 11.0, 39.0, 87.0, 188.0, 256.0, 229.0, 145.0, 40.0, 11.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.544193267822266, -5.57241678237915, -4.600640296936035, -3.6288633346557617, -2.6570868492126465, -1.6853103637695312, -0.7135334014892578, 0.2582430839538574, 1.2300195693969727, 2.201796054840088, 3.1735727787017822, 4.145349502563477, 5.117125988006592, 6.088902473449707, 7.0606794357299805, 8.032455444335938, 9.004232406616211, 9.976009368896484, 10.947785377502441, 11.919562339782715, 12.891338348388672, 13.863115310668945, 14.834892272949219, 15.806669235229492, 16.778446197509766, 17.75022315979004, 18.722000122070312, 19.693775177001953, 20.665552139282227, 21.6373291015625, 22.609106063842773, 23.580883026123047, 24.552658081054688, 25.52443504333496, 26.496212005615234, 27.467987060546875, 28.43976402282715, 29.411540985107422, 30.383317947387695, 31.35509490966797, 32.32686996459961, 33.29864501953125, 34.270423889160156, 35.2421989440918, 36.2139778137207, 37.185752868652344, 38.15753173828125, 39.12930679321289, 40.10108184814453, 41.07285690307617, 42.04463577270508, 43.01641082763672, 43.988189697265625, 44.959964752197266, 45.931739807128906, 46.90351867675781, 47.87529754638672, 48.84707260131836, 49.818851470947266, 50.790626525878906, 51.76240539550781, 52.73418045043945, 53.705955505371094, 54.677734375, 55.64950942993164]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 6.0, 10.0, 4.0, 3.0, 7.0, 6.0, 7.0, 16.0, 14.0, 15.0, 16.0, 24.0, 25.0, 22.0, 20.0, 23.0, 35.0, 26.0, 36.0, 35.0, 40.0, 45.0, 35.0, 48.0, 33.0, 31.0, 34.0, 45.0, 35.0, 38.0, 24.0, 32.0, 25.0, 25.0, 24.0, 17.0, 15.0, 20.0, 18.0, 15.0, 6.0, 10.0, 8.0, 4.0, 12.0, 9.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.562644958496094, -14.989542007446289, -14.4164400100708, -13.843338012695312, -13.270235061645508, -12.697132110595703, -12.124030113220215, -11.550928115844727, -10.977825164794922, -10.404722213745117, -9.831620216369629, -9.25851821899414, -8.685415267944336, -8.112312316894531, -7.539210319519043, -6.9661078453063965, -6.39300537109375, -5.8199028968811035, -5.246800422668457, -4.6736979484558105, -4.100595474243164, -3.5274930000305176, -2.954390525817871, -2.3812880516052246, -1.8081855773925781, -1.2350831031799316, -0.6619806289672852, -0.08887815475463867, 0.4842243194580078, 1.0573267936706543, 1.6304292678833008, 2.2035317420959473, 2.7766342163085938, 3.3497366905212402, 3.9228391647338867, 4.495941638946533, 5.06904411315918, 5.642146587371826, 6.215249061584473, 6.788351535797119, 7.361454010009766, 7.934556484222412, 8.507658958435059, 9.080760955810547, 9.653863906860352, 10.226966857910156, 10.800068855285645, 11.373170852661133, 11.946273803710938, 12.519376754760742, 13.09247875213623, 13.665580749511719, 14.238683700561523, 14.811786651611328, 15.384888648986816, 15.957990646362305, 16.53109359741211, 17.104196548461914, 17.67729949951172, 18.25040054321289, 18.823503494262695, 19.3966064453125, 19.969707489013672, 20.542810440063477, 21.11591339111328]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 10.0, 7.0, 10.0, 13.0, 16.0, 17.0, 19.0, 23.0, 25.0, 29.0, 41.0, 26.0, 39.0, 31.0, 37.0, 43.0, 54.0, 36.0, 47.0, 41.0, 36.0, 44.0, 56.0, 40.0, 39.0, 23.0, 35.0, 32.0, 17.0, 20.0, 23.0, 19.0, 15.0, 7.0, 3.0, 11.0, 6.0, 3.0, 7.0, 4.0, 1.0, 1.0, 2.0, 1.0], "bins": [-3.232421875, -3.14813232421875, -3.0638427734375, -2.97955322265625, -2.895263671875, -2.81097412109375, -2.7266845703125, -2.64239501953125, -2.55810546875, -2.47381591796875, -2.3895263671875, -2.30523681640625, -2.220947265625, -2.13665771484375, -2.0523681640625, -1.96807861328125, -1.8837890625, -1.79949951171875, -1.7152099609375, -1.63092041015625, -1.546630859375, -1.46234130859375, -1.3780517578125, -1.29376220703125, -1.20947265625, -1.12518310546875, -1.0408935546875, -0.95660400390625, -0.872314453125, -0.78802490234375, -0.7037353515625, -0.61944580078125, -0.53515625, -0.45086669921875, -0.3665771484375, -0.28228759765625, -0.197998046875, -0.11370849609375, -0.0294189453125, 0.05487060546875, 0.13916015625, 0.22344970703125, 0.3077392578125, 0.39202880859375, 0.476318359375, 0.56060791015625, 0.6448974609375, 0.72918701171875, 0.8134765625, 0.89776611328125, 0.9820556640625, 1.06634521484375, 1.150634765625, 1.23492431640625, 1.3192138671875, 1.40350341796875, 1.48779296875, 1.57208251953125, 1.6563720703125, 1.74066162109375, 1.824951171875, 1.90924072265625, 1.9935302734375, 2.07781982421875, 2.162109375]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 7.0, 5.0, 3.0, 7.0, 15.0, 16.0, 34.0, 29.0, 64.0, 81.0, 139.0, 232.0, 404.0, 868.0, 2173.0, 6860.0, 24638.0, 99373.0, 411844.0, 1353464.0, 1566847.0, 545344.0, 134456.0, 33441.0, 8982.0, 2842.0, 974.0, 458.0, 214.0, 151.0, 99.0, 65.0, 55.0, 25.0, 21.0, 18.0, 18.0, 5.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.17578125, -4.06011962890625, -3.9444580078125, -3.82879638671875, -3.713134765625, -3.59747314453125, -3.4818115234375, -3.36614990234375, -3.25048828125, -3.13482666015625, -3.0191650390625, -2.90350341796875, -2.787841796875, -2.67218017578125, -2.5565185546875, -2.44085693359375, -2.3251953125, -2.20953369140625, -2.0938720703125, -1.97821044921875, -1.862548828125, -1.74688720703125, -1.6312255859375, -1.51556396484375, -1.39990234375, -1.28424072265625, -1.1685791015625, -1.05291748046875, -0.937255859375, -0.82159423828125, -0.7059326171875, -0.59027099609375, -0.474609375, -0.35894775390625, -0.2432861328125, -0.12762451171875, -0.011962890625, 0.10369873046875, 0.2193603515625, 0.33502197265625, 0.45068359375, 0.56634521484375, 0.6820068359375, 0.79766845703125, 0.913330078125, 1.02899169921875, 1.1446533203125, 1.26031494140625, 1.3759765625, 1.49163818359375, 1.6072998046875, 1.72296142578125, 1.838623046875, 1.95428466796875, 2.0699462890625, 2.18560791015625, 2.30126953125, 2.41693115234375, 2.5325927734375, 2.64825439453125, 2.763916015625, 2.87957763671875, 2.9952392578125, 3.11090087890625, 3.2265625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 5.0, 2.0, 7.0, 10.0, 21.0, 25.0, 33.0, 29.0, 56.0, 66.0, 77.0, 106.0, 140.0, 164.0, 240.0, 298.0, 381.0, 401.0, 402.0, 323.0, 305.0, 232.0, 191.0, 139.0, 109.0, 72.0, 64.0, 47.0, 44.0, 22.0, 17.0, 22.0, 7.0, 6.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.640625, -3.4996337890625, -3.358642578125, -3.2176513671875, -3.07666015625, -2.9356689453125, -2.794677734375, -2.6536865234375, -2.5126953125, -2.3717041015625, -2.230712890625, -2.0897216796875, -1.94873046875, -1.8077392578125, -1.666748046875, -1.5257568359375, -1.384765625, -1.2437744140625, -1.102783203125, -0.9617919921875, -0.82080078125, -0.6798095703125, -0.538818359375, -0.3978271484375, -0.2568359375, -0.1158447265625, 0.025146484375, 0.1661376953125, 0.30712890625, 0.4481201171875, 0.589111328125, 0.7301025390625, 0.87109375, 1.0120849609375, 1.153076171875, 1.2940673828125, 1.43505859375, 1.5760498046875, 1.717041015625, 1.8580322265625, 1.9990234375, 2.1400146484375, 2.281005859375, 2.4219970703125, 2.56298828125, 2.7039794921875, 2.844970703125, 2.9859619140625, 3.126953125, 3.2679443359375, 3.408935546875, 3.5499267578125, 3.69091796875, 3.8319091796875, 3.972900390625, 4.1138916015625, 4.2548828125, 4.3958740234375, 4.536865234375, 4.6778564453125, 4.81884765625, 4.9598388671875, 5.100830078125, 5.2418212890625, 5.3828125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 3.0, 5.0, 6.0, 10.0, 16.0, 20.0, 26.0, 48.0, 65.0, 83.0, 99.0, 145.0, 213.0, 338.0, 577.0, 3529.0, 157739.0, 3536212.0, 484894.0, 8406.0, 732.0, 343.0, 228.0, 162.0, 99.0, 82.0, 51.0, 44.0, 38.0, 27.0, 16.0, 11.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.640625, -17.1590576171875, -16.677490234375, -16.1959228515625, -15.71435546875, -15.2327880859375, -14.751220703125, -14.2696533203125, -13.7880859375, -13.3065185546875, -12.824951171875, -12.3433837890625, -11.86181640625, -11.3802490234375, -10.898681640625, -10.4171142578125, -9.935546875, -9.4539794921875, -8.972412109375, -8.4908447265625, -8.00927734375, -7.5277099609375, -7.046142578125, -6.5645751953125, -6.0830078125, -5.6014404296875, -5.119873046875, -4.6383056640625, -4.15673828125, -3.6751708984375, -3.193603515625, -2.7120361328125, -2.23046875, -1.7489013671875, -1.267333984375, -0.7857666015625, -0.30419921875, 0.1773681640625, 0.658935546875, 1.1405029296875, 1.6220703125, 2.1036376953125, 2.585205078125, 3.0667724609375, 3.54833984375, 4.0299072265625, 4.511474609375, 4.9930419921875, 5.474609375, 5.9561767578125, 6.437744140625, 6.9193115234375, 7.40087890625, 7.8824462890625, 8.364013671875, 8.8455810546875, 9.3271484375, 9.8087158203125, 10.290283203125, 10.7718505859375, 11.25341796875, 11.7349853515625, 12.216552734375, 12.6981201171875, 13.1796875]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 10.0, 3.0, 16.0, 21.0, 28.0, 33.0, 47.0, 76.0, 85.0, 105.0, 106.0, 108.0, 76.0, 86.0, 61.0, 48.0, 40.0, 28.0, 25.0, 6.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-31.58955955505371, -30.914949417114258, -30.240339279174805, -29.56572914123535, -28.8911190032959, -28.216506958007812, -27.54189682006836, -26.867286682128906, -26.192676544189453, -25.51806640625, -24.843456268310547, -24.168846130371094, -23.49423599243164, -22.819625854492188, -22.145015716552734, -21.47040367126465, -20.795795440673828, -20.121185302734375, -19.446575164794922, -18.77196502685547, -18.097354888916016, -17.422744750976562, -16.74813461303711, -16.073522567749023, -15.39891242980957, -14.724302291870117, -14.049692153930664, -13.375082015991211, -12.700470924377441, -12.025860786437988, -11.351250648498535, -10.676639556884766, -10.002030372619629, -9.327420234680176, -8.652810096740723, -7.978199481964111, -7.3035888671875, -6.628978729248047, -5.954368591308594, -5.279757976531982, -4.605147838592529, -3.930537462234497, -3.255927085876465, -2.5813169479370117, -1.9067065715789795, -1.2320961952209473, -0.5574860572814941, 0.11712455749511719, 0.7917346954345703, 1.4663450717926025, 2.1409554481506348, 2.815565586090088, 3.49017596244812, 4.164786338806152, 4.8393964767456055, 5.514007091522217, 6.18861722946167, 6.863227367401123, 7.537837982177734, 8.212448120117188, 8.88705825805664, 9.561668395996094, 10.236278533935547, 10.910889625549316, 11.58549976348877]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 0.0, 6.0, 7.0, 7.0, 8.0, 13.0, 7.0, 15.0, 16.0, 22.0, 25.0, 19.0, 17.0, 23.0, 19.0, 33.0, 34.0, 34.0, 36.0, 31.0, 41.0, 39.0, 44.0, 51.0, 40.0, 44.0, 42.0, 35.0, 34.0, 33.0, 35.0, 25.0, 21.0, 23.0, 25.0, 20.0, 12.0, 13.0, 19.0, 9.0, 9.0, 2.0, 6.0, 6.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.154518127441406, -16.663501739501953, -16.1724853515625, -15.681469917297363, -15.190454483032227, -14.699438095092773, -14.20842170715332, -13.717405319213867, -13.22638988494873, -12.735373497009277, -12.24435806274414, -11.753341674804688, -11.262325286865234, -10.771309852600098, -10.280293464660645, -9.789278030395508, -9.298261642456055, -8.807245254516602, -8.316229820251465, -7.825213432312012, -7.334197521209717, -6.843181610107422, -6.352165222167969, -5.861149311065674, -5.370133399963379, -4.879117488861084, -4.388101577758789, -3.897085189819336, -3.406069278717041, -2.915053367614746, -2.424037218093872, -1.933021068572998, -1.4420051574707031, -0.9509891271591187, -0.4599730968475342, 0.031042933464050293, 0.5220589637756348, 1.0130748748779297, 1.5040910243988037, 1.9951071739196777, 2.4861230850219727, 2.9771389961242676, 3.4681551456451416, 3.9591712951660156, 4.4501872062683105, 4.9412031173706055, 5.432219505310059, 5.9232354164123535, 6.414251327514648, 6.905267238616943, 7.396283149719238, 7.887299537658691, 8.378314971923828, 8.869331359863281, 9.360347747802734, 9.851364135742188, 10.342379570007324, 10.833395957946777, 11.324411392211914, 11.815427780151367, 12.30644416809082, 12.797459602355957, 13.28847599029541, 13.779491424560547, 14.2705078125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 13.0, 14.0, 21.0, 20.0, 9.0, 19.0, 30.0, 34.0, 48.0, 37.0, 36.0, 33.0, 37.0, 35.0, 38.0, 49.0, 45.0, 51.0, 47.0, 41.0, 46.0, 39.0, 30.0, 30.0, 31.0, 26.0, 24.0, 14.0, 23.0, 16.0, 11.0, 15.0, 6.0, 2.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.037109375, -2.956939697265625, -2.87677001953125, -2.796600341796875, -2.7164306640625, -2.636260986328125, -2.55609130859375, -2.475921630859375, -2.395751953125, -2.315582275390625, -2.23541259765625, -2.155242919921875, -2.0750732421875, -1.994903564453125, -1.91473388671875, -1.834564208984375, -1.75439453125, -1.674224853515625, -1.59405517578125, -1.513885498046875, -1.4337158203125, -1.353546142578125, -1.27337646484375, -1.193206787109375, -1.113037109375, -1.032867431640625, -0.95269775390625, -0.872528076171875, -0.7923583984375, -0.712188720703125, -0.63201904296875, -0.551849365234375, -0.4716796875, -0.391510009765625, -0.31134033203125, -0.231170654296875, -0.1510009765625, -0.070831298828125, 0.00933837890625, 0.089508056640625, 0.169677734375, 0.249847412109375, 0.33001708984375, 0.410186767578125, 0.4903564453125, 0.570526123046875, 0.65069580078125, 0.730865478515625, 0.81103515625, 0.891204833984375, 0.97137451171875, 1.051544189453125, 1.1317138671875, 1.211883544921875, 1.29205322265625, 1.372222900390625, 1.452392578125, 1.532562255859375, 1.61273193359375, 1.692901611328125, 1.7730712890625, 1.853240966796875, 1.93341064453125, 2.013580322265625, 2.09375]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 3.0, 4.0, 7.0, 11.0, 8.0, 9.0, 16.0, 25.0, 30.0, 52.0, 74.0, 158.0, 245.0, 471.0, 813.0, 1519.0, 2795.0, 5341.0, 10052.0, 19052.0, 35782.0, 68127.0, 122117.0, 197718.0, 226378.0, 159398.0, 91847.0, 50187.0, 26585.0, 13970.0, 7214.0, 3840.0, 2160.0, 1100.0, 585.0, 346.0, 216.0, 107.0, 61.0, 27.0, 30.0, 20.0, 15.0, 13.0, 10.0, 4.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.281494140625, -0.2724876403808594, -0.26348114013671875, -0.2544746398925781, -0.2454681396484375, -0.23646163940429688, -0.22745513916015625, -0.21844863891601562, -0.209442138671875, -0.20043563842773438, -0.19142913818359375, -0.18242263793945312, -0.1734161376953125, -0.16440963745117188, -0.15540313720703125, -0.14639663696289062, -0.13739013671875, -0.12838363647460938, -0.11937713623046875, -0.11037063598632812, -0.1013641357421875, -0.09235763549804688, -0.08335113525390625, -0.07434463500976562, -0.065338134765625, -0.056331634521484375, -0.04732513427734375, -0.038318634033203125, -0.0293121337890625, -0.020305633544921875, -0.01129913330078125, -0.002292633056640625, 0.0067138671875, 0.015720367431640625, 0.02472686767578125, 0.033733367919921875, 0.0427398681640625, 0.051746368408203125, 0.06075286865234375, 0.06975936889648438, 0.078765869140625, 0.08777236938476562, 0.09677886962890625, 0.10578536987304688, 0.1147918701171875, 0.12379837036132812, 0.13280487060546875, 0.14181137084960938, 0.15081787109375, 0.15982437133789062, 0.16883087158203125, 0.17783737182617188, 0.1868438720703125, 0.19585037231445312, 0.20485687255859375, 0.21386337280273438, 0.222869873046875, 0.23187637329101562, 0.24088287353515625, 0.24988937377929688, 0.2588958740234375, 0.2679023742675781, 0.27690887451171875, 0.2859153747558594, 0.294921875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 12.0, 7.0, 8.0, 3.0, 13.0, 7.0, 9.0, 13.0, 14.0, 19.0, 21.0, 22.0, 31.0, 25.0, 39.0, 35.0, 32.0, 37.0, 48.0, 43.0, 30.0, 1067.0, 44.0, 38.0, 30.0, 36.0, 52.0, 31.0, 34.0, 28.0, 28.0, 25.0, 18.0, 19.0, 15.0, 24.0, 18.0, 6.0, 5.0, 7.0, 4.0, 4.0, 6.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-1.861328125, -1.8037261962890625, -1.746124267578125, -1.6885223388671875, -1.63092041015625, -1.5733184814453125, -1.515716552734375, -1.4581146240234375, -1.4005126953125, -1.3429107666015625, -1.285308837890625, -1.2277069091796875, -1.17010498046875, -1.1125030517578125, -1.054901123046875, -0.9972991943359375, -0.939697265625, -0.8820953369140625, -0.824493408203125, -0.7668914794921875, -0.70928955078125, -0.6516876220703125, -0.594085693359375, -0.5364837646484375, -0.4788818359375, -0.4212799072265625, -0.363677978515625, -0.3060760498046875, -0.24847412109375, -0.1908721923828125, -0.133270263671875, -0.0756683349609375, -0.01806640625, 0.0395355224609375, 0.097137451171875, 0.1547393798828125, 0.21234130859375, 0.2699432373046875, 0.327545166015625, 0.3851470947265625, 0.4427490234375, 0.5003509521484375, 0.557952880859375, 0.6155548095703125, 0.67315673828125, 0.7307586669921875, 0.788360595703125, 0.8459625244140625, 0.903564453125, 0.9611663818359375, 1.018768310546875, 1.0763702392578125, 1.13397216796875, 1.1915740966796875, 1.249176025390625, 1.3067779541015625, 1.3643798828125, 1.4219818115234375, 1.479583740234375, 1.5371856689453125, 1.59478759765625, 1.6523895263671875, 1.709991455078125, 1.7675933837890625, 1.8251953125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 7.0, 10.0, 11.0, 14.0, 21.0, 27.0, 44.0, 66.0, 106.0, 154.0, 209.0, 352.0, 516.0, 883.0, 1410.0, 2266.0, 3875.0, 6428.0, 10468.0, 17821.0, 30564.0, 50639.0, 85218.0, 135265.0, 1002548.0, 416291.0, 130501.0, 81432.0, 48469.0, 28737.0, 16929.0, 10286.0, 6044.0, 3699.0, 2130.0, 1351.0, 864.0, 491.0, 355.0, 202.0, 138.0, 100.0, 61.0, 47.0, 35.0, 18.0, 16.0, 7.0, 3.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.1510009765625, -0.14641952514648438, -0.14183807373046875, -0.13725662231445312, -0.1326751708984375, -0.12809371948242188, -0.12351226806640625, -0.11893081665039062, -0.114349365234375, -0.10976791381835938, -0.10518646240234375, -0.10060501098632812, -0.0960235595703125, -0.09144210815429688, -0.08686065673828125, -0.08227920532226562, -0.07769775390625, -0.07311630249023438, -0.06853485107421875, -0.06395339965820312, -0.0593719482421875, -0.054790496826171875, -0.05020904541015625, -0.045627593994140625, -0.041046142578125, -0.036464691162109375, -0.03188323974609375, -0.027301788330078125, -0.0227203369140625, -0.018138885498046875, -0.01355743408203125, -0.008975982666015625, -0.00439453125, 0.000186920166015625, 0.00476837158203125, 0.009349822998046875, 0.0139312744140625, 0.018512725830078125, 0.02309417724609375, 0.027675628662109375, 0.032257080078125, 0.036838531494140625, 0.04141998291015625, 0.046001434326171875, 0.0505828857421875, 0.055164337158203125, 0.05974578857421875, 0.06432723999023438, 0.06890869140625, 0.07349014282226562, 0.07807159423828125, 0.08265304565429688, 0.0872344970703125, 0.09181594848632812, 0.09639739990234375, 0.10097885131835938, 0.105560302734375, 0.11014175415039062, 0.11472320556640625, 0.11930465698242188, 0.1238861083984375, 0.12846755981445312, 0.13304901123046875, 0.13763046264648438, 0.1422119140625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 5.0, 6.0, 2.0, 6.0, 12.0, 6.0, 15.0, 9.0, 21.0, 15.0, 24.0, 24.0, 36.0, 35.0, 47.0, 59.0, 73.0, 71.0, 73.0, 63.0, 84.0, 44.0, 32.0, 33.0, 24.0, 30.0, 31.0, 23.0, 19.0, 14.0, 13.0, 9.0, 9.0, 10.0, 4.0, 10.0, 1.0, 7.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.008514404296875, -0.008266806602478027, -0.008019208908081055, -0.007771611213684082, -0.007524013519287109, -0.007276415824890137, -0.007028818130493164, -0.006781220436096191, -0.006533622741699219, -0.006286025047302246, -0.0060384273529052734, -0.005790829658508301, -0.005543231964111328, -0.0052956342697143555, -0.005048036575317383, -0.00480043888092041, -0.0045528411865234375, -0.004305243492126465, -0.004057645797729492, -0.0038100481033325195, -0.003562450408935547, -0.0033148527145385742, -0.0030672550201416016, -0.002819657325744629, -0.0025720596313476562, -0.0023244619369506836, -0.002076864242553711, -0.0018292665481567383, -0.0015816688537597656, -0.001334071159362793, -0.0010864734649658203, -0.0008388757705688477, -0.000591278076171875, -0.00034368038177490234, -9.608268737792969e-05, 0.00015151500701904297, 0.0003991127014160156, 0.0006467103958129883, 0.0008943080902099609, 0.0011419057846069336, 0.0013895034790039062, 0.001637101173400879, 0.0018846988677978516, 0.0021322965621948242, 0.002379894256591797, 0.0026274919509887695, 0.002875089645385742, 0.003122687339782715, 0.0033702850341796875, 0.00361788272857666, 0.003865480422973633, 0.0041130781173706055, 0.004360675811767578, 0.004608273506164551, 0.0048558712005615234, 0.005103468894958496, 0.005351066589355469, 0.005598664283752441, 0.005846261978149414, 0.006093859672546387, 0.006341457366943359, 0.006589055061340332, 0.006836652755737305, 0.007084250450134277, 0.00733184814453125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 11.0, 6.0, 9.0, 11.0, 11.0, 13.0, 27.0, 32.0, 43.0, 57.0, 78.0, 120.0, 239.0, 792.0, 12871.0, 962782.0, 68869.0, 1714.0, 361.0, 178.0, 93.0, 60.0, 47.0, 24.0, 18.0, 10.0, 18.0, 10.0, 5.0, 12.0, 2.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.165283203125, -0.1597156524658203, -0.15414810180664062, -0.14858055114746094, -0.14301300048828125, -0.13744544982910156, -0.13187789916992188, -0.1263103485107422, -0.1207427978515625, -0.11517524719238281, -0.10960769653320312, -0.10404014587402344, -0.09847259521484375, -0.09290504455566406, -0.08733749389648438, -0.08176994323730469, -0.076202392578125, -0.07063484191894531, -0.06506729125976562, -0.05949974060058594, -0.05393218994140625, -0.04836463928222656, -0.042797088623046875, -0.03722953796386719, -0.0316619873046875, -0.026094436645507812, -0.020526885986328125, -0.014959335327148438, -0.00939178466796875, -0.0038242340087890625, 0.001743316650390625, 0.0073108673095703125, 0.01287841796875, 0.018445968627929688, 0.024013519287109375, 0.029581069946289062, 0.03514862060546875, 0.04071617126464844, 0.046283721923828125, 0.05185127258300781, 0.0574188232421875, 0.06298637390136719, 0.06855392456054688, 0.07412147521972656, 0.07968902587890625, 0.08525657653808594, 0.09082412719726562, 0.09639167785644531, 0.101959228515625, 0.10752677917480469, 0.11309432983398438, 0.11866188049316406, 0.12422943115234375, 0.12979698181152344, 0.13536453247070312, 0.1409320831298828, 0.1464996337890625, 0.1520671844482422, 0.15763473510742188, 0.16320228576660156, 0.16876983642578125, 0.17433738708496094, 0.17990493774414062, 0.1854724884033203, 0.1910400390625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 10.0, 7.0, 18.0, 30.0, 54.0, 99.0, 226.0, 285.0, 110.0, 65.0, 43.0, 21.0, 20.0, 8.0, 7.0, 0.0, 1.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042905036360025406, -0.0408683717250824, -0.03883171081542969, -0.03679504618048668, -0.03475838154554367, -0.03272172063589096, -0.030685056000947952, -0.028648393228650093, -0.026611730456352234, -0.024575067684054375, -0.022538404911756516, -0.020501740276813507, -0.018465077504515648, -0.01642841473221779, -0.014391751028597355, -0.012355087324976921, -0.010318424552679062, -0.008281761780381203, -0.006245098076760769, -0.004208434838801622, -0.002171771600842476, -0.0001351088285446167, 0.001901554875075817, 0.003938218578696251, 0.00597488135099411, 0.00801154412329197, 0.010048207826912403, 0.012084871530532837, 0.014121534302830696, 0.016158197075128555, 0.018194861710071564, 0.020231524482369423, 0.02226819097995758, 0.02430485375225544, 0.0263415165245533, 0.028378181159496307, 0.030414843931794167, 0.032451506704092026, 0.034488171339035034, 0.036524832248687744, 0.03856149688363075, 0.04059816151857376, 0.04263482242822647, 0.04467148706316948, 0.04670815169811249, 0.0487448126077652, 0.050781477242708206, 0.052818141877651215, 0.054854802787303925, 0.05689146742224693, 0.05892812833189964, 0.06096479296684265, 0.06300145387649536, 0.06503811478614807, 0.06707478314638138, 0.06911144405603409, 0.0711481124162674, 0.0731847733259201, 0.07522144168615341, 0.07725810259580612, 0.07929476350545883, 0.08133143186569214, 0.08336809277534485, 0.08540475368499756, 0.08744141459465027]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 6.0, 4.0, 7.0, 15.0, 8.0, 14.0, 18.0, 18.0, 24.0, 24.0, 28.0, 22.0, 38.0, 32.0, 28.0, 47.0, 35.0, 29.0, 41.0, 48.0, 35.0, 29.0, 33.0, 43.0, 33.0, 29.0, 33.0, 34.0, 36.0, 36.0, 24.0, 33.0, 16.0, 17.0, 26.0, 12.0, 9.0, 12.0, 3.0, 8.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.017187058925628662, -0.016643870621919632, -0.01610068418085575, -0.015557496808469296, -0.01501430943608284, -0.014471122063696384, -0.013927934691309929, -0.013384747318923473, -0.012841559946537018, -0.012298372574150562, -0.011755185201764107, -0.011211997829377651, -0.010668810456991196, -0.01012562308460474, -0.009582435712218285, -0.009039248339831829, -0.008496060967445374, -0.007952873595058918, -0.0074096862226724625, -0.006866498850286007, -0.006323311477899551, -0.005780124105513096, -0.00523693673312664, -0.004693749360740185, -0.004150561988353729, -0.0036073746159672737, -0.003064187243580818, -0.0025209998711943626, -0.001977812498807907, -0.0014346251264214516, -0.000891437754034996, -0.0003482503816485405, 0.00019493699073791504, 0.0007381243631243706, 0.0012813117355108261, 0.0018244991078972816, 0.002367686480283737, 0.0029108738526701927, 0.0034540612250566483, 0.003997248597443104, 0.004540435969829559, 0.005083623342216015, 0.00562681071460247, 0.006169998086988926, 0.0067131854593753815, 0.007256372831761837, 0.0077995602041482925, 0.008342747576534748, 0.008885934948921204, 0.00942912232130766, 0.009972309693694115, 0.01051549706608057, 0.011058684438467026, 0.011601871810853481, 0.012145059183239937, 0.012688246555626392, 0.013231433928012848, 0.013774621300399303, 0.014317808672785759, 0.014860996045172215, 0.01540418341755867, 0.0159473717212677, 0.01649055816233158, 0.017033744603395462, 0.017576932907104492]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 6.0, 9.0, 13.0, 14.0, 21.0, 20.0, 9.0, 19.0, 30.0, 33.0, 49.0, 37.0, 36.0, 33.0, 37.0, 35.0, 38.0, 49.0, 44.0, 53.0, 45.0, 42.0, 47.0, 38.0, 30.0, 30.0, 31.0, 26.0, 24.0, 14.0, 23.0, 16.0, 11.0, 15.0, 6.0, 2.0, 6.0, 3.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.037109375, -2.956939697265625, -2.87677001953125, -2.796600341796875, -2.7164306640625, -2.636260986328125, -2.55609130859375, -2.475921630859375, -2.395751953125, -2.315582275390625, -2.23541259765625, -2.155242919921875, -2.0750732421875, -1.994903564453125, -1.91473388671875, -1.834564208984375, -1.75439453125, -1.674224853515625, -1.59405517578125, -1.513885498046875, -1.4337158203125, -1.353546142578125, -1.27337646484375, -1.193206787109375, -1.113037109375, -1.032867431640625, -0.95269775390625, -0.872528076171875, -0.7923583984375, -0.712188720703125, -0.63201904296875, -0.551849365234375, -0.4716796875, -0.391510009765625, -0.31134033203125, -0.231170654296875, -0.1510009765625, -0.070831298828125, 0.00933837890625, 0.089508056640625, 0.169677734375, 0.249847412109375, 0.33001708984375, 0.410186767578125, 0.4903564453125, 0.570526123046875, 0.65069580078125, 0.730865478515625, 0.81103515625, 0.891204833984375, 0.97137451171875, 1.051544189453125, 1.1317138671875, 1.211883544921875, 1.29205322265625, 1.372222900390625, 1.452392578125, 1.532562255859375, 1.61273193359375, 1.692901611328125, 1.7730712890625, 1.853240966796875, 1.93341064453125, 2.013580322265625, 2.09375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 3.0, 5.0, 12.0, 12.0, 25.0, 20.0, 67.0, 74.0, 113.0, 218.0, 314.0, 560.0, 964.0, 1823.0, 3308.0, 6719.0, 14093.0, 32151.0, 78999.0, 196987.0, 362874.0, 203959.0, 82478.0, 33454.0, 14729.0, 6891.0, 3324.0, 1864.0, 1018.0, 600.0, 320.0, 209.0, 118.0, 86.0, 60.0, 28.0, 26.0, 16.0, 14.0, 10.0, 5.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.919921875, -2.84210205078125, -2.7642822265625, -2.68646240234375, -2.608642578125, -2.53082275390625, -2.4530029296875, -2.37518310546875, -2.29736328125, -2.21954345703125, -2.1417236328125, -2.06390380859375, -1.986083984375, -1.90826416015625, -1.8304443359375, -1.75262451171875, -1.6748046875, -1.59698486328125, -1.5191650390625, -1.44134521484375, -1.363525390625, -1.28570556640625, -1.2078857421875, -1.13006591796875, -1.05224609375, -0.97442626953125, -0.8966064453125, -0.81878662109375, -0.740966796875, -0.66314697265625, -0.5853271484375, -0.50750732421875, -0.4296875, -0.35186767578125, -0.2740478515625, -0.19622802734375, -0.118408203125, -0.04058837890625, 0.0372314453125, 0.11505126953125, 0.19287109375, 0.27069091796875, 0.3485107421875, 0.42633056640625, 0.504150390625, 0.58197021484375, 0.6597900390625, 0.73760986328125, 0.8154296875, 0.89324951171875, 0.9710693359375, 1.04888916015625, 1.126708984375, 1.20452880859375, 1.2823486328125, 1.36016845703125, 1.43798828125, 1.51580810546875, 1.5936279296875, 1.67144775390625, 1.749267578125, 1.82708740234375, 1.9049072265625, 1.98272705078125, 2.060546875]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 9.0, 5.0, 10.0, 13.0, 15.0, 12.0, 24.0, 20.0, 28.0, 32.0, 28.0, 38.0, 36.0, 51.0, 60.0, 108.0, 214.0, 1464.0, 315.0, 127.0, 72.0, 52.0, 37.0, 40.0, 35.0, 29.0, 28.0, 25.0, 24.0, 22.0, 19.0, 11.0, 16.0, 6.0, 7.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9765625, -8.6844482421875, -8.392333984375, -8.1002197265625, -7.80810546875, -7.5159912109375, -7.223876953125, -6.9317626953125, -6.6396484375, -6.3475341796875, -6.055419921875, -5.7633056640625, -5.47119140625, -5.1790771484375, -4.886962890625, -4.5948486328125, -4.302734375, -4.0106201171875, -3.718505859375, -3.4263916015625, -3.13427734375, -2.8421630859375, -2.550048828125, -2.2579345703125, -1.9658203125, -1.6737060546875, -1.381591796875, -1.0894775390625, -0.79736328125, -0.5052490234375, -0.213134765625, 0.0789794921875, 0.37109375, 0.6632080078125, 0.955322265625, 1.2474365234375, 1.53955078125, 1.8316650390625, 2.123779296875, 2.4158935546875, 2.7080078125, 3.0001220703125, 3.292236328125, 3.5843505859375, 3.87646484375, 4.1685791015625, 4.460693359375, 4.7528076171875, 5.044921875, 5.3370361328125, 5.629150390625, 5.9212646484375, 6.21337890625, 6.5054931640625, 6.797607421875, 7.0897216796875, 7.3818359375, 7.6739501953125, 7.966064453125, 8.2581787109375, 8.55029296875, 8.8424072265625, 9.134521484375, 9.4266357421875, 9.71875]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 12.0, 17.0, 30.0, 38.0, 45.0, 82.0, 122.0, 191.0, 379.0, 766.0, 3493.0, 1874984.0, 1260732.0, 3091.0, 787.0, 360.0, 187.0, 120.0, 81.0, 61.0, 28.0, 24.0, 15.0, 15.0, 9.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-30.171875, -29.283935546875, -28.39599609375, -27.508056640625, -26.6201171875, -25.732177734375, -24.84423828125, -23.956298828125, -23.068359375, -22.180419921875, -21.29248046875, -20.404541015625, -19.5166015625, -18.628662109375, -17.74072265625, -16.852783203125, -15.96484375, -15.076904296875, -14.18896484375, -13.301025390625, -12.4130859375, -11.525146484375, -10.63720703125, -9.749267578125, -8.861328125, -7.973388671875, -7.08544921875, -6.197509765625, -5.3095703125, -4.421630859375, -3.53369140625, -2.645751953125, -1.7578125, -0.869873046875, 0.01806640625, 0.906005859375, 1.7939453125, 2.681884765625, 3.56982421875, 4.457763671875, 5.345703125, 6.233642578125, 7.12158203125, 8.009521484375, 8.8974609375, 9.785400390625, 10.67333984375, 11.561279296875, 12.44921875, 13.337158203125, 14.22509765625, 15.113037109375, 16.0009765625, 16.888916015625, 17.77685546875, 18.664794921875, 19.552734375, 20.440673828125, 21.32861328125, 22.216552734375, 23.1044921875, 23.992431640625, 24.88037109375, 25.768310546875, 26.65625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 10.0, 184.0, 657.0, 158.0, 9.0], "bins": [-149.5689697265625, -147.13258361816406, -144.6962127685547, -142.25982666015625, -139.8234405517578, -137.38706970214844, -134.95068359375, -132.51431274414062, -130.0779266357422, -127.64154815673828, -125.20516204833984, -122.76878356933594, -120.33240509033203, -117.89602661132812, -115.45964050292969, -113.02326202392578, -110.58688354492188, -108.15050506591797, -105.71411895751953, -103.27774047851562, -100.84136199951172, -98.40498352050781, -95.96859741210938, -93.53221893310547, -91.09583282470703, -88.65945434570312, -86.22306823730469, -83.78668975830078, -81.35031127929688, -78.91393280029297, -76.47754669189453, -74.04116821289062, -71.60479736328125, -69.16841888427734, -66.7320327758789, -64.295654296875, -61.859275817871094, -59.42289352416992, -56.98651123046875, -54.550132751464844, -52.11375045776367, -49.6773681640625, -47.240989685058594, -44.80460739135742, -42.368228912353516, -39.931846618652344, -37.49546813964844, -35.059085845947266, -32.62270736694336, -30.18632698059082, -27.74994659423828, -25.31356430053711, -22.877185821533203, -20.44080352783203, -18.004423141479492, -15.568042755126953, -13.131662368774414, -10.695281982421875, -8.258901596069336, -5.8225202560424805, -3.3861398696899414, -0.9497594833374023, 1.4866218566894531, 3.923002243041992, 6.3593831062316895]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 3.0, 5.0, 5.0, 9.0, 9.0, 14.0, 10.0, 21.0, 16.0, 25.0, 18.0, 20.0, 22.0, 19.0, 34.0, 28.0, 36.0, 38.0, 39.0, 36.0, 26.0, 35.0, 36.0, 40.0, 31.0, 32.0, 32.0, 38.0, 27.0, 30.0, 30.0, 27.0, 29.0, 23.0, 25.0, 23.0, 9.0, 23.0, 14.0, 22.0, 8.0, 8.0, 6.0, 10.0, 3.0, 4.0, 3.0, 1.0, 0.0, 5.0, 0.0, 1.0], "bins": [-21.335079193115234, -20.725122451782227, -20.11516761779785, -19.505210876464844, -18.89525604248047, -18.28529930114746, -17.675344467163086, -17.065387725830078, -16.455432891845703, -15.845477104187012, -15.23552131652832, -14.625565528869629, -14.015609741210938, -13.40565299987793, -12.795697212219238, -12.185741424560547, -11.575784683227539, -10.965828895568848, -10.355873107910156, -9.745917320251465, -9.135961532592773, -8.526004791259766, -7.916049003601074, -7.306093215942383, -6.696137428283691, -6.086181640625, -5.476225852966309, -4.866269588470459, -4.256313800811768, -3.646358013153076, -3.0364019870758057, -2.426445960998535, -1.816488265991211, -1.20653235912323, -0.596576452255249, 0.013379454612731934, 0.6233353614807129, 1.2332911491394043, 1.8432471752166748, 2.4532032012939453, 3.0631589889526367, 3.673114776611328, 4.2830705642700195, 4.893026828765869, 5.5029826164245605, 6.112938404083252, 6.722894668579102, 7.332850456237793, 7.942806243896484, 8.552762031555176, 9.162717819213867, 9.772673606872559, 10.38262939453125, 10.992586135864258, 11.60254192352295, 12.21249771118164, 12.822453498840332, 13.432409286499023, 14.042365074157715, 14.652320861816406, 15.262277603149414, 15.872232437133789, 16.482189178466797, 17.092144012451172, 17.70210075378418]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 11.0, 5.0, 7.0, 13.0, 20.0, 15.0, 28.0, 29.0, 31.0, 38.0, 30.0, 42.0, 35.0, 30.0, 48.0, 42.0, 47.0, 60.0, 46.0, 46.0, 30.0, 42.0, 38.0, 37.0, 47.0, 24.0, 25.0, 19.0, 19.0, 10.0, 21.0, 15.0, 10.0, 10.0, 10.0, 4.0, 6.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.18359375, -3.097930908203125, -3.01226806640625, -2.926605224609375, -2.8409423828125, -2.755279541015625, -2.66961669921875, -2.583953857421875, -2.498291015625, -2.412628173828125, -2.32696533203125, -2.241302490234375, -2.1556396484375, -2.069976806640625, -1.98431396484375, -1.898651123046875, -1.81298828125, -1.727325439453125, -1.64166259765625, -1.555999755859375, -1.4703369140625, -1.384674072265625, -1.29901123046875, -1.213348388671875, -1.127685546875, -1.042022705078125, -0.95635986328125, -0.870697021484375, -0.7850341796875, -0.699371337890625, -0.61370849609375, -0.528045654296875, -0.4423828125, -0.356719970703125, -0.27105712890625, -0.185394287109375, -0.0997314453125, -0.014068603515625, 0.07159423828125, 0.157257080078125, 0.242919921875, 0.328582763671875, 0.41424560546875, 0.499908447265625, 0.5855712890625, 0.671234130859375, 0.75689697265625, 0.842559814453125, 0.92822265625, 1.013885498046875, 1.09954833984375, 1.185211181640625, 1.2708740234375, 1.356536865234375, 1.44219970703125, 1.527862548828125, 1.613525390625, 1.699188232421875, 1.78485107421875, 1.870513916015625, 1.9561767578125, 2.041839599609375, 2.12750244140625, 2.213165283203125, 2.298828125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 5.0, 6.0, 11.0, 9.0, 14.0, 17.0, 19.0, 31.0, 40.0, 41.0, 71.0, 126.0, 192.0, 351.0, 730.0, 1666.0, 4438.0, 12364.0, 38328.0, 125033.0, 414948.0, 1158347.0, 1476472.0, 658944.0, 207672.0, 63039.0, 19765.0, 6767.0, 2622.0, 1042.0, 483.0, 209.0, 159.0, 62.0, 62.0, 39.0, 39.0, 29.0, 25.0, 20.0, 8.0, 6.0, 9.0, 5.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.46484375, -3.360504150390625, -3.25616455078125, -3.151824951171875, -3.0474853515625, -2.943145751953125, -2.83880615234375, -2.734466552734375, -2.630126953125, -2.525787353515625, -2.42144775390625, -2.317108154296875, -2.2127685546875, -2.108428955078125, -2.00408935546875, -1.899749755859375, -1.79541015625, -1.691070556640625, -1.58673095703125, -1.482391357421875, -1.3780517578125, -1.273712158203125, -1.16937255859375, -1.065032958984375, -0.960693359375, -0.856353759765625, -0.75201416015625, -0.647674560546875, -0.5433349609375, -0.438995361328125, -0.33465576171875, -0.230316162109375, -0.1259765625, -0.021636962890625, 0.08270263671875, 0.187042236328125, 0.2913818359375, 0.395721435546875, 0.50006103515625, 0.604400634765625, 0.708740234375, 0.813079833984375, 0.91741943359375, 1.021759033203125, 1.1260986328125, 1.230438232421875, 1.33477783203125, 1.439117431640625, 1.54345703125, 1.647796630859375, 1.75213623046875, 1.856475830078125, 1.9608154296875, 2.065155029296875, 2.16949462890625, 2.273834228515625, 2.378173828125, 2.482513427734375, 2.58685302734375, 2.691192626953125, 2.7955322265625, 2.899871826171875, 3.00421142578125, 3.108551025390625, 3.212890625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 2.0, 8.0, 1.0, 12.0, 11.0, 16.0, 28.0, 21.0, 30.0, 58.0, 64.0, 75.0, 109.0, 138.0, 188.0, 238.0, 308.0, 390.0, 435.0, 402.0, 337.0, 291.0, 222.0, 196.0, 137.0, 73.0, 65.0, 67.0, 36.0, 27.0, 31.0, 21.0, 13.0, 1.0, 9.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.6328125, -4.4871826171875, -4.341552734375, -4.1959228515625, -4.05029296875, -3.9046630859375, -3.759033203125, -3.6134033203125, -3.4677734375, -3.3221435546875, -3.176513671875, -3.0308837890625, -2.88525390625, -2.7396240234375, -2.593994140625, -2.4483642578125, -2.302734375, -2.1571044921875, -2.011474609375, -1.8658447265625, -1.72021484375, -1.5745849609375, -1.428955078125, -1.2833251953125, -1.1376953125, -0.9920654296875, -0.846435546875, -0.7008056640625, -0.55517578125, -0.4095458984375, -0.263916015625, -0.1182861328125, 0.02734375, 0.1729736328125, 0.318603515625, 0.4642333984375, 0.60986328125, 0.7554931640625, 0.901123046875, 1.0467529296875, 1.1923828125, 1.3380126953125, 1.483642578125, 1.6292724609375, 1.77490234375, 1.9205322265625, 2.066162109375, 2.2117919921875, 2.357421875, 2.5030517578125, 2.648681640625, 2.7943115234375, 2.93994140625, 3.0855712890625, 3.231201171875, 3.3768310546875, 3.5224609375, 3.6680908203125, 3.813720703125, 3.9593505859375, 4.10498046875, 4.2506103515625, 4.396240234375, 4.5418701171875, 4.6875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 4.0, 5.0, 11.0, 9.0, 15.0, 20.0, 31.0, 27.0, 43.0, 63.0, 67.0, 106.0, 168.0, 242.0, 375.0, 950.0, 16011.0, 2372300.0, 1790128.0, 11746.0, 820.0, 352.0, 209.0, 146.0, 108.0, 88.0, 58.0, 45.0, 38.0, 22.0, 27.0, 10.0, 11.0, 9.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.390625, -18.764404296875, -18.13818359375, -17.511962890625, -16.8857421875, -16.259521484375, -15.63330078125, -15.007080078125, -14.380859375, -13.754638671875, -13.12841796875, -12.502197265625, -11.8759765625, -11.249755859375, -10.62353515625, -9.997314453125, -9.37109375, -8.744873046875, -8.11865234375, -7.492431640625, -6.8662109375, -6.239990234375, -5.61376953125, -4.987548828125, -4.361328125, -3.735107421875, -3.10888671875, -2.482666015625, -1.8564453125, -1.230224609375, -0.60400390625, 0.022216796875, 0.6484375, 1.274658203125, 1.90087890625, 2.527099609375, 3.1533203125, 3.779541015625, 4.40576171875, 5.031982421875, 5.658203125, 6.284423828125, 6.91064453125, 7.536865234375, 8.1630859375, 8.789306640625, 9.41552734375, 10.041748046875, 10.66796875, 11.294189453125, 11.92041015625, 12.546630859375, 13.1728515625, 13.799072265625, 14.42529296875, 15.051513671875, 15.677734375, 16.303955078125, 16.93017578125, 17.556396484375, 18.1826171875, 18.808837890625, 19.43505859375, 20.061279296875, 20.6875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 11.0, 37.0, 107.0, 210.0, 272.0, 214.0, 111.0, 46.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.58159637451172, -61.69062423706055, -59.799652099609375, -57.9086799621582, -56.01770782470703, -54.12673568725586, -52.23576354980469, -50.344791412353516, -48.453819274902344, -46.56284713745117, -44.671875, -42.78090286254883, -40.889930725097656, -38.998958587646484, -37.10798645019531, -35.21701431274414, -33.32604217529297, -31.435070037841797, -29.544097900390625, -27.653125762939453, -25.76215362548828, -23.87118148803711, -21.980209350585938, -20.089237213134766, -18.198265075683594, -16.307292938232422, -14.41632080078125, -12.525348663330078, -10.634376525878906, -8.743404388427734, -6.8524322509765625, -4.961460113525391, -3.0704917907714844, -1.1795196533203125, 0.7114524841308594, 2.6024246215820312, 4.493396759033203, 6.384368896484375, 8.275341033935547, 10.166313171386719, 12.05728530883789, 13.948257446289062, 15.839229583740234, 17.730201721191406, 19.621173858642578, 21.51214599609375, 23.403118133544922, 25.294090270996094, 27.185062408447266, 29.076034545898438, 30.96700668334961, 32.85797882080078, 34.74895095825195, 36.639923095703125, 38.5308952331543, 40.42186737060547, 42.31283950805664, 44.20381164550781, 46.094783782958984, 47.985755920410156, 49.87672805786133, 51.7677001953125, 53.65867233276367, 55.549644470214844, 57.440616607666016]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 8.0, 7.0, 8.0, 5.0, 6.0, 13.0, 12.0, 21.0, 15.0, 19.0, 16.0, 26.0, 26.0, 37.0, 37.0, 25.0, 39.0, 32.0, 35.0, 41.0, 47.0, 41.0, 42.0, 43.0, 41.0, 39.0, 41.0, 28.0, 36.0, 30.0, 22.0, 31.0, 26.0, 23.0, 9.0, 20.0, 12.0, 9.0, 12.0, 9.0, 6.0, 2.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-16.500185012817383, -16.022724151611328, -15.545263290405273, -15.067802429199219, -14.590341567993164, -14.11288070678711, -13.635419845581055, -13.157959938049316, -12.680499076843262, -12.203038215637207, -11.725577354431152, -11.248116493225098, -10.770655632019043, -10.293195724487305, -9.81573486328125, -9.338274002075195, -8.86081314086914, -8.383352279663086, -7.905891418457031, -7.428430557250977, -6.95097017288208, -6.473509311676025, -5.996048450469971, -5.518588066101074, -5.041126251220703, -4.563665390014648, -4.086204528808594, -3.608743906021118, -3.1312832832336426, -2.653822422027588, -2.176361560821533, -1.6989009380340576, -1.221440315246582, -0.7439795732498169, -0.266518771648407, 0.21094202995300293, 0.6884027719497681, 1.1658635139465332, 1.643324375152588, 2.1207849979400635, 2.598245859146118, 3.075706720352173, 3.5531673431396484, 4.030628204345703, 4.508089065551758, 4.9855499267578125, 5.463010787963867, 5.940471172332764, 6.417932033538818, 6.895392894744873, 7.372853755950928, 7.850314140319824, 8.327775001525879, 8.805235862731934, 9.282696723937988, 9.760157585144043, 10.237618446350098, 10.715079307556152, 11.192540168762207, 11.670001029968262, 12.147461891174316, 12.624921798706055, 13.10238265991211, 13.579843521118164, 14.057304382324219]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 8.0, 6.0, 7.0, 8.0, 11.0, 19.0, 15.0, 16.0, 21.0, 26.0, 29.0, 29.0, 37.0, 37.0, 40.0, 27.0, 38.0, 47.0, 46.0, 37.0, 45.0, 42.0, 36.0, 54.0, 42.0, 31.0, 24.0, 28.0, 25.0, 31.0, 24.0, 25.0, 14.0, 13.0, 14.0, 12.0, 8.0, 6.0, 8.0, 4.0, 0.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-2.806640625, -2.727691650390625, -2.64874267578125, -2.569793701171875, -2.4908447265625, -2.411895751953125, -2.33294677734375, -2.253997802734375, -2.175048828125, -2.096099853515625, -2.01715087890625, -1.938201904296875, -1.8592529296875, -1.780303955078125, -1.70135498046875, -1.622406005859375, -1.54345703125, -1.464508056640625, -1.38555908203125, -1.306610107421875, -1.2276611328125, -1.148712158203125, -1.06976318359375, -0.990814208984375, -0.911865234375, -0.832916259765625, -0.75396728515625, -0.675018310546875, -0.5960693359375, -0.517120361328125, -0.43817138671875, -0.359222412109375, -0.2802734375, -0.201324462890625, -0.12237548828125, -0.043426513671875, 0.0355224609375, 0.114471435546875, 0.19342041015625, 0.272369384765625, 0.351318359375, 0.430267333984375, 0.50921630859375, 0.588165283203125, 0.6671142578125, 0.746063232421875, 0.82501220703125, 0.903961181640625, 0.98291015625, 1.061859130859375, 1.14080810546875, 1.219757080078125, 1.2987060546875, 1.377655029296875, 1.45660400390625, 1.535552978515625, 1.614501953125, 1.693450927734375, 1.77239990234375, 1.851348876953125, 1.9302978515625, 2.009246826171875, 2.08819580078125, 2.167144775390625, 2.24609375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 13.0, 17.0, 23.0, 27.0, 46.0, 91.0, 147.0, 257.0, 453.0, 817.0, 1535.0, 3000.0, 5709.0, 11127.0, 21409.0, 42360.0, 84895.0, 164362.0, 251765.0, 215666.0, 121254.0, 60655.0, 30249.0, 15710.0, 7893.0, 4269.0, 2172.0, 1181.0, 604.0, 349.0, 190.0, 106.0, 65.0, 39.0, 34.0, 12.0, 8.0, 12.0, 9.0, 6.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.306396484375, -0.2967491149902344, -0.28710174560546875, -0.2774543762207031, -0.2678070068359375, -0.2581596374511719, -0.24851226806640625, -0.23886489868164062, -0.229217529296875, -0.21957015991210938, -0.20992279052734375, -0.20027542114257812, -0.1906280517578125, -0.18098068237304688, -0.17133331298828125, -0.16168594360351562, -0.15203857421875, -0.14239120483398438, -0.13274383544921875, -0.12309646606445312, -0.1134490966796875, -0.10380172729492188, -0.09415435791015625, -0.08450698852539062, -0.074859619140625, -0.06521224975585938, -0.05556488037109375, -0.045917510986328125, -0.0362701416015625, -0.026622772216796875, -0.01697540283203125, -0.007328033447265625, 0.0023193359375, 0.011966705322265625, 0.02161407470703125, 0.031261444091796875, 0.0409088134765625, 0.050556182861328125, 0.06020355224609375, 0.06985092163085938, 0.079498291015625, 0.08914566040039062, 0.09879302978515625, 0.10844039916992188, 0.1180877685546875, 0.12773513793945312, 0.13738250732421875, 0.14702987670898438, 0.15667724609375, 0.16632461547851562, 0.17597198486328125, 0.18561935424804688, 0.1952667236328125, 0.20491409301757812, 0.21456146240234375, 0.22420883178710938, 0.233856201171875, 0.24350357055664062, 0.25315093994140625, 0.2627983093261719, 0.2724456787109375, 0.2820930480957031, 0.29174041748046875, 0.3013877868652344, 0.31103515625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 1.0, 2.0, 5.0, 9.0, 12.0, 9.0, 9.0, 13.0, 12.0, 21.0, 25.0, 23.0, 33.0, 16.0, 33.0, 33.0, 29.0, 50.0, 31.0, 43.0, 41.0, 46.0, 1058.0, 40.0, 43.0, 35.0, 34.0, 32.0, 40.0, 30.0, 41.0, 33.0, 32.0, 15.0, 20.0, 16.0, 7.0, 13.0, 11.0, 6.0, 11.0, 13.0, 3.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.60546875, -2.535125732421875, -2.46478271484375, -2.394439697265625, -2.3240966796875, -2.253753662109375, -2.18341064453125, -2.113067626953125, -2.042724609375, -1.972381591796875, -1.90203857421875, -1.831695556640625, -1.7613525390625, -1.691009521484375, -1.62066650390625, -1.550323486328125, -1.47998046875, -1.409637451171875, -1.33929443359375, -1.268951416015625, -1.1986083984375, -1.128265380859375, -1.05792236328125, -0.987579345703125, -0.917236328125, -0.846893310546875, -0.77655029296875, -0.706207275390625, -0.6358642578125, -0.565521240234375, -0.49517822265625, -0.424835205078125, -0.3544921875, -0.284149169921875, -0.21380615234375, -0.143463134765625, -0.0731201171875, -0.002777099609375, 0.06756591796875, 0.137908935546875, 0.208251953125, 0.278594970703125, 0.34893798828125, 0.419281005859375, 0.4896240234375, 0.559967041015625, 0.63031005859375, 0.700653076171875, 0.77099609375, 0.841339111328125, 0.91168212890625, 0.982025146484375, 1.0523681640625, 1.122711181640625, 1.19305419921875, 1.263397216796875, 1.333740234375, 1.404083251953125, 1.47442626953125, 1.544769287109375, 1.6151123046875, 1.685455322265625, 1.75579833984375, 1.826141357421875, 1.896484375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 12.0, 16.0, 20.0, 33.0, 42.0, 60.0, 102.0, 144.0, 234.0, 356.0, 589.0, 995.0, 1567.0, 2573.0, 4540.0, 7754.0, 13192.0, 22375.0, 38333.0, 64844.0, 107450.0, 165246.0, 1241434.0, 163118.0, 106549.0, 63518.0, 37938.0, 22374.0, 12853.0, 7666.0, 4504.0, 2658.0, 1495.0, 956.0, 560.0, 378.0, 233.0, 128.0, 98.0, 54.0, 39.0, 28.0, 22.0, 13.0, 12.0, 8.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.153076171875, -0.14836502075195312, -0.14365386962890625, -0.13894271850585938, -0.1342315673828125, -0.12952041625976562, -0.12480926513671875, -0.12009811401367188, -0.115386962890625, -0.11067581176757812, -0.10596466064453125, -0.10125350952148438, -0.0965423583984375, -0.09183120727539062, -0.08712005615234375, -0.08240890502929688, -0.07769775390625, -0.07298660278320312, -0.06827545166015625, -0.06356430053710938, -0.0588531494140625, -0.054141998291015625, -0.04943084716796875, -0.044719696044921875, -0.040008544921875, -0.035297393798828125, -0.03058624267578125, -0.025875091552734375, -0.0211639404296875, -0.016452789306640625, -0.01174163818359375, -0.007030487060546875, -0.0023193359375, 0.002391815185546875, 0.00710296630859375, 0.011814117431640625, 0.0165252685546875, 0.021236419677734375, 0.02594757080078125, 0.030658721923828125, 0.035369873046875, 0.040081024169921875, 0.04479217529296875, 0.049503326416015625, 0.0542144775390625, 0.058925628662109375, 0.06363677978515625, 0.06834793090820312, 0.07305908203125, 0.07777023315429688, 0.08248138427734375, 0.08719253540039062, 0.0919036865234375, 0.09661483764648438, 0.10132598876953125, 0.10603713989257812, 0.110748291015625, 0.11545944213867188, 0.12017059326171875, 0.12488174438476562, 0.1295928955078125, 0.13430404663085938, 0.13901519775390625, 0.14372634887695312, 0.1484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 4.0, 6.0, 5.0, 1.0, 5.0, 2.0, 6.0, 12.0, 11.0, 8.0, 13.0, 16.0, 38.0, 39.0, 58.0, 104.0, 107.0, 153.0, 134.0, 72.0, 51.0, 37.0, 22.0, 18.0, 12.0, 13.0, 9.0, 7.0, 6.0, 3.0, 5.0, 7.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0074615478515625, -0.007206320762634277, -0.006951093673706055, -0.006695866584777832, -0.006440639495849609, -0.006185412406921387, -0.005930185317993164, -0.005674958229064941, -0.005419731140136719, -0.005164504051208496, -0.0049092769622802734, -0.004654049873352051, -0.004398822784423828, -0.0041435956954956055, -0.003888368606567383, -0.00363314151763916, -0.0033779144287109375, -0.003122687339782715, -0.002867460250854492, -0.0026122331619262695, -0.002357006072998047, -0.0021017789840698242, -0.0018465518951416016, -0.001591324806213379, -0.0013360977172851562, -0.0010808706283569336, -0.0008256435394287109, -0.0005704164505004883, -0.0003151893615722656, -5.996227264404297e-05, 0.0001952648162841797, 0.00045049190521240234, 0.000705718994140625, 0.0009609460830688477, 0.0012161731719970703, 0.001471400260925293, 0.0017266273498535156, 0.0019818544387817383, 0.002237081527709961, 0.0024923086166381836, 0.0027475357055664062, 0.003002762794494629, 0.0032579898834228516, 0.0035132169723510742, 0.003768444061279297, 0.0040236711502075195, 0.004278898239135742, 0.004534125328063965, 0.0047893524169921875, 0.00504457950592041, 0.005299806594848633, 0.0055550336837768555, 0.005810260772705078, 0.006065487861633301, 0.0063207149505615234, 0.006575942039489746, 0.006831169128417969, 0.007086396217346191, 0.007341623306274414, 0.007596850395202637, 0.00785207748413086, 0.008107304573059082, 0.008362531661987305, 0.008617758750915527, 0.00887298583984375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 7.0, 6.0, 9.0, 2.0, 10.0, 7.0, 9.0, 20.0, 12.0, 35.0, 35.0, 59.0, 114.0, 383.0, 3889.0, 944253.0, 97553.0, 1620.0, 245.0, 107.0, 52.0, 29.0, 22.0, 16.0, 15.0, 13.0, 5.0, 3.0, 4.0, 5.0, 5.0, 0.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1954345703125, -0.18982696533203125, -0.1842193603515625, -0.17861175537109375, -0.173004150390625, -0.16739654541015625, -0.1617889404296875, -0.15618133544921875, -0.15057373046875, -0.14496612548828125, -0.1393585205078125, -0.13375091552734375, -0.128143310546875, -0.12253570556640625, -0.1169281005859375, -0.11132049560546875, -0.105712890625, -0.10010528564453125, -0.0944976806640625, -0.08889007568359375, -0.083282470703125, -0.07767486572265625, -0.0720672607421875, -0.06645965576171875, -0.06085205078125, -0.05524444580078125, -0.0496368408203125, -0.04402923583984375, -0.038421630859375, -0.03281402587890625, -0.0272064208984375, -0.02159881591796875, -0.0159912109375, -0.01038360595703125, -0.0047760009765625, 0.00083160400390625, 0.006439208984375, 0.01204681396484375, 0.0176544189453125, 0.02326202392578125, 0.02886962890625, 0.03447723388671875, 0.0400848388671875, 0.04569244384765625, 0.051300048828125, 0.05690765380859375, 0.0625152587890625, 0.06812286376953125, 0.07373046875, 0.07933807373046875, 0.0849456787109375, 0.09055328369140625, 0.096160888671875, 0.10176849365234375, 0.1073760986328125, 0.11298370361328125, 0.11859130859375, 0.12419891357421875, 0.1298065185546875, 0.13541412353515625, 0.141021728515625, 0.14662933349609375, 0.1522369384765625, 0.15784454345703125, 0.1634521484375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 10.0, 20.0, 59.0, 149.0, 465.0, 194.0, 55.0, 30.0, 22.0, 4.0, 1.0, 3.0], "bins": [-0.11061510443687439, -0.10866040736436844, -0.10670571029186249, -0.10475101321935654, -0.10279631614685059, -0.10084162652492523, -0.09888692200183868, -0.09693223237991333, -0.09497753530740738, -0.09302283823490143, -0.09106814116239548, -0.08911344408988953, -0.08715874701738358, -0.08520404994487762, -0.08324936032295227, -0.08129466325044632, -0.07933996617794037, -0.07738526910543442, -0.07543057203292847, -0.07347587496042252, -0.07152117788791656, -0.06956648826599121, -0.06761178374290466, -0.06565709412097931, -0.06370238959789276, -0.06174769252538681, -0.05979299545288086, -0.05783829838037491, -0.055883605033159256, -0.053928907960653305, -0.051974210888147354, -0.0500195138156414, -0.04806482791900635, -0.0461101308465004, -0.044155433773994446, -0.042200736701488495, -0.04024604335427284, -0.03829134628176689, -0.03633664920926094, -0.03438195213675499, -0.03242725506424904, -0.030472557991743088, -0.028517862781882286, -0.026563165709376335, -0.024608470499515533, -0.022653773427009583, -0.02069907635450363, -0.01874437928199768, -0.01678968407213688, -0.014834987930953503, -0.012880291789770126, -0.010925594717264175, -0.008970898576080799, -0.007016202434897423, -0.005061505362391472, -0.0031068092212080956, -0.0011521130800247192, 0.0008025832939893007, 0.0027572796680033207, 0.004711976274847984, 0.006666672416031361, 0.008621368557214737, 0.010576065629720688, 0.012530761770904064, 0.01448545791208744]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 5.0, 5.0, 6.0, 4.0, 6.0, 7.0, 9.0, 14.0, 11.0, 15.0, 9.0, 15.0, 18.0, 18.0, 23.0, 26.0, 31.0, 35.0, 34.0, 36.0, 35.0, 37.0, 33.0, 43.0, 33.0, 32.0, 31.0, 42.0, 38.0, 44.0, 28.0, 31.0, 23.0, 40.0, 34.0, 18.0, 23.0, 19.0, 13.0, 15.0, 15.0, 15.0, 11.0, 5.0, 5.0, 7.0, 7.0, 4.0, 0.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00542217493057251, -0.005230746231973171, -0.005039317533373833, -0.004847888834774494, -0.004656460136175156, -0.004465031437575817, -0.004273602738976479, -0.00408217404037714, -0.0038907453417778015, -0.003699316643178463, -0.0035078879445791245, -0.003316459245979786, -0.0031250305473804474, -0.002933601848781109, -0.0027421731501817703, -0.002550744451582432, -0.0023593157529830933, -0.0021678870543837547, -0.001976458355784416, -0.0017850296571850777, -0.0015936009585857391, -0.0014021722599864006, -0.001210743561387062, -0.0010193148627877235, -0.000827886164188385, -0.0006364574655890465, -0.00044502876698970795, -0.0002536000683903694, -6.217136979103088e-05, 0.00012925732880830765, 0.0003206860274076462, 0.0005121147260069847, 0.0007035434246063232, 0.0008949721232056618, 0.0010864008218050003, 0.0012778295204043388, 0.0014692582190036774, 0.001660686917603016, 0.0018521156162023544, 0.002043544314801693, 0.0022349730134010315, 0.00242640171200037, 0.0026178304105997086, 0.002809259109199047, 0.0030006878077983856, 0.003192116506397724, 0.0033835452049970627, 0.003574973903596401, 0.0037664026021957397, 0.003957831300795078, 0.004149259999394417, 0.004340688697993755, 0.004532117396593094, 0.004723546095192432, 0.004914974793791771, 0.0051064034923911095, 0.005297832190990448, 0.0054892608895897865, 0.005680689588189125, 0.005872118286788464, 0.006063546985387802, 0.006254975683987141, 0.006446404382586479, 0.006637833081185818, 0.006829261779785156]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 8.0, 6.0, 7.0, 8.0, 11.0, 19.0, 15.0, 16.0, 21.0, 25.0, 30.0, 30.0, 36.0, 36.0, 41.0, 27.0, 38.0, 48.0, 46.0, 36.0, 45.0, 42.0, 36.0, 54.0, 42.0, 31.0, 23.0, 29.0, 25.0, 31.0, 24.0, 25.0, 14.0, 13.0, 14.0, 12.0, 8.0, 6.0, 8.0, 4.0, 0.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0], "bins": [-2.806640625, -2.727691650390625, -2.64874267578125, -2.569793701171875, -2.4908447265625, -2.411895751953125, -2.33294677734375, -2.253997802734375, -2.175048828125, -2.096099853515625, -2.01715087890625, -1.938201904296875, -1.8592529296875, -1.780303955078125, -1.70135498046875, -1.622406005859375, -1.54345703125, -1.464508056640625, -1.38555908203125, -1.306610107421875, -1.2276611328125, -1.148712158203125, -1.06976318359375, -0.990814208984375, -0.911865234375, -0.832916259765625, -0.75396728515625, -0.675018310546875, -0.5960693359375, -0.517120361328125, -0.43817138671875, -0.359222412109375, -0.2802734375, -0.201324462890625, -0.12237548828125, -0.043426513671875, 0.0355224609375, 0.114471435546875, 0.19342041015625, 0.272369384765625, 0.351318359375, 0.430267333984375, 0.50921630859375, 0.588165283203125, 0.6671142578125, 0.746063232421875, 0.82501220703125, 0.903961181640625, 0.98291015625, 1.061859130859375, 1.14080810546875, 1.219757080078125, 1.2987060546875, 1.377655029296875, 1.45660400390625, 1.535552978515625, 1.614501953125, 1.693450927734375, 1.77239990234375, 1.851348876953125, 1.9302978515625, 2.009246826171875, 2.08819580078125, 2.167144775390625, 2.24609375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 3.0, 9.0, 13.0, 20.0, 37.0, 44.0, 59.0, 138.0, 210.0, 373.0, 721.0, 1407.0, 2737.0, 4952.0, 9441.0, 17963.0, 37531.0, 97761.0, 294135.0, 358522.0, 130430.0, 47116.0, 21462.0, 10876.0, 5953.0, 3076.0, 1634.0, 860.0, 481.0, 244.0, 119.0, 94.0, 53.0, 17.0, 16.0, 13.0, 13.0, 8.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-3.384765625, -3.29107666015625, -3.1973876953125, -3.10369873046875, -3.010009765625, -2.91632080078125, -2.8226318359375, -2.72894287109375, -2.63525390625, -2.54156494140625, -2.4478759765625, -2.35418701171875, -2.260498046875, -2.16680908203125, -2.0731201171875, -1.97943115234375, -1.8857421875, -1.79205322265625, -1.6983642578125, -1.60467529296875, -1.510986328125, -1.41729736328125, -1.3236083984375, -1.22991943359375, -1.13623046875, -1.04254150390625, -0.9488525390625, -0.85516357421875, -0.761474609375, -0.66778564453125, -0.5740966796875, -0.48040771484375, -0.38671875, -0.29302978515625, -0.1993408203125, -0.10565185546875, -0.011962890625, 0.08172607421875, 0.1754150390625, 0.26910400390625, 0.36279296875, 0.45648193359375, 0.5501708984375, 0.64385986328125, 0.737548828125, 0.83123779296875, 0.9249267578125, 1.01861572265625, 1.1123046875, 1.20599365234375, 1.2996826171875, 1.39337158203125, 1.487060546875, 1.58074951171875, 1.6744384765625, 1.76812744140625, 1.86181640625, 1.95550537109375, 2.0491943359375, 2.14288330078125, 2.236572265625, 2.33026123046875, 2.4239501953125, 2.51763916015625, 2.611328125]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 3.0, 3.0, 6.0, 8.0, 11.0, 14.0, 18.0, 12.0, 25.0, 30.0, 26.0, 35.0, 40.0, 46.0, 46.0, 79.0, 85.0, 314.0, 1501.0, 264.0, 97.0, 55.0, 43.0, 52.0, 31.0, 37.0, 31.0, 35.0, 24.0, 20.0, 12.0, 16.0, 7.0, 4.0, 4.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.84375, -11.4998779296875, -11.156005859375, -10.8121337890625, -10.46826171875, -10.1243896484375, -9.780517578125, -9.4366455078125, -9.0927734375, -8.7489013671875, -8.405029296875, -8.0611572265625, -7.71728515625, -7.3734130859375, -7.029541015625, -6.6856689453125, -6.341796875, -5.9979248046875, -5.654052734375, -5.3101806640625, -4.96630859375, -4.6224365234375, -4.278564453125, -3.9346923828125, -3.5908203125, -3.2469482421875, -2.903076171875, -2.5592041015625, -2.21533203125, -1.8714599609375, -1.527587890625, -1.1837158203125, -0.83984375, -0.4959716796875, -0.152099609375, 0.1917724609375, 0.53564453125, 0.8795166015625, 1.223388671875, 1.5672607421875, 1.9111328125, 2.2550048828125, 2.598876953125, 2.9427490234375, 3.28662109375, 3.6304931640625, 3.974365234375, 4.3182373046875, 4.662109375, 5.0059814453125, 5.349853515625, 5.6937255859375, 6.03759765625, 6.3814697265625, 6.725341796875, 7.0692138671875, 7.4130859375, 7.7569580078125, 8.100830078125, 8.4447021484375, 8.78857421875, 9.1324462890625, 9.476318359375, 9.8201904296875, 10.1640625]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 4.0, 6.0, 4.0, 5.0, 13.0, 19.0, 18.0, 30.0, 29.0, 40.0, 76.0, 61.0, 133.0, 160.0, 235.0, 396.0, 1174.0, 32617.0, 3066621.0, 41440.0, 1367.0, 413.0, 215.0, 178.0, 121.0, 80.0, 59.0, 49.0, 42.0, 20.0, 19.0, 12.0, 12.0, 14.0, 7.0, 7.0, 5.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.921875, -22.1455078125, -21.369140625, -20.5927734375, -19.81640625, -19.0400390625, -18.263671875, -17.4873046875, -16.7109375, -15.9345703125, -15.158203125, -14.3818359375, -13.60546875, -12.8291015625, -12.052734375, -11.2763671875, -10.5, -9.7236328125, -8.947265625, -8.1708984375, -7.39453125, -6.6181640625, -5.841796875, -5.0654296875, -4.2890625, -3.5126953125, -2.736328125, -1.9599609375, -1.18359375, -0.4072265625, 0.369140625, 1.1455078125, 1.921875, 2.6982421875, 3.474609375, 4.2509765625, 5.02734375, 5.8037109375, 6.580078125, 7.3564453125, 8.1328125, 8.9091796875, 9.685546875, 10.4619140625, 11.23828125, 12.0146484375, 12.791015625, 13.5673828125, 14.34375, 15.1201171875, 15.896484375, 16.6728515625, 17.44921875, 18.2255859375, 19.001953125, 19.7783203125, 20.5546875, 21.3310546875, 22.107421875, 22.8837890625, 23.66015625, 24.4365234375, 25.212890625, 25.9892578125, 26.765625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 7.0, 11.0, 20.0, 31.0, 56.0, 76.0, 103.0, 122.0, 131.0, 112.0, 99.0, 88.0, 57.0, 41.0, 32.0, 13.0, 11.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-11.380694389343262, -10.93441390991211, -10.488133430480957, -10.041852951049805, -9.595571517944336, -9.149291038513184, -8.703010559082031, -8.256730079650879, -7.810449123382568, -7.364168643951416, -6.9178876876831055, -6.471607208251953, -6.025326728820801, -5.57904577255249, -5.132765293121338, -4.686484336853027, -4.240203857421875, -3.7939231395721436, -3.347642421722412, -2.9013619422912598, -2.4550812244415283, -2.008800506591797, -1.5625200271606445, -1.116239309310913, -0.6699585914611816, -0.22367793321609497, 0.2226027250289917, 0.6688833236694336, 1.115164041519165, 1.5614447593688965, 2.007725238800049, 2.4540059566497803, 2.900287628173828, 3.3465683460235596, 3.792849063873291, 4.239129543304443, 4.685410499572754, 5.131690979003906, 5.577971458435059, 6.024251937866211, 6.4705328941345215, 6.916813373565674, 7.363094329833984, 7.809374809265137, 8.255655288696289, 8.701936721801758, 9.148216247558594, 9.594497680664062, 10.040778160095215, 10.487058639526367, 10.93333911895752, 11.379619598388672, 11.82590103149414, 12.272181510925293, 12.718461990356445, 13.164742469787598, 13.61102294921875, 14.057303428649902, 14.503583908081055, 14.949865341186523, 15.396145820617676, 15.842426300048828, 16.288707733154297, 16.734987258911133, 17.1812686920166]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 7.0, 11.0, 1.0, 6.0, 14.0, 12.0, 17.0, 21.0, 16.0, 27.0, 27.0, 27.0, 28.0, 36.0, 34.0, 38.0, 51.0, 51.0, 45.0, 43.0, 57.0, 50.0, 39.0, 40.0, 37.0, 33.0, 35.0, 21.0, 26.0, 24.0, 23.0, 23.0, 16.0, 14.0, 8.0, 8.0, 12.0, 15.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.827173233032227, -23.998550415039062, -23.16992950439453, -22.341306686401367, -21.512683868408203, -20.68406105041504, -19.855438232421875, -19.026817321777344, -18.19819450378418, -17.369571685791016, -16.540950775146484, -15.71232795715332, -14.883705139160156, -14.055082321166992, -13.226460456848145, -12.397838592529297, -11.569215774536133, -10.740592956542969, -9.911971092224121, -9.083349227905273, -8.25472640991211, -7.4261040687561035, -6.597481727600098, -5.768859386444092, -4.940237045288086, -4.11161470413208, -3.282992362976074, -2.4543700218200684, -1.6257476806640625, -0.7971253395080566, 0.03149700164794922, 0.8601193428039551, 1.6887397766113281, 2.517362117767334, 3.34598445892334, 4.174606800079346, 5.003229141235352, 5.831851482391357, 6.660473823547363, 7.489096164703369, 8.317718505859375, 9.146341323852539, 9.974963188171387, 10.803585052490234, 11.632207870483398, 12.460830688476562, 13.28945255279541, 14.118074417114258, 14.946697235107422, 15.775320053100586, 16.60394287109375, 17.43256378173828, 18.261186599731445, 19.08980941772461, 19.91843032836914, 20.747053146362305, 21.57567596435547, 22.404298782348633, 23.232921600341797, 24.061542510986328, 24.890165328979492, 25.718788146972656, 26.547409057617188, 27.37603187561035, 28.204654693603516]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 2.0, 9.0, 11.0, 11.0, 18.0, 14.0, 18.0, 26.0, 25.0, 26.0, 31.0, 29.0, 30.0, 33.0, 31.0, 31.0, 51.0, 41.0, 45.0, 37.0, 42.0, 36.0, 40.0, 38.0, 31.0, 34.0, 42.0, 32.0, 28.0, 20.0, 23.0, 17.0, 27.0, 9.0, 13.0, 11.0, 8.0, 4.0, 4.0, 8.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-3.068359375, -2.98345947265625, -2.8985595703125, -2.81365966796875, -2.728759765625, -2.64385986328125, -2.5589599609375, -2.47406005859375, -2.38916015625, -2.30426025390625, -2.2193603515625, -2.13446044921875, -2.049560546875, -1.96466064453125, -1.8797607421875, -1.79486083984375, -1.7099609375, -1.62506103515625, -1.5401611328125, -1.45526123046875, -1.370361328125, -1.28546142578125, -1.2005615234375, -1.11566162109375, -1.03076171875, -0.94586181640625, -0.8609619140625, -0.77606201171875, -0.691162109375, -0.60626220703125, -0.5213623046875, -0.43646240234375, -0.3515625, -0.26666259765625, -0.1817626953125, -0.09686279296875, -0.011962890625, 0.07293701171875, 0.1578369140625, 0.24273681640625, 0.32763671875, 0.41253662109375, 0.4974365234375, 0.58233642578125, 0.667236328125, 0.75213623046875, 0.8370361328125, 0.92193603515625, 1.0068359375, 1.09173583984375, 1.1766357421875, 1.26153564453125, 1.346435546875, 1.43133544921875, 1.5162353515625, 1.60113525390625, 1.68603515625, 1.77093505859375, 1.8558349609375, 1.94073486328125, 2.025634765625, 2.11053466796875, 2.1954345703125, 2.28033447265625, 2.365234375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 2.0, 5.0, 9.0, 6.0, 10.0, 13.0, 26.0, 29.0, 27.0, 39.0, 59.0, 96.0, 138.0, 237.0, 539.0, 1467.0, 5107.0, 21502.0, 106248.0, 584262.0, 2038651.0, 1153662.0, 225786.0, 42433.0, 9611.0, 2608.0, 879.0, 343.0, 155.0, 90.0, 68.0, 34.0, 19.0, 26.0, 24.0, 22.0, 10.0, 9.0, 8.0, 5.0, 6.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0], "bins": [-5.38671875, -5.2315673828125, -5.076416015625, -4.9212646484375, -4.76611328125, -4.6109619140625, -4.455810546875, -4.3006591796875, -4.1455078125, -3.9903564453125, -3.835205078125, -3.6800537109375, -3.52490234375, -3.3697509765625, -3.214599609375, -3.0594482421875, -2.904296875, -2.7491455078125, -2.593994140625, -2.4388427734375, -2.28369140625, -2.1285400390625, -1.973388671875, -1.8182373046875, -1.6630859375, -1.5079345703125, -1.352783203125, -1.1976318359375, -1.04248046875, -0.8873291015625, -0.732177734375, -0.5770263671875, -0.421875, -0.2667236328125, -0.111572265625, 0.0435791015625, 0.19873046875, 0.3538818359375, 0.509033203125, 0.6641845703125, 0.8193359375, 0.9744873046875, 1.129638671875, 1.2847900390625, 1.43994140625, 1.5950927734375, 1.750244140625, 1.9053955078125, 2.060546875, 2.2156982421875, 2.370849609375, 2.5260009765625, 2.68115234375, 2.8363037109375, 2.991455078125, 3.1466064453125, 3.3017578125, 3.4569091796875, 3.612060546875, 3.7672119140625, 3.92236328125, 4.0775146484375, 4.232666015625, 4.3878173828125, 4.54296875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 7.0, 1.0, 0.0, 3.0, 10.0, 9.0, 10.0, 15.0, 19.0, 33.0, 33.0, 49.0, 47.0, 65.0, 92.0, 110.0, 167.0, 198.0, 245.0, 340.0, 373.0, 365.0, 324.0, 329.0, 270.0, 227.0, 168.0, 113.0, 98.0, 70.0, 59.0, 51.0, 38.0, 32.0, 22.0, 29.0, 11.0, 11.0, 7.0, 6.0, 10.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.52734375, -3.3896484375, -3.251953125, -3.1142578125, -2.9765625, -2.8388671875, -2.701171875, -2.5634765625, -2.42578125, -2.2880859375, -2.150390625, -2.0126953125, -1.875, -1.7373046875, -1.599609375, -1.4619140625, -1.32421875, -1.1865234375, -1.048828125, -0.9111328125, -0.7734375, -0.6357421875, -0.498046875, -0.3603515625, -0.22265625, -0.0849609375, 0.052734375, 0.1904296875, 0.328125, 0.4658203125, 0.603515625, 0.7412109375, 0.87890625, 1.0166015625, 1.154296875, 1.2919921875, 1.4296875, 1.5673828125, 1.705078125, 1.8427734375, 1.98046875, 2.1181640625, 2.255859375, 2.3935546875, 2.53125, 2.6689453125, 2.806640625, 2.9443359375, 3.08203125, 3.2197265625, 3.357421875, 3.4951171875, 3.6328125, 3.7705078125, 3.908203125, 4.0458984375, 4.18359375, 4.3212890625, 4.458984375, 4.5966796875, 4.734375, 4.8720703125, 5.009765625, 5.1474609375, 5.28515625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 5.0, 8.0, 9.0, 9.0, 6.0, 14.0, 19.0, 31.0, 31.0, 40.0, 48.0, 49.0, 80.0, 103.0, 144.0, 192.0, 312.0, 572.0, 3028.0, 199859.0, 3806713.0, 178617.0, 2796.0, 541.0, 299.0, 209.0, 127.0, 113.0, 74.0, 49.0, 42.0, 42.0, 30.0, 19.0, 12.0, 14.0, 7.0, 7.0, 6.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-23.0, -22.386474609375, -21.77294921875, -21.159423828125, -20.5458984375, -19.932373046875, -19.31884765625, -18.705322265625, -18.091796875, -17.478271484375, -16.86474609375, -16.251220703125, -15.6376953125, -15.024169921875, -14.41064453125, -13.797119140625, -13.18359375, -12.570068359375, -11.95654296875, -11.343017578125, -10.7294921875, -10.115966796875, -9.50244140625, -8.888916015625, -8.275390625, -7.661865234375, -7.04833984375, -6.434814453125, -5.8212890625, -5.207763671875, -4.59423828125, -3.980712890625, -3.3671875, -2.753662109375, -2.14013671875, -1.526611328125, -0.9130859375, -0.299560546875, 0.31396484375, 0.927490234375, 1.541015625, 2.154541015625, 2.76806640625, 3.381591796875, 3.9951171875, 4.608642578125, 5.22216796875, 5.835693359375, 6.44921875, 7.062744140625, 7.67626953125, 8.289794921875, 8.9033203125, 9.516845703125, 10.13037109375, 10.743896484375, 11.357421875, 11.970947265625, 12.58447265625, 13.197998046875, 13.8115234375, 14.425048828125, 15.03857421875, 15.652099609375, 16.265625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 21.0, 44.0, 113.0, 222.0, 264.0, 183.0, 91.0, 53.0, 14.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.497007369995117, -10.824869155883789, -9.152731895446777, -7.480594158172607, -5.8084564208984375, -4.136318206787109, -2.4641809463500977, -0.7920436859130859, 0.8800945281982422, 2.552232265472412, 4.224370002746582, 5.896507740020752, 7.568645477294922, 9.24078369140625, 10.912920951843262, 12.585058212280273, 14.257196426391602, 15.92933464050293, 17.601470947265625, 19.273609161376953, 20.94574737548828, 22.61788558959961, 24.290023803710938, 25.962160110473633, 27.63429832458496, 29.30643653869629, 30.978572845458984, 32.65071105957031, 34.32284927368164, 35.99498748779297, 37.6671257019043, 39.339263916015625, 41.01139831542969, 42.683536529541016, 44.355674743652344, 46.02781295776367, 47.699951171875, 49.37208557128906, 51.04422378540039, 52.71636199951172, 54.38850021362305, 56.060638427734375, 57.7327766418457, 59.40491485595703, 61.077049255371094, 62.74919128417969, 64.42132568359375, 66.09346008300781, 67.7656021118164, 69.43773651123047, 71.10987854003906, 72.78201293945312, 74.45415496826172, 76.12628936767578, 77.79843139648438, 79.47056579589844, 81.1427001953125, 82.81483459472656, 84.48697662353516, 86.15911102294922, 87.83125305175781, 89.50338745117188, 91.17552947998047, 92.84766387939453, 94.51980590820312]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 3.0, 7.0, 6.0, 12.0, 8.0, 14.0, 9.0, 23.0, 23.0, 24.0, 23.0, 30.0, 32.0, 32.0, 37.0, 37.0, 38.0, 30.0, 33.0, 37.0, 45.0, 40.0, 46.0, 46.0, 33.0, 27.0, 32.0, 25.0, 30.0, 31.0, 23.0, 27.0, 32.0, 17.0, 15.0, 10.0, 12.0, 8.0, 9.0, 10.0, 6.0, 7.0, 4.0, 3.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-18.260726928710938, -17.751453399658203, -17.242177963256836, -16.7329044342041, -16.223630905151367, -15.71435546875, -15.205081939697266, -14.695807456970215, -14.186532974243164, -13.677258491516113, -13.167984962463379, -12.658710479736328, -12.149435997009277, -11.640161514282227, -11.130887985229492, -10.621613502502441, -10.112339973449707, -9.603065490722656, -9.093791961669922, -8.584517478942871, -8.07524299621582, -7.565968990325928, -7.056694984436035, -6.547420501708984, -6.038146495819092, -5.528872489929199, -5.019598007202148, -4.510324001312256, -4.001049995422363, -3.4917755126953125, -2.98250150680542, -2.4732272624969482, -1.9639530181884766, -1.4546787738800049, -0.9454046487808228, -0.4361305236816406, 0.07314372062683105, 0.5824179649353027, 1.0916919708251953, 1.600966215133667, 2.1102404594421387, 2.6195147037506104, 3.128788948059082, 3.6380629539489746, 4.147336959838867, 4.656611442565918, 5.1658854484558105, 5.675159454345703, 6.184433937072754, 6.6937079429626465, 7.202982425689697, 7.71225643157959, 8.22153091430664, 8.730804443359375, 9.240078926086426, 9.749353408813477, 10.258626937866211, 10.767901420593262, 11.277174949645996, 11.786449432373047, 12.295723915100098, 12.804998397827148, 13.314271926879883, 13.823546409606934, 14.332820892333984]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 8.0, 6.0, 14.0, 7.0, 4.0, 11.0, 18.0, 25.0, 25.0, 30.0, 21.0, 32.0, 30.0, 29.0, 43.0, 30.0, 45.0, 43.0, 39.0, 30.0, 42.0, 36.0, 38.0, 36.0, 32.0, 48.0, 28.0, 20.0, 30.0, 37.0, 30.0, 19.0, 22.0, 21.0, 18.0, 9.0, 7.0, 6.0, 5.0, 9.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.791015625, -2.711212158203125, -2.63140869140625, -2.551605224609375, -2.4718017578125, -2.391998291015625, -2.31219482421875, -2.232391357421875, -2.152587890625, -2.072784423828125, -1.99298095703125, -1.913177490234375, -1.8333740234375, -1.753570556640625, -1.67376708984375, -1.593963623046875, -1.51416015625, -1.434356689453125, -1.35455322265625, -1.274749755859375, -1.1949462890625, -1.115142822265625, -1.03533935546875, -0.955535888671875, -0.875732421875, -0.795928955078125, -0.71612548828125, -0.636322021484375, -0.5565185546875, -0.476715087890625, -0.39691162109375, -0.317108154296875, -0.2373046875, -0.157501220703125, -0.07769775390625, 0.002105712890625, 0.0819091796875, 0.161712646484375, 0.24151611328125, 0.321319580078125, 0.401123046875, 0.480926513671875, 0.56072998046875, 0.640533447265625, 0.7203369140625, 0.800140380859375, 0.87994384765625, 0.959747314453125, 1.03955078125, 1.119354248046875, 1.19915771484375, 1.278961181640625, 1.3587646484375, 1.438568115234375, 1.51837158203125, 1.598175048828125, 1.677978515625, 1.757781982421875, 1.83758544921875, 1.917388916015625, 1.9971923828125, 2.076995849609375, 2.15679931640625, 2.236602783203125, 2.31640625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 14.0, 11.0, 14.0, 22.0, 32.0, 46.0, 82.0, 129.0, 174.0, 262.0, 390.0, 572.0, 860.0, 1320.0, 2080.0, 3284.0, 5076.0, 7969.0, 12677.0, 20231.0, 30968.0, 48551.0, 72568.0, 105850.0, 141356.0, 159188.0, 137110.0, 101767.0, 69093.0, 45379.0, 29457.0, 18796.0, 11983.0, 7486.0, 4874.0, 3001.0, 1968.0, 1307.0, 878.0, 586.0, 378.0, 252.0, 154.0, 112.0, 82.0, 53.0, 37.0, 24.0, 17.0, 16.0, 12.0, 3.0, 4.0, 5.0, 0.0, 0.0, 1.0], "bins": [-0.1998291015625, -0.19366836547851562, -0.18750762939453125, -0.18134689331054688, -0.1751861572265625, -0.16902542114257812, -0.16286468505859375, -0.15670394897460938, -0.150543212890625, -0.14438247680664062, -0.13822174072265625, -0.13206100463867188, -0.1259002685546875, -0.11973953247070312, -0.11357879638671875, -0.10741806030273438, -0.10125732421875, -0.09509658813476562, -0.08893585205078125, -0.08277511596679688, -0.0766143798828125, -0.07045364379882812, -0.06429290771484375, -0.058132171630859375, -0.051971435546875, -0.045810699462890625, -0.03964996337890625, -0.033489227294921875, -0.0273284912109375, -0.021167755126953125, -0.01500701904296875, -0.008846282958984375, -0.002685546875, 0.003475189208984375, 0.00963592529296875, 0.015796661376953125, 0.0219573974609375, 0.028118133544921875, 0.03427886962890625, 0.040439605712890625, 0.046600341796875, 0.052761077880859375, 0.05892181396484375, 0.06508255004882812, 0.0712432861328125, 0.07740402221679688, 0.08356475830078125, 0.08972549438476562, 0.09588623046875, 0.10204696655273438, 0.10820770263671875, 0.11436843872070312, 0.1205291748046875, 0.12668991088867188, 0.13285064697265625, 0.13901138305664062, 0.145172119140625, 0.15133285522460938, 0.15749359130859375, 0.16365432739257812, 0.1698150634765625, 0.17597579956054688, 0.18213653564453125, 0.18829727172851562, 0.1944580078125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 5.0, 5.0, 6.0, 14.0, 14.0, 8.0, 13.0, 13.0, 31.0, 20.0, 25.0, 23.0, 30.0, 23.0, 42.0, 40.0, 33.0, 43.0, 42.0, 52.0, 1072.0, 33.0, 37.0, 38.0, 41.0, 34.0, 27.0, 27.0, 23.0, 37.0, 20.0, 21.0, 27.0, 22.0, 16.0, 9.0, 11.0, 13.0, 12.0, 6.0, 5.0, 5.0, 5.0, 0.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9912109375, -1.9209136962890625, -1.850616455078125, -1.7803192138671875, -1.71002197265625, -1.6397247314453125, -1.569427490234375, -1.4991302490234375, -1.4288330078125, -1.3585357666015625, -1.288238525390625, -1.2179412841796875, -1.14764404296875, -1.0773468017578125, -1.007049560546875, -0.9367523193359375, -0.866455078125, -0.7961578369140625, -0.725860595703125, -0.6555633544921875, -0.58526611328125, -0.5149688720703125, -0.444671630859375, -0.3743743896484375, -0.3040771484375, -0.2337799072265625, -0.163482666015625, -0.0931854248046875, -0.02288818359375, 0.0474090576171875, 0.117706298828125, 0.1880035400390625, 0.25830078125, 0.3285980224609375, 0.398895263671875, 0.4691925048828125, 0.53948974609375, 0.6097869873046875, 0.680084228515625, 0.7503814697265625, 0.8206787109375, 0.8909759521484375, 0.961273193359375, 1.0315704345703125, 1.10186767578125, 1.1721649169921875, 1.242462158203125, 1.3127593994140625, 1.383056640625, 1.4533538818359375, 1.523651123046875, 1.5939483642578125, 1.66424560546875, 1.7345428466796875, 1.804840087890625, 1.8751373291015625, 1.9454345703125, 2.0157318115234375, 2.086029052734375, 2.1563262939453125, 2.22662353515625, 2.2969207763671875, 2.367218017578125, 2.4375152587890625, 2.5078125]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 11.0, 14.0, 11.0, 17.0, 24.0, 35.0, 51.0, 88.0, 134.0, 205.0, 330.0, 497.0, 893.0, 1467.0, 2568.0, 4194.0, 7409.0, 12545.0, 20850.0, 35338.0, 58552.0, 94359.0, 143004.0, 1217186.0, 181406.0, 121380.0, 77590.0, 47672.0, 28132.0, 16761.0, 9990.0, 5911.0, 3418.0, 1977.0, 1203.0, 723.0, 395.0, 305.0, 159.0, 122.0, 63.0, 49.0, 29.0, 24.0, 18.0, 7.0, 6.0, 3.0, 3.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14013671875, -0.1358623504638672, -0.13158798217773438, -0.12731361389160156, -0.12303924560546875, -0.11876487731933594, -0.11449050903320312, -0.11021614074707031, -0.1059417724609375, -0.10166740417480469, -0.09739303588867188, -0.09311866760253906, -0.08884429931640625, -0.08456993103027344, -0.08029556274414062, -0.07602119445800781, -0.071746826171875, -0.06747245788574219, -0.06319808959960938, -0.05892372131347656, -0.05464935302734375, -0.05037498474121094, -0.046100616455078125, -0.04182624816894531, -0.0375518798828125, -0.03327751159667969, -0.029003143310546875, -0.024728775024414062, -0.02045440673828125, -0.016180038452148438, -0.011905670166015625, -0.0076313018798828125, -0.00335693359375, 0.0009174346923828125, 0.005191802978515625, 0.009466171264648438, 0.01374053955078125, 0.018014907836914062, 0.022289276123046875, 0.026563644409179688, 0.0308380126953125, 0.03511238098144531, 0.039386749267578125, 0.04366111755371094, 0.04793548583984375, 0.05220985412597656, 0.056484222412109375, 0.06075859069824219, 0.065032958984375, 0.06930732727050781, 0.07358169555664062, 0.07785606384277344, 0.08213043212890625, 0.08640480041503906, 0.09067916870117188, 0.09495353698730469, 0.0992279052734375, 0.10350227355957031, 0.10777664184570312, 0.11205101013183594, 0.11632537841796875, 0.12059974670410156, 0.12487411499023438, 0.1291484832763672, 0.1334228515625]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 4.0, 7.0, 11.0, 11.0, 19.0, 21.0, 19.0, 28.0, 33.0, 31.0, 46.0, 53.0, 71.0, 92.0, 95.0, 109.0, 53.0, 60.0, 42.0, 36.0, 29.0, 19.0, 19.0, 20.0, 17.0, 10.0, 13.0, 7.0, 3.0, 5.0, 7.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.004817962646484375, -0.004668831825256348, -0.00451970100402832, -0.004370570182800293, -0.004221439361572266, -0.004072308540344238, -0.003923177719116211, -0.0037740468978881836, -0.0036249160766601562, -0.003475785255432129, -0.0033266544342041016, -0.0031775236129760742, -0.003028392791748047, -0.0028792619705200195, -0.002730131149291992, -0.002581000328063965, -0.0024318695068359375, -0.00228273868560791, -0.002133607864379883, -0.0019844770431518555, -0.0018353462219238281, -0.0016862154006958008, -0.0015370845794677734, -0.001387953758239746, -0.0012388229370117188, -0.0010896921157836914, -0.0009405612945556641, -0.0007914304733276367, -0.0006422996520996094, -0.000493168830871582, -0.0003440380096435547, -0.00019490718841552734, -4.57763671875e-05, 0.00010335445404052734, 0.0002524852752685547, 0.00040161609649658203, 0.0005507469177246094, 0.0006998777389526367, 0.0008490085601806641, 0.0009981393814086914, 0.0011472702026367188, 0.001296401023864746, 0.0014455318450927734, 0.0015946626663208008, 0.0017437934875488281, 0.0018929243087768555, 0.002042055130004883, 0.00219118595123291, 0.0023403167724609375, 0.002489447593688965, 0.002638578414916992, 0.0027877092361450195, 0.002936840057373047, 0.0030859708786010742, 0.0032351016998291016, 0.003384232521057129, 0.0035333633422851562, 0.0036824941635131836, 0.003831624984741211, 0.003980755805969238, 0.004129886627197266, 0.004279017448425293, 0.00442814826965332, 0.004577279090881348, 0.004726409912109375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 7.0, 9.0, 13.0, 11.0, 23.0, 15.0, 18.0, 34.0, 40.0, 64.0, 94.0, 165.0, 481.0, 6474.0, 927933.0, 110603.0, 1871.0, 277.0, 143.0, 56.0, 48.0, 41.0, 28.0, 25.0, 19.0, 10.0, 14.0, 6.0, 9.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10150146484375, -0.09831047058105469, -0.09511947631835938, -0.09192848205566406, -0.08873748779296875, -0.08554649353027344, -0.08235549926757812, -0.07916450500488281, -0.0759735107421875, -0.07278251647949219, -0.06959152221679688, -0.06640052795410156, -0.06320953369140625, -0.06001853942871094, -0.056827545166015625, -0.05363655090332031, -0.050445556640625, -0.04725456237792969, -0.044063568115234375, -0.04087257385253906, -0.03768157958984375, -0.03449058532714844, -0.031299591064453125, -0.028108596801757812, -0.0249176025390625, -0.021726608276367188, -0.018535614013671875, -0.015344619750976562, -0.01215362548828125, -0.008962631225585938, -0.005771636962890625, -0.0025806427001953125, 0.0006103515625, 0.0038013458251953125, 0.006992340087890625, 0.010183334350585938, 0.01337432861328125, 0.016565322875976562, 0.019756317138671875, 0.022947311401367188, 0.0261383056640625, 0.029329299926757812, 0.032520294189453125, 0.03571128845214844, 0.03890228271484375, 0.04209327697753906, 0.045284271240234375, 0.04847526550292969, 0.051666259765625, 0.05485725402832031, 0.058048248291015625, 0.06123924255371094, 0.06443023681640625, 0.06762123107910156, 0.07081222534179688, 0.07400321960449219, 0.0771942138671875, 0.08038520812988281, 0.08357620239257812, 0.08676719665527344, 0.08995819091796875, 0.09314918518066406, 0.09634017944335938, 0.09953117370605469, 0.10272216796875]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 7.0, 10.0, 16.0, 32.0, 65.0, 104.0, 300.0, 263.0, 113.0, 45.0, 20.0, 12.0, 12.0, 2.0, 5.0, 2.0, 2.0, 3.0], "bins": [-0.050242114812135696, -0.049291785806417465, -0.048341453075408936, -0.047391124069690704, -0.046440791338682175, -0.045490462332963943, -0.04454013332724571, -0.04358980059623718, -0.04263947159051895, -0.04168914258480072, -0.04073880985379219, -0.03978848084807396, -0.03883814811706543, -0.0378878191113472, -0.03693749010562897, -0.03598715737462044, -0.035036828368902206, -0.034086499363183975, -0.033136166632175446, -0.032185837626457214, -0.031235506758093834, -0.030285175889730453, -0.029334845021367073, -0.028384514153003693, -0.027434183284640312, -0.026483852416276932, -0.02553352154791355, -0.02458319254219532, -0.02363286167383194, -0.02268253080546856, -0.02173219993710518, -0.020781870931386948, -0.019831541925668716, -0.018881211057305336, -0.017930880188941956, -0.016980551183223724, -0.016030220314860344, -0.015079889446496964, -0.014129558578133583, -0.013179228641092777, -0.012228896841406822, -0.011278565973043442, -0.010328236036002636, -0.009377905167639256, -0.00842757523059845, -0.007477244362235069, -0.006526913959532976, -0.005576583556830883, -0.004626253619790077, -0.003675923217087984, -0.002725592814385891, -0.0017752621788531542, -0.0008249317761510611, 0.00012539885938167572, 0.0010757292620837688, 0.002026059664785862, 0.002976390067487955, 0.003926720470190048, 0.004877050872892141, 0.0058273812755942345, 0.006777712143957615, 0.007728042546659708, 0.008678372949361801, 0.009628703817725182, 0.010579033754765987]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 2.0, 7.0, 8.0, 12.0, 10.0, 15.0, 12.0, 21.0, 18.0, 23.0, 24.0, 21.0, 42.0, 33.0, 41.0, 18.0, 35.0, 45.0, 44.0, 39.0, 38.0, 42.0, 37.0, 26.0, 30.0, 25.0, 44.0, 36.0, 19.0, 34.0, 34.0, 27.0, 14.0, 27.0, 22.0, 17.0, 15.0, 9.0, 10.0, 11.0, 3.0, 4.0, 0.0, 7.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-0.005157470703125, -0.005002596415579319, -0.004847722128033638, -0.004692847840487957, -0.004537973552942276, -0.004383099265396595, -0.004228224977850914, -0.004073350690305233, -0.003918476402759552, -0.003763602115213871, -0.00360872782766819, -0.003453853540122509, -0.003298979252576828, -0.003144104965031147, -0.002989230677485466, -0.002834356389939785, -0.002679482102394104, -0.002524607814848423, -0.002369733527302742, -0.002214859239757061, -0.00205998495221138, -0.001905110664665699, -0.001750236377120018, -0.001595362089574337, -0.001440487802028656, -0.001285613514482975, -0.001130739226937294, -0.000975864939391613, -0.000820990651845932, -0.000666116364300251, -0.00051124207675457, -0.000356367789208889, -0.000201493501663208, -4.661921411752701e-05, 0.00010825507342815399, 0.000263129360973835, 0.000418003648519516, 0.000572877936065197, 0.000727752223610878, 0.000882626511156559, 0.00103750079870224, 0.001192375086247921, 0.001347249373793602, 0.001502123661339283, 0.001656997948884964, 0.001811872236430645, 0.001966746523976326, 0.002121620811522007, 0.002276495099067688, 0.002431369386613369, 0.00258624367415905, 0.002741117961704731, 0.002895992249250412, 0.003050866536796093, 0.003205740824341774, 0.003360615111887455, 0.003515489399433136, 0.003670363686978817, 0.003825237974524498, 0.003980112262070179, 0.00413498654961586, 0.004289860837161541, 0.004444735124707222, 0.004599609412252903, 0.004754483699798584]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 4.0, 3.0, 8.0, 7.0, 13.0, 7.0, 4.0, 11.0, 18.0, 25.0, 27.0, 29.0, 20.0, 32.0, 30.0, 30.0, 42.0, 30.0, 45.0, 43.0, 39.0, 32.0, 40.0, 37.0, 38.0, 36.0, 31.0, 48.0, 28.0, 21.0, 29.0, 37.0, 30.0, 19.0, 22.0, 21.0, 18.0, 9.0, 7.0, 6.0, 5.0, 9.0, 6.0, 2.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.7890625, -2.70928955078125, -2.6295166015625, -2.54974365234375, -2.469970703125, -2.39019775390625, -2.3104248046875, -2.23065185546875, -2.15087890625, -2.07110595703125, -1.9913330078125, -1.91156005859375, -1.831787109375, -1.75201416015625, -1.6722412109375, -1.59246826171875, -1.5126953125, -1.43292236328125, -1.3531494140625, -1.27337646484375, -1.193603515625, -1.11383056640625, -1.0340576171875, -0.95428466796875, -0.87451171875, -0.79473876953125, -0.7149658203125, -0.63519287109375, -0.555419921875, -0.47564697265625, -0.3958740234375, -0.31610107421875, -0.236328125, -0.15655517578125, -0.0767822265625, 0.00299072265625, 0.082763671875, 0.16253662109375, 0.2423095703125, 0.32208251953125, 0.40185546875, 0.48162841796875, 0.5614013671875, 0.64117431640625, 0.720947265625, 0.80072021484375, 0.8804931640625, 0.96026611328125, 1.0400390625, 1.11981201171875, 1.1995849609375, 1.27935791015625, 1.359130859375, 1.43890380859375, 1.5186767578125, 1.59844970703125, 1.67822265625, 1.75799560546875, 1.8377685546875, 1.91754150390625, 1.997314453125, 2.07708740234375, 2.1568603515625, 2.23663330078125, 2.31640625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 8.0, 7.0, 6.0, 6.0, 17.0, 17.0, 23.0, 17.0, 44.0, 48.0, 82.0, 115.0, 194.0, 310.0, 566.0, 1142.0, 2164.0, 4288.0, 8471.0, 16463.0, 31590.0, 63922.0, 136455.0, 304183.0, 254604.0, 113676.0, 53729.0, 27100.0, 14160.0, 7319.0, 3717.0, 1813.0, 963.0, 509.0, 284.0, 177.0, 94.0, 79.0, 52.0, 34.0, 33.0, 21.0, 13.0, 12.0, 13.0, 8.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-2.953125, -2.86846923828125, -2.7838134765625, -2.69915771484375, -2.614501953125, -2.52984619140625, -2.4451904296875, -2.36053466796875, -2.27587890625, -2.19122314453125, -2.1065673828125, -2.02191162109375, -1.937255859375, -1.85260009765625, -1.7679443359375, -1.68328857421875, -1.5986328125, -1.51397705078125, -1.4293212890625, -1.34466552734375, -1.260009765625, -1.17535400390625, -1.0906982421875, -1.00604248046875, -0.92138671875, -0.83673095703125, -0.7520751953125, -0.66741943359375, -0.582763671875, -0.49810791015625, -0.4134521484375, -0.32879638671875, -0.244140625, -0.15948486328125, -0.0748291015625, 0.00982666015625, 0.094482421875, 0.17913818359375, 0.2637939453125, 0.34844970703125, 0.43310546875, 0.51776123046875, 0.6024169921875, 0.68707275390625, 0.771728515625, 0.85638427734375, 0.9410400390625, 1.02569580078125, 1.1103515625, 1.19500732421875, 1.2796630859375, 1.36431884765625, 1.448974609375, 1.53363037109375, 1.6182861328125, 1.70294189453125, 1.78759765625, 1.87225341796875, 1.9569091796875, 2.04156494140625, 2.126220703125, 2.21087646484375, 2.2955322265625, 2.38018798828125, 2.46484375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 0.0, 7.0, 10.0, 7.0, 9.0, 16.0, 14.0, 22.0, 28.0, 22.0, 32.0, 27.0, 29.0, 36.0, 43.0, 58.0, 62.0, 103.0, 194.0, 1443.0, 291.0, 144.0, 76.0, 61.0, 51.0, 29.0, 23.0, 41.0, 25.0, 29.0, 19.0, 23.0, 13.0, 5.0, 11.0, 12.0, 8.0, 4.0, 4.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.5, -8.22314453125, -7.9462890625, -7.66943359375, -7.392578125, -7.11572265625, -6.8388671875, -6.56201171875, -6.28515625, -6.00830078125, -5.7314453125, -5.45458984375, -5.177734375, -4.90087890625, -4.6240234375, -4.34716796875, -4.0703125, -3.79345703125, -3.5166015625, -3.23974609375, -2.962890625, -2.68603515625, -2.4091796875, -2.13232421875, -1.85546875, -1.57861328125, -1.3017578125, -1.02490234375, -0.748046875, -0.47119140625, -0.1943359375, 0.08251953125, 0.359375, 0.63623046875, 0.9130859375, 1.18994140625, 1.466796875, 1.74365234375, 2.0205078125, 2.29736328125, 2.57421875, 2.85107421875, 3.1279296875, 3.40478515625, 3.681640625, 3.95849609375, 4.2353515625, 4.51220703125, 4.7890625, 5.06591796875, 5.3427734375, 5.61962890625, 5.896484375, 6.17333984375, 6.4501953125, 6.72705078125, 7.00390625, 7.28076171875, 7.5576171875, 7.83447265625, 8.111328125, 8.38818359375, 8.6650390625, 8.94189453125, 9.21875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 1.0, 3.0, 5.0, 8.0, 8.0, 16.0, 14.0, 21.0, 33.0, 36.0, 52.0, 67.0, 109.0, 134.0, 207.0, 380.0, 842.0, 3245.0, 318855.0, 2810094.0, 9059.0, 1179.0, 473.0, 283.0, 149.0, 116.0, 89.0, 65.0, 45.0, 34.0, 20.0, 23.0, 8.0, 11.0, 5.0, 2.0, 2.0, 3.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.21875, -23.466064453125, -22.71337890625, -21.960693359375, -21.2080078125, -20.455322265625, -19.70263671875, -18.949951171875, -18.197265625, -17.444580078125, -16.69189453125, -15.939208984375, -15.1865234375, -14.433837890625, -13.68115234375, -12.928466796875, -12.17578125, -11.423095703125, -10.67041015625, -9.917724609375, -9.1650390625, -8.412353515625, -7.65966796875, -6.906982421875, -6.154296875, -5.401611328125, -4.64892578125, -3.896240234375, -3.1435546875, -2.390869140625, -1.63818359375, -0.885498046875, -0.1328125, 0.619873046875, 1.37255859375, 2.125244140625, 2.8779296875, 3.630615234375, 4.38330078125, 5.135986328125, 5.888671875, 6.641357421875, 7.39404296875, 8.146728515625, 8.8994140625, 9.652099609375, 10.40478515625, 11.157470703125, 11.91015625, 12.662841796875, 13.41552734375, 14.168212890625, 14.9208984375, 15.673583984375, 16.42626953125, 17.178955078125, 17.931640625, 18.684326171875, 19.43701171875, 20.189697265625, 20.9423828125, 21.695068359375, 22.44775390625, 23.200439453125, 23.953125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 17.0, 276.0, 577.0, 139.0, 7.0, 0.0, 1.0], "bins": [-129.88644409179688, -127.69596862792969, -125.5054931640625, -123.31501770019531, -121.12454223632812, -118.93406677246094, -116.74359130859375, -114.55311584472656, -112.36264038085938, -110.17216491699219, -107.981689453125, -105.79121398925781, -103.60073852539062, -101.41026306152344, -99.21978759765625, -97.02931213378906, -94.83883666992188, -92.64836120605469, -90.4578857421875, -88.26741027832031, -86.07693481445312, -83.88645935058594, -81.69598388671875, -79.50550842285156, -77.31502532958984, -75.12454986572266, -72.93407440185547, -70.74359893798828, -68.5531234741211, -66.3626480102539, -64.17217254638672, -61.98169708251953, -59.79121398925781, -57.600738525390625, -55.41026306152344, -53.21978759765625, -51.02931213378906, -48.838836669921875, -46.64836120605469, -44.4578857421875, -42.26741027832031, -40.076934814453125, -37.88645935058594, -35.69598388671875, -33.50550842285156, -31.315032958984375, -29.124555587768555, -26.934080123901367, -24.743602752685547, -22.55312728881836, -20.362651824951172, -18.172176361083984, -15.98169994354248, -13.791224479675293, -11.600748062133789, -9.410272598266602, -7.2197980880737305, -5.029322624206543, -2.8388466835021973, -0.6483707427978516, 1.542104721069336, 3.7325801849365234, 5.923056602478027, 8.113532066345215, 10.304007530212402]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 2.0, 3.0, 7.0, 8.0, 8.0, 14.0, 12.0, 8.0, 19.0, 19.0, 22.0, 23.0, 20.0, 17.0, 28.0, 25.0, 40.0, 37.0, 32.0, 25.0, 32.0, 34.0, 41.0, 43.0, 32.0, 42.0, 34.0, 39.0, 32.0, 36.0, 22.0, 20.0, 30.0, 24.0, 22.0, 20.0, 20.0, 16.0, 21.0, 9.0, 16.0, 19.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0], "bins": [-21.74846649169922, -21.087907791137695, -20.427349090576172, -19.76679039001465, -19.106231689453125, -18.4456729888916, -17.785114288330078, -17.124555587768555, -16.46399688720703, -15.803438186645508, -15.142879486083984, -14.482320785522461, -13.821762084960938, -13.161203384399414, -12.50064468383789, -11.840085983276367, -11.179526329040527, -10.518967628479004, -9.85840892791748, -9.197850227355957, -8.537291526794434, -7.87673282623291, -7.2161736488342285, -6.555614948272705, -5.895056247711182, -5.234497547149658, -4.573938846588135, -3.9133799076080322, -3.252821207046509, -2.5922625064849854, -1.9317035675048828, -1.2711448669433594, -0.6105861663818359, 0.049972593784332275, 0.7105313539505005, 1.3710901737213135, 2.031648874282837, 2.6922075748443604, 3.352766513824463, 4.013325214385986, 4.67388391494751, 5.334442615509033, 5.995001316070557, 6.655560493469238, 7.316119194030762, 7.976677894592285, 8.637236595153809, 9.297795295715332, 9.958353996276855, 10.618912696838379, 11.279471397399902, 11.940030097961426, 12.60058879852295, 13.261147499084473, 13.921707153320312, 14.582265853881836, 15.24282455444336, 15.903383255004883, 16.563941955566406, 17.22450065612793, 17.885059356689453, 18.545618057250977, 19.2061767578125, 19.866735458374023, 20.527294158935547]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 4.0, 2.0, 6.0, 5.0, 9.0, 10.0, 8.0, 10.0, 17.0, 15.0, 19.0, 22.0, 31.0, 23.0, 23.0, 45.0, 26.0, 33.0, 38.0, 32.0, 40.0, 54.0, 39.0, 32.0, 38.0, 35.0, 35.0, 31.0, 35.0, 38.0, 32.0, 33.0, 19.0, 27.0, 22.0, 22.0, 17.0, 13.0, 12.0, 8.0, 12.0, 4.0, 9.0, 9.0, 3.0, 4.0, 5.0, 0.0, 3.0, 1.0], "bins": [-3.1640625, -3.07830810546875, -2.9925537109375, -2.90679931640625, -2.821044921875, -2.73529052734375, -2.6495361328125, -2.56378173828125, -2.47802734375, -2.39227294921875, -2.3065185546875, -2.22076416015625, -2.135009765625, -2.04925537109375, -1.9635009765625, -1.87774658203125, -1.7919921875, -1.70623779296875, -1.6204833984375, -1.53472900390625, -1.448974609375, -1.36322021484375, -1.2774658203125, -1.19171142578125, -1.10595703125, -1.02020263671875, -0.9344482421875, -0.84869384765625, -0.762939453125, -0.67718505859375, -0.5914306640625, -0.50567626953125, -0.419921875, -0.33416748046875, -0.2484130859375, -0.16265869140625, -0.076904296875, 0.00885009765625, 0.0946044921875, 0.18035888671875, 0.26611328125, 0.35186767578125, 0.4376220703125, 0.52337646484375, 0.609130859375, 0.69488525390625, 0.7806396484375, 0.86639404296875, 0.9521484375, 1.03790283203125, 1.1236572265625, 1.20941162109375, 1.295166015625, 1.38092041015625, 1.4666748046875, 1.55242919921875, 1.63818359375, 1.72393798828125, 1.8096923828125, 1.89544677734375, 1.981201171875, 2.06695556640625, 2.1527099609375, 2.23846435546875, 2.32421875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 0.0, 4.0, 1.0, 6.0, 3.0, 6.0, 9.0, 8.0, 11.0, 11.0, 11.0, 12.0, 18.0, 22.0, 26.0, 38.0, 44.0, 105.0, 144.0, 316.0, 792.0, 2672.0, 10239.0, 49603.0, 281311.0, 1500116.0, 1863524.0, 397485.0, 68735.0, 13764.0, 3401.0, 983.0, 371.0, 150.0, 82.0, 57.0, 35.0, 33.0, 18.0, 18.0, 20.0, 17.0, 16.0, 7.0, 8.0, 9.0, 6.0, 9.0, 4.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0], "bins": [-5.95703125, -5.78729248046875, -5.6175537109375, -5.44781494140625, -5.278076171875, -5.10833740234375, -4.9385986328125, -4.76885986328125, -4.59912109375, -4.42938232421875, -4.2596435546875, -4.08990478515625, -3.920166015625, -3.75042724609375, -3.5806884765625, -3.41094970703125, -3.2412109375, -3.07147216796875, -2.9017333984375, -2.73199462890625, -2.562255859375, -2.39251708984375, -2.2227783203125, -2.05303955078125, -1.88330078125, -1.71356201171875, -1.5438232421875, -1.37408447265625, -1.204345703125, -1.03460693359375, -0.8648681640625, -0.69512939453125, -0.525390625, -0.35565185546875, -0.1859130859375, -0.01617431640625, 0.153564453125, 0.32330322265625, 0.4930419921875, 0.66278076171875, 0.83251953125, 1.00225830078125, 1.1719970703125, 1.34173583984375, 1.511474609375, 1.68121337890625, 1.8509521484375, 2.02069091796875, 2.1904296875, 2.36016845703125, 2.5299072265625, 2.69964599609375, 2.869384765625, 3.03912353515625, 3.2088623046875, 3.37860107421875, 3.54833984375, 3.71807861328125, 3.8878173828125, 4.05755615234375, 4.227294921875, 4.39703369140625, 4.5667724609375, 4.73651123046875, 4.90625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 2.0, 6.0, 15.0, 19.0, 10.0, 22.0, 20.0, 31.0, 60.0, 65.0, 60.0, 97.0, 145.0, 161.0, 209.0, 308.0, 363.0, 376.0, 409.0, 353.0, 293.0, 251.0, 203.0, 133.0, 109.0, 71.0, 59.0, 49.0, 27.0, 40.0, 19.0, 24.0, 21.0, 13.0, 8.0, 4.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.6640625, -4.5191650390625, -4.374267578125, -4.2293701171875, -4.08447265625, -3.9395751953125, -3.794677734375, -3.6497802734375, -3.5048828125, -3.3599853515625, -3.215087890625, -3.0701904296875, -2.92529296875, -2.7803955078125, -2.635498046875, -2.4906005859375, -2.345703125, -2.2008056640625, -2.055908203125, -1.9110107421875, -1.76611328125, -1.6212158203125, -1.476318359375, -1.3314208984375, -1.1865234375, -1.0416259765625, -0.896728515625, -0.7518310546875, -0.60693359375, -0.4620361328125, -0.317138671875, -0.1722412109375, -0.02734375, 0.1175537109375, 0.262451171875, 0.4073486328125, 0.55224609375, 0.6971435546875, 0.842041015625, 0.9869384765625, 1.1318359375, 1.2767333984375, 1.421630859375, 1.5665283203125, 1.71142578125, 1.8563232421875, 2.001220703125, 2.1461181640625, 2.291015625, 2.4359130859375, 2.580810546875, 2.7257080078125, 2.87060546875, 3.0155029296875, 3.160400390625, 3.3052978515625, 3.4501953125, 3.5950927734375, 3.739990234375, 3.8848876953125, 4.02978515625, 4.1746826171875, 4.319580078125, 4.4644775390625, 4.609375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 7.0, 7.0, 16.0, 21.0, 22.0, 32.0, 35.0, 44.0, 63.0, 64.0, 102.0, 176.0, 225.0, 348.0, 964.0, 25340.0, 3634202.0, 527335.0, 3697.0, 558.0, 280.0, 200.0, 150.0, 96.0, 59.0, 74.0, 33.0, 27.0, 25.0, 14.0, 17.0, 11.0, 13.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-26.0, -25.20654296875, -24.4130859375, -23.61962890625, -22.826171875, -22.03271484375, -21.2392578125, -20.44580078125, -19.65234375, -18.85888671875, -18.0654296875, -17.27197265625, -16.478515625, -15.68505859375, -14.8916015625, -14.09814453125, -13.3046875, -12.51123046875, -11.7177734375, -10.92431640625, -10.130859375, -9.33740234375, -8.5439453125, -7.75048828125, -6.95703125, -6.16357421875, -5.3701171875, -4.57666015625, -3.783203125, -2.98974609375, -2.1962890625, -1.40283203125, -0.609375, 0.18408203125, 0.9775390625, 1.77099609375, 2.564453125, 3.35791015625, 4.1513671875, 4.94482421875, 5.73828125, 6.53173828125, 7.3251953125, 8.11865234375, 8.912109375, 9.70556640625, 10.4990234375, 11.29248046875, 12.0859375, 12.87939453125, 13.6728515625, 14.46630859375, 15.259765625, 16.05322265625, 16.8466796875, 17.64013671875, 18.43359375, 19.22705078125, 20.0205078125, 20.81396484375, 21.607421875, 22.40087890625, 23.1943359375, 23.98779296875, 24.78125]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 16.0, 33.0, 103.0, 193.0, 230.0, 182.0, 137.0, 71.0, 30.0, 10.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.815752029418945, -25.31035614013672, -23.804962158203125, -22.2995662689209, -20.794170379638672, -19.288776397705078, -17.78338050842285, -16.277984619140625, -14.772589683532715, -13.267194747924805, -11.761798858642578, -10.256403923034668, -8.751008987426758, -7.245613098144531, -5.740218162536621, -4.2348222732543945, -2.7294273376464844, -1.2240320444107056, 0.28136324882507324, 1.7867584228515625, 3.292153835296631, 4.797549247741699, 6.302944183349609, 7.808340072631836, 9.313735008239746, 10.819129943847656, 12.324525833129883, 13.829920768737793, 15.335315704345703, 16.84071159362793, 18.346107482910156, 19.85150146484375, 21.35689926147461, 22.862295150756836, 24.36768913269043, 25.873085021972656, 27.378480911254883, 28.88387680053711, 30.389270782470703, 31.89466667175293, 33.400062561035156, 34.90545654296875, 36.41085433959961, 37.9162483215332, 39.4216423034668, 40.927040100097656, 42.43243408203125, 43.937828063964844, 45.44322204589844, 46.94861602783203, 48.45401382446289, 49.959407806396484, 51.46480178833008, 52.97019958496094, 54.47559356689453, 55.980987548828125, 57.486385345458984, 58.99177932739258, 60.49717712402344, 62.00257110595703, 63.507965087890625, 65.01335906982422, 66.51875305175781, 68.02415466308594, 69.52954864501953]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 9.0, 10.0, 6.0, 8.0, 14.0, 17.0, 15.0, 10.0, 20.0, 18.0, 28.0, 30.0, 31.0, 28.0, 23.0, 31.0, 42.0, 34.0, 35.0, 27.0, 34.0, 48.0, 42.0, 27.0, 26.0, 35.0, 33.0, 32.0, 29.0, 22.0, 31.0, 20.0, 17.0, 28.0, 21.0, 20.0, 16.0, 24.0, 10.0, 10.0, 8.0, 4.0, 5.0, 6.0, 6.0, 3.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0], "bins": [-16.525115966796875, -16.047571182250977, -15.570027351379395, -15.092483520507812, -14.614938735961914, -14.137394905090332, -13.65985107421875, -13.182306289672852, -12.704761505126953, -12.227217674255371, -11.749672889709473, -11.27212905883789, -10.794584274291992, -10.31704044342041, -9.839496612548828, -9.36195182800293, -8.884407997131348, -8.406864166259766, -7.929319381713867, -7.451775550842285, -6.974230766296387, -6.496686935424805, -6.0191426277160645, -5.541598320007324, -5.064054012298584, -4.586509704589844, -4.1089653968811035, -3.6314213275909424, -3.153877019882202, -2.676332712173462, -2.198788642883301, -1.7212443351745605, -1.243699073791504, -0.7661548256874084, -0.288610577583313, 0.1889336109161377, 0.6664779186248779, 1.1440222263336182, 1.6215662956237793, 2.0991106033325195, 2.5766549110412598, 3.05419921875, 3.5317435264587402, 4.0092878341674805, 4.4868316650390625, 4.964376449584961, 5.441920280456543, 5.919464588165283, 6.397008895874023, 6.874553203582764, 7.352097511291504, 7.829641342163086, 8.307186126708984, 8.784729957580566, 9.262273788452148, 9.739818572998047, 10.217363357543945, 10.694907188415527, 11.172451972961426, 11.649995803833008, 12.127540588378906, 12.605084419250488, 13.08262825012207, 13.560173034667969, 14.03771686553955]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 8.0, 3.0, 15.0, 8.0, 12.0, 15.0, 17.0, 25.0, 27.0, 26.0, 23.0, 32.0, 30.0, 44.0, 37.0, 27.0, 47.0, 40.0, 49.0, 46.0, 40.0, 34.0, 36.0, 41.0, 34.0, 40.0, 38.0, 16.0, 38.0, 23.0, 27.0, 15.0, 13.0, 14.0, 18.0, 9.0, 4.0, 7.0, 9.0, 7.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0], "bins": [-3.375, -3.2843017578125, -3.193603515625, -3.1029052734375, -3.01220703125, -2.9215087890625, -2.830810546875, -2.7401123046875, -2.6494140625, -2.5587158203125, -2.468017578125, -2.3773193359375, -2.28662109375, -2.1959228515625, -2.105224609375, -2.0145263671875, -1.923828125, -1.8331298828125, -1.742431640625, -1.6517333984375, -1.56103515625, -1.4703369140625, -1.379638671875, -1.2889404296875, -1.1982421875, -1.1075439453125, -1.016845703125, -0.9261474609375, -0.83544921875, -0.7447509765625, -0.654052734375, -0.5633544921875, -0.47265625, -0.3819580078125, -0.291259765625, -0.2005615234375, -0.10986328125, -0.0191650390625, 0.071533203125, 0.1622314453125, 0.2529296875, 0.3436279296875, 0.434326171875, 0.5250244140625, 0.61572265625, 0.7064208984375, 0.797119140625, 0.8878173828125, 0.978515625, 1.0692138671875, 1.159912109375, 1.2506103515625, 1.34130859375, 1.4320068359375, 1.522705078125, 1.6134033203125, 1.7041015625, 1.7947998046875, 1.885498046875, 1.9761962890625, 2.06689453125, 2.1575927734375, 2.248291015625, 2.3389892578125, 2.4296875]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 6.0, 9.0, 5.0, 12.0, 23.0, 28.0, 58.0, 74.0, 107.0, 163.0, 242.0, 385.0, 562.0, 900.0, 1319.0, 2024.0, 3149.0, 4952.0, 7796.0, 12359.0, 19439.0, 30981.0, 48337.0, 75311.0, 111199.0, 150551.0, 166215.0, 136902.0, 97636.0, 64703.0, 41295.0, 26163.0, 16246.0, 10506.0, 6648.0, 4292.0, 2752.0, 1755.0, 1177.0, 760.0, 518.0, 321.0, 238.0, 161.0, 85.0, 52.0, 42.0, 38.0, 23.0, 19.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0], "bins": [-0.23828125, -0.23113059997558594, -0.22397994995117188, -0.2168292999267578, -0.20967864990234375, -0.2025279998779297, -0.19537734985351562, -0.18822669982910156, -0.1810760498046875, -0.17392539978027344, -0.16677474975585938, -0.1596240997314453, -0.15247344970703125, -0.1453227996826172, -0.13817214965820312, -0.13102149963378906, -0.123870849609375, -0.11672019958496094, -0.10956954956054688, -0.10241889953613281, -0.09526824951171875, -0.08811759948730469, -0.08096694946289062, -0.07381629943847656, -0.0666656494140625, -0.05951499938964844, -0.052364349365234375, -0.04521369934082031, -0.03806304931640625, -0.030912399291992188, -0.023761749267578125, -0.016611099243164062, -0.00946044921875, -0.0023097991943359375, 0.004840850830078125, 0.011991500854492188, 0.01914215087890625, 0.026292800903320312, 0.033443450927734375, 0.04059410095214844, 0.0477447509765625, 0.05489540100097656, 0.062046051025390625, 0.06919670104980469, 0.07634735107421875, 0.08349800109863281, 0.09064865112304688, 0.09779930114746094, 0.104949951171875, 0.11210060119628906, 0.11925125122070312, 0.1264019012451172, 0.13355255126953125, 0.1407032012939453, 0.14785385131835938, 0.15500450134277344, 0.1621551513671875, 0.16930580139160156, 0.17645645141601562, 0.1836071014404297, 0.19075775146484375, 0.1979084014892578, 0.20505905151367188, 0.21220970153808594, 0.2193603515625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 5.0, 9.0, 9.0, 11.0, 13.0, 11.0, 8.0, 10.0, 19.0, 22.0, 17.0, 12.0, 18.0, 21.0, 28.0, 27.0, 27.0, 28.0, 46.0, 34.0, 45.0, 34.0, 39.0, 1056.0, 45.0, 30.0, 32.0, 40.0, 29.0, 34.0, 28.0, 16.0, 21.0, 24.0, 18.0, 19.0, 27.0, 19.0, 15.0, 11.0, 9.0, 9.0, 10.0, 7.0, 12.0, 7.0, 4.0, 3.0, 3.0, 5.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.1484375, -2.083587646484375, -2.01873779296875, -1.953887939453125, -1.8890380859375, -1.824188232421875, -1.75933837890625, -1.694488525390625, -1.629638671875, -1.564788818359375, -1.49993896484375, -1.435089111328125, -1.3702392578125, -1.305389404296875, -1.24053955078125, -1.175689697265625, -1.11083984375, -1.045989990234375, -0.98114013671875, -0.916290283203125, -0.8514404296875, -0.786590576171875, -0.72174072265625, -0.656890869140625, -0.592041015625, -0.527191162109375, -0.46234130859375, -0.397491455078125, -0.3326416015625, -0.267791748046875, -0.20294189453125, -0.138092041015625, -0.0732421875, -0.008392333984375, 0.05645751953125, 0.121307373046875, 0.1861572265625, 0.251007080078125, 0.31585693359375, 0.380706787109375, 0.445556640625, 0.510406494140625, 0.57525634765625, 0.640106201171875, 0.7049560546875, 0.769805908203125, 0.83465576171875, 0.899505615234375, 0.96435546875, 1.029205322265625, 1.09405517578125, 1.158905029296875, 1.2237548828125, 1.288604736328125, 1.35345458984375, 1.418304443359375, 1.483154296875, 1.548004150390625, 1.61285400390625, 1.677703857421875, 1.7425537109375, 1.807403564453125, 1.87225341796875, 1.937103271484375, 2.001953125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 10.0, 9.0, 18.0, 28.0, 45.0, 52.0, 89.0, 132.0, 189.0, 340.0, 469.0, 763.0, 1297.0, 2291.0, 3898.0, 6540.0, 10590.0, 18218.0, 30014.0, 49441.0, 80393.0, 123936.0, 193524.0, 1196032.0, 139076.0, 93267.0, 58437.0, 35133.0, 21375.0, 12546.0, 7635.0, 4544.0, 2675.0, 1570.0, 945.0, 539.0, 397.0, 226.0, 156.0, 90.0, 52.0, 53.0, 36.0, 20.0, 11.0, 6.0, 9.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1392822265625, -0.13466453552246094, -0.13004684448242188, -0.1254291534423828, -0.12081146240234375, -0.11619377136230469, -0.11157608032226562, -0.10695838928222656, -0.1023406982421875, -0.09772300720214844, -0.09310531616210938, -0.08848762512207031, -0.08386993408203125, -0.07925224304199219, -0.07463455200195312, -0.07001686096191406, -0.065399169921875, -0.06078147888183594, -0.056163787841796875, -0.05154609680175781, -0.04692840576171875, -0.04231071472167969, -0.037693023681640625, -0.03307533264160156, -0.0284576416015625, -0.023839950561523438, -0.019222259521484375, -0.014604568481445312, -0.00998687744140625, -0.0053691864013671875, -0.000751495361328125, 0.0038661956787109375, 0.00848388671875, 0.013101577758789062, 0.017719268798828125, 0.022336959838867188, 0.02695465087890625, 0.03157234191894531, 0.036190032958984375, 0.04080772399902344, 0.0454254150390625, 0.05004310607910156, 0.054660797119140625, 0.05927848815917969, 0.06389617919921875, 0.06851387023925781, 0.07313156127929688, 0.07774925231933594, 0.082366943359375, 0.08698463439941406, 0.09160232543945312, 0.09622001647949219, 0.10083770751953125, 0.10545539855957031, 0.11007308959960938, 0.11469078063964844, 0.1193084716796875, 0.12392616271972656, 0.12854385375976562, 0.1331615447998047, 0.13777923583984375, 0.1423969268798828, 0.14701461791992188, 0.15163230895996094, 0.15625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 3.0, 4.0, 7.0, 5.0, 7.0, 10.0, 7.0, 15.0, 14.0, 18.0, 29.0, 22.0, 28.0, 52.0, 36.0, 55.0, 90.0, 113.0, 106.0, 73.0, 61.0, 43.0, 36.0, 27.0, 24.0, 16.0, 15.0, 23.0, 11.0, 10.0, 7.0, 5.0, 4.0, 4.0, 5.0, 5.0, 6.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00916290283203125, -0.008872389793395996, -0.008581876754760742, -0.008291363716125488, -0.008000850677490234, -0.0077103376388549805, -0.0074198246002197266, -0.007129311561584473, -0.006838798522949219, -0.006548285484313965, -0.006257772445678711, -0.005967259407043457, -0.005676746368408203, -0.005386233329772949, -0.005095720291137695, -0.004805207252502441, -0.0045146942138671875, -0.004224181175231934, -0.00393366813659668, -0.0036431550979614258, -0.003352642059326172, -0.003062129020690918, -0.002771615982055664, -0.00248110294342041, -0.0021905899047851562, -0.0019000768661499023, -0.0016095638275146484, -0.0013190507888793945, -0.0010285377502441406, -0.0007380247116088867, -0.0004475116729736328, -0.0001569986343383789, 0.000133514404296875, 0.0004240274429321289, 0.0007145404815673828, 0.0010050535202026367, 0.0012955665588378906, 0.0015860795974731445, 0.0018765926361083984, 0.0021671056747436523, 0.0024576187133789062, 0.00274813175201416, 0.003038644790649414, 0.003329157829284668, 0.003619670867919922, 0.003910183906555176, 0.00420069694519043, 0.004491209983825684, 0.0047817230224609375, 0.005072236061096191, 0.005362749099731445, 0.005653262138366699, 0.005943775177001953, 0.006234288215637207, 0.006524801254272461, 0.006815314292907715, 0.007105827331542969, 0.007396340370178223, 0.0076868534088134766, 0.00797736644744873, 0.008267879486083984, 0.008558392524719238, 0.008848905563354492, 0.009139418601989746, 0.009429931640625]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 8.0, 5.0, 3.0, 5.0, 7.0, 7.0, 12.0, 13.0, 19.0, 22.0, 25.0, 27.0, 58.0, 66.0, 130.0, 224.0, 791.0, 41619.0, 995537.0, 9031.0, 418.0, 177.0, 101.0, 62.0, 38.0, 37.0, 25.0, 22.0, 11.0, 3.0, 14.0, 5.0, 5.0, 8.0, 3.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2099609375, -0.20347023010253906, -0.19697952270507812, -0.1904888153076172, -0.18399810791015625, -0.1775074005126953, -0.17101669311523438, -0.16452598571777344, -0.1580352783203125, -0.15154457092285156, -0.14505386352539062, -0.1385631561279297, -0.13207244873046875, -0.1255817413330078, -0.11909103393554688, -0.11260032653808594, -0.106109619140625, -0.09961891174316406, -0.09312820434570312, -0.08663749694824219, -0.08014678955078125, -0.07365608215332031, -0.06716537475585938, -0.06067466735839844, -0.0541839599609375, -0.04769325256347656, -0.041202545166015625, -0.03471183776855469, -0.02822113037109375, -0.021730422973632812, -0.015239715576171875, -0.008749008178710938, -0.00225830078125, 0.0042324066162109375, 0.010723114013671875, 0.017213821411132812, 0.02370452880859375, 0.030195236206054688, 0.036685943603515625, 0.04317665100097656, 0.0496673583984375, 0.05615806579589844, 0.06264877319335938, 0.06913948059082031, 0.07563018798828125, 0.08212089538574219, 0.08861160278320312, 0.09510231018066406, 0.101593017578125, 0.10808372497558594, 0.11457443237304688, 0.12106513977050781, 0.12755584716796875, 0.1340465545654297, 0.14053726196289062, 0.14702796936035156, 0.1535186767578125, 0.16000938415527344, 0.16650009155273438, 0.1729907989501953, 0.17948150634765625, 0.1859722137451172, 0.19246292114257812, 0.19895362854003906, 0.2054443359375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 19.0, 25.0, 37.0, 68.0, 147.0, 259.0, 200.0, 91.0, 64.0, 27.0, 18.0, 20.0, 9.0, 6.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048612404614686966, -0.04697245731949806, -0.04533250629901886, -0.043692559003829956, -0.04205261170864105, -0.04041266441345215, -0.038772713392972946, -0.03713276609778404, -0.03549281507730484, -0.033852867782115936, -0.032212916761636734, -0.03057296946644783, -0.028933022171258926, -0.027293073013424873, -0.02565312385559082, -0.024013176560401917, -0.022373229265213013, -0.02073328010737896, -0.019093332812190056, -0.017453383654356003, -0.0158134363591671, -0.014173487201333046, -0.012533538043498993, -0.010893589816987514, -0.009253641590476036, -0.007613693363964558, -0.005973744671791792, -0.004333795979619026, -0.0026938477531075478, -0.0010538995265960693, 0.0005860496312379837, 0.002225997857749462, 0.003865942358970642, 0.0055058905854821205, 0.007145839277654886, 0.008785787969827652, 0.01042573619633913, 0.012065684422850609, 0.013705633580684662, 0.01534558180719614, 0.01698553003370762, 0.018625479191541672, 0.020265426486730576, 0.02190537564456463, 0.02354532480239868, 0.025185272097587585, 0.02682522125542164, 0.02846517041325569, 0.030105117708444595, 0.0317450650036335, 0.0333850160241127, 0.035024963319301605, 0.03666491061449051, 0.03830485790967941, 0.039944808930158615, 0.04158475622534752, 0.04322470724582672, 0.044864654541015625, 0.04650460556149483, 0.04814455285668373, 0.049784500151872635, 0.05142445117235184, 0.05306439846754074, 0.054704345762729645, 0.05634429305791855]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 4.0, 6.0, 9.0, 9.0, 5.0, 11.0, 11.0, 12.0, 14.0, 24.0, 20.0, 24.0, 23.0, 39.0, 29.0, 26.0, 25.0, 23.0, 35.0, 25.0, 25.0, 29.0, 44.0, 32.0, 36.0, 28.0, 36.0, 41.0, 44.0, 36.0, 27.0, 17.0, 25.0, 11.0, 21.0, 25.0, 25.0, 20.0, 19.0, 7.0, 14.0, 9.0, 6.0, 10.0, 9.0, 6.0, 9.0, 6.0, 6.0, 1.0, 2.0, 2.0, 4.0, 3.0], "bins": [-0.013815760612487793, -0.013405535370111465, -0.012995310127735138, -0.01258508488535881, -0.012174859642982483, -0.011764634400606155, -0.011354409158229828, -0.0109441839158535, -0.010533958673477173, -0.010123733431100845, -0.009713508188724518, -0.00930328294634819, -0.008893057703971863, -0.008482832461595535, -0.008072607219219208, -0.00766238197684288, -0.007252156734466553, -0.006841931492090225, -0.006431706249713898, -0.00602148100733757, -0.005611255764961243, -0.005201030522584915, -0.004790805280208588, -0.00438058003783226, -0.003970354795455933, -0.003560129553079605, -0.0031499043107032776, -0.00273967906832695, -0.0023294538259506226, -0.001919228583574295, -0.0015090033411979675, -0.00109877809882164, -0.0006885528564453125, -0.000278327614068985, 0.00013189762830734253, 0.00054212287068367, 0.0009523481130599976, 0.001362573355436325, 0.0017727985978126526, 0.00218302384018898, 0.0025932490825653076, 0.003003474324941635, 0.0034136995673179626, 0.00382392480969429, 0.004234150052070618, 0.004644375294446945, 0.005054600536823273, 0.0054648257791996, 0.005875051021575928, 0.006285276263952255, 0.006695501506328583, 0.00710572674870491, 0.007515951991081238, 0.007926177233457565, 0.008336402475833893, 0.00874662771821022, 0.009156852960586548, 0.009567078202962875, 0.009977303445339203, 0.01038752868771553, 0.010797753930091858, 0.011207979172468185, 0.011618204414844513, 0.01202842965722084, 0.012438654899597168]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 3.0, 8.0, 2.0, 16.0, 7.0, 13.0, 15.0, 17.0, 25.0, 27.0, 26.0, 23.0, 32.0, 29.0, 45.0, 37.0, 26.0, 48.0, 40.0, 49.0, 45.0, 41.0, 34.0, 35.0, 42.0, 33.0, 41.0, 39.0, 15.0, 38.0, 23.0, 27.0, 15.0, 13.0, 14.0, 18.0, 9.0, 4.0, 7.0, 9.0, 7.0, 0.0, 4.0, 1.0, 2.0, 0.0, 3.0], "bins": [-3.376953125, -3.286224365234375, -3.19549560546875, -3.104766845703125, -3.0140380859375, -2.923309326171875, -2.83258056640625, -2.741851806640625, -2.651123046875, -2.560394287109375, -2.46966552734375, -2.378936767578125, -2.2882080078125, -2.197479248046875, -2.10675048828125, -2.016021728515625, -1.92529296875, -1.834564208984375, -1.74383544921875, -1.653106689453125, -1.5623779296875, -1.471649169921875, -1.38092041015625, -1.290191650390625, -1.199462890625, -1.108734130859375, -1.01800537109375, -0.927276611328125, -0.8365478515625, -0.745819091796875, -0.65509033203125, -0.564361572265625, -0.4736328125, -0.382904052734375, -0.29217529296875, -0.201446533203125, -0.1107177734375, -0.019989013671875, 0.07073974609375, 0.161468505859375, 0.252197265625, 0.342926025390625, 0.43365478515625, 0.524383544921875, 0.6151123046875, 0.705841064453125, 0.79656982421875, 0.887298583984375, 0.97802734375, 1.068756103515625, 1.15948486328125, 1.250213623046875, 1.3409423828125, 1.431671142578125, 1.52239990234375, 1.613128662109375, 1.703857421875, 1.794586181640625, 1.88531494140625, 1.976043701171875, 2.0667724609375, 2.157501220703125, 2.24822998046875, 2.338958740234375, 2.4296875]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 5.0, 9.0, 11.0, 13.0, 17.0, 27.0, 29.0, 46.0, 52.0, 85.0, 104.0, 186.0, 391.0, 855.0, 2459.0, 7550.0, 23696.0, 76364.0, 294265.0, 465848.0, 122354.0, 36259.0, 11660.0, 3755.0, 1272.0, 506.0, 251.0, 128.0, 75.0, 68.0, 45.0, 33.0, 37.0, 22.0, 18.0, 9.0, 11.0, 8.0, 7.0, 5.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-5.51953125, -5.36700439453125, -5.2144775390625, -5.06195068359375, -4.909423828125, -4.75689697265625, -4.6043701171875, -4.45184326171875, -4.29931640625, -4.14678955078125, -3.9942626953125, -3.84173583984375, -3.689208984375, -3.53668212890625, -3.3841552734375, -3.23162841796875, -3.0791015625, -2.92657470703125, -2.7740478515625, -2.62152099609375, -2.468994140625, -2.31646728515625, -2.1639404296875, -2.01141357421875, -1.85888671875, -1.70635986328125, -1.5538330078125, -1.40130615234375, -1.248779296875, -1.09625244140625, -0.9437255859375, -0.79119873046875, -0.638671875, -0.48614501953125, -0.3336181640625, -0.18109130859375, -0.028564453125, 0.12396240234375, 0.2764892578125, 0.42901611328125, 0.58154296875, 0.73406982421875, 0.8865966796875, 1.03912353515625, 1.191650390625, 1.34417724609375, 1.4967041015625, 1.64923095703125, 1.8017578125, 1.95428466796875, 2.1068115234375, 2.25933837890625, 2.411865234375, 2.56439208984375, 2.7169189453125, 2.86944580078125, 3.02197265625, 3.17449951171875, 3.3270263671875, 3.47955322265625, 3.632080078125, 3.78460693359375, 3.9371337890625, 4.08966064453125, 4.2421875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 8.0, 11.0, 15.0, 15.0, 13.0, 17.0, 19.0, 24.0, 32.0, 33.0, 23.0, 43.0, 52.0, 56.0, 98.0, 128.0, 279.0, 1463.0, 221.0, 92.0, 67.0, 55.0, 37.0, 41.0, 26.0, 25.0, 25.0, 32.0, 17.0, 15.0, 15.0, 16.0, 7.0, 9.0, 3.0, 8.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.203125, -8.88916015625, -8.5751953125, -8.26123046875, -7.947265625, -7.63330078125, -7.3193359375, -7.00537109375, -6.69140625, -6.37744140625, -6.0634765625, -5.74951171875, -5.435546875, -5.12158203125, -4.8076171875, -4.49365234375, -4.1796875, -3.86572265625, -3.5517578125, -3.23779296875, -2.923828125, -2.60986328125, -2.2958984375, -1.98193359375, -1.66796875, -1.35400390625, -1.0400390625, -0.72607421875, -0.412109375, -0.09814453125, 0.2158203125, 0.52978515625, 0.84375, 1.15771484375, 1.4716796875, 1.78564453125, 2.099609375, 2.41357421875, 2.7275390625, 3.04150390625, 3.35546875, 3.66943359375, 3.9833984375, 4.29736328125, 4.611328125, 4.92529296875, 5.2392578125, 5.55322265625, 5.8671875, 6.18115234375, 6.4951171875, 6.80908203125, 7.123046875, 7.43701171875, 7.7509765625, 8.06494140625, 8.37890625, 8.69287109375, 9.0068359375, 9.32080078125, 9.634765625, 9.94873046875, 10.2626953125, 10.57666015625, 10.890625]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 4.0, 6.0, 5.0, 10.0, 16.0, 21.0, 20.0, 24.0, 36.0, 42.0, 41.0, 55.0, 84.0, 125.0, 219.0, 461.0, 1397.0, 32290.0, 3054095.0, 53852.0, 1644.0, 469.0, 237.0, 169.0, 94.0, 46.0, 66.0, 34.0, 22.0, 28.0, 11.0, 27.0, 19.0, 10.0, 9.0, 6.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-29.265625, -28.41845703125, -27.5712890625, -26.72412109375, -25.876953125, -25.02978515625, -24.1826171875, -23.33544921875, -22.48828125, -21.64111328125, -20.7939453125, -19.94677734375, -19.099609375, -18.25244140625, -17.4052734375, -16.55810546875, -15.7109375, -14.86376953125, -14.0166015625, -13.16943359375, -12.322265625, -11.47509765625, -10.6279296875, -9.78076171875, -8.93359375, -8.08642578125, -7.2392578125, -6.39208984375, -5.544921875, -4.69775390625, -3.8505859375, -3.00341796875, -2.15625, -1.30908203125, -0.4619140625, 0.38525390625, 1.232421875, 2.07958984375, 2.9267578125, 3.77392578125, 4.62109375, 5.46826171875, 6.3154296875, 7.16259765625, 8.009765625, 8.85693359375, 9.7041015625, 10.55126953125, 11.3984375, 12.24560546875, 13.0927734375, 13.93994140625, 14.787109375, 15.63427734375, 16.4814453125, 17.32861328125, 18.17578125, 19.02294921875, 19.8701171875, 20.71728515625, 21.564453125, 22.41162109375, 23.2587890625, 24.10595703125, 24.953125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 28.0, 159.0, 399.0, 325.0, 84.0, 18.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.68353271484375, -76.9996566772461, -75.31578826904297, -73.63191223144531, -71.94803619384766, -70.26416015625, -68.58029174804688, -66.89641571044922, -65.21253967285156, -63.52866744995117, -61.844791412353516, -60.160919189453125, -58.47704315185547, -56.79317092895508, -55.10929489135742, -53.42542266845703, -51.741546630859375, -50.057674407958984, -48.37379837036133, -46.68992614746094, -45.00605010986328, -43.32217788696289, -41.638301849365234, -39.954429626464844, -38.27055740356445, -36.58668518066406, -34.902809143066406, -33.218936920166016, -31.53506088256836, -29.85118865966797, -28.167312622070312, -26.483440399169922, -24.7995662689209, -23.115692138671875, -21.43181800842285, -19.747943878173828, -18.064069747924805, -16.38019561767578, -14.696322441101074, -13.01244831085205, -11.328574180603027, -9.644700050354004, -7.9608259201049805, -6.276952266693115, -4.593078136444092, -2.9092044830322266, -1.2253303527832031, 0.4585437774658203, 2.1424179077148438, 3.826292037963867, 5.510166168212891, 7.194039821624756, 8.877914428710938, 10.561787605285645, 12.245661735534668, 13.929535865783691, 15.613409996032715, 17.297283172607422, 18.981157302856445, 20.66503143310547, 22.348905563354492, 24.032779693603516, 25.71665382385254, 27.400527954101562, 29.084402084350586]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 16.0, 9.0, 11.0, 9.0, 13.0, 16.0, 18.0, 15.0, 28.0, 40.0, 32.0, 38.0, 37.0, 31.0, 39.0, 35.0, 45.0, 30.0, 50.0, 41.0, 46.0, 53.0, 44.0, 38.0, 43.0, 31.0, 41.0, 25.0, 24.0, 16.0, 15.0, 13.0, 8.0, 5.0, 11.0, 10.0, 5.0, 5.0, 4.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.583093643188477, -30.59583282470703, -29.60857391357422, -28.621313095092773, -27.63405418395996, -26.646793365478516, -25.659534454345703, -24.672273635864258, -23.685012817382812, -22.697751998901367, -21.710493087768555, -20.72323226928711, -19.735973358154297, -18.74871253967285, -17.761451721191406, -16.774192810058594, -15.786933898925781, -14.799674034118652, -13.812414169311523, -12.825153350830078, -11.837894439697266, -10.85063362121582, -9.863373756408691, -8.876113891601562, -7.888854026794434, -6.901594161987305, -5.914334297180176, -4.927073955535889, -3.9398140907287598, -2.952554225921631, -1.9652938842773438, -0.9780340194702148, 0.00922393798828125, 0.9964839220046997, 1.9837439060211182, 2.971004009246826, 3.958263874053955, 4.945523738861084, 5.932784080505371, 6.9200439453125, 7.907303810119629, 8.894563674926758, 9.881823539733887, 10.869083404541016, 11.856344223022461, 12.843603134155273, 13.830863952636719, 14.818123817443848, 15.805383682250977, 16.792644500732422, 17.779903411865234, 18.76716423034668, 19.754423141479492, 20.741683959960938, 21.72894287109375, 22.716203689575195, 23.70346450805664, 24.690725326538086, 25.6779842376709, 26.665245056152344, 27.652503967285156, 28.6397647857666, 29.627025604248047, 30.61428451538086, 31.601543426513672]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 4.0, 8.0, 13.0, 14.0, 23.0, 14.0, 10.0, 20.0, 28.0, 26.0, 26.0, 24.0, 33.0, 27.0, 31.0, 39.0, 50.0, 39.0, 49.0, 48.0, 42.0, 41.0, 41.0, 35.0, 38.0, 30.0, 30.0, 29.0, 29.0, 30.0, 23.0, 18.0, 24.0, 11.0, 14.0, 8.0, 3.0, 5.0, 8.0, 4.0, 4.0, 5.0, 3.0, 0.0, 2.0, 2.0], "bins": [-3.806640625, -3.704498291015625, -3.60235595703125, -3.500213623046875, -3.3980712890625, -3.295928955078125, -3.19378662109375, -3.091644287109375, -2.989501953125, -2.887359619140625, -2.78521728515625, -2.683074951171875, -2.5809326171875, -2.478790283203125, -2.37664794921875, -2.274505615234375, -2.17236328125, -2.070220947265625, -1.96807861328125, -1.865936279296875, -1.7637939453125, -1.661651611328125, -1.55950927734375, -1.457366943359375, -1.355224609375, -1.253082275390625, -1.15093994140625, -1.048797607421875, -0.9466552734375, -0.844512939453125, -0.74237060546875, -0.640228271484375, -0.5380859375, -0.435943603515625, -0.33380126953125, -0.231658935546875, -0.1295166015625, -0.027374267578125, 0.07476806640625, 0.176910400390625, 0.279052734375, 0.381195068359375, 0.48333740234375, 0.585479736328125, 0.6876220703125, 0.789764404296875, 0.89190673828125, 0.994049072265625, 1.09619140625, 1.198333740234375, 1.30047607421875, 1.402618408203125, 1.5047607421875, 1.606903076171875, 1.70904541015625, 1.811187744140625, 1.913330078125, 2.015472412109375, 2.11761474609375, 2.219757080078125, 2.3218994140625, 2.424041748046875, 2.52618408203125, 2.628326416015625, 2.73046875]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 8.0, 15.0, 27.0, 34.0, 63.0, 73.0, 133.0, 197.0, 344.0, 582.0, 1040.0, 2086.0, 4263.0, 9318.0, 20758.0, 50146.0, 126326.0, 309532.0, 682419.0, 1117085.0, 975159.0, 516349.0, 223028.0, 89543.0, 36483.0, 15408.0, 6903.0, 3277.0, 1578.0, 797.0, 504.0, 264.0, 162.0, 123.0, 79.0, 50.0, 43.0, 23.0, 21.0, 13.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.146484375, -3.058624267578125, -2.97076416015625, -2.882904052734375, -2.7950439453125, -2.707183837890625, -2.61932373046875, -2.531463623046875, -2.443603515625, -2.355743408203125, -2.26788330078125, -2.180023193359375, -2.0921630859375, -2.004302978515625, -1.91644287109375, -1.828582763671875, -1.74072265625, -1.652862548828125, -1.56500244140625, -1.477142333984375, -1.3892822265625, -1.301422119140625, -1.21356201171875, -1.125701904296875, -1.037841796875, -0.949981689453125, -0.86212158203125, -0.774261474609375, -0.6864013671875, -0.598541259765625, -0.51068115234375, -0.422821044921875, -0.3349609375, -0.247100830078125, -0.15924072265625, -0.071380615234375, 0.0164794921875, 0.104339599609375, 0.19219970703125, 0.280059814453125, 0.367919921875, 0.455780029296875, 0.54364013671875, 0.631500244140625, 0.7193603515625, 0.807220458984375, 0.89508056640625, 0.982940673828125, 1.07080078125, 1.158660888671875, 1.24652099609375, 1.334381103515625, 1.4222412109375, 1.510101318359375, 1.59796142578125, 1.685821533203125, 1.773681640625, 1.861541748046875, 1.94940185546875, 2.037261962890625, 2.1251220703125, 2.212982177734375, 2.30084228515625, 2.388702392578125, 2.4765625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 6.0, 2.0, 6.0, 11.0, 9.0, 19.0, 23.0, 39.0, 59.0, 94.0, 106.0, 168.0, 231.0, 306.0, 404.0, 508.0, 539.0, 498.0, 309.0, 211.0, 146.0, 123.0, 90.0, 60.0, 33.0, 22.0, 14.0, 11.0, 9.0, 10.0, 4.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.83203125, -7.62054443359375, -7.4090576171875, -7.19757080078125, -6.986083984375, -6.77459716796875, -6.5631103515625, -6.35162353515625, -6.14013671875, -5.92864990234375, -5.7171630859375, -5.50567626953125, -5.294189453125, -5.08270263671875, -4.8712158203125, -4.65972900390625, -4.4482421875, -4.23675537109375, -4.0252685546875, -3.81378173828125, -3.602294921875, -3.39080810546875, -3.1793212890625, -2.96783447265625, -2.75634765625, -2.54486083984375, -2.3333740234375, -2.12188720703125, -1.910400390625, -1.69891357421875, -1.4874267578125, -1.27593994140625, -1.064453125, -0.85296630859375, -0.6414794921875, -0.42999267578125, -0.218505859375, -0.00701904296875, 0.2044677734375, 0.41595458984375, 0.62744140625, 0.83892822265625, 1.0504150390625, 1.26190185546875, 1.473388671875, 1.68487548828125, 1.8963623046875, 2.10784912109375, 2.3193359375, 2.53082275390625, 2.7423095703125, 2.95379638671875, 3.165283203125, 3.37677001953125, 3.5882568359375, 3.79974365234375, 4.01123046875, 4.22271728515625, 4.4342041015625, 4.64569091796875, 4.857177734375, 5.06866455078125, 5.2801513671875, 5.49163818359375, 5.703125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 4.0, 11.0, 17.0, 18.0, 35.0, 54.0, 90.0, 110.0, 171.0, 313.0, 621.0, 2100.0, 89719.0, 3989174.0, 108102.0, 2228.0, 611.0, 314.0, 202.0, 128.0, 80.0, 59.0, 34.0, 21.0, 17.0, 11.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.203125, -22.4169921875, -21.630859375, -20.8447265625, -20.05859375, -19.2724609375, -18.486328125, -17.7001953125, -16.9140625, -16.1279296875, -15.341796875, -14.5556640625, -13.76953125, -12.9833984375, -12.197265625, -11.4111328125, -10.625, -9.8388671875, -9.052734375, -8.2666015625, -7.48046875, -6.6943359375, -5.908203125, -5.1220703125, -4.3359375, -3.5498046875, -2.763671875, -1.9775390625, -1.19140625, -0.4052734375, 0.380859375, 1.1669921875, 1.953125, 2.7392578125, 3.525390625, 4.3115234375, 5.09765625, 5.8837890625, 6.669921875, 7.4560546875, 8.2421875, 9.0283203125, 9.814453125, 10.6005859375, 11.38671875, 12.1728515625, 12.958984375, 13.7451171875, 14.53125, 15.3173828125, 16.103515625, 16.8896484375, 17.67578125, 18.4619140625, 19.248046875, 20.0341796875, 20.8203125, 21.6064453125, 22.392578125, 23.1787109375, 23.96484375, 24.7509765625, 25.537109375, 26.3232421875, 27.109375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 24.0, 208.0, 500.0, 254.0, 26.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-175.95037841796875, -172.40451049804688, -168.85865783691406, -165.3127899169922, -161.7669219970703, -158.2210693359375, -154.67520141601562, -151.12933349609375, -147.58348083496094, -144.03761291503906, -140.49176025390625, -136.94589233398438, -133.4000244140625, -129.8541717529297, -126.30830383300781, -122.76244354248047, -119.2165756225586, -115.67071533203125, -112.12484741210938, -108.57898712158203, -105.03312683105469, -101.48725891113281, -97.94139862060547, -94.39553833007812, -90.84967041015625, -87.3038101196289, -83.75794219970703, -80.21208190917969, -76.66622161865234, -73.120361328125, -69.57449340820312, -66.02863311767578, -62.4827766418457, -58.936912536621094, -55.39105224609375, -51.84518814086914, -48.29932403564453, -44.75346374511719, -41.20759963989258, -37.66173553466797, -34.115875244140625, -30.57001304626465, -27.024150848388672, -23.478286743164062, -19.932424545288086, -16.38656234741211, -12.8406982421875, -9.294836044311523, -5.748973846435547, -2.203111171722412, 1.3427515029907227, 4.888614654541016, 8.434476852416992, 11.980339050292969, 15.526203155517578, 19.072065353393555, 22.61792755126953, 26.163789749145508, 29.709651947021484, 33.255516052246094, 36.80137634277344, 40.34724044799805, 43.893104553222656, 47.43896484375, 50.98482894897461]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 3.0, 12.0, 8.0, 9.0, 10.0, 14.0, 10.0, 11.0, 11.0, 28.0, 19.0, 32.0, 34.0, 29.0, 38.0, 49.0, 36.0, 37.0, 28.0, 35.0, 32.0, 39.0, 40.0, 29.0, 31.0, 41.0, 32.0, 29.0, 37.0, 29.0, 40.0, 24.0, 18.0, 20.0, 24.0, 12.0, 8.0, 14.0, 7.0, 7.0, 5.0, 5.0, 6.0, 7.0, 3.0, 2.0, 0.0, 1.0, 2.0, 4.0, 2.0, 1.0], "bins": [-19.174789428710938, -18.610828399658203, -18.046865463256836, -17.4829044342041, -16.918941497802734, -16.35498046875, -15.791019439697266, -15.227057456970215, -14.663095474243164, -14.099133491516113, -13.535171508789062, -12.971210479736328, -12.407248497009277, -11.843286514282227, -11.279325485229492, -10.715363502502441, -10.15140151977539, -9.58743953704834, -9.023477554321289, -8.459516525268555, -7.895554542541504, -7.331592559814453, -6.7676310539245605, -6.203669548034668, -5.639707565307617, -5.075745582580566, -4.511784076690674, -3.947822332382202, -3.3838605880737305, -2.819898843765259, -2.255937099456787, -1.6919753551483154, -1.1280136108398438, -0.5640518665313721, -9.012222290039062e-05, 0.5638716220855713, 1.127833366394043, 1.6917951107025146, 2.2557568550109863, 2.819718599319458, 3.3836803436279297, 3.9476420879364014, 4.511603832244873, 5.075565338134766, 5.639527320861816, 6.203489303588867, 6.76745080947876, 7.331412315368652, 7.895374298095703, 8.459336280822754, 9.023298263549805, 9.587259292602539, 10.15122127532959, 10.71518325805664, 11.279144287109375, 11.843106269836426, 12.407068252563477, 12.971030235290527, 13.534992218017578, 14.098953247070312, 14.662915229797363, 15.226877212524414, 15.790838241577148, 16.354801177978516, 16.91876220703125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 8.0, 10.0, 15.0, 13.0, 20.0, 23.0, 24.0, 27.0, 26.0, 27.0, 40.0, 38.0, 38.0, 28.0, 50.0, 37.0, 52.0, 36.0, 38.0, 41.0, 39.0, 39.0, 45.0, 38.0, 35.0, 32.0, 26.0, 30.0, 36.0, 12.0, 13.0, 15.0, 8.0, 7.0, 7.0, 5.0, 7.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.44921875, -3.345703125, -3.2421875, -3.138671875, -3.03515625, -2.931640625, -2.828125, -2.724609375, -2.62109375, -2.517578125, -2.4140625, -2.310546875, -2.20703125, -2.103515625, -2.0, -1.896484375, -1.79296875, -1.689453125, -1.5859375, -1.482421875, -1.37890625, -1.275390625, -1.171875, -1.068359375, -0.96484375, -0.861328125, -0.7578125, -0.654296875, -0.55078125, -0.447265625, -0.34375, -0.240234375, -0.13671875, -0.033203125, 0.0703125, 0.173828125, 0.27734375, 0.380859375, 0.484375, 0.587890625, 0.69140625, 0.794921875, 0.8984375, 1.001953125, 1.10546875, 1.208984375, 1.3125, 1.416015625, 1.51953125, 1.623046875, 1.7265625, 1.830078125, 1.93359375, 2.037109375, 2.140625, 2.244140625, 2.34765625, 2.451171875, 2.5546875, 2.658203125, 2.76171875, 2.865234375, 2.96875, 3.072265625, 3.17578125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 8.0, 2.0, 3.0, 1.0, 11.0, 9.0, 16.0, 36.0, 49.0, 80.0, 87.0, 149.0, 205.0, 268.0, 469.0, 698.0, 1055.0, 1610.0, 2575.0, 4074.0, 6461.0, 9920.0, 15996.0, 25639.0, 40754.0, 65111.0, 99558.0, 142248.0, 171324.0, 152917.0, 110292.0, 72766.0, 46016.0, 28880.0, 17901.0, 11211.0, 7224.0, 4591.0, 3013.0, 1855.0, 1217.0, 748.0, 501.0, 360.0, 226.0, 136.0, 109.0, 69.0, 34.0, 31.0, 23.0, 9.0, 13.0, 4.0, 7.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.250732421875, -0.24327659606933594, -0.23582077026367188, -0.2283649444580078, -0.22090911865234375, -0.2134532928466797, -0.20599746704101562, -0.19854164123535156, -0.1910858154296875, -0.18362998962402344, -0.17617416381835938, -0.1687183380126953, -0.16126251220703125, -0.1538066864013672, -0.14635086059570312, -0.13889503479003906, -0.131439208984375, -0.12398338317871094, -0.11652755737304688, -0.10907173156738281, -0.10161590576171875, -0.09416007995605469, -0.08670425415039062, -0.07924842834472656, -0.0717926025390625, -0.06433677673339844, -0.056880950927734375, -0.04942512512207031, -0.04196929931640625, -0.03451347351074219, -0.027057647705078125, -0.019601821899414062, -0.01214599609375, -0.0046901702880859375, 0.002765655517578125, 0.010221481323242188, 0.01767730712890625, 0.025133132934570312, 0.032588958740234375, 0.04004478454589844, 0.0475006103515625, 0.05495643615722656, 0.062412261962890625, 0.06986808776855469, 0.07732391357421875, 0.08477973937988281, 0.09223556518554688, 0.09969139099121094, 0.107147216796875, 0.11460304260253906, 0.12205886840820312, 0.1295146942138672, 0.13697052001953125, 0.1444263458251953, 0.15188217163085938, 0.15933799743652344, 0.1667938232421875, 0.17424964904785156, 0.18170547485351562, 0.1891613006591797, 0.19661712646484375, 0.2040729522705078, 0.21152877807617188, 0.21898460388183594, 0.2264404296875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 5.0, 6.0, 9.0, 13.0, 8.0, 14.0, 28.0, 21.0, 29.0, 16.0, 27.0, 27.0, 25.0, 35.0, 34.0, 39.0, 50.0, 43.0, 45.0, 1069.0, 43.0, 35.0, 40.0, 45.0, 30.0, 43.0, 29.0, 26.0, 24.0, 22.0, 29.0, 16.0, 14.0, 12.0, 10.0, 16.0, 6.0, 6.0, 10.0, 5.0, 5.0, 3.0, 0.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.53515625, -2.456695556640625, -2.37823486328125, -2.299774169921875, -2.2213134765625, -2.142852783203125, -2.06439208984375, -1.985931396484375, -1.907470703125, -1.829010009765625, -1.75054931640625, -1.672088623046875, -1.5936279296875, -1.515167236328125, -1.43670654296875, -1.358245849609375, -1.27978515625, -1.201324462890625, -1.12286376953125, -1.044403076171875, -0.9659423828125, -0.887481689453125, -0.80902099609375, -0.730560302734375, -0.652099609375, -0.573638916015625, -0.49517822265625, -0.416717529296875, -0.3382568359375, -0.259796142578125, -0.18133544921875, -0.102874755859375, -0.0244140625, 0.054046630859375, 0.13250732421875, 0.210968017578125, 0.2894287109375, 0.367889404296875, 0.44635009765625, 0.524810791015625, 0.603271484375, 0.681732177734375, 0.76019287109375, 0.838653564453125, 0.9171142578125, 0.995574951171875, 1.07403564453125, 1.152496337890625, 1.23095703125, 1.309417724609375, 1.38787841796875, 1.466339111328125, 1.5447998046875, 1.623260498046875, 1.70172119140625, 1.780181884765625, 1.858642578125, 1.937103271484375, 2.01556396484375, 2.094024658203125, 2.1724853515625, 2.250946044921875, 2.32940673828125, 2.407867431640625, 2.486328125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 3.0, 5.0, 9.0, 12.0, 23.0, 13.0, 28.0, 38.0, 53.0, 87.0, 139.0, 192.0, 300.0, 446.0, 660.0, 1005.0, 1588.0, 2524.0, 3798.0, 6153.0, 9902.0, 15510.0, 24526.0, 39127.0, 61035.0, 92198.0, 131296.0, 1164569.0, 196976.0, 118735.0, 81933.0, 52847.0, 33661.0, 21130.0, 13262.0, 8419.0, 5363.0, 3283.0, 2208.0, 1337.0, 936.0, 557.0, 416.0, 291.0, 181.0, 128.0, 62.0, 56.0, 33.0, 23.0, 18.0, 12.0, 10.0, 13.0, 3.0, 6.0, 3.0, 3.0, 2.0, 2.0], "bins": [-0.1356201171875, -0.1313610076904297, -0.12710189819335938, -0.12284278869628906, -0.11858367919921875, -0.11432456970214844, -0.11006546020507812, -0.10580635070800781, -0.1015472412109375, -0.09728813171386719, -0.09302902221679688, -0.08876991271972656, -0.08451080322265625, -0.08025169372558594, -0.07599258422851562, -0.07173347473144531, -0.067474365234375, -0.06321525573730469, -0.058956146240234375, -0.05469703674316406, -0.05043792724609375, -0.04617881774902344, -0.041919708251953125, -0.03766059875488281, -0.0334014892578125, -0.029142379760742188, -0.024883270263671875, -0.020624160766601562, -0.01636505126953125, -0.012105941772460938, -0.007846832275390625, -0.0035877227783203125, 0.00067138671875, 0.0049304962158203125, 0.009189605712890625, 0.013448715209960938, 0.01770782470703125, 0.021966934204101562, 0.026226043701171875, 0.030485153198242188, 0.0347442626953125, 0.03900337219238281, 0.043262481689453125, 0.04752159118652344, 0.05178070068359375, 0.05603981018066406, 0.060298919677734375, 0.06455802917480469, 0.068817138671875, 0.07307624816894531, 0.07733535766601562, 0.08159446716308594, 0.08585357666015625, 0.09011268615722656, 0.09437179565429688, 0.09863090515136719, 0.1028900146484375, 0.10714912414550781, 0.11140823364257812, 0.11566734313964844, 0.11992645263671875, 0.12418556213378906, 0.12844467163085938, 0.1327037811279297, 0.136962890625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 6.0, 6.0, 16.0, 9.0, 14.0, 17.0, 20.0, 35.0, 57.0, 77.0, 126.0, 129.0, 130.0, 101.0, 69.0, 57.0, 29.0, 27.0, 14.0, 12.0, 6.0, 8.0, 3.0, 5.0, 4.0, 0.0, 4.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.01039886474609375, -0.01013094186782837, -0.009863018989562988, -0.009595096111297607, -0.009327173233032227, -0.009059250354766846, -0.008791327476501465, -0.008523404598236084, -0.008255481719970703, -0.007987558841705322, -0.007719635963439941, -0.0074517130851745605, -0.00718379020690918, -0.006915867328643799, -0.006647944450378418, -0.006380021572113037, -0.006112098693847656, -0.005844175815582275, -0.0055762529373168945, -0.005308330059051514, -0.005040407180786133, -0.004772484302520752, -0.004504561424255371, -0.00423663854598999, -0.003968715667724609, -0.0037007927894592285, -0.0034328699111938477, -0.003164947032928467, -0.002897024154663086, -0.002629101276397705, -0.0023611783981323242, -0.0020932555198669434, -0.0018253326416015625, -0.0015574097633361816, -0.0012894868850708008, -0.00102156400680542, -0.0007536411285400391, -0.0004857182502746582, -0.00021779537200927734, 5.0127506256103516e-05, 0.0003180503845214844, 0.0005859732627868652, 0.0008538961410522461, 0.001121819019317627, 0.0013897418975830078, 0.0016576647758483887, 0.0019255876541137695, 0.0021935105323791504, 0.0024614334106445312, 0.002729356288909912, 0.002997279167175293, 0.003265202045440674, 0.0035331249237060547, 0.0038010478019714355, 0.004068970680236816, 0.004336893558502197, 0.004604816436767578, 0.004872739315032959, 0.00514066219329834, 0.005408585071563721, 0.0056765079498291016, 0.005944430828094482, 0.006212353706359863, 0.006480276584625244, 0.006748199462890625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 1.0, 6.0, 6.0, 5.0, 15.0, 14.0, 20.0, 24.0, 36.0, 58.0, 110.0, 210.0, 756.0, 39067.0, 1005683.0, 1858.0, 291.0, 120.0, 92.0, 38.0, 32.0, 24.0, 16.0, 18.0, 10.0, 9.0, 7.0, 1.0, 7.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1474609375, -0.14183425903320312, -0.13620758056640625, -0.13058090209960938, -0.1249542236328125, -0.11932754516601562, -0.11370086669921875, -0.10807418823242188, -0.102447509765625, -0.09682083129882812, -0.09119415283203125, -0.08556747436523438, -0.0799407958984375, -0.07431411743164062, -0.06868743896484375, -0.06306076049804688, -0.05743408203125, -0.051807403564453125, -0.04618072509765625, -0.040554046630859375, -0.0349273681640625, -0.029300689697265625, -0.02367401123046875, -0.018047332763671875, -0.012420654296875, -0.006793975830078125, -0.00116729736328125, 0.004459381103515625, 0.0100860595703125, 0.015712738037109375, 0.02133941650390625, 0.026966094970703125, 0.0325927734375, 0.038219451904296875, 0.04384613037109375, 0.049472808837890625, 0.0550994873046875, 0.060726165771484375, 0.06635284423828125, 0.07197952270507812, 0.077606201171875, 0.08323287963867188, 0.08885955810546875, 0.09448623657226562, 0.1001129150390625, 0.10573959350585938, 0.11136627197265625, 0.11699295043945312, 0.12261962890625, 0.12824630737304688, 0.13387298583984375, 0.13949966430664062, 0.1451263427734375, 0.15075302124023438, 0.15637969970703125, 0.16200637817382812, 0.167633056640625, 0.17325973510742188, 0.17888641357421875, 0.18451309204101562, 0.1901397705078125, 0.19576644897460938, 0.20139312744140625, 0.20701980590820312, 0.212646484375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 13.0, 27.0, 59.0, 132.0, 467.0, 211.0, 72.0, 15.0, 7.0, 3.0, 0.0, 2.0], "bins": [-0.06743063777685165, -0.06624156981706619, -0.06505250185728073, -0.06386343389749527, -0.06267436593770981, -0.061485301703214645, -0.060296233743429184, -0.05910716578364372, -0.05791809782385826, -0.0567290298640728, -0.05553996190428734, -0.05435089394450188, -0.053161829710006714, -0.05197276175022125, -0.05078369379043579, -0.04959462583065033, -0.04840555787086487, -0.04721648991107941, -0.046027421951293945, -0.044838353991508484, -0.04364928603172302, -0.04246022179722786, -0.0412711538374424, -0.04008208587765694, -0.038893017917871475, -0.037703949958086014, -0.03651488199830055, -0.03532581403851509, -0.03413674980401993, -0.03294768184423447, -0.031758613884449005, -0.030569545924663544, -0.02938048169016838, -0.02819141373038292, -0.027002345770597458, -0.025813279673457146, -0.024624211713671684, -0.023435143753886223, -0.02224607765674591, -0.02105700969696045, -0.019867941737174988, -0.018678873777389526, -0.017489805817604065, -0.016300739720463753, -0.015111671760678291, -0.01392260380089283, -0.012733536772429943, -0.011544469743967056, -0.010355401784181595, -0.009166333824396133, -0.007977266795933247, -0.0067881993018090725, -0.005599131807684898, -0.004410064313560724, -0.00322099681943655, -0.0020319297909736633, -0.0008428618311882019, 0.0003462056629359722, 0.0015352731570601463, 0.0027243406511843204, 0.003913408145308495, 0.005102475639432669, 0.006291543133556843, 0.00748061016201973, 0.008669678121805191]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 5.0, 7.0, 9.0, 7.0, 13.0, 8.0, 10.0, 15.0, 15.0, 19.0, 20.0, 18.0, 21.0, 32.0, 17.0, 30.0, 34.0, 32.0, 38.0, 40.0, 41.0, 35.0, 35.0, 43.0, 39.0, 29.0, 41.0, 33.0, 33.0, 41.0, 24.0, 37.0, 27.0, 18.0, 25.0, 22.0, 16.0, 14.0, 16.0, 8.0, 8.0, 6.0, 8.0, 0.0, 7.0, 6.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.01086878776550293, -0.01051870547235012, -0.010168623179197311, -0.009818540886044502, -0.009468458592891693, -0.009118376299738884, -0.008768294006586075, -0.008418211713433266, -0.008068129420280457, -0.007718047127127647, -0.007367964833974838, -0.007017882540822029, -0.00666780024766922, -0.006317717954516411, -0.005967635661363602, -0.0056175533682107925, -0.005267471075057983, -0.004917388781905174, -0.004567306488752365, -0.004217224195599556, -0.003867141902446747, -0.0035170596092939377, -0.0031669773161411285, -0.0028168950229883194, -0.0024668127298355103, -0.002116730436682701, -0.001766648143529892, -0.0014165658503770828, -0.0010664835572242737, -0.0007164012640714645, -0.0003663189709186554, -1.6236677765846252e-05, 0.0003338456153869629, 0.000683927908539772, 0.0010340102016925812, 0.0013840924948453903, 0.0017341747879981995, 0.0020842570811510086, 0.0024343393743038177, 0.002784421667456627, 0.003134503960609436, 0.003484586253762245, 0.0038346685469150543, 0.0041847508400678635, 0.004534833133220673, 0.004884915426373482, 0.005234997719526291, 0.0055850800126791, 0.005935162305831909, 0.006285244598984718, 0.0066353268921375275, 0.006985409185290337, 0.007335491478443146, 0.007685573771595955, 0.008035656064748764, 0.008385738357901573, 0.008735820651054382, 0.009085902944207191, 0.00943598523736, 0.00978606753051281, 0.010136149823665619, 0.010486232116818428, 0.010836314409971237, 0.011186396703124046, 0.011536478996276855]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 8.0, 10.0, 15.0, 13.0, 21.0, 22.0, 24.0, 27.0, 26.0, 27.0, 40.0, 38.0, 38.0, 28.0, 50.0, 37.0, 52.0, 36.0, 38.0, 41.0, 39.0, 39.0, 45.0, 38.0, 35.0, 32.0, 26.0, 30.0, 35.0, 13.0, 13.0, 15.0, 8.0, 7.0, 7.0, 6.0, 6.0, 3.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.44921875, -3.345703125, -3.2421875, -3.138671875, -3.03515625, -2.931640625, -2.828125, -2.724609375, -2.62109375, -2.517578125, -2.4140625, -2.310546875, -2.20703125, -2.103515625, -2.0, -1.896484375, -1.79296875, -1.689453125, -1.5859375, -1.482421875, -1.37890625, -1.275390625, -1.171875, -1.068359375, -0.96484375, -0.861328125, -0.7578125, -0.654296875, -0.55078125, -0.447265625, -0.34375, -0.240234375, -0.13671875, -0.033203125, 0.0703125, 0.173828125, 0.27734375, 0.380859375, 0.484375, 0.587890625, 0.69140625, 0.794921875, 0.8984375, 1.001953125, 1.10546875, 1.208984375, 1.3125, 1.416015625, 1.51953125, 1.623046875, 1.7265625, 1.830078125, 1.93359375, 2.037109375, 2.140625, 2.244140625, 2.34765625, 2.451171875, 2.5546875, 2.658203125, 2.76171875, 2.865234375, 2.96875, 3.072265625, 3.17578125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 5.0, 15.0, 4.0, 17.0, 31.0, 36.0, 76.0, 127.0, 206.0, 420.0, 782.0, 1591.0, 3258.0, 6287.0, 12308.0, 23723.0, 44201.0, 84147.0, 179650.0, 309282.0, 192962.0, 90659.0, 46903.0, 24810.0, 13300.0, 6798.0, 3380.0, 1710.0, 862.0, 440.0, 229.0, 132.0, 74.0, 45.0, 24.0, 14.0, 14.0, 12.0, 4.0, 5.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.92578125, -2.833038330078125, -2.74029541015625, -2.647552490234375, -2.5548095703125, -2.462066650390625, -2.36932373046875, -2.276580810546875, -2.183837890625, -2.091094970703125, -1.99835205078125, -1.905609130859375, -1.8128662109375, -1.720123291015625, -1.62738037109375, -1.534637451171875, -1.44189453125, -1.349151611328125, -1.25640869140625, -1.163665771484375, -1.0709228515625, -0.978179931640625, -0.88543701171875, -0.792694091796875, -0.699951171875, -0.607208251953125, -0.51446533203125, -0.421722412109375, -0.3289794921875, -0.236236572265625, -0.14349365234375, -0.050750732421875, 0.0419921875, 0.134735107421875, 0.22747802734375, 0.320220947265625, 0.4129638671875, 0.505706787109375, 0.59844970703125, 0.691192626953125, 0.783935546875, 0.876678466796875, 0.96942138671875, 1.062164306640625, 1.1549072265625, 1.247650146484375, 1.34039306640625, 1.433135986328125, 1.52587890625, 1.618621826171875, 1.71136474609375, 1.804107666015625, 1.8968505859375, 1.989593505859375, 2.08233642578125, 2.175079345703125, 2.267822265625, 2.360565185546875, 2.45330810546875, 2.546051025390625, 2.6387939453125, 2.731536865234375, 2.82427978515625, 2.917022705078125, 3.009765625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 9.0, 5.0, 2.0, 10.0, 10.0, 14.0, 8.0, 22.0, 17.0, 18.0, 22.0, 28.0, 21.0, 23.0, 38.0, 63.0, 36.0, 66.0, 105.0, 240.0, 1448.0, 271.0, 129.0, 69.0, 47.0, 46.0, 39.0, 35.0, 29.0, 29.0, 18.0, 27.0, 20.0, 21.0, 18.0, 7.0, 10.0, 8.0, 8.0, 3.0, 7.0, 5.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-12.1171875, -11.7862548828125, -11.455322265625, -11.1243896484375, -10.79345703125, -10.4625244140625, -10.131591796875, -9.8006591796875, -9.4697265625, -9.1387939453125, -8.807861328125, -8.4769287109375, -8.14599609375, -7.8150634765625, -7.484130859375, -7.1531982421875, -6.822265625, -6.4913330078125, -6.160400390625, -5.8294677734375, -5.49853515625, -5.1676025390625, -4.836669921875, -4.5057373046875, -4.1748046875, -3.8438720703125, -3.512939453125, -3.1820068359375, -2.85107421875, -2.5201416015625, -2.189208984375, -1.8582763671875, -1.52734375, -1.1964111328125, -0.865478515625, -0.5345458984375, -0.20361328125, 0.1273193359375, 0.458251953125, 0.7891845703125, 1.1201171875, 1.4510498046875, 1.781982421875, 2.1129150390625, 2.44384765625, 2.7747802734375, 3.105712890625, 3.4366455078125, 3.767578125, 4.0985107421875, 4.429443359375, 4.7603759765625, 5.09130859375, 5.4222412109375, 5.753173828125, 6.0841064453125, 6.4150390625, 6.7459716796875, 7.076904296875, 7.4078369140625, 7.73876953125, 8.0697021484375, 8.400634765625, 8.7315673828125, 9.0625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 7.0, 6.0, 9.0, 9.0, 12.0, 8.0, 16.0, 29.0, 19.0, 24.0, 38.0, 44.0, 63.0, 72.0, 108.0, 156.0, 207.0, 366.0, 800.0, 3102.0, 61275.0, 2721209.0, 345748.0, 9649.0, 1275.0, 480.0, 273.0, 159.0, 129.0, 96.0, 60.0, 58.0, 44.0, 36.0, 36.0, 19.0, 12.0, 15.0, 9.0, 9.0, 5.0, 2.0, 7.0, 4.0, 4.0, 2.0, 4.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-14.4375, -13.95166015625, -13.4658203125, -12.97998046875, -12.494140625, -12.00830078125, -11.5224609375, -11.03662109375, -10.55078125, -10.06494140625, -9.5791015625, -9.09326171875, -8.607421875, -8.12158203125, -7.6357421875, -7.14990234375, -6.6640625, -6.17822265625, -5.6923828125, -5.20654296875, -4.720703125, -4.23486328125, -3.7490234375, -3.26318359375, -2.77734375, -2.29150390625, -1.8056640625, -1.31982421875, -0.833984375, -0.34814453125, 0.1376953125, 0.62353515625, 1.109375, 1.59521484375, 2.0810546875, 2.56689453125, 3.052734375, 3.53857421875, 4.0244140625, 4.51025390625, 4.99609375, 5.48193359375, 5.9677734375, 6.45361328125, 6.939453125, 7.42529296875, 7.9111328125, 8.39697265625, 8.8828125, 9.36865234375, 9.8544921875, 10.34033203125, 10.826171875, 11.31201171875, 11.7978515625, 12.28369140625, 12.76953125, 13.25537109375, 13.7412109375, 14.22705078125, 14.712890625, 15.19873046875, 15.6845703125, 16.17041015625, 16.65625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 7.0, 22.0, 82.0, 137.0, 214.0, 225.0, 145.0, 96.0, 61.0, 13.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.62026023864746, -19.763843536376953, -18.907424926757812, -18.051008224487305, -17.194591522216797, -16.338172912597656, -15.481756210327148, -14.625338554382324, -13.7689208984375, -12.912503242492676, -12.056085586547852, -11.199668884277344, -10.34325122833252, -9.486833572387695, -8.630416870117188, -7.773999214172363, -6.917581558227539, -6.061163902282715, -5.204746723175049, -4.348329544067383, -3.4919118881225586, -2.6354942321777344, -1.7790770530700684, -0.9226598739624023, -0.06624221801757812, 0.790175199508667, 1.646592617034912, 2.5030100345611572, 3.3594274520874023, 4.215845108032227, 5.072262287139893, 5.928679466247559, 6.78509521484375, 7.641512870788574, 8.497930526733398, 9.354347229003906, 10.21076488494873, 11.067182540893555, 11.923599243164062, 12.780016899108887, 13.636434555053711, 14.492852210998535, 15.34926986694336, 16.205686569213867, 17.062103271484375, 17.918521881103516, 18.774938583374023, 19.63135528564453, 20.487773895263672, 21.34419059753418, 22.20060920715332, 23.057025909423828, 23.91344451904297, 24.769861221313477, 25.626277923583984, 26.482696533203125, 27.339113235473633, 28.19552993774414, 29.05194854736328, 29.90836524963379, 30.764781951904297, 31.621200561523438, 32.47761917114258, 33.33403396606445, 34.190452575683594]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 4.0, 3.0, 2.0, 5.0, 13.0, 7.0, 8.0, 13.0, 12.0, 15.0, 13.0, 12.0, 17.0, 13.0, 24.0, 21.0, 24.0, 37.0, 35.0, 31.0, 31.0, 42.0, 29.0, 33.0, 42.0, 36.0, 45.0, 41.0, 37.0, 38.0, 26.0, 34.0, 25.0, 36.0, 27.0, 26.0, 23.0, 18.0, 13.0, 10.0, 15.0, 11.0, 9.0, 12.0, 6.0, 7.0, 11.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0], "bins": [-27.23621368408203, -26.48138999938965, -25.726566314697266, -24.971742630004883, -24.2169189453125, -23.46209716796875, -22.707271575927734, -21.952449798583984, -21.1976261138916, -20.44280242919922, -19.687978744506836, -18.933155059814453, -18.17833137512207, -17.423507690429688, -16.668685913085938, -15.913862228393555, -15.159037590026855, -14.404213905334473, -13.64939022064209, -12.894567489624023, -12.13974380493164, -11.384920120239258, -10.630096435546875, -9.875272750854492, -9.12044906616211, -8.365625381469727, -7.610802173614502, -6.855978488922119, -6.1011552810668945, -5.346331596374512, -4.591507911682129, -3.8366847038269043, -3.0818614959716797, -2.327038049697876, -1.5722144842147827, -0.8173909187316895, -0.06256747245788574, 0.692255973815918, 1.4470796585083008, 2.2019028663635254, 2.956726551055908, 3.711549997329712, 4.466373443603516, 5.221197128295898, 5.976020812988281, 6.730844020843506, 7.485667705535889, 8.240490913391113, 8.995314598083496, 9.750138282775879, 10.504961967468262, 11.259784698486328, 12.014608383178711, 12.769432067871094, 13.524255752563477, 14.27907943725586, 15.033903121948242, 15.788726806640625, 16.543550491333008, 17.29837417602539, 18.053197860717773, 18.808021545410156, 19.562843322753906, 20.31766700744629, 21.072490692138672]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 4.0, 10.0, 5.0, 17.0, 14.0, 18.0, 25.0, 15.0, 21.0, 29.0, 29.0, 33.0, 25.0, 43.0, 28.0, 42.0, 44.0, 28.0, 50.0, 35.0, 41.0, 32.0, 41.0, 33.0, 39.0, 37.0, 36.0, 23.0, 37.0, 29.0, 27.0, 21.0, 18.0, 14.0, 13.0, 7.0, 7.0, 4.0, 9.0, 6.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-3.384765625, -3.283172607421875, -3.18157958984375, -3.079986572265625, -2.9783935546875, -2.876800537109375, -2.77520751953125, -2.673614501953125, -2.572021484375, -2.470428466796875, -2.36883544921875, -2.267242431640625, -2.1656494140625, -2.064056396484375, -1.96246337890625, -1.860870361328125, -1.75927734375, -1.657684326171875, -1.55609130859375, -1.454498291015625, -1.3529052734375, -1.251312255859375, -1.14971923828125, -1.048126220703125, -0.946533203125, -0.844940185546875, -0.74334716796875, -0.641754150390625, -0.5401611328125, -0.438568115234375, -0.33697509765625, -0.235382080078125, -0.1337890625, -0.032196044921875, 0.06939697265625, 0.170989990234375, 0.2725830078125, 0.374176025390625, 0.47576904296875, 0.577362060546875, 0.678955078125, 0.780548095703125, 0.88214111328125, 0.983734130859375, 1.0853271484375, 1.186920166015625, 1.28851318359375, 1.390106201171875, 1.49169921875, 1.593292236328125, 1.69488525390625, 1.796478271484375, 1.8980712890625, 1.999664306640625, 2.10125732421875, 2.202850341796875, 2.304443359375, 2.406036376953125, 2.50762939453125, 2.609222412109375, 2.7108154296875, 2.812408447265625, 2.91400146484375, 3.015594482421875, 3.1171875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 10.0, 5.0, 16.0, 10.0, 20.0, 21.0, 23.0, 14.0, 31.0, 38.0, 50.0, 85.0, 183.0, 644.0, 3114.0, 25173.0, 266299.0, 2290923.0, 1455079.0, 135832.0, 13716.0, 2027.0, 457.0, 194.0, 71.0, 56.0, 33.0, 39.0, 25.0, 20.0, 9.0, 14.0, 8.0, 10.0, 4.0, 5.0, 6.0, 7.0, 3.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.99609375, -7.7667236328125, -7.537353515625, -7.3079833984375, -7.07861328125, -6.8492431640625, -6.619873046875, -6.3905029296875, -6.1611328125, -5.9317626953125, -5.702392578125, -5.4730224609375, -5.24365234375, -5.0142822265625, -4.784912109375, -4.5555419921875, -4.326171875, -4.0968017578125, -3.867431640625, -3.6380615234375, -3.40869140625, -3.1793212890625, -2.949951171875, -2.7205810546875, -2.4912109375, -2.2618408203125, -2.032470703125, -1.8031005859375, -1.57373046875, -1.3443603515625, -1.114990234375, -0.8856201171875, -0.65625, -0.4268798828125, -0.197509765625, 0.0318603515625, 0.26123046875, 0.4906005859375, 0.719970703125, 0.9493408203125, 1.1787109375, 1.4080810546875, 1.637451171875, 1.8668212890625, 2.09619140625, 2.3255615234375, 2.554931640625, 2.7843017578125, 3.013671875, 3.2430419921875, 3.472412109375, 3.7017822265625, 3.93115234375, 4.1605224609375, 4.389892578125, 4.6192626953125, 4.8486328125, 5.0780029296875, 5.307373046875, 5.5367431640625, 5.76611328125, 5.9954833984375, 6.224853515625, 6.4542236328125, 6.68359375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 3.0, 5.0, 9.0, 9.0, 8.0, 16.0, 21.0, 26.0, 28.0, 47.0, 54.0, 69.0, 86.0, 105.0, 168.0, 180.0, 260.0, 346.0, 387.0, 427.0, 370.0, 351.0, 241.0, 201.0, 158.0, 121.0, 85.0, 65.0, 51.0, 43.0, 26.0, 25.0, 23.0, 13.0, 14.0, 13.0, 6.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.21875, -4.08050537109375, -3.9422607421875, -3.80401611328125, -3.665771484375, -3.52752685546875, -3.3892822265625, -3.25103759765625, -3.11279296875, -2.97454833984375, -2.8363037109375, -2.69805908203125, -2.559814453125, -2.42156982421875, -2.2833251953125, -2.14508056640625, -2.0068359375, -1.86859130859375, -1.7303466796875, -1.59210205078125, -1.453857421875, -1.31561279296875, -1.1773681640625, -1.03912353515625, -0.90087890625, -0.76263427734375, -0.6243896484375, -0.48614501953125, -0.347900390625, -0.20965576171875, -0.0714111328125, 0.06683349609375, 0.205078125, 0.34332275390625, 0.4815673828125, 0.61981201171875, 0.758056640625, 0.89630126953125, 1.0345458984375, 1.17279052734375, 1.31103515625, 1.44927978515625, 1.5875244140625, 1.72576904296875, 1.864013671875, 2.00225830078125, 2.1405029296875, 2.27874755859375, 2.4169921875, 2.55523681640625, 2.6934814453125, 2.83172607421875, 2.969970703125, 3.10821533203125, 3.2464599609375, 3.38470458984375, 3.52294921875, 3.66119384765625, 3.7994384765625, 3.93768310546875, 4.075927734375, 4.21417236328125, 4.3524169921875, 4.49066162109375, 4.62890625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 2.0, 5.0, 11.0, 9.0, 13.0, 17.0, 31.0, 42.0, 41.0, 50.0, 69.0, 108.0, 127.0, 188.0, 257.0, 439.0, 1167.0, 9331.0, 252506.0, 3574656.0, 340717.0, 11700.0, 1270.0, 468.0, 293.0, 195.0, 131.0, 114.0, 81.0, 70.0, 34.0, 36.0, 24.0, 17.0, 15.0, 17.0, 9.0, 9.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.59375, -16.0989990234375, -15.604248046875, -15.1094970703125, -14.61474609375, -14.1199951171875, -13.625244140625, -13.1304931640625, -12.6357421875, -12.1409912109375, -11.646240234375, -11.1514892578125, -10.65673828125, -10.1619873046875, -9.667236328125, -9.1724853515625, -8.677734375, -8.1829833984375, -7.688232421875, -7.1934814453125, -6.69873046875, -6.2039794921875, -5.709228515625, -5.2144775390625, -4.7197265625, -4.2249755859375, -3.730224609375, -3.2354736328125, -2.74072265625, -2.2459716796875, -1.751220703125, -1.2564697265625, -0.76171875, -0.2669677734375, 0.227783203125, 0.7225341796875, 1.21728515625, 1.7120361328125, 2.206787109375, 2.7015380859375, 3.1962890625, 3.6910400390625, 4.185791015625, 4.6805419921875, 5.17529296875, 5.6700439453125, 6.164794921875, 6.6595458984375, 7.154296875, 7.6490478515625, 8.143798828125, 8.6385498046875, 9.13330078125, 9.6280517578125, 10.122802734375, 10.6175537109375, 11.1123046875, 11.6070556640625, 12.101806640625, 12.5965576171875, 13.09130859375, 13.5860595703125, 14.080810546875, 14.5755615234375, 15.0703125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 11.0, 134.0, 465.0, 337.0, 70.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.39815139770508, -58.141178131103516, -54.88420867919922, -51.627235412597656, -48.370262145996094, -45.11328887939453, -41.85631561279297, -38.59934616088867, -35.34237289428711, -32.08539962768555, -28.828428268432617, -25.571456909179688, -22.314483642578125, -19.057510375976562, -15.800539016723633, -12.543567657470703, -9.28659439086914, -6.0296220779418945, -2.7726497650146484, 0.48432254791259766, 3.7412948608398438, 6.998268127441406, 10.255239486694336, 13.512210845947266, 16.769184112548828, 20.02615737915039, 23.28312873840332, 26.54010009765625, 29.797073364257812, 33.054046630859375, 36.31101989746094, 39.567989349365234, 42.82496643066406, 46.081939697265625, 49.33891296386719, 52.595882415771484, 55.85285568237305, 59.10982894897461, 62.366798400878906, 65.62377166748047, 68.88074493408203, 72.1377182006836, 75.39469146728516, 78.65166473388672, 81.90863037109375, 85.16560363769531, 88.42257690429688, 91.67955017089844, 94.9365234375, 98.19349670410156, 101.45046997070312, 104.70744323730469, 107.96441650390625, 111.22138977050781, 114.47835540771484, 117.7353286743164, 120.99230194091797, 124.24927520751953, 127.5062484741211, 130.76321411132812, 134.0201873779297, 137.27716064453125, 140.5341339111328, 143.79110717773438, 147.04808044433594]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 2.0, 4.0, 5.0, 7.0, 5.0, 3.0, 3.0, 5.0, 12.0, 24.0, 10.0, 17.0, 14.0, 22.0, 27.0, 23.0, 18.0, 31.0, 36.0, 31.0, 41.0, 34.0, 31.0, 36.0, 42.0, 44.0, 42.0, 38.0, 31.0, 34.0, 41.0, 43.0, 36.0, 25.0, 22.0, 18.0, 27.0, 21.0, 15.0, 29.0, 9.0, 9.0, 12.0, 5.0, 6.0, 4.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-16.938751220703125, -16.447296142578125, -15.955840110778809, -15.464385032653809, -14.972929954528809, -14.481473922729492, -13.990018844604492, -13.498563766479492, -13.007108688354492, -12.515653610229492, -12.024197578430176, -11.532742500305176, -11.041287422180176, -10.54983139038086, -10.05837631225586, -9.56692123413086, -9.07546615600586, -8.58401107788086, -8.092555046081543, -7.601099967956543, -7.109644889831543, -6.618189334869385, -6.126733779907227, -5.635278701782227, -5.14382266998291, -4.652367115020752, -4.160912036895752, -3.6694564819335938, -3.1780014038085938, -2.6865458488464355, -2.1950905323028564, -1.7036352157592773, -1.2121801376342773, -0.7207248210906982, -0.22926944494247437, 0.2621859312057495, 0.7536412477493286, 1.2450966835021973, 1.7365520000457764, 2.2280073165893555, 2.7194626331329346, 3.2109179496765137, 3.7023732662200928, 4.193828582763672, 4.68528413772583, 5.176739692687988, 5.668194770812988, 6.159649848937988, 6.6511054039001465, 7.142560958862305, 7.634016036987305, 8.125471115112305, 8.616927146911621, 9.108382225036621, 9.599837303161621, 10.091293334960938, 10.582748413085938, 11.074203491210938, 11.565659523010254, 12.057114601135254, 12.548569679260254, 13.04002571105957, 13.53148078918457, 14.02293586730957, 14.51439094543457]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 5.0, 15.0, 8.0, 11.0, 14.0, 8.0, 18.0, 26.0, 27.0, 41.0, 16.0, 35.0, 24.0, 34.0, 39.0, 40.0, 40.0, 36.0, 43.0, 43.0, 36.0, 32.0, 37.0, 32.0, 33.0, 36.0, 32.0, 36.0, 23.0, 28.0, 16.0, 24.0, 24.0, 18.0, 15.0, 10.0, 8.0, 12.0, 3.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.095703125, -3.0001220703125, -2.904541015625, -2.8089599609375, -2.71337890625, -2.6177978515625, -2.522216796875, -2.4266357421875, -2.3310546875, -2.2354736328125, -2.139892578125, -2.0443115234375, -1.94873046875, -1.8531494140625, -1.757568359375, -1.6619873046875, -1.56640625, -1.4708251953125, -1.375244140625, -1.2796630859375, -1.18408203125, -1.0885009765625, -0.992919921875, -0.8973388671875, -0.8017578125, -0.7061767578125, -0.610595703125, -0.5150146484375, -0.41943359375, -0.3238525390625, -0.228271484375, -0.1326904296875, -0.037109375, 0.0584716796875, 0.154052734375, 0.2496337890625, 0.34521484375, 0.4407958984375, 0.536376953125, 0.6319580078125, 0.7275390625, 0.8231201171875, 0.918701171875, 1.0142822265625, 1.10986328125, 1.2054443359375, 1.301025390625, 1.3966064453125, 1.4921875, 1.5877685546875, 1.683349609375, 1.7789306640625, 1.87451171875, 1.9700927734375, 2.065673828125, 2.1612548828125, 2.2568359375, 2.3524169921875, 2.447998046875, 2.5435791015625, 2.63916015625, 2.7347412109375, 2.830322265625, 2.9259033203125, 3.021484375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 7.0, 8.0, 9.0, 13.0, 31.0, 32.0, 55.0, 78.0, 116.0, 159.0, 274.0, 434.0, 704.0, 1071.0, 1796.0, 2962.0, 4921.0, 8098.0, 13803.0, 23492.0, 39610.0, 66479.0, 106001.0, 154667.0, 186176.0, 158401.0, 109767.0, 68667.0, 40919.0, 24323.0, 14155.0, 8391.0, 4983.0, 3010.0, 1843.0, 1156.0, 681.0, 446.0, 294.0, 173.0, 117.0, 75.0, 70.0, 40.0, 27.0, 13.0, 7.0, 4.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.2476806640625, -0.23956871032714844, -0.23145675659179688, -0.2233448028564453, -0.21523284912109375, -0.2071208953857422, -0.19900894165039062, -0.19089698791503906, -0.1827850341796875, -0.17467308044433594, -0.16656112670898438, -0.1584491729736328, -0.15033721923828125, -0.1422252655029297, -0.13411331176757812, -0.12600135803222656, -0.117889404296875, -0.10977745056152344, -0.10166549682617188, -0.09355354309082031, -0.08544158935546875, -0.07732963562011719, -0.06921768188476562, -0.06110572814941406, -0.0529937744140625, -0.04488182067871094, -0.036769866943359375, -0.028657913208007812, -0.02054595947265625, -0.012434005737304688, -0.004322052001953125, 0.0037899017333984375, 0.01190185546875, 0.020013809204101562, 0.028125762939453125, 0.03623771667480469, 0.04434967041015625, 0.05246162414550781, 0.060573577880859375, 0.06868553161621094, 0.0767974853515625, 0.08490943908691406, 0.09302139282226562, 0.10113334655761719, 0.10924530029296875, 0.11735725402832031, 0.12546920776367188, 0.13358116149902344, 0.141693115234375, 0.14980506896972656, 0.15791702270507812, 0.1660289764404297, 0.17414093017578125, 0.1822528839111328, 0.19036483764648438, 0.19847679138183594, 0.2065887451171875, 0.21470069885253906, 0.22281265258789062, 0.2309246063232422, 0.23903656005859375, 0.2471485137939453, 0.2552604675292969, 0.26337242126464844, 0.271484375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 7.0, 1.0, 7.0, 5.0, 11.0, 8.0, 3.0, 17.0, 19.0, 13.0, 19.0, 19.0, 22.0, 30.0, 29.0, 46.0, 38.0, 34.0, 36.0, 43.0, 48.0, 42.0, 1078.0, 37.0, 35.0, 33.0, 42.0, 32.0, 39.0, 36.0, 21.0, 28.0, 21.0, 27.0, 22.0, 18.0, 9.0, 11.0, 7.0, 10.0, 8.0, 5.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.1953125, -2.120361328125, -2.04541015625, -1.970458984375, -1.8955078125, -1.820556640625, -1.74560546875, -1.670654296875, -1.595703125, -1.520751953125, -1.44580078125, -1.370849609375, -1.2958984375, -1.220947265625, -1.14599609375, -1.071044921875, -0.99609375, -0.921142578125, -0.84619140625, -0.771240234375, -0.6962890625, -0.621337890625, -0.54638671875, -0.471435546875, -0.396484375, -0.321533203125, -0.24658203125, -0.171630859375, -0.0966796875, -0.021728515625, 0.05322265625, 0.128173828125, 0.203125, 0.278076171875, 0.35302734375, 0.427978515625, 0.5029296875, 0.577880859375, 0.65283203125, 0.727783203125, 0.802734375, 0.877685546875, 0.95263671875, 1.027587890625, 1.1025390625, 1.177490234375, 1.25244140625, 1.327392578125, 1.40234375, 1.477294921875, 1.55224609375, 1.627197265625, 1.7021484375, 1.777099609375, 1.85205078125, 1.927001953125, 2.001953125, 2.076904296875, 2.15185546875, 2.226806640625, 2.3017578125, 2.376708984375, 2.45166015625, 2.526611328125, 2.6015625]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 5.0, 11.0, 6.0, 12.0, 18.0, 26.0, 53.0, 42.0, 101.0, 135.0, 229.0, 324.0, 485.0, 718.0, 1054.0, 1672.0, 2669.0, 4252.0, 6372.0, 9686.0, 15292.0, 23084.0, 36345.0, 54244.0, 80119.0, 112928.0, 169259.0, 1172024.0, 126285.0, 93300.0, 63555.0, 42463.0, 27951.0, 18457.0, 11926.0, 7575.0, 5142.0, 3183.0, 2179.0, 1342.0, 909.0, 567.0, 357.0, 257.0, 181.0, 98.0, 80.0, 61.0, 41.0, 25.0, 10.0, 10.0, 11.0, 8.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1278076171875, -0.12371253967285156, -0.11961746215820312, -0.11552238464355469, -0.11142730712890625, -0.10733222961425781, -0.10323715209960938, -0.09914207458496094, -0.0950469970703125, -0.09095191955566406, -0.08685684204101562, -0.08276176452636719, -0.07866668701171875, -0.07457160949707031, -0.07047653198242188, -0.06638145446777344, -0.062286376953125, -0.05819129943847656, -0.054096221923828125, -0.05000114440917969, -0.04590606689453125, -0.04181098937988281, -0.037715911865234375, -0.03362083435058594, -0.0295257568359375, -0.025430679321289062, -0.021335601806640625, -0.017240524291992188, -0.01314544677734375, -0.009050369262695312, -0.004955291748046875, -0.0008602142333984375, 0.00323486328125, 0.0073299407958984375, 0.011425018310546875, 0.015520095825195312, 0.01961517333984375, 0.023710250854492188, 0.027805328369140625, 0.03190040588378906, 0.0359954833984375, 0.04009056091308594, 0.044185638427734375, 0.04828071594238281, 0.05237579345703125, 0.05647087097167969, 0.060565948486328125, 0.06466102600097656, 0.068756103515625, 0.07285118103027344, 0.07694625854492188, 0.08104133605957031, 0.08513641357421875, 0.08923149108886719, 0.09332656860351562, 0.09742164611816406, 0.1015167236328125, 0.10561180114746094, 0.10970687866210938, 0.11380195617675781, 0.11789703369140625, 0.12199211120605469, 0.12608718872070312, 0.13018226623535156, 0.13427734375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 4.0, 3.0, 0.0, 3.0, 6.0, 4.0, 7.0, 8.0, 11.0, 17.0, 15.0, 13.0, 21.0, 37.0, 29.0, 45.0, 58.0, 82.0, 123.0, 123.0, 82.0, 53.0, 46.0, 37.0, 27.0, 22.0, 30.0, 25.0, 18.0, 11.0, 7.0, 7.0, 7.0, 3.0, 6.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00868988037109375, -0.008412718772888184, -0.008135557174682617, -0.00785839557647705, -0.007581233978271484, -0.007304072380065918, -0.0070269107818603516, -0.006749749183654785, -0.006472587585449219, -0.006195425987243652, -0.005918264389038086, -0.0056411027908325195, -0.005363941192626953, -0.005086779594421387, -0.00480961799621582, -0.004532456398010254, -0.0042552947998046875, -0.003978133201599121, -0.0037009716033935547, -0.0034238100051879883, -0.003146648406982422, -0.0028694868087768555, -0.002592325210571289, -0.0023151636123657227, -0.0020380020141601562, -0.0017608404159545898, -0.0014836788177490234, -0.001206517219543457, -0.0009293556213378906, -0.0006521940231323242, -0.0003750324249267578, -9.78708267211914e-05, 0.000179290771484375, 0.0004564523696899414, 0.0007336139678955078, 0.0010107755661010742, 0.0012879371643066406, 0.001565098762512207, 0.0018422603607177734, 0.00211942195892334, 0.0023965835571289062, 0.0026737451553344727, 0.002950906753540039, 0.0032280683517456055, 0.003505229949951172, 0.0037823915481567383, 0.004059553146362305, 0.004336714744567871, 0.0046138763427734375, 0.004891037940979004, 0.00516819953918457, 0.005445361137390137, 0.005722522735595703, 0.0059996843338012695, 0.006276845932006836, 0.006554007530212402, 0.006831169128417969, 0.007108330726623535, 0.0073854923248291016, 0.007662653923034668, 0.007939815521240234, 0.0082169771194458, 0.008494138717651367, 0.008771300315856934, 0.0090484619140625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 6.0, 2.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 9.0, 7.0, 10.0, 17.0, 33.0, 39.0, 38.0, 40.0, 59.0, 121.0, 190.0, 440.0, 5058.0, 1027332.0, 13934.0, 552.0, 239.0, 123.0, 69.0, 59.0, 39.0, 21.0, 23.0, 22.0, 11.0, 13.0, 11.0, 6.0, 3.0, 5.0, 1.0, 3.0, 3.0, 4.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1954345703125, -0.1894378662109375, -0.183441162109375, -0.1774444580078125, -0.17144775390625, -0.1654510498046875, -0.159454345703125, -0.1534576416015625, -0.1474609375, -0.1414642333984375, -0.135467529296875, -0.1294708251953125, -0.12347412109375, -0.1174774169921875, -0.111480712890625, -0.1054840087890625, -0.0994873046875, -0.0934906005859375, -0.087493896484375, -0.0814971923828125, -0.07550048828125, -0.0695037841796875, -0.063507080078125, -0.0575103759765625, -0.051513671875, -0.0455169677734375, -0.039520263671875, -0.0335235595703125, -0.02752685546875, -0.0215301513671875, -0.015533447265625, -0.0095367431640625, -0.0035400390625, 0.0024566650390625, 0.008453369140625, 0.0144500732421875, 0.02044677734375, 0.0264434814453125, 0.032440185546875, 0.0384368896484375, 0.04443359375, 0.0504302978515625, 0.056427001953125, 0.0624237060546875, 0.06842041015625, 0.0744171142578125, 0.080413818359375, 0.0864105224609375, 0.0924072265625, 0.0984039306640625, 0.104400634765625, 0.1103973388671875, 0.11639404296875, 0.1223907470703125, 0.128387451171875, 0.1343841552734375, 0.140380859375, 0.1463775634765625, 0.152374267578125, 0.1583709716796875, 0.16436767578125, 0.1703643798828125, 0.176361083984375, 0.1823577880859375, 0.1883544921875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 5.0, 9.0, 15.0, 29.0, 62.0, 129.0, 394.0, 246.0, 78.0, 27.0, 11.0, 2.0, 2.0, 4.0], "bins": [-0.07770585268735886, -0.07633709907531738, -0.0749683529138565, -0.07359959930181503, -0.07223084568977356, -0.07086209207773209, -0.06949333846569061, -0.06812459230422974, -0.06675583869218826, -0.06538708508014679, -0.06401833891868591, -0.06264958530664444, -0.061280831694602966, -0.05991207808256149, -0.05854332819581032, -0.05717457830905914, -0.05580582469701767, -0.054437071084976196, -0.05306832119822502, -0.051699571311473846, -0.05033081769943237, -0.0489620640873909, -0.047593314200639725, -0.04622456431388855, -0.044855810701847076, -0.0434870570898056, -0.04211830720305443, -0.04074955731630325, -0.03938080370426178, -0.038012050092220306, -0.03664330020546913, -0.03527455031871796, -0.03390579670667648, -0.03253704309463501, -0.031168293207883835, -0.02979954145848751, -0.028430789709091187, -0.027062037959694862, -0.025693286210298538, -0.024324534460902214, -0.02295578271150589, -0.021587030962109566, -0.02021827921271324, -0.018849527463316917, -0.017480775713920593, -0.01611202396452427, -0.014743272215127945, -0.01337452046573162, -0.012005769647657871, -0.010637017898261547, -0.009268266148865223, -0.007899514399468899, -0.006530762650072575, -0.0051620109006762505, -0.0037932591512799263, -0.002424507401883602, -0.001055755652487278, 0.0003129960969090462, 0.0016817478463053703, 0.0030504995957016945, 0.004419251345098019, 0.005788003094494343, 0.007156754843890667, 0.008525506593286991, 0.009894258342683315]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 1.0, 8.0, 7.0, 9.0, 7.0, 12.0, 10.0, 10.0, 14.0, 32.0, 22.0, 18.0, 29.0, 37.0, 29.0, 41.0, 31.0, 47.0, 34.0, 41.0, 37.0, 45.0, 52.0, 31.0, 30.0, 26.0, 39.0, 34.0, 26.0, 26.0, 26.0, 22.0, 33.0, 20.0, 16.0, 13.0, 13.0, 19.0, 14.0, 5.0, 7.0, 5.0, 9.0, 3.0, 9.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0], "bins": [-0.016794323921203613, -0.016286468133330345, -0.015778612345457077, -0.015270756557583809, -0.01476290076971054, -0.014255044981837273, -0.013747189193964005, -0.013239333406090736, -0.012731477618217468, -0.0122236218303442, -0.011715766042470932, -0.011207910254597664, -0.010700054466724396, -0.010192198678851128, -0.00968434289097786, -0.009176487103104591, -0.008668631315231323, -0.008160775527358055, -0.007652919739484787, -0.007145063951611519, -0.006637208163738251, -0.006129352375864983, -0.0056214965879917145, -0.005113640800118446, -0.004605785012245178, -0.00409792922437191, -0.003590073436498642, -0.003082217648625374, -0.0025743618607521057, -0.0020665060728788376, -0.0015586502850055695, -0.0010507944971323013, -0.0005429387092590332, -3.5082921385765076e-05, 0.00047277286648750305, 0.0009806286543607712, 0.0014884844422340393, 0.0019963402301073074, 0.0025041960179805756, 0.0030120518058538437, 0.003519907593727112, 0.00402776338160038, 0.004535619169473648, 0.005043474957346916, 0.005551330745220184, 0.0060591865330934525, 0.006567042320966721, 0.007074898108839989, 0.007582753896713257, 0.008090609684586525, 0.008598465472459793, 0.009106321260333061, 0.00961417704820633, 0.010122032836079597, 0.010629888623952866, 0.011137744411826134, 0.011645600199699402, 0.01215345598757267, 0.012661311775445938, 0.013169167563319206, 0.013677023351192474, 0.014184879139065742, 0.01469273492693901, 0.015200590714812279, 0.015708446502685547]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 5.0, 15.0, 8.0, 11.0, 14.0, 8.0, 18.0, 26.0, 27.0, 41.0, 16.0, 35.0, 24.0, 34.0, 41.0, 38.0, 40.0, 36.0, 43.0, 45.0, 34.0, 32.0, 38.0, 32.0, 32.0, 36.0, 32.0, 36.0, 23.0, 28.0, 16.0, 25.0, 23.0, 18.0, 15.0, 10.0, 8.0, 12.0, 3.0, 7.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.095703125, -3.0001220703125, -2.904541015625, -2.8089599609375, -2.71337890625, -2.6177978515625, -2.522216796875, -2.4266357421875, -2.3310546875, -2.2354736328125, -2.139892578125, -2.0443115234375, -1.94873046875, -1.8531494140625, -1.757568359375, -1.6619873046875, -1.56640625, -1.4708251953125, -1.375244140625, -1.2796630859375, -1.18408203125, -1.0885009765625, -0.992919921875, -0.8973388671875, -0.8017578125, -0.7061767578125, -0.610595703125, -0.5150146484375, -0.41943359375, -0.3238525390625, -0.228271484375, -0.1326904296875, -0.037109375, 0.0584716796875, 0.154052734375, 0.2496337890625, 0.34521484375, 0.4407958984375, 0.536376953125, 0.6319580078125, 0.7275390625, 0.8231201171875, 0.918701171875, 1.0142822265625, 1.10986328125, 1.2054443359375, 1.301025390625, 1.3966064453125, 1.4921875, 1.5877685546875, 1.683349609375, 1.7789306640625, 1.87451171875, 1.9700927734375, 2.065673828125, 2.1612548828125, 2.2568359375, 2.3524169921875, 2.447998046875, 2.5435791015625, 2.63916015625, 2.7347412109375, 2.830322265625, 2.9259033203125, 3.021484375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 7.0, 4.0, 9.0, 6.0, 12.0, 15.0, 18.0, 25.0, 32.0, 37.0, 63.0, 82.0, 86.0, 144.0, 183.0, 306.0, 744.0, 1947.0, 5288.0, 15469.0, 51465.0, 264338.0, 542030.0, 121538.0, 29067.0, 9562.0, 3392.0, 1286.0, 533.0, 278.0, 144.0, 100.0, 72.0, 65.0, 45.0, 44.0, 30.0, 19.0, 25.0, 10.0, 14.0, 7.0, 6.0, 2.0, 1.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.79296875, -5.618896484375, -5.44482421875, -5.270751953125, -5.0966796875, -4.922607421875, -4.74853515625, -4.574462890625, -4.400390625, -4.226318359375, -4.05224609375, -3.878173828125, -3.7041015625, -3.530029296875, -3.35595703125, -3.181884765625, -3.0078125, -2.833740234375, -2.65966796875, -2.485595703125, -2.3115234375, -2.137451171875, -1.96337890625, -1.789306640625, -1.615234375, -1.441162109375, -1.26708984375, -1.093017578125, -0.9189453125, -0.744873046875, -0.57080078125, -0.396728515625, -0.22265625, -0.048583984375, 0.12548828125, 0.299560546875, 0.4736328125, 0.647705078125, 0.82177734375, 0.995849609375, 1.169921875, 1.343994140625, 1.51806640625, 1.692138671875, 1.8662109375, 2.040283203125, 2.21435546875, 2.388427734375, 2.5625, 2.736572265625, 2.91064453125, 3.084716796875, 3.2587890625, 3.432861328125, 3.60693359375, 3.781005859375, 3.955078125, 4.129150390625, 4.30322265625, 4.477294921875, 4.6513671875, 4.825439453125, 4.99951171875, 5.173583984375, 5.34765625]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 7.0, 2.0, 8.0, 6.0, 9.0, 17.0, 20.0, 14.0, 28.0, 28.0, 39.0, 31.0, 44.0, 42.0, 59.0, 73.0, 126.0, 373.0, 1509.0, 144.0, 86.0, 59.0, 58.0, 46.0, 37.0, 32.0, 33.0, 29.0, 18.0, 14.0, 19.0, 10.0, 6.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.1015625, -11.7247314453125, -11.347900390625, -10.9710693359375, -10.59423828125, -10.2174072265625, -9.840576171875, -9.4637451171875, -9.0869140625, -8.7100830078125, -8.333251953125, -7.9564208984375, -7.57958984375, -7.2027587890625, -6.825927734375, -6.4490966796875, -6.072265625, -5.6954345703125, -5.318603515625, -4.9417724609375, -4.56494140625, -4.1881103515625, -3.811279296875, -3.4344482421875, -3.0576171875, -2.6807861328125, -2.303955078125, -1.9271240234375, -1.55029296875, -1.1734619140625, -0.796630859375, -0.4197998046875, -0.04296875, 0.3338623046875, 0.710693359375, 1.0875244140625, 1.46435546875, 1.8411865234375, 2.218017578125, 2.5948486328125, 2.9716796875, 3.3485107421875, 3.725341796875, 4.1021728515625, 4.47900390625, 4.8558349609375, 5.232666015625, 5.6094970703125, 5.986328125, 6.3631591796875, 6.739990234375, 7.1168212890625, 7.49365234375, 7.8704833984375, 8.247314453125, 8.6241455078125, 9.0009765625, 9.3778076171875, 9.754638671875, 10.1314697265625, 10.50830078125, 10.8851318359375, 11.261962890625, 11.6387939453125, 12.015625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 8.0, 9.0, 23.0, 17.0, 27.0, 33.0, 44.0, 50.0, 75.0, 107.0, 175.0, 347.0, 1017.0, 12899.0, 3008441.0, 119024.0, 2164.0, 501.0, 249.0, 115.0, 90.0, 59.0, 51.0, 40.0, 26.0, 23.0, 20.0, 15.0, 7.0, 6.0, 5.0, 2.0, 9.0, 5.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.203125, -24.408447265625, -23.61376953125, -22.819091796875, -22.0244140625, -21.229736328125, -20.43505859375, -19.640380859375, -18.845703125, -18.051025390625, -17.25634765625, -16.461669921875, -15.6669921875, -14.872314453125, -14.07763671875, -13.282958984375, -12.48828125, -11.693603515625, -10.89892578125, -10.104248046875, -9.3095703125, -8.514892578125, -7.72021484375, -6.925537109375, -6.130859375, -5.336181640625, -4.54150390625, -3.746826171875, -2.9521484375, -2.157470703125, -1.36279296875, -0.568115234375, 0.2265625, 1.021240234375, 1.81591796875, 2.610595703125, 3.4052734375, 4.199951171875, 4.99462890625, 5.789306640625, 6.583984375, 7.378662109375, 8.17333984375, 8.968017578125, 9.7626953125, 10.557373046875, 11.35205078125, 12.146728515625, 12.94140625, 13.736083984375, 14.53076171875, 15.325439453125, 16.1201171875, 16.914794921875, 17.70947265625, 18.504150390625, 19.298828125, 20.093505859375, 20.88818359375, 21.682861328125, 22.4775390625, 23.272216796875, 24.06689453125, 24.861572265625, 25.65625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 110.0, 814.0, 94.0], "bins": [-211.14410400390625, -207.7620086669922, -204.37989807128906, -200.997802734375, -197.61569213867188, -194.2335968017578, -190.85150146484375, -187.46939086914062, -184.08729553222656, -180.7052001953125, -177.32308959960938, -173.9409942626953, -170.5588836669922, -167.17678833007812, -163.79469299316406, -160.41258239746094, -157.03048706054688, -153.6483917236328, -150.2662811279297, -146.88418579101562, -143.5020751953125, -140.11997985839844, -136.73788452148438, -133.35577392578125, -129.9736785888672, -126.5915756225586, -123.20947265625, -119.82737731933594, -116.44527435302734, -113.06317138671875, -109.68106842041016, -106.29896545410156, -102.91685485839844, -99.53475189208984, -96.15264892578125, -92.77055358886719, -89.3884506225586, -86.00634765625, -82.6242446899414, -79.24214172363281, -75.86004638671875, -72.47794342041016, -69.09584045410156, -65.7137451171875, -62.331642150878906, -58.94953918457031, -55.56743621826172, -52.18533706665039, -48.8032341003418, -45.4211311340332, -42.039031982421875, -38.65692901611328, -35.27482986450195, -31.89272689819336, -28.5106258392334, -25.128524780273438, -21.74642562866211, -18.36432456970215, -14.982223510742188, -11.60012149810791, -8.21802043914795, -4.835918426513672, -1.453817367553711, 1.92828369140625, 5.310385704040527]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 11.0, 5.0, 6.0, 11.0, 12.0, 13.0, 18.0, 16.0, 20.0, 16.0, 25.0, 30.0, 21.0, 28.0, 42.0, 39.0, 35.0, 38.0, 34.0, 42.0, 44.0, 40.0, 42.0, 25.0, 30.0, 35.0, 38.0, 33.0, 34.0, 28.0, 31.0, 21.0, 18.0, 16.0, 16.0, 18.0, 14.0, 13.0, 12.0, 9.0, 3.0, 4.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 4.0], "bins": [-24.510894775390625, -23.72867774963379, -22.946462631225586, -22.16424560546875, -21.382030487060547, -20.59981346130371, -19.817598342895508, -19.035381317138672, -18.25316619873047, -17.470949172973633, -16.68873405456543, -15.90651798248291, -15.12430191040039, -14.342085838317871, -13.559869766235352, -12.777652740478516, -11.995436668395996, -11.213220596313477, -10.431004524230957, -9.648788452148438, -8.866572380065918, -8.084356307983398, -7.302139759063721, -6.519923686981201, -5.737707614898682, -4.955491542816162, -4.173275470733643, -3.391059160232544, -2.6088430881500244, -1.8266270160675049, -1.0444107055664062, -0.2621946334838867, 0.5200214385986328, 1.3022375106811523, 2.084453582763672, 2.8666698932647705, 3.64888596534729, 4.4311017990112305, 5.213318347930908, 5.995534420013428, 6.777750492095947, 7.559966564178467, 8.342183113098145, 9.124399185180664, 9.906615257263184, 10.688831329345703, 11.471047401428223, 12.253263473510742, 13.035479545593262, 13.817695617675781, 14.5999116897583, 15.38212776184082, 16.164344787597656, 16.94655990600586, 17.728776931762695, 18.5109920501709, 19.293209075927734, 20.07542610168457, 20.857641220092773, 21.63985824584961, 22.422073364257812, 23.20429039001465, 23.98650550842285, 24.768722534179688, 25.55093765258789]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 5.0, 9.0, 10.0, 12.0, 9.0, 20.0, 11.0, 23.0, 22.0, 32.0, 23.0, 21.0, 41.0, 29.0, 37.0, 31.0, 28.0, 48.0, 36.0, 39.0, 47.0, 42.0, 29.0, 37.0, 26.0, 41.0, 39.0, 30.0, 39.0, 18.0, 22.0, 30.0, 22.0, 7.0, 16.0, 11.0, 12.0, 12.0, 4.0, 7.0, 6.0, 6.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.0859375, -2.986297607421875, -2.88665771484375, -2.787017822265625, -2.6873779296875, -2.587738037109375, -2.48809814453125, -2.388458251953125, -2.288818359375, -2.189178466796875, -2.08953857421875, -1.989898681640625, -1.8902587890625, -1.790618896484375, -1.69097900390625, -1.591339111328125, -1.49169921875, -1.392059326171875, -1.29241943359375, -1.192779541015625, -1.0931396484375, -0.993499755859375, -0.89385986328125, -0.794219970703125, -0.694580078125, -0.594940185546875, -0.49530029296875, -0.395660400390625, -0.2960205078125, -0.196380615234375, -0.09674072265625, 0.002899169921875, 0.1025390625, 0.202178955078125, 0.30181884765625, 0.401458740234375, 0.5010986328125, 0.600738525390625, 0.70037841796875, 0.800018310546875, 0.899658203125, 0.999298095703125, 1.09893798828125, 1.198577880859375, 1.2982177734375, 1.397857666015625, 1.49749755859375, 1.597137451171875, 1.69677734375, 1.796417236328125, 1.89605712890625, 1.995697021484375, 2.0953369140625, 2.194976806640625, 2.29461669921875, 2.394256591796875, 2.493896484375, 2.593536376953125, 2.69317626953125, 2.792816162109375, 2.8924560546875, 2.992095947265625, 3.09173583984375, 3.191375732421875, 3.291015625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 5.0, 2.0, 8.0, 12.0, 10.0, 13.0, 29.0, 20.0, 31.0, 40.0, 44.0, 79.0, 132.0, 264.0, 552.0, 1599.0, 4767.0, 17592.0, 77192.0, 359053.0, 1442045.0, 1688981.0, 468964.0, 100261.0, 22981.0, 6074.0, 1955.0, 777.0, 323.0, 148.0, 100.0, 54.0, 48.0, 34.0, 25.0, 16.0, 13.0, 11.0, 8.0, 5.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-4.546875, -4.395751953125, -4.24462890625, -4.093505859375, -3.9423828125, -3.791259765625, -3.64013671875, -3.489013671875, -3.337890625, -3.186767578125, -3.03564453125, -2.884521484375, -2.7333984375, -2.582275390625, -2.43115234375, -2.280029296875, -2.12890625, -1.977783203125, -1.82666015625, -1.675537109375, -1.5244140625, -1.373291015625, -1.22216796875, -1.071044921875, -0.919921875, -0.768798828125, -0.61767578125, -0.466552734375, -0.3154296875, -0.164306640625, -0.01318359375, 0.137939453125, 0.2890625, 0.440185546875, 0.59130859375, 0.742431640625, 0.8935546875, 1.044677734375, 1.19580078125, 1.346923828125, 1.498046875, 1.649169921875, 1.80029296875, 1.951416015625, 2.1025390625, 2.253662109375, 2.40478515625, 2.555908203125, 2.70703125, 2.858154296875, 3.00927734375, 3.160400390625, 3.3115234375, 3.462646484375, 3.61376953125, 3.764892578125, 3.916015625, 4.067138671875, 4.21826171875, 4.369384765625, 4.5205078125, 4.671630859375, 4.82275390625, 4.973876953125, 5.125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 5.0, 7.0, 4.0, 16.0, 19.0, 28.0, 31.0, 45.0, 58.0, 88.0, 104.0, 122.0, 213.0, 246.0, 336.0, 431.0, 451.0, 464.0, 359.0, 251.0, 214.0, 145.0, 102.0, 83.0, 69.0, 49.0, 35.0, 29.0, 16.0, 17.0, 7.0, 11.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.9140625, -4.7586669921875, -4.603271484375, -4.4478759765625, -4.29248046875, -4.1370849609375, -3.981689453125, -3.8262939453125, -3.6708984375, -3.5155029296875, -3.360107421875, -3.2047119140625, -3.04931640625, -2.8939208984375, -2.738525390625, -2.5831298828125, -2.427734375, -2.2723388671875, -2.116943359375, -1.9615478515625, -1.80615234375, -1.6507568359375, -1.495361328125, -1.3399658203125, -1.1845703125, -1.0291748046875, -0.873779296875, -0.7183837890625, -0.56298828125, -0.4075927734375, -0.252197265625, -0.0968017578125, 0.05859375, 0.2139892578125, 0.369384765625, 0.5247802734375, 0.68017578125, 0.8355712890625, 0.990966796875, 1.1463623046875, 1.3017578125, 1.4571533203125, 1.612548828125, 1.7679443359375, 1.92333984375, 2.0787353515625, 2.234130859375, 2.3895263671875, 2.544921875, 2.7003173828125, 2.855712890625, 3.0111083984375, 3.16650390625, 3.3218994140625, 3.477294921875, 3.6326904296875, 3.7880859375, 3.9434814453125, 4.098876953125, 4.2542724609375, 4.40966796875, 4.5650634765625, 4.720458984375, 4.8758544921875, 5.03125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 3.0, 5.0, 6.0, 10.0, 10.0, 18.0, 27.0, 36.0, 51.0, 62.0, 110.0, 141.0, 197.0, 354.0, 560.0, 1310.0, 5986.0, 73689.0, 1866121.0, 2150565.0, 85228.0, 6723.0, 1407.0, 641.0, 321.0, 218.0, 144.0, 103.0, 69.0, 62.0, 29.0, 27.0, 12.0, 11.0, 10.0, 6.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.71875, -13.3033447265625, -12.887939453125, -12.4725341796875, -12.05712890625, -11.6417236328125, -11.226318359375, -10.8109130859375, -10.3955078125, -9.9801025390625, -9.564697265625, -9.1492919921875, -8.73388671875, -8.3184814453125, -7.903076171875, -7.4876708984375, -7.072265625, -6.6568603515625, -6.241455078125, -5.8260498046875, -5.41064453125, -4.9952392578125, -4.579833984375, -4.1644287109375, -3.7490234375, -3.3336181640625, -2.918212890625, -2.5028076171875, -2.08740234375, -1.6719970703125, -1.256591796875, -0.8411865234375, -0.42578125, -0.0103759765625, 0.405029296875, 0.8204345703125, 1.23583984375, 1.6512451171875, 2.066650390625, 2.4820556640625, 2.8974609375, 3.3128662109375, 3.728271484375, 4.1436767578125, 4.55908203125, 4.9744873046875, 5.389892578125, 5.8052978515625, 6.220703125, 6.6361083984375, 7.051513671875, 7.4669189453125, 7.88232421875, 8.2977294921875, 8.713134765625, 9.1285400390625, 9.5439453125, 9.9593505859375, 10.374755859375, 10.7901611328125, 11.20556640625, 11.6209716796875, 12.036376953125, 12.4517822265625, 12.8671875]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 13.0, 80.0, 286.0, 366.0, 221.0, 45.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.412269592285156, -15.932291984558105, -13.452314376831055, -10.972336769104004, -8.492359161376953, -6.012381553649902, -3.5324039459228516, -1.0524253845214844, 1.42755126953125, 3.907528877258301, 6.387506484985352, 8.867484092712402, 11.347461700439453, 13.827439308166504, 16.307416915893555, 18.787395477294922, 21.267372131347656, 23.74734878540039, 26.227327346801758, 28.707305908203125, 31.18728256225586, 33.667259216308594, 36.147239685058594, 38.62721633911133, 41.10719299316406, 43.5871696472168, 46.06714630126953, 48.54712677001953, 51.027103424072266, 53.507080078125, 55.987060546875, 58.467037200927734, 60.947021484375, 63.426998138427734, 65.90697479248047, 68.38695526123047, 70.86692810058594, 73.34690856933594, 75.82688903808594, 78.30686950683594, 80.7868423461914, 83.2668228149414, 85.74679565429688, 88.22677612304688, 90.70675659179688, 93.18672943115234, 95.66670989990234, 98.14668273925781, 100.62666320800781, 103.10664367675781, 105.58661651611328, 108.06659698486328, 110.54656982421875, 113.02655029296875, 115.50653076171875, 117.98651123046875, 120.46648406982422, 122.94646453857422, 125.42643737792969, 127.90641784667969, 130.3863983154297, 132.8663787841797, 135.34634399414062, 137.82632446289062, 140.30630493164062]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 7.0, 5.0, 3.0, 10.0, 9.0, 9.0, 17.0, 24.0, 23.0, 27.0, 27.0, 21.0, 35.0, 39.0, 35.0, 32.0, 42.0, 36.0, 46.0, 51.0, 54.0, 35.0, 37.0, 50.0, 50.0, 39.0, 44.0, 25.0, 17.0, 30.0, 23.0, 24.0, 18.0, 16.0, 19.0, 3.0, 7.0, 8.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.12828254699707, -16.559585571289062, -15.990887641906738, -15.42219066619873, -14.853492736816406, -14.284795761108398, -13.71609878540039, -13.147401809692383, -12.578703880310059, -12.01000690460205, -11.441308975219727, -10.872611999511719, -10.303915023803711, -9.735217094421387, -9.166520118713379, -8.597822189331055, -8.029125213623047, -7.460427761077881, -6.891730308532715, -6.323033332824707, -5.754335880279541, -5.185638427734375, -4.616941452026367, -4.048243999481201, -3.479546546936035, -2.910849094390869, -2.3421518802642822, -1.7734545469284058, -1.2047572135925293, -0.6360597610473633, -0.06736254692077637, 0.5013346672058105, 1.0700340270996094, 1.6387313604354858, 2.2074286937713623, 2.776125907897949, 3.3448233604431152, 3.9135208129882812, 4.482217788696289, 5.050915241241455, 5.619612693786621, 6.188310146331787, 6.757007598876953, 7.325704574584961, 7.894402027130127, 8.463099479675293, 9.0317964553833, 9.600494384765625, 10.169191360473633, 10.73788833618164, 11.306586265563965, 11.875283241271973, 12.443981170654297, 13.012678146362305, 13.581375122070312, 14.15007209777832, 14.718770027160645, 15.287467002868652, 15.856164932250977, 16.424861907958984, 16.993558883666992, 17.562255859375, 18.13095474243164, 18.69965171813965, 19.268348693847656]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 8.0, 3.0, 4.0, 2.0, 14.0, 14.0, 11.0, 17.0, 17.0, 17.0, 25.0, 21.0, 20.0, 25.0, 25.0, 31.0, 43.0, 37.0, 41.0, 28.0, 44.0, 36.0, 37.0, 36.0, 48.0, 35.0, 39.0, 39.0, 38.0, 27.0, 25.0, 30.0, 20.0, 20.0, 24.0, 18.0, 23.0, 14.0, 7.0, 13.0, 9.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.326171875, -3.2264404296875, -3.126708984375, -3.0269775390625, -2.92724609375, -2.8275146484375, -2.727783203125, -2.6280517578125, -2.5283203125, -2.4285888671875, -2.328857421875, -2.2291259765625, -2.12939453125, -2.0296630859375, -1.929931640625, -1.8302001953125, -1.73046875, -1.6307373046875, -1.531005859375, -1.4312744140625, -1.33154296875, -1.2318115234375, -1.132080078125, -1.0323486328125, -0.9326171875, -0.8328857421875, -0.733154296875, -0.6334228515625, -0.53369140625, -0.4339599609375, -0.334228515625, -0.2344970703125, -0.134765625, -0.0350341796875, 0.064697265625, 0.1644287109375, 0.26416015625, 0.3638916015625, 0.463623046875, 0.5633544921875, 0.6630859375, 0.7628173828125, 0.862548828125, 0.9622802734375, 1.06201171875, 1.1617431640625, 1.261474609375, 1.3612060546875, 1.4609375, 1.5606689453125, 1.660400390625, 1.7601318359375, 1.85986328125, 1.9595947265625, 2.059326171875, 2.1590576171875, 2.2587890625, 2.3585205078125, 2.458251953125, 2.5579833984375, 2.65771484375, 2.7574462890625, 2.857177734375, 2.9569091796875, 3.056640625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 7.0, 15.0, 16.0, 23.0, 33.0, 42.0, 73.0, 100.0, 172.0, 225.0, 342.0, 575.0, 860.0, 1381.0, 2296.0, 3575.0, 6037.0, 10050.0, 16697.0, 28138.0, 46782.0, 75787.0, 117578.0, 166840.0, 183326.0, 142476.0, 94835.0, 59726.0, 36049.0, 21586.0, 12721.0, 7642.0, 4852.0, 2889.0, 1710.0, 1099.0, 698.0, 426.0, 295.0, 203.0, 131.0, 80.0, 56.0, 37.0, 25.0, 19.0, 12.0, 9.0, 4.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.2568359375, -0.248870849609375, -0.24090576171875, -0.232940673828125, -0.2249755859375, -0.217010498046875, -0.20904541015625, -0.201080322265625, -0.193115234375, -0.185150146484375, -0.17718505859375, -0.169219970703125, -0.1612548828125, -0.153289794921875, -0.14532470703125, -0.137359619140625, -0.12939453125, -0.121429443359375, -0.11346435546875, -0.105499267578125, -0.0975341796875, -0.089569091796875, -0.08160400390625, -0.073638916015625, -0.065673828125, -0.057708740234375, -0.04974365234375, -0.041778564453125, -0.0338134765625, -0.025848388671875, -0.01788330078125, -0.009918212890625, -0.001953125, 0.006011962890625, 0.01397705078125, 0.021942138671875, 0.0299072265625, 0.037872314453125, 0.04583740234375, 0.053802490234375, 0.061767578125, 0.069732666015625, 0.07769775390625, 0.085662841796875, 0.0936279296875, 0.101593017578125, 0.10955810546875, 0.117523193359375, 0.12548828125, 0.133453369140625, 0.14141845703125, 0.149383544921875, 0.1573486328125, 0.165313720703125, 0.17327880859375, 0.181243896484375, 0.189208984375, 0.197174072265625, 0.20513916015625, 0.213104248046875, 0.2210693359375, 0.229034423828125, 0.23699951171875, 0.244964599609375, 0.2529296875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 4.0, 7.0, 9.0, 9.0, 11.0, 15.0, 18.0, 17.0, 23.0, 21.0, 20.0, 25.0, 21.0, 26.0, 27.0, 46.0, 30.0, 53.0, 35.0, 36.0, 38.0, 1062.0, 38.0, 44.0, 36.0, 40.0, 45.0, 38.0, 27.0, 33.0, 18.0, 25.0, 22.0, 24.0, 11.0, 15.0, 9.0, 11.0, 7.0, 9.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-2.626953125, -2.54498291015625, -2.4630126953125, -2.38104248046875, -2.299072265625, -2.21710205078125, -2.1351318359375, -2.05316162109375, -1.97119140625, -1.88922119140625, -1.8072509765625, -1.72528076171875, -1.643310546875, -1.56134033203125, -1.4793701171875, -1.39739990234375, -1.3154296875, -1.23345947265625, -1.1514892578125, -1.06951904296875, -0.987548828125, -0.90557861328125, -0.8236083984375, -0.74163818359375, -0.65966796875, -0.57769775390625, -0.4957275390625, -0.41375732421875, -0.331787109375, -0.24981689453125, -0.1678466796875, -0.08587646484375, -0.00390625, 0.07806396484375, 0.1600341796875, 0.24200439453125, 0.323974609375, 0.40594482421875, 0.4879150390625, 0.56988525390625, 0.65185546875, 0.73382568359375, 0.8157958984375, 0.89776611328125, 0.979736328125, 1.06170654296875, 1.1436767578125, 1.22564697265625, 1.3076171875, 1.38958740234375, 1.4715576171875, 1.55352783203125, 1.635498046875, 1.71746826171875, 1.7994384765625, 1.88140869140625, 1.96337890625, 2.04534912109375, 2.1273193359375, 2.20928955078125, 2.291259765625, 2.37322998046875, 2.4552001953125, 2.53717041015625, 2.619140625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 9.0, 17.0, 35.0, 49.0, 72.0, 107.0, 172.0, 297.0, 480.0, 783.0, 1257.0, 2231.0, 3825.0, 6571.0, 11590.0, 19731.0, 33729.0, 56704.0, 90713.0, 136011.0, 1116669.0, 276716.0, 128357.0, 84693.0, 52102.0, 31107.0, 18215.0, 10281.0, 6008.0, 3478.0, 2032.0, 1185.0, 752.0, 462.0, 227.0, 157.0, 113.0, 75.0, 36.0, 29.0, 20.0, 13.0, 10.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1417236328125, -0.13664817810058594, -0.13157272338867188, -0.1264972686767578, -0.12142181396484375, -0.11634635925292969, -0.11127090454101562, -0.10619544982910156, -0.1011199951171875, -0.09604454040527344, -0.09096908569335938, -0.08589363098144531, -0.08081817626953125, -0.07574272155761719, -0.07066726684570312, -0.06559181213378906, -0.060516357421875, -0.05544090270996094, -0.050365447998046875, -0.04528999328613281, -0.04021453857421875, -0.03513908386230469, -0.030063629150390625, -0.024988174438476562, -0.0199127197265625, -0.014837265014648438, -0.009761810302734375, -0.0046863555908203125, 0.00038909912109375, 0.0054645538330078125, 0.010540008544921875, 0.015615463256835938, 0.02069091796875, 0.025766372680664062, 0.030841827392578125, 0.03591728210449219, 0.04099273681640625, 0.04606819152832031, 0.051143646240234375, 0.05621910095214844, 0.0612945556640625, 0.06637001037597656, 0.07144546508789062, 0.07652091979980469, 0.08159637451171875, 0.08667182922363281, 0.09174728393554688, 0.09682273864746094, 0.101898193359375, 0.10697364807128906, 0.11204910278320312, 0.11712455749511719, 0.12220001220703125, 0.1272754669189453, 0.13235092163085938, 0.13742637634277344, 0.1425018310546875, 0.14757728576660156, 0.15265274047851562, 0.1577281951904297, 0.16280364990234375, 0.1678791046142578, 0.17295455932617188, 0.17803001403808594, 0.18310546875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 3.0, 9.0, 12.0, 6.0, 14.0, 24.0, 23.0, 15.0, 29.0, 26.0, 43.0, 68.0, 85.0, 137.0, 128.0, 95.0, 53.0, 46.0, 28.0, 29.0, 20.0, 22.0, 16.0, 14.0, 8.0, 9.0, 8.0, 9.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.007022857666015625, -0.006780445575714111, -0.006538033485412598, -0.006295621395111084, -0.00605320930480957, -0.005810797214508057, -0.005568385124206543, -0.005325973033905029, -0.005083560943603516, -0.004841148853302002, -0.004598736763000488, -0.004356324672698975, -0.004113912582397461, -0.0038715004920959473, -0.0036290884017944336, -0.00338667631149292, -0.0031442642211914062, -0.0029018521308898926, -0.002659440040588379, -0.0024170279502868652, -0.0021746158599853516, -0.0019322037696838379, -0.0016897916793823242, -0.0014473795890808105, -0.0012049674987792969, -0.0009625554084777832, -0.0007201433181762695, -0.00047773122787475586, -0.0002353191375732422, 7.092952728271484e-06, 0.00024950504302978516, 0.0004919171333312988, 0.0007343292236328125, 0.0009767413139343262, 0.0012191534042358398, 0.0014615654945373535, 0.0017039775848388672, 0.0019463896751403809, 0.0021888017654418945, 0.002431213855743408, 0.002673625946044922, 0.0029160380363464355, 0.0031584501266479492, 0.003400862216949463, 0.0036432743072509766, 0.0038856863975524902, 0.004128098487854004, 0.004370510578155518, 0.004612922668457031, 0.004855334758758545, 0.005097746849060059, 0.005340158939361572, 0.005582571029663086, 0.0058249831199646, 0.006067395210266113, 0.006309807300567627, 0.006552219390869141, 0.006794631481170654, 0.007037043571472168, 0.007279455661773682, 0.007521867752075195, 0.007764279842376709, 0.008006691932678223, 0.008249104022979736, 0.00849151611328125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 4.0, 7.0, 10.0, 11.0, 8.0, 1.0, 15.0, 21.0, 20.0, 30.0, 43.0, 65.0, 92.0, 143.0, 274.0, 877.0, 845205.0, 200271.0, 784.0, 243.0, 125.0, 88.0, 58.0, 30.0, 28.0, 27.0, 16.0, 13.0, 11.0, 15.0, 6.0, 5.0, 0.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.18359375, -0.17833900451660156, -0.17308425903320312, -0.1678295135498047, -0.16257476806640625, -0.1573200225830078, -0.15206527709960938, -0.14681053161621094, -0.1415557861328125, -0.13630104064941406, -0.13104629516601562, -0.1257915496826172, -0.12053680419921875, -0.11528205871582031, -0.11002731323242188, -0.10477256774902344, -0.099517822265625, -0.09426307678222656, -0.08900833129882812, -0.08375358581542969, -0.07849884033203125, -0.07324409484863281, -0.06798934936523438, -0.06273460388183594, -0.0574798583984375, -0.05222511291503906, -0.046970367431640625, -0.04171562194824219, -0.03646087646484375, -0.031206130981445312, -0.025951385498046875, -0.020696640014648438, -0.01544189453125, -0.010187149047851562, -0.004932403564453125, 0.0003223419189453125, 0.00557708740234375, 0.010831832885742188, 0.016086578369140625, 0.021341323852539062, 0.0265960693359375, 0.03185081481933594, 0.037105560302734375, 0.04236030578613281, 0.04761505126953125, 0.05286979675292969, 0.058124542236328125, 0.06337928771972656, 0.068634033203125, 0.07388877868652344, 0.07914352416992188, 0.08439826965332031, 0.08965301513671875, 0.09490776062011719, 0.10016250610351562, 0.10541725158691406, 0.1106719970703125, 0.11592674255371094, 0.12118148803710938, 0.1264362335205078, 0.13169097900390625, 0.1369457244873047, 0.14220046997070312, 0.14745521545410156, 0.1527099609375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 9.0, 18.0, 28.0, 93.0, 399.0, 376.0, 64.0, 15.0, 10.0, 2.0], "bins": [-0.06621676683425903, -0.06509514153003693, -0.06397351622581482, -0.06285188347101212, -0.06173025816679001, -0.0606086328625679, -0.059487007558345795, -0.05836538225412369, -0.05724375322461128, -0.056122127920389175, -0.05500049889087677, -0.05387887358665466, -0.052757248282432556, -0.05163561925292015, -0.050513993948698044, -0.04939236491918564, -0.04827073961496353, -0.047149114310741425, -0.04602748528122902, -0.04490585997700691, -0.04378423094749451, -0.0426626056432724, -0.04154098033905029, -0.040419355034828186, -0.03929772600531578, -0.038176100701093674, -0.03705447167158127, -0.03593284636735916, -0.034811221063137054, -0.03368959203362465, -0.03256796672940254, -0.03144633769989014, -0.03032471239566803, -0.029203085228800774, -0.028081458061933517, -0.02695983275771141, -0.025838205590844154, -0.024716578423976898, -0.02359495311975479, -0.022473325952887535, -0.02135169878602028, -0.020230071619153023, -0.019108444452285767, -0.01798681914806366, -0.016865191981196404, -0.015743564814329147, -0.014621938578784466, -0.013500312343239784, -0.012378685176372528, -0.011257058009505272, -0.01013543177396059, -0.009013805538415909, -0.007892178371548653, -0.006770551670342684, -0.005648924969136715, -0.004527298733592033, -0.00340567110106349, -0.002284044399857521, -0.0011624176986515522, -4.0790997445583344e-05, 0.0010808357037603855, 0.0022024624049663544, 0.0033240891061723232, 0.004445715341717005, 0.005567342508584261]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 5.0, 4.0, 2.0, 2.0, 5.0, 11.0, 17.0, 8.0, 11.0, 19.0, 10.0, 22.0, 17.0, 24.0, 25.0, 29.0, 31.0, 30.0, 31.0, 52.0, 40.0, 40.0, 41.0, 54.0, 40.0, 38.0, 35.0, 34.0, 29.0, 38.0, 25.0, 39.0, 27.0, 29.0, 23.0, 24.0, 16.0, 14.0, 15.0, 17.0, 13.0, 4.0, 7.0, 5.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.01119309663772583, -0.010841550305485725, -0.01049000397324562, -0.010138457641005516, -0.009786911308765411, -0.009435364976525307, -0.009083818644285202, -0.008732272312045097, -0.008380725979804993, -0.008029179647564888, -0.007677633315324783, -0.007326086983084679, -0.006974540650844574, -0.006622994318604469, -0.006271447986364365, -0.00591990165412426, -0.005568355321884155, -0.005216808989644051, -0.004865262657403946, -0.004513716325163841, -0.004162169992923737, -0.003810623660683632, -0.0034590773284435272, -0.0031075309962034225, -0.002755984663963318, -0.002404438331723213, -0.0020528919994831085, -0.0017013456672430038, -0.0013497993350028992, -0.0009982530027627945, -0.0006467066705226898, -0.00029516033828258514, 5.638599395751953e-05, 0.0004079323261976242, 0.0007594786584377289, 0.0011110249906778336, 0.0014625713229179382, 0.001814117655158043, 0.0021656639873981476, 0.0025172103196382523, 0.002868756651878357, 0.0032203029841184616, 0.0035718493163585663, 0.003923395648598671, 0.004274941980838776, 0.00462648831307888, 0.004978034645318985, 0.00532958097755909, 0.005681127309799194, 0.006032673642039299, 0.006384219974279404, 0.006735766306519508, 0.007087312638759613, 0.007438858970999718, 0.007790405303239822, 0.008141951635479927, 0.008493497967720032, 0.008845044299960136, 0.009196590632200241, 0.009548136964440346, 0.00989968329668045, 0.010251229628920555, 0.01060277596116066, 0.010954322293400764, 0.01130586862564087]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 8.0, 3.0, 4.0, 3.0, 13.0, 14.0, 11.0, 16.0, 18.0, 17.0, 27.0, 19.0, 20.0, 26.0, 24.0, 31.0, 43.0, 37.0, 41.0, 28.0, 45.0, 35.0, 37.0, 36.0, 48.0, 35.0, 39.0, 39.0, 39.0, 26.0, 25.0, 30.0, 20.0, 21.0, 23.0, 20.0, 21.0, 14.0, 7.0, 13.0, 9.0, 8.0, 3.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.326171875, -3.226409912109375, -3.12664794921875, -3.026885986328125, -2.9271240234375, -2.827362060546875, -2.72760009765625, -2.627838134765625, -2.528076171875, -2.428314208984375, -2.32855224609375, -2.228790283203125, -2.1290283203125, -2.029266357421875, -1.92950439453125, -1.829742431640625, -1.72998046875, -1.630218505859375, -1.53045654296875, -1.430694580078125, -1.3309326171875, -1.231170654296875, -1.13140869140625, -1.031646728515625, -0.931884765625, -0.832122802734375, -0.73236083984375, -0.632598876953125, -0.5328369140625, -0.433074951171875, -0.33331298828125, -0.233551025390625, -0.1337890625, -0.034027099609375, 0.06573486328125, 0.165496826171875, 0.2652587890625, 0.365020751953125, 0.46478271484375, 0.564544677734375, 0.664306640625, 0.764068603515625, 0.86383056640625, 0.963592529296875, 1.0633544921875, 1.163116455078125, 1.26287841796875, 1.362640380859375, 1.46240234375, 1.562164306640625, 1.66192626953125, 1.761688232421875, 1.8614501953125, 1.961212158203125, 2.06097412109375, 2.160736083984375, 2.260498046875, 2.360260009765625, 2.46002197265625, 2.559783935546875, 2.6595458984375, 2.759307861328125, 2.85906982421875, 2.958831787109375, 3.05859375]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 5.0, 7.0, 4.0, 5.0, 11.0, 15.0, 14.0, 23.0, 34.0, 50.0, 59.0, 74.0, 67.0, 123.0, 142.0, 190.0, 292.0, 450.0, 761.0, 1615.0, 4397.0, 12715.0, 36310.0, 139187.0, 634585.0, 156496.0, 38649.0, 13411.0, 4702.0, 1736.0, 812.0, 461.0, 307.0, 195.0, 146.0, 117.0, 91.0, 85.0, 57.0, 34.0, 41.0, 20.0, 21.0, 12.0, 12.0, 2.0, 8.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-6.9453125, -6.7318115234375, -6.518310546875, -6.3048095703125, -6.09130859375, -5.8778076171875, -5.664306640625, -5.4508056640625, -5.2373046875, -5.0238037109375, -4.810302734375, -4.5968017578125, -4.38330078125, -4.1697998046875, -3.956298828125, -3.7427978515625, -3.529296875, -3.3157958984375, -3.102294921875, -2.8887939453125, -2.67529296875, -2.4617919921875, -2.248291015625, -2.0347900390625, -1.8212890625, -1.6077880859375, -1.394287109375, -1.1807861328125, -0.96728515625, -0.7537841796875, -0.540283203125, -0.3267822265625, -0.11328125, 0.1002197265625, 0.313720703125, 0.5272216796875, 0.74072265625, 0.9542236328125, 1.167724609375, 1.3812255859375, 1.5947265625, 1.8082275390625, 2.021728515625, 2.2352294921875, 2.44873046875, 2.6622314453125, 2.875732421875, 3.0892333984375, 3.302734375, 3.5162353515625, 3.729736328125, 3.9432373046875, 4.15673828125, 4.3702392578125, 4.583740234375, 4.7972412109375, 5.0107421875, 5.2242431640625, 5.437744140625, 5.6512451171875, 5.86474609375, 6.0782470703125, 6.291748046875, 6.5052490234375, 6.71875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 7.0, 11.0, 13.0, 16.0, 17.0, 18.0, 15.0, 30.0, 33.0, 39.0, 49.0, 32.0, 44.0, 48.0, 77.0, 164.0, 1483.0, 351.0, 134.0, 69.0, 54.0, 45.0, 48.0, 45.0, 28.0, 33.0, 24.0, 19.0, 14.0, 14.0, 18.0, 11.0, 10.0, 9.0, 4.0, 4.0, 6.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.203125, -10.8720703125, -10.541015625, -10.2099609375, -9.87890625, -9.5478515625, -9.216796875, -8.8857421875, -8.5546875, -8.2236328125, -7.892578125, -7.5615234375, -7.23046875, -6.8994140625, -6.568359375, -6.2373046875, -5.90625, -5.5751953125, -5.244140625, -4.9130859375, -4.58203125, -4.2509765625, -3.919921875, -3.5888671875, -3.2578125, -2.9267578125, -2.595703125, -2.2646484375, -1.93359375, -1.6025390625, -1.271484375, -0.9404296875, -0.609375, -0.2783203125, 0.052734375, 0.3837890625, 0.71484375, 1.0458984375, 1.376953125, 1.7080078125, 2.0390625, 2.3701171875, 2.701171875, 3.0322265625, 3.36328125, 3.6943359375, 4.025390625, 4.3564453125, 4.6875, 5.0185546875, 5.349609375, 5.6806640625, 6.01171875, 6.3427734375, 6.673828125, 7.0048828125, 7.3359375, 7.6669921875, 7.998046875, 8.3291015625, 8.66015625, 8.9912109375, 9.322265625, 9.6533203125, 9.984375]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 8.0, 11.0, 9.0, 12.0, 20.0, 26.0, 23.0, 27.0, 33.0, 45.0, 67.0, 103.0, 121.0, 216.0, 470.0, 1406.0, 17178.0, 2902912.0, 217244.0, 4065.0, 773.0, 315.0, 154.0, 97.0, 91.0, 53.0, 50.0, 39.0, 23.0, 19.0, 9.0, 22.0, 12.0, 11.0, 8.0, 7.0, 3.0, 6.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.15625, -22.37841796875, -21.6005859375, -20.82275390625, -20.044921875, -19.26708984375, -18.4892578125, -17.71142578125, -16.93359375, -16.15576171875, -15.3779296875, -14.60009765625, -13.822265625, -13.04443359375, -12.2666015625, -11.48876953125, -10.7109375, -9.93310546875, -9.1552734375, -8.37744140625, -7.599609375, -6.82177734375, -6.0439453125, -5.26611328125, -4.48828125, -3.71044921875, -2.9326171875, -2.15478515625, -1.376953125, -0.59912109375, 0.1787109375, 0.95654296875, 1.734375, 2.51220703125, 3.2900390625, 4.06787109375, 4.845703125, 5.62353515625, 6.4013671875, 7.17919921875, 7.95703125, 8.73486328125, 9.5126953125, 10.29052734375, 11.068359375, 11.84619140625, 12.6240234375, 13.40185546875, 14.1796875, 14.95751953125, 15.7353515625, 16.51318359375, 17.291015625, 18.06884765625, 18.8466796875, 19.62451171875, 20.40234375, 21.18017578125, 21.9580078125, 22.73583984375, 23.513671875, 24.29150390625, 25.0693359375, 25.84716796875, 26.625]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 15.0, 258.0, 545.0, 187.0, 14.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-113.48046112060547, -111.2283706665039, -108.97628021240234, -106.72418975830078, -104.47209930419922, -102.22000122070312, -99.96791076660156, -97.7158203125, -95.46372985839844, -93.21163940429688, -90.95954895019531, -88.70745849609375, -86.45536804199219, -84.20327758789062, -81.95118713378906, -79.69908905029297, -77.44700622558594, -75.19491577148438, -72.94282531738281, -70.69073486328125, -68.43864440917969, -66.18655395507812, -63.9344596862793, -61.682369232177734, -59.430274963378906, -57.178184509277344, -54.92609405517578, -52.67400360107422, -50.42190933227539, -48.16981887817383, -45.917728424072266, -43.6656379699707, -41.413543701171875, -39.16145324707031, -36.90936279296875, -34.65727233886719, -32.40517807006836, -30.153087615966797, -27.900997161865234, -25.648906707763672, -23.396814346313477, -21.144723892211914, -18.89263153076172, -16.640541076660156, -14.388449668884277, -12.136358261108398, -9.884267807006836, -7.632176399230957, -5.380084991455078, -3.1279938220977783, -0.8759026527404785, 1.3761882781982422, 3.628279685974121, 5.88037109375, 8.132461547851562, 10.384552955627441, 12.63664436340332, 14.8887357711792, 17.140827178955078, 19.39291763305664, 21.645008087158203, 23.8971004486084, 26.14919090270996, 28.401283264160156, 30.65337371826172]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 4.0, 8.0, 9.0, 13.0, 10.0, 20.0, 10.0, 28.0, 16.0, 28.0, 30.0, 15.0, 35.0, 38.0, 26.0, 38.0, 44.0, 53.0, 43.0, 41.0, 36.0, 25.0, 36.0, 38.0, 30.0, 36.0, 36.0, 35.0, 37.0, 30.0, 31.0, 18.0, 18.0, 20.0, 12.0, 14.0, 8.0, 9.0, 5.0, 2.0, 6.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.002716064453125, -25.202999114990234, -24.403282165527344, -23.603565216064453, -22.803848266601562, -22.004131317138672, -21.20441436767578, -20.40469741821289, -19.60498046875, -18.80526351928711, -18.00554656982422, -17.205829620361328, -16.406112670898438, -15.606395721435547, -14.806678771972656, -14.006961822509766, -13.207244873046875, -12.407527923583984, -11.607810974121094, -10.808094024658203, -10.008377075195312, -9.208660125732422, -8.408943176269531, -7.609226226806641, -6.80950927734375, -6.009792327880859, -5.210075378417969, -4.410358428955078, -3.6106414794921875, -2.810924530029297, -2.0112075805664062, -1.2114906311035156, -0.4117717742919922, 0.38794517517089844, 1.187662124633789, 1.9873790740966797, 2.7870960235595703, 3.586812973022461, 4.386529922485352, 5.186246871948242, 5.985963821411133, 6.785680770874023, 7.585397720336914, 8.385114669799805, 9.184831619262695, 9.984548568725586, 10.784265518188477, 11.583982467651367, 12.383699417114258, 13.183416366577148, 13.983133316040039, 14.78285026550293, 15.58256721496582, 16.38228416442871, 17.1820011138916, 17.981718063354492, 18.781435012817383, 19.581151962280273, 20.380868911743164, 21.180585861206055, 21.980302810668945, 22.780019760131836, 23.579736709594727, 24.379453659057617, 25.179170608520508]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 4.0, 5.0, 2.0, 9.0, 16.0, 16.0, 19.0, 19.0, 22.0, 17.0, 23.0, 27.0, 33.0, 28.0, 33.0, 33.0, 45.0, 32.0, 32.0, 39.0, 44.0, 43.0, 38.0, 41.0, 40.0, 34.0, 45.0, 31.0, 35.0, 20.0, 28.0, 25.0, 24.0, 18.0, 14.0, 13.0, 15.0, 10.0, 7.0, 3.0, 6.0, 5.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0], "bins": [-3.779296875, -3.673583984375, -3.56787109375, -3.462158203125, -3.3564453125, -3.250732421875, -3.14501953125, -3.039306640625, -2.93359375, -2.827880859375, -2.72216796875, -2.616455078125, -2.5107421875, -2.405029296875, -2.29931640625, -2.193603515625, -2.087890625, -1.982177734375, -1.87646484375, -1.770751953125, -1.6650390625, -1.559326171875, -1.45361328125, -1.347900390625, -1.2421875, -1.136474609375, -1.03076171875, -0.925048828125, -0.8193359375, -0.713623046875, -0.60791015625, -0.502197265625, -0.396484375, -0.290771484375, -0.18505859375, -0.079345703125, 0.0263671875, 0.132080078125, 0.23779296875, 0.343505859375, 0.44921875, 0.554931640625, 0.66064453125, 0.766357421875, 0.8720703125, 0.977783203125, 1.08349609375, 1.189208984375, 1.294921875, 1.400634765625, 1.50634765625, 1.612060546875, 1.7177734375, 1.823486328125, 1.92919921875, 2.034912109375, 2.140625, 2.246337890625, 2.35205078125, 2.457763671875, 2.5634765625, 2.669189453125, 2.77490234375, 2.880615234375, 2.986328125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 6.0, 10.0, 4.0, 12.0, 6.0, 6.0, 20.0, 17.0, 22.0, 49.0, 50.0, 63.0, 115.0, 173.0, 300.0, 736.0, 1593.0, 4476.0, 14634.0, 51545.0, 198292.0, 761584.0, 1801572.0, 994937.0, 266519.0, 68447.0, 19065.0, 5874.0, 2184.0, 874.0, 453.0, 204.0, 139.0, 80.0, 60.0, 34.0, 25.0, 23.0, 15.0, 20.0, 7.0, 9.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.16015625, -4.0196533203125, -3.879150390625, -3.7386474609375, -3.59814453125, -3.4576416015625, -3.317138671875, -3.1766357421875, -3.0361328125, -2.8956298828125, -2.755126953125, -2.6146240234375, -2.47412109375, -2.3336181640625, -2.193115234375, -2.0526123046875, -1.912109375, -1.7716064453125, -1.631103515625, -1.4906005859375, -1.35009765625, -1.2095947265625, -1.069091796875, -0.9285888671875, -0.7880859375, -0.6475830078125, -0.507080078125, -0.3665771484375, -0.22607421875, -0.0855712890625, 0.054931640625, 0.1954345703125, 0.3359375, 0.4764404296875, 0.616943359375, 0.7574462890625, 0.89794921875, 1.0384521484375, 1.178955078125, 1.3194580078125, 1.4599609375, 1.6004638671875, 1.740966796875, 1.8814697265625, 2.02197265625, 2.1624755859375, 2.302978515625, 2.4434814453125, 2.583984375, 2.7244873046875, 2.864990234375, 3.0054931640625, 3.14599609375, 3.2864990234375, 3.427001953125, 3.5675048828125, 3.7080078125, 3.8485107421875, 3.989013671875, 4.1295166015625, 4.27001953125, 4.4105224609375, 4.551025390625, 4.6915283203125, 4.83203125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 5.0, 7.0, 5.0, 10.0, 16.0, 25.0, 33.0, 40.0, 47.0, 90.0, 103.0, 155.0, 235.0, 354.0, 445.0, 524.0, 527.0, 392.0, 295.0, 225.0, 171.0, 121.0, 74.0, 44.0, 44.0, 30.0, 19.0, 14.0, 16.0, 10.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.85528564453125, -3.6715087890625, -3.48773193359375, -3.303955078125, -3.12017822265625, -2.9364013671875, -2.75262451171875, -2.56884765625, -2.38507080078125, -2.2012939453125, -2.01751708984375, -1.833740234375, -1.64996337890625, -1.4661865234375, -1.28240966796875, -1.0986328125, -0.91485595703125, -0.7310791015625, -0.54730224609375, -0.363525390625, -0.17974853515625, 0.0040283203125, 0.18780517578125, 0.37158203125, 0.55535888671875, 0.7391357421875, 0.92291259765625, 1.106689453125, 1.29046630859375, 1.4742431640625, 1.65802001953125, 1.841796875, 2.02557373046875, 2.2093505859375, 2.39312744140625, 2.576904296875, 2.76068115234375, 2.9444580078125, 3.12823486328125, 3.31201171875, 3.49578857421875, 3.6795654296875, 3.86334228515625, 4.047119140625, 4.23089599609375, 4.4146728515625, 4.59844970703125, 4.7822265625, 4.96600341796875, 5.1497802734375, 5.33355712890625, 5.517333984375, 5.70111083984375, 5.8848876953125, 6.06866455078125, 6.25244140625, 6.43621826171875, 6.6199951171875, 6.80377197265625, 6.987548828125, 7.17132568359375, 7.3551025390625, 7.53887939453125, 7.72265625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 4.0, 2.0, 12.0, 15.0, 18.0, 32.0, 43.0, 55.0, 95.0, 163.0, 263.0, 455.0, 946.0, 4022.0, 53907.0, 2128473.0, 1950408.0, 49497.0, 3836.0, 909.0, 410.0, 231.0, 178.0, 93.0, 78.0, 45.0, 38.0, 18.0, 13.0, 11.0, 7.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 3.0], "bins": [-21.234375, -20.7286376953125, -20.222900390625, -19.7171630859375, -19.21142578125, -18.7056884765625, -18.199951171875, -17.6942138671875, -17.1884765625, -16.6827392578125, -16.177001953125, -15.6712646484375, -15.16552734375, -14.6597900390625, -14.154052734375, -13.6483154296875, -13.142578125, -12.6368408203125, -12.131103515625, -11.6253662109375, -11.11962890625, -10.6138916015625, -10.108154296875, -9.6024169921875, -9.0966796875, -8.5909423828125, -8.085205078125, -7.5794677734375, -7.07373046875, -6.5679931640625, -6.062255859375, -5.5565185546875, -5.05078125, -4.5450439453125, -4.039306640625, -3.5335693359375, -3.02783203125, -2.5220947265625, -2.016357421875, -1.5106201171875, -1.0048828125, -0.4991455078125, 0.006591796875, 0.5123291015625, 1.01806640625, 1.5238037109375, 2.029541015625, 2.5352783203125, 3.041015625, 3.5467529296875, 4.052490234375, 4.5582275390625, 5.06396484375, 5.5697021484375, 6.075439453125, 6.5811767578125, 7.0869140625, 7.5926513671875, 8.098388671875, 8.6041259765625, 9.10986328125, 9.6156005859375, 10.121337890625, 10.6270751953125, 11.1328125]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 14.0, 87.0, 216.0, 356.0, 241.0, 83.0, 16.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.1852798461914, -78.83224487304688, -76.47920227050781, -74.12616729736328, -71.77313232421875, -69.42008972167969, -67.06705474853516, -64.71401977539062, -62.36097717285156, -60.007938385009766, -57.65489959716797, -55.30186462402344, -52.94882583618164, -50.595787048339844, -48.24275207519531, -45.889713287353516, -43.53667449951172, -41.18363571166992, -38.830596923828125, -36.477561950683594, -34.1245231628418, -31.771484375, -29.418447494506836, -27.065410614013672, -24.712371826171875, -22.359333038330078, -20.006296157836914, -17.65325927734375, -15.300220489501953, -12.947182655334473, -10.594144821166992, -8.241107940673828, -5.8880615234375, -3.5350236892700195, -1.181985855102539, 1.1710519790649414, 3.524089813232422, 5.877127647399902, 8.230165481567383, 10.583202362060547, 12.936241149902344, 15.289278984069824, 17.642316818237305, 19.99535369873047, 22.348392486572266, 24.701431274414062, 27.054468154907227, 29.40750503540039, 31.760543823242188, 34.113582611083984, 36.46662139892578, 38.81965637207031, 41.17269515991211, 43.525733947753906, 45.87876892089844, 48.231807708740234, 50.58484649658203, 52.93788528442383, 55.290924072265625, 57.643959045410156, 59.99699783325195, 62.35003662109375, 64.70307159423828, 67.05610656738281, 69.40914916992188]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 0.0, 4.0, 8.0, 2.0, 2.0, 4.0, 7.0, 9.0, 10.0, 13.0, 19.0, 22.0, 27.0, 13.0, 32.0, 38.0, 40.0, 32.0, 41.0, 51.0, 39.0, 35.0, 45.0, 49.0, 60.0, 41.0, 40.0, 44.0, 36.0, 28.0, 29.0, 25.0, 22.0, 19.0, 27.0, 20.0, 15.0, 10.0, 10.0, 5.0, 10.0, 10.0, 3.0, 4.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.829551696777344, -18.26865577697754, -17.707761764526367, -17.146865844726562, -16.585969924926758, -16.025075912475586, -15.464179992675781, -14.903285026550293, -14.342390060424805, -13.781495094299316, -13.220599174499512, -12.659704208374023, -12.098809242248535, -11.537914276123047, -10.977018356323242, -10.416123390197754, -9.85522747039795, -9.294332504272461, -8.733436584472656, -8.172541618347168, -7.61164665222168, -7.050751209259033, -6.489855766296387, -5.928960800170898, -5.368065357208252, -4.8071699142456055, -4.246274948120117, -3.6853795051574707, -3.1244843006134033, -2.563589096069336, -2.0026936531066895, -1.441798448562622, -0.8809032440185547, -0.32000797986984253, 0.24088728427886963, 0.8017826080322266, 1.362677812576294, 1.9235730171203613, 2.484468460083008, 3.045363664627075, 3.6062588691711426, 4.167154312133789, 4.728049278259277, 5.288944721221924, 5.84984016418457, 6.410735130310059, 6.971630573272705, 7.532526016235352, 8.09342098236084, 8.654315948486328, 9.215211868286133, 9.776106834411621, 10.33700180053711, 10.897897720336914, 11.458792686462402, 12.01968765258789, 12.580583572387695, 13.141478538513184, 13.702374458312988, 14.263269424438477, 14.824164390563965, 15.385059356689453, 15.945955276489258, 16.506851196289062, 17.067745208740234]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 1.0, 2.0, 3.0, 3.0, 7.0, 13.0, 9.0, 10.0, 11.0, 14.0, 14.0, 16.0, 27.0, 24.0, 25.0, 30.0, 36.0, 41.0, 33.0, 35.0, 39.0, 33.0, 53.0, 48.0, 38.0, 35.0, 36.0, 37.0, 43.0, 26.0, 36.0, 19.0, 28.0, 33.0, 29.0, 15.0, 22.0, 11.0, 11.0, 12.0, 11.0, 9.0, 3.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.364349365234375, -3.25799560546875, -3.151641845703125, -3.0452880859375, -2.938934326171875, -2.83258056640625, -2.726226806640625, -2.619873046875, -2.513519287109375, -2.40716552734375, -2.300811767578125, -2.1944580078125, -2.088104248046875, -1.98175048828125, -1.875396728515625, -1.76904296875, -1.662689208984375, -1.55633544921875, -1.449981689453125, -1.3436279296875, -1.237274169921875, -1.13092041015625, -1.024566650390625, -0.918212890625, -0.811859130859375, -0.70550537109375, -0.599151611328125, -0.4927978515625, -0.386444091796875, -0.28009033203125, -0.173736572265625, -0.0673828125, 0.038970947265625, 0.14532470703125, 0.251678466796875, 0.3580322265625, 0.464385986328125, 0.57073974609375, 0.677093505859375, 0.783447265625, 0.889801025390625, 0.99615478515625, 1.102508544921875, 1.2088623046875, 1.315216064453125, 1.42156982421875, 1.527923583984375, 1.63427734375, 1.740631103515625, 1.84698486328125, 1.953338623046875, 2.0596923828125, 2.166046142578125, 2.27239990234375, 2.378753662109375, 2.485107421875, 2.591461181640625, 2.69781494140625, 2.804168701171875, 2.9105224609375, 3.016876220703125, 3.12322998046875, 3.229583740234375, 3.3359375]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 4.0, 21.0, 26.0, 26.0, 53.0, 74.0, 151.0, 229.0, 407.0, 646.0, 1116.0, 1897.0, 3238.0, 5441.0, 9317.0, 15498.0, 25680.0, 42363.0, 69383.0, 111652.0, 164797.0, 191471.0, 151907.0, 98741.0, 61108.0, 37344.0, 22649.0, 13637.0, 7872.0, 4884.0, 2822.0, 1622.0, 1039.0, 557.0, 343.0, 198.0, 118.0, 77.0, 64.0, 26.0, 23.0, 12.0, 3.0, 4.0, 4.0, 5.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2352294921875, -0.22693824768066406, -0.21864700317382812, -0.2103557586669922, -0.20206451416015625, -0.1937732696533203, -0.18548202514648438, -0.17719078063964844, -0.1688995361328125, -0.16060829162597656, -0.15231704711914062, -0.1440258026123047, -0.13573455810546875, -0.1274433135986328, -0.11915206909179688, -0.11086082458496094, -0.102569580078125, -0.09427833557128906, -0.08598709106445312, -0.07769584655761719, -0.06940460205078125, -0.06111335754394531, -0.052822113037109375, -0.04453086853027344, -0.0362396240234375, -0.027948379516601562, -0.019657135009765625, -0.011365890502929688, -0.00307464599609375, 0.0052165985107421875, 0.013507843017578125, 0.021799087524414062, 0.03009033203125, 0.03838157653808594, 0.046672821044921875, 0.05496406555175781, 0.06325531005859375, 0.07154655456542969, 0.07983779907226562, 0.08812904357910156, 0.0964202880859375, 0.10471153259277344, 0.11300277709960938, 0.12129402160644531, 0.12958526611328125, 0.1378765106201172, 0.14616775512695312, 0.15445899963378906, 0.162750244140625, 0.17104148864746094, 0.17933273315429688, 0.1876239776611328, 0.19591522216796875, 0.2042064666748047, 0.21249771118164062, 0.22078895568847656, 0.2290802001953125, 0.23737144470214844, 0.24566268920898438, 0.2539539337158203, 0.26224517822265625, 0.2705364227294922, 0.2788276672363281, 0.28711891174316406, 0.29541015625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 0.0, 3.0, 7.0, 3.0, 3.0, 10.0, 12.0, 9.0, 13.0, 14.0, 25.0, 21.0, 18.0, 23.0, 29.0, 43.0, 28.0, 47.0, 39.0, 37.0, 36.0, 42.0, 1070.0, 44.0, 39.0, 50.0, 43.0, 46.0, 29.0, 31.0, 28.0, 38.0, 19.0, 23.0, 18.0, 15.0, 9.0, 19.0, 13.0, 8.0, 5.0, 9.0, 0.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.908203125, -2.8262939453125, -2.744384765625, -2.6624755859375, -2.58056640625, -2.4986572265625, -2.416748046875, -2.3348388671875, -2.2529296875, -2.1710205078125, -2.089111328125, -2.0072021484375, -1.92529296875, -1.8433837890625, -1.761474609375, -1.6795654296875, -1.59765625, -1.5157470703125, -1.433837890625, -1.3519287109375, -1.27001953125, -1.1881103515625, -1.106201171875, -1.0242919921875, -0.9423828125, -0.8604736328125, -0.778564453125, -0.6966552734375, -0.61474609375, -0.5328369140625, -0.450927734375, -0.3690185546875, -0.287109375, -0.2052001953125, -0.123291015625, -0.0413818359375, 0.04052734375, 0.1224365234375, 0.204345703125, 0.2862548828125, 0.3681640625, 0.4500732421875, 0.531982421875, 0.6138916015625, 0.69580078125, 0.7777099609375, 0.859619140625, 0.9415283203125, 1.0234375, 1.1053466796875, 1.187255859375, 1.2691650390625, 1.35107421875, 1.4329833984375, 1.514892578125, 1.5968017578125, 1.6787109375, 1.7606201171875, 1.842529296875, 1.9244384765625, 2.00634765625, 2.0882568359375, 2.170166015625, 2.2520751953125, 2.333984375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 6.0, 0.0, 3.0, 7.0, 13.0, 12.0, 21.0, 32.0, 57.0, 76.0, 101.0, 171.0, 239.0, 378.0, 614.0, 960.0, 1516.0, 2311.0, 3684.0, 5750.0, 8849.0, 13993.0, 21150.0, 33444.0, 51045.0, 76760.0, 109536.0, 146952.0, 1195802.0, 132506.0, 97682.0, 67411.0, 44768.0, 28988.0, 18551.0, 12026.0, 7863.0, 4869.0, 3181.0, 2062.0, 1311.0, 836.0, 593.0, 352.0, 230.0, 135.0, 101.0, 58.0, 45.0, 40.0, 17.0, 15.0, 8.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.142822265625, -0.13840484619140625, -0.1339874267578125, -0.12957000732421875, -0.125152587890625, -0.12073516845703125, -0.1163177490234375, -0.11190032958984375, -0.10748291015625, -0.10306549072265625, -0.0986480712890625, -0.09423065185546875, -0.089813232421875, -0.08539581298828125, -0.0809783935546875, -0.07656097412109375, -0.0721435546875, -0.06772613525390625, -0.0633087158203125, -0.05889129638671875, -0.054473876953125, -0.05005645751953125, -0.0456390380859375, -0.04122161865234375, -0.03680419921875, -0.03238677978515625, -0.0279693603515625, -0.02355194091796875, -0.019134521484375, -0.01471710205078125, -0.0102996826171875, -0.00588226318359375, -0.00146484375, 0.00295257568359375, 0.0073699951171875, 0.01178741455078125, 0.016204833984375, 0.02062225341796875, 0.0250396728515625, 0.02945709228515625, 0.03387451171875, 0.03829193115234375, 0.0427093505859375, 0.04712677001953125, 0.051544189453125, 0.05596160888671875, 0.0603790283203125, 0.06479644775390625, 0.0692138671875, 0.07363128662109375, 0.0780487060546875, 0.08246612548828125, 0.086883544921875, 0.09130096435546875, 0.0957183837890625, 0.10013580322265625, 0.10455322265625, 0.10897064208984375, 0.1133880615234375, 0.11780548095703125, 0.122222900390625, 0.12664031982421875, 0.1310577392578125, 0.13547515869140625, 0.139892578125]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 6.0, 9.0, 14.0, 10.0, 26.0, 27.0, 34.0, 49.0, 126.0, 177.0, 175.0, 110.0, 70.0, 36.0, 35.0, 22.0, 13.0, 16.0, 7.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009674072265625, -0.009352922439575195, -0.00903177261352539, -0.008710622787475586, -0.008389472961425781, -0.008068323135375977, -0.007747173309326172, -0.007426023483276367, -0.0071048736572265625, -0.006783723831176758, -0.006462574005126953, -0.0061414241790771484, -0.005820274353027344, -0.005499124526977539, -0.005177974700927734, -0.00485682487487793, -0.004535675048828125, -0.00421452522277832, -0.0038933753967285156, -0.003572225570678711, -0.0032510757446289062, -0.0029299259185791016, -0.002608776092529297, -0.002287626266479492, -0.0019664764404296875, -0.0016453266143798828, -0.0013241767883300781, -0.0010030269622802734, -0.0006818771362304688, -0.00036072731018066406, -3.9577484130859375e-05, 0.0002815723419189453, 0.00060272216796875, 0.0009238719940185547, 0.0012450218200683594, 0.001566171646118164, 0.0018873214721679688, 0.0022084712982177734, 0.002529621124267578, 0.002850770950317383, 0.0031719207763671875, 0.003493070602416992, 0.003814220428466797, 0.0041353702545166016, 0.004456520080566406, 0.004777669906616211, 0.005098819732666016, 0.00541996955871582, 0.005741119384765625, 0.00606226921081543, 0.006383419036865234, 0.006704568862915039, 0.007025718688964844, 0.0073468685150146484, 0.007668018341064453, 0.007989168167114258, 0.008310317993164062, 0.008631467819213867, 0.008952617645263672, 0.009273767471313477, 0.009594917297363281, 0.009916067123413086, 0.01023721694946289, 0.010558366775512695, 0.0108795166015625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 3.0, 5.0, 3.0, 7.0, 10.0, 10.0, 15.0, 19.0, 31.0, 41.0, 60.0, 89.0, 236.0, 703.0, 987129.0, 59241.0, 515.0, 178.0, 82.0, 64.0, 33.0, 21.0, 16.0, 17.0, 6.0, 5.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.23046875, -0.22366714477539062, -0.21686553955078125, -0.21006393432617188, -0.2032623291015625, -0.19646072387695312, -0.18965911865234375, -0.18285751342773438, -0.176055908203125, -0.16925430297851562, -0.16245269775390625, -0.15565109252929688, -0.1488494873046875, -0.14204788208007812, -0.13524627685546875, -0.12844467163085938, -0.12164306640625, -0.11484146118164062, -0.10803985595703125, -0.10123825073242188, -0.0944366455078125, -0.08763504028320312, -0.08083343505859375, -0.07403182983398438, -0.067230224609375, -0.060428619384765625, -0.05362701416015625, -0.046825408935546875, -0.0400238037109375, -0.033222198486328125, -0.02642059326171875, -0.019618988037109375, -0.0128173828125, -0.006015777587890625, 0.00078582763671875, 0.007587432861328125, 0.0143890380859375, 0.021190643310546875, 0.02799224853515625, 0.034793853759765625, 0.041595458984375, 0.048397064208984375, 0.05519866943359375, 0.062000274658203125, 0.0688018798828125, 0.07560348510742188, 0.08240509033203125, 0.08920669555664062, 0.09600830078125, 0.10280990600585938, 0.10961151123046875, 0.11641311645507812, 0.1232147216796875, 0.13001632690429688, 0.13681793212890625, 0.14361953735351562, 0.150421142578125, 0.15722274780273438, 0.16402435302734375, 0.17082595825195312, 0.1776275634765625, 0.18442916870117188, 0.19123077392578125, 0.19803237915039062, 0.204833984375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 23.0, 106.0, 589.0, 269.0, 25.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0663873627781868, -0.06521732360124588, -0.06404727697372437, -0.06287723779678345, -0.06170719116926193, -0.060537148267030716, -0.0593671053647995, -0.05819706246256828, -0.05702701956033707, -0.05585697665810585, -0.054686933755874634, -0.05351689085364342, -0.0523468479514122, -0.051176805049180984, -0.05000676214694977, -0.04883671924471855, -0.047666676342487335, -0.04649663344025612, -0.0453265905380249, -0.044156547635793686, -0.04298650473356247, -0.04181646183133125, -0.04064641892910004, -0.03947637602686882, -0.0383063368499279, -0.037136293947696686, -0.03596625104546547, -0.03479620814323425, -0.033626165241003036, -0.03245612233877182, -0.031286079436540604, -0.030116036534309387, -0.02894599549472332, -0.027775952592492104, -0.026605909690260887, -0.02543586678802967, -0.024265823885798454, -0.023095780983567238, -0.02192573994398117, -0.020755697041749954, -0.019585654139518738, -0.01841561123728752, -0.017245568335056305, -0.01607552543282509, -0.014905482530593872, -0.013735439628362656, -0.012565397657454014, -0.011395354755222797, -0.010225310921669006, -0.00905526801943779, -0.007885225117206573, -0.006715182680636644, -0.005545139778405428, -0.0043750968761742115, -0.0032050544396042824, -0.002035011537373066, -0.0008649686351418495, 0.0003050741506740451, 0.0014751169364899397, 0.0026451596058905125, 0.003815202508121729, 0.004985245410352945, 0.0061552878469228745, 0.007325330749154091, 0.008495373651385307]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 10.0, 8.0, 9.0, 9.0, 12.0, 17.0, 15.0, 23.0, 21.0, 30.0, 29.0, 28.0, 38.0, 41.0, 35.0, 50.0, 37.0, 34.0, 60.0, 41.0, 51.0, 52.0, 42.0, 40.0, 35.0, 46.0, 40.0, 27.0, 23.0, 23.0, 9.0, 16.0, 12.0, 16.0, 9.0, 5.0, 6.0, 3.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.005005240440368652, -0.004851999692618847, -0.0046987589448690414, -0.004545518197119236, -0.0043922774493694305, -0.004239036701619625, -0.00408579595386982, -0.003932555206120014, -0.0037793144583702087, -0.0036260737106204033, -0.003472832962870598, -0.0033195922151207924, -0.003166351467370987, -0.0030131107196211815, -0.002859869971871376, -0.0027066292241215706, -0.002553388476371765, -0.0024001477286219597, -0.0022469069808721542, -0.002093666233122349, -0.0019404254853725433, -0.0017871847376227379, -0.0016339439898729324, -0.001480703242123127, -0.0013274624943733215, -0.001174221746623516, -0.0010209809988737106, -0.0008677402511239052, -0.0007144995033740997, -0.0005612587556242943, -0.00040801800787448883, -0.0002547772601246834, -0.00010153651237487793, 5.170423537492752e-05, 0.00020494498312473297, 0.0003581857308745384, 0.0005114264786243439, 0.0006646672263741493, 0.0008179079741239548, 0.0009711487218737602, 0.0011243894696235657, 0.0012776302173733711, 0.0014308709651231766, 0.001584111712872982, 0.0017373524606227875, 0.001890593208372593, 0.0020438339561223984, 0.002197074703872204, 0.0023503154516220093, 0.0025035561993718147, 0.00265679694712162, 0.0028100376948714256, 0.002963278442621231, 0.0031165191903710365, 0.003269759938120842, 0.0034230006858706474, 0.003576241433620453, 0.0037294821813702583, 0.0038827229291200638, 0.004035963676869869, 0.004189204424619675, 0.00434244517236948, 0.004495685920119286, 0.004648926667869091, 0.0048021674156188965]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 6.0, 1.0, 2.0, 3.0, 3.0, 7.0, 13.0, 9.0, 10.0, 11.0, 14.0, 14.0, 16.0, 27.0, 24.0, 25.0, 30.0, 36.0, 41.0, 33.0, 35.0, 39.0, 34.0, 52.0, 48.0, 38.0, 35.0, 36.0, 37.0, 43.0, 26.0, 36.0, 19.0, 28.0, 33.0, 29.0, 15.0, 22.0, 11.0, 11.0, 12.0, 11.0, 9.0, 3.0, 9.0, 3.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.470703125, -3.364349365234375, -3.25799560546875, -3.151641845703125, -3.0452880859375, -2.938934326171875, -2.83258056640625, -2.726226806640625, -2.619873046875, -2.513519287109375, -2.40716552734375, -2.300811767578125, -2.1944580078125, -2.088104248046875, -1.98175048828125, -1.875396728515625, -1.76904296875, -1.662689208984375, -1.55633544921875, -1.449981689453125, -1.3436279296875, -1.237274169921875, -1.13092041015625, -1.024566650390625, -0.918212890625, -0.811859130859375, -0.70550537109375, -0.599151611328125, -0.4927978515625, -0.386444091796875, -0.28009033203125, -0.173736572265625, -0.0673828125, 0.038970947265625, 0.14532470703125, 0.251678466796875, 0.3580322265625, 0.464385986328125, 0.57073974609375, 0.677093505859375, 0.783447265625, 0.889801025390625, 0.99615478515625, 1.102508544921875, 1.2088623046875, 1.315216064453125, 1.42156982421875, 1.527923583984375, 1.63427734375, 1.740631103515625, 1.84698486328125, 1.953338623046875, 2.0596923828125, 2.166046142578125, 2.27239990234375, 2.378753662109375, 2.485107421875, 2.591461181640625, 2.69781494140625, 2.804168701171875, 2.9105224609375, 3.016876220703125, 3.12322998046875, 3.229583740234375, 3.3359375]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 8.0, 6.0, 8.0, 16.0, 25.0, 34.0, 53.0, 66.0, 109.0, 144.0, 226.0, 357.0, 684.0, 1272.0, 2425.0, 4932.0, 10173.0, 22392.0, 47917.0, 103988.0, 214517.0, 320888.0, 167842.0, 79886.0, 37287.0, 16902.0, 8170.0, 3778.0, 1939.0, 1001.0, 535.0, 333.0, 192.0, 147.0, 83.0, 65.0, 41.0, 31.0, 22.0, 17.0, 9.0, 8.0, 8.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.203125, -4.0731201171875, -3.943115234375, -3.8131103515625, -3.68310546875, -3.5531005859375, -3.423095703125, -3.2930908203125, -3.1630859375, -3.0330810546875, -2.903076171875, -2.7730712890625, -2.64306640625, -2.5130615234375, -2.383056640625, -2.2530517578125, -2.123046875, -1.9930419921875, -1.863037109375, -1.7330322265625, -1.60302734375, -1.4730224609375, -1.343017578125, -1.2130126953125, -1.0830078125, -0.9530029296875, -0.822998046875, -0.6929931640625, -0.56298828125, -0.4329833984375, -0.302978515625, -0.1729736328125, -0.04296875, 0.0870361328125, 0.217041015625, 0.3470458984375, 0.47705078125, 0.6070556640625, 0.737060546875, 0.8670654296875, 0.9970703125, 1.1270751953125, 1.257080078125, 1.3870849609375, 1.51708984375, 1.6470947265625, 1.777099609375, 1.9071044921875, 2.037109375, 2.1671142578125, 2.297119140625, 2.4271240234375, 2.55712890625, 2.6871337890625, 2.817138671875, 2.9471435546875, 3.0771484375, 3.2071533203125, 3.337158203125, 3.4671630859375, 3.59716796875, 3.7271728515625, 3.857177734375, 3.9871826171875, 4.1171875]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 10.0, 12.0, 11.0, 14.0, 22.0, 11.0, 25.0, 34.0, 27.0, 47.0, 44.0, 57.0, 72.0, 119.0, 177.0, 1365.0, 314.0, 178.0, 91.0, 61.0, 49.0, 54.0, 44.0, 26.0, 25.0, 18.0, 25.0, 22.0, 22.0, 9.0, 7.0, 8.0, 10.0, 7.0, 6.0, 4.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.6640625, -9.3182373046875, -8.972412109375, -8.6265869140625, -8.28076171875, -7.9349365234375, -7.589111328125, -7.2432861328125, -6.8974609375, -6.5516357421875, -6.205810546875, -5.8599853515625, -5.51416015625, -5.1683349609375, -4.822509765625, -4.4766845703125, -4.130859375, -3.7850341796875, -3.439208984375, -3.0933837890625, -2.74755859375, -2.4017333984375, -2.055908203125, -1.7100830078125, -1.3642578125, -1.0184326171875, -0.672607421875, -0.3267822265625, 0.01904296875, 0.3648681640625, 0.710693359375, 1.0565185546875, 1.40234375, 1.7481689453125, 2.093994140625, 2.4398193359375, 2.78564453125, 3.1314697265625, 3.477294921875, 3.8231201171875, 4.1689453125, 4.5147705078125, 4.860595703125, 5.2064208984375, 5.55224609375, 5.8980712890625, 6.243896484375, 6.5897216796875, 6.935546875, 7.2813720703125, 7.627197265625, 7.9730224609375, 8.31884765625, 8.6646728515625, 9.010498046875, 9.3563232421875, 9.7021484375, 10.0479736328125, 10.393798828125, 10.7396240234375, 11.08544921875, 11.4312744140625, 11.777099609375, 12.1229248046875, 12.46875]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 8.0, 5.0, 12.0, 13.0, 18.0, 23.0, 26.0, 36.0, 45.0, 64.0, 107.0, 133.0, 188.0, 288.0, 515.0, 1142.0, 6591.0, 86983.0, 2357182.0, 659138.0, 28280.0, 2899.0, 751.0, 381.0, 277.0, 169.0, 125.0, 97.0, 55.0, 41.0, 20.0, 24.0, 21.0, 11.0, 14.0, 9.0, 3.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.15625, -14.720703125, -14.28515625, -13.849609375, -13.4140625, -12.978515625, -12.54296875, -12.107421875, -11.671875, -11.236328125, -10.80078125, -10.365234375, -9.9296875, -9.494140625, -9.05859375, -8.623046875, -8.1875, -7.751953125, -7.31640625, -6.880859375, -6.4453125, -6.009765625, -5.57421875, -5.138671875, -4.703125, -4.267578125, -3.83203125, -3.396484375, -2.9609375, -2.525390625, -2.08984375, -1.654296875, -1.21875, -0.783203125, -0.34765625, 0.087890625, 0.5234375, 0.958984375, 1.39453125, 1.830078125, 2.265625, 2.701171875, 3.13671875, 3.572265625, 4.0078125, 4.443359375, 4.87890625, 5.314453125, 5.75, 6.185546875, 6.62109375, 7.056640625, 7.4921875, 7.927734375, 8.36328125, 8.798828125, 9.234375, 9.669921875, 10.10546875, 10.541015625, 10.9765625, 11.412109375, 11.84765625, 12.283203125, 12.71875]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 63.0, 510.0, 413.0, 31.0], "bins": [-202.80532836914062, -199.52784729003906, -196.2503662109375, -192.97288513183594, -189.69540405273438, -186.41790771484375, -183.14044189453125, -179.86294555664062, -176.58546447753906, -173.3079833984375, -170.03050231933594, -166.75302124023438, -163.4755401611328, -160.19805908203125, -156.92056274414062, -153.64308166503906, -150.3656005859375, -147.08811950683594, -143.81063842773438, -140.5331573486328, -137.25567626953125, -133.97817993164062, -130.70071411132812, -127.42322540283203, -124.145751953125, -120.86827087402344, -117.59078979492188, -114.31330871582031, -111.03582000732422, -107.75833892822266, -104.4808578491211, -101.20337677001953, -97.92588806152344, -94.64840698242188, -91.37092590332031, -88.09344482421875, -84.81595611572266, -81.5384750366211, -78.26099395751953, -74.98351287841797, -71.7060317993164, -68.42855072021484, -65.15106964111328, -61.87358474731445, -58.596099853515625, -55.31861877441406, -52.0411376953125, -48.76365661621094, -45.48617172241211, -42.20869064331055, -38.93120574951172, -35.653724670410156, -32.376243591308594, -29.098758697509766, -25.821277618408203, -22.543794631958008, -19.266311645507812, -15.988828659057617, -12.711346626281738, -9.43386459350586, -6.156381607055664, -2.8788986206054688, 0.39858245849609375, 3.676065444946289, 6.953549385070801]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 7.0, 7.0, 13.0, 10.0, 20.0, 12.0, 21.0, 28.0, 28.0, 35.0, 33.0, 33.0, 46.0, 32.0, 41.0, 35.0, 44.0, 55.0, 57.0, 44.0, 58.0, 41.0, 32.0, 51.0, 32.0, 30.0, 25.0, 25.0, 24.0, 18.0, 20.0, 10.0, 8.0, 10.0, 7.0, 5.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.668346405029297, -26.806684494018555, -25.945022583007812, -25.083358764648438, -24.221696853637695, -23.360034942626953, -22.498371124267578, -21.636709213256836, -20.775047302246094, -19.91338539123535, -19.05172348022461, -18.190059661865234, -17.328397750854492, -16.46673583984375, -15.605072975158691, -14.743410110473633, -13.88174819946289, -13.020086288452148, -12.15842342376709, -11.296760559082031, -10.435098648071289, -9.573436737060547, -8.711773872375488, -7.850111484527588, -6.9884490966796875, -6.126786708831787, -5.265124320983887, -4.403461933135986, -3.541799545288086, -2.6801371574401855, -1.8184747695922852, -0.9568123817443848, -0.09515190124511719, 0.7665104866027832, 1.6281728744506836, 2.489835262298584, 3.3514976501464844, 4.213160037994385, 5.074822425842285, 5.9364848136901855, 6.798147201538086, 7.659809589385986, 8.521471977233887, 9.383134841918945, 10.244796752929688, 11.10645866394043, 11.968121528625488, 12.829784393310547, 13.691446304321289, 14.553108215332031, 15.41477108001709, 16.27643394470215, 17.13809585571289, 17.999757766723633, 18.861419677734375, 19.72308349609375, 20.584745407104492, 21.446407318115234, 22.30807113647461, 23.16973304748535, 24.031394958496094, 24.893056869506836, 25.754718780517578, 26.616382598876953, 27.478044509887695]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 3.0, 4.0, 8.0, 10.0, 15.0, 14.0, 13.0, 12.0, 12.0, 25.0, 22.0, 27.0, 39.0, 26.0, 28.0, 37.0, 46.0, 39.0, 49.0, 50.0, 40.0, 49.0, 38.0, 38.0, 33.0, 49.0, 31.0, 19.0, 28.0, 26.0, 27.0, 19.0, 19.0, 23.0, 16.0, 14.0, 14.0, 6.0, 6.0, 3.0, 6.0, 4.0, 5.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0], "bins": [-4.00390625, -3.891143798828125, -3.77838134765625, -3.665618896484375, -3.5528564453125, -3.440093994140625, -3.32733154296875, -3.214569091796875, -3.101806640625, -2.989044189453125, -2.87628173828125, -2.763519287109375, -2.6507568359375, -2.537994384765625, -2.42523193359375, -2.312469482421875, -2.19970703125, -2.086944580078125, -1.97418212890625, -1.861419677734375, -1.7486572265625, -1.635894775390625, -1.52313232421875, -1.410369873046875, -1.297607421875, -1.184844970703125, -1.07208251953125, -0.959320068359375, -0.8465576171875, -0.733795166015625, -0.62103271484375, -0.508270263671875, -0.3955078125, -0.282745361328125, -0.16998291015625, -0.057220458984375, 0.0555419921875, 0.168304443359375, 0.28106689453125, 0.393829345703125, 0.506591796875, 0.619354248046875, 0.73211669921875, 0.844879150390625, 0.9576416015625, 1.070404052734375, 1.18316650390625, 1.295928955078125, 1.40869140625, 1.521453857421875, 1.63421630859375, 1.746978759765625, 1.8597412109375, 1.972503662109375, 2.08526611328125, 2.198028564453125, 2.310791015625, 2.423553466796875, 2.53631591796875, 2.649078369140625, 2.7618408203125, 2.874603271484375, 2.98736572265625, 3.100128173828125, 3.212890625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 3.0, 3.0, 8.0, 6.0, 16.0, 15.0, 17.0, 31.0, 56.0, 62.0, 75.0, 115.0, 195.0, 368.0, 663.0, 1213.0, 2642.0, 5927.0, 14212.0, 36485.0, 99146.0, 285433.0, 808193.0, 1532129.0, 901986.0, 323910.0, 112042.0, 40504.0, 15816.0, 6774.0, 3000.0, 1451.0, 725.0, 383.0, 218.0, 148.0, 89.0, 69.0, 35.0, 29.0, 19.0, 14.0, 13.0, 10.0, 11.0, 4.0, 5.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 5.0], "bins": [-3.8046875, -3.691314697265625, -3.57794189453125, -3.464569091796875, -3.3511962890625, -3.237823486328125, -3.12445068359375, -3.011077880859375, -2.897705078125, -2.784332275390625, -2.67095947265625, -2.557586669921875, -2.4442138671875, -2.330841064453125, -2.21746826171875, -2.104095458984375, -1.99072265625, -1.877349853515625, -1.76397705078125, -1.650604248046875, -1.5372314453125, -1.423858642578125, -1.31048583984375, -1.197113037109375, -1.083740234375, -0.970367431640625, -0.85699462890625, -0.743621826171875, -0.6302490234375, -0.516876220703125, -0.40350341796875, -0.290130615234375, -0.1767578125, -0.063385009765625, 0.04998779296875, 0.163360595703125, 0.2767333984375, 0.390106201171875, 0.50347900390625, 0.616851806640625, 0.730224609375, 0.843597412109375, 0.95697021484375, 1.070343017578125, 1.1837158203125, 1.297088623046875, 1.41046142578125, 1.523834228515625, 1.63720703125, 1.750579833984375, 1.86395263671875, 1.977325439453125, 2.0906982421875, 2.204071044921875, 2.31744384765625, 2.430816650390625, 2.544189453125, 2.657562255859375, 2.77093505859375, 2.884307861328125, 2.9976806640625, 3.111053466796875, 3.22442626953125, 3.337799072265625, 3.451171875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 2.0, 8.0, 13.0, 10.0, 25.0, 24.0, 32.0, 56.0, 55.0, 90.0, 116.0, 138.0, 224.0, 270.0, 367.0, 470.0, 486.0, 447.0, 362.0, 236.0, 160.0, 127.0, 90.0, 69.0, 47.0, 35.0, 30.0, 18.0, 14.0, 8.0, 12.0, 6.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.109375, -4.951171875, -4.79296875, -4.634765625, -4.4765625, -4.318359375, -4.16015625, -4.001953125, -3.84375, -3.685546875, -3.52734375, -3.369140625, -3.2109375, -3.052734375, -2.89453125, -2.736328125, -2.578125, -2.419921875, -2.26171875, -2.103515625, -1.9453125, -1.787109375, -1.62890625, -1.470703125, -1.3125, -1.154296875, -0.99609375, -0.837890625, -0.6796875, -0.521484375, -0.36328125, -0.205078125, -0.046875, 0.111328125, 0.26953125, 0.427734375, 0.5859375, 0.744140625, 0.90234375, 1.060546875, 1.21875, 1.376953125, 1.53515625, 1.693359375, 1.8515625, 2.009765625, 2.16796875, 2.326171875, 2.484375, 2.642578125, 2.80078125, 2.958984375, 3.1171875, 3.275390625, 3.43359375, 3.591796875, 3.75, 3.908203125, 4.06640625, 4.224609375, 4.3828125, 4.541015625, 4.69921875, 4.857421875, 5.015625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 5.0, 5.0, 10.0, 7.0, 13.0, 18.0, 32.0, 45.0, 55.0, 96.0, 191.0, 275.0, 553.0, 1278.0, 3528.0, 11450.0, 45140.0, 234681.0, 1667534.0, 1893138.0, 267642.0, 49802.0, 12154.0, 3774.0, 1397.0, 628.0, 303.0, 173.0, 114.0, 70.0, 46.0, 29.0, 14.0, 16.0, 16.0, 13.0, 10.0, 7.0, 9.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.21484375, -6.96636962890625, -6.7178955078125, -6.46942138671875, -6.220947265625, -5.97247314453125, -5.7239990234375, -5.47552490234375, -5.22705078125, -4.97857666015625, -4.7301025390625, -4.48162841796875, -4.233154296875, -3.98468017578125, -3.7362060546875, -3.48773193359375, -3.2392578125, -2.99078369140625, -2.7423095703125, -2.49383544921875, -2.245361328125, -1.99688720703125, -1.7484130859375, -1.49993896484375, -1.25146484375, -1.00299072265625, -0.7545166015625, -0.50604248046875, -0.257568359375, -0.00909423828125, 0.2393798828125, 0.48785400390625, 0.736328125, 0.98480224609375, 1.2332763671875, 1.48175048828125, 1.730224609375, 1.97869873046875, 2.2271728515625, 2.47564697265625, 2.72412109375, 2.97259521484375, 3.2210693359375, 3.46954345703125, 3.718017578125, 3.96649169921875, 4.2149658203125, 4.46343994140625, 4.7119140625, 4.96038818359375, 5.2088623046875, 5.45733642578125, 5.705810546875, 5.95428466796875, 6.2027587890625, 6.45123291015625, 6.69970703125, 6.94818115234375, 7.1966552734375, 7.44512939453125, 7.693603515625, 7.94207763671875, 8.1905517578125, 8.43902587890625, 8.6875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 141.0, 616.0, 241.0, 15.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.11626625061035, -25.602092742919922, -21.08791732788086, -16.57374382019043, -12.0595703125, -7.54539680480957, -3.031221389770508, 1.4829521179199219, 5.997125625610352, 10.511299133300781, 15.025473594665527, 19.539648056030273, 24.053821563720703, 28.567995071411133, 33.08216857910156, 37.596343994140625, 42.11051940917969, 46.62469482421875, 51.13886642456055, 55.65304183959961, 60.167213439941406, 64.68138885498047, 69.19556427001953, 73.7097396850586, 78.22390747070312, 82.73808288574219, 87.25225830078125, 91.76643371582031, 96.28060150146484, 100.7947769165039, 105.30895233154297, 109.82312774658203, 114.33729553222656, 118.85147094726562, 123.36564636230469, 127.87982177734375, 132.3939971923828, 136.90817260742188, 141.42233276367188, 145.93650817871094, 150.45068359375, 154.96485900878906, 159.47903442382812, 163.9932098388672, 168.50738525390625, 173.02154541015625, 177.53573608398438, 182.04989624023438, 186.5640869140625, 191.07826232910156, 195.59243774414062, 200.1066131591797, 204.62078857421875, 209.13494873046875, 213.64913940429688, 218.16329956054688, 222.67747497558594, 227.191650390625, 231.70582580566406, 236.22000122070312, 240.7341766357422, 245.24835205078125, 249.76251220703125, 254.2766876220703, 258.7908630371094]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 4.0, 7.0, 10.0, 17.0, 17.0, 24.0, 21.0, 15.0, 21.0, 27.0, 27.0, 35.0, 36.0, 22.0, 23.0, 38.0, 40.0, 34.0, 29.0, 31.0, 33.0, 46.0, 40.0, 32.0, 31.0, 39.0, 27.0, 21.0, 34.0, 28.0, 22.0, 24.0, 22.0, 20.0, 14.0, 18.0, 13.0, 11.0, 8.0, 7.0, 9.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-14.548486709594727, -14.05323600769043, -13.557984352111816, -13.06273365020752, -12.567481994628906, -12.07223129272461, -11.576980590820312, -11.0817289352417, -10.586478233337402, -10.091227531433105, -9.595975875854492, -9.100725173950195, -8.605473518371582, -8.110222816467285, -7.61497163772583, -7.119720458984375, -6.62446928024292, -6.129218101501465, -5.63396692276001, -5.138715744018555, -4.643465042114258, -4.148213863372803, -3.6529626846313477, -3.1577117443084717, -2.6624605655670166, -2.1672093868255615, -1.6719584465026855, -1.1767072677612305, -0.6814562082290649, -0.18620514869689941, 0.30904603004455566, 0.8042969703674316, 1.2995481491088867, 1.7947992086410522, 2.2900502681732178, 2.785301446914673, 3.280552387237549, 3.775803565979004, 4.271054744720459, 4.766305923461914, 5.261556625366211, 5.756807804107666, 6.252058982849121, 6.747309684753418, 7.242560863494873, 7.737812042236328, 8.233062744140625, 8.728314399719238, 9.223566055297852, 9.718816757202148, 10.214068412780762, 10.709319114685059, 11.204570770263672, 11.699821472167969, 12.195072174072266, 12.690323829650879, 13.185574531555176, 13.680825233459473, 14.176076889038086, 14.671327590942383, 15.166579246520996, 15.661829948425293, 16.157081604003906, 16.652332305908203, 17.1475830078125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 5.0, 7.0, 4.0, 9.0, 10.0, 13.0, 20.0, 13.0, 20.0, 24.0, 24.0, 17.0, 36.0, 31.0, 37.0, 34.0, 40.0, 31.0, 41.0, 46.0, 35.0, 48.0, 43.0, 39.0, 32.0, 44.0, 40.0, 38.0, 25.0, 27.0, 20.0, 23.0, 19.0, 19.0, 8.0, 12.0, 10.0, 13.0, 12.0, 9.0, 4.0, 1.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.58984375, -3.47991943359375, -3.3699951171875, -3.26007080078125, -3.150146484375, -3.04022216796875, -2.9302978515625, -2.82037353515625, -2.71044921875, -2.60052490234375, -2.4906005859375, -2.38067626953125, -2.270751953125, -2.16082763671875, -2.0509033203125, -1.94097900390625, -1.8310546875, -1.72113037109375, -1.6112060546875, -1.50128173828125, -1.391357421875, -1.28143310546875, -1.1715087890625, -1.06158447265625, -0.95166015625, -0.84173583984375, -0.7318115234375, -0.62188720703125, -0.511962890625, -0.40203857421875, -0.2921142578125, -0.18218994140625, -0.072265625, 0.03765869140625, 0.1475830078125, 0.25750732421875, 0.367431640625, 0.47735595703125, 0.5872802734375, 0.69720458984375, 0.80712890625, 0.91705322265625, 1.0269775390625, 1.13690185546875, 1.246826171875, 1.35675048828125, 1.4666748046875, 1.57659912109375, 1.6865234375, 1.79644775390625, 1.9063720703125, 2.01629638671875, 2.126220703125, 2.23614501953125, 2.3460693359375, 2.45599365234375, 2.56591796875, 2.67584228515625, 2.7857666015625, 2.89569091796875, 3.005615234375, 3.11553955078125, 3.2254638671875, 3.33538818359375, 3.4453125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 14.0, 19.0, 39.0, 35.0, 59.0, 111.0, 216.0, 286.0, 487.0, 718.0, 1093.0, 1754.0, 2945.0, 4734.0, 7461.0, 11699.0, 18870.0, 29976.0, 47367.0, 73074.0, 107884.0, 146508.0, 167342.0, 140190.0, 101154.0, 67948.0, 43339.0, 27379.0, 16887.0, 10808.0, 6805.0, 4245.0, 2642.0, 1619.0, 1072.0, 649.0, 417.0, 263.0, 157.0, 107.0, 77.0, 31.0, 25.0, 17.0, 8.0, 9.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.2430419921875, -0.2350482940673828, -0.22705459594726562, -0.21906089782714844, -0.21106719970703125, -0.20307350158691406, -0.19507980346679688, -0.1870861053466797, -0.1790924072265625, -0.1710987091064453, -0.16310501098632812, -0.15511131286621094, -0.14711761474609375, -0.13912391662597656, -0.13113021850585938, -0.12313652038574219, -0.115142822265625, -0.10714912414550781, -0.09915542602539062, -0.09116172790527344, -0.08316802978515625, -0.07517433166503906, -0.06718063354492188, -0.05918693542480469, -0.0511932373046875, -0.04319953918457031, -0.035205841064453125, -0.027212142944335938, -0.01921844482421875, -0.011224746704101562, -0.003231048583984375, 0.0047626495361328125, 0.01275634765625, 0.020750045776367188, 0.028743743896484375, 0.03673744201660156, 0.04473114013671875, 0.05272483825683594, 0.060718536376953125, 0.06871223449707031, 0.0767059326171875, 0.08469963073730469, 0.09269332885742188, 0.10068702697753906, 0.10868072509765625, 0.11667442321777344, 0.12466812133789062, 0.1326618194580078, 0.140655517578125, 0.1486492156982422, 0.15664291381835938, 0.16463661193847656, 0.17263031005859375, 0.18062400817871094, 0.18861770629882812, 0.1966114044189453, 0.2046051025390625, 0.2125988006591797, 0.22059249877929688, 0.22858619689941406, 0.23657989501953125, 0.24457359313964844, 0.2525672912597656, 0.2605609893798828, 0.2685546875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 6.0, 5.0, 11.0, 12.0, 13.0, 12.0, 14.0, 22.0, 24.0, 24.0, 20.0, 21.0, 28.0, 37.0, 30.0, 34.0, 44.0, 36.0, 31.0, 33.0, 1058.0, 43.0, 39.0, 39.0, 45.0, 30.0, 24.0, 43.0, 28.0, 34.0, 29.0, 23.0, 12.0, 18.0, 9.0, 15.0, 12.0, 10.0, 12.0, 9.0, 7.0, 7.0, 4.0, 3.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.4140625, -2.33953857421875, -2.2650146484375, -2.19049072265625, -2.115966796875, -2.04144287109375, -1.9669189453125, -1.89239501953125, -1.81787109375, -1.74334716796875, -1.6688232421875, -1.59429931640625, -1.519775390625, -1.44525146484375, -1.3707275390625, -1.29620361328125, -1.2216796875, -1.14715576171875, -1.0726318359375, -0.99810791015625, -0.923583984375, -0.84906005859375, -0.7745361328125, -0.70001220703125, -0.62548828125, -0.55096435546875, -0.4764404296875, -0.40191650390625, -0.327392578125, -0.25286865234375, -0.1783447265625, -0.10382080078125, -0.029296875, 0.04522705078125, 0.1197509765625, 0.19427490234375, 0.268798828125, 0.34332275390625, 0.4178466796875, 0.49237060546875, 0.56689453125, 0.64141845703125, 0.7159423828125, 0.79046630859375, 0.864990234375, 0.93951416015625, 1.0140380859375, 1.08856201171875, 1.1630859375, 1.23760986328125, 1.3121337890625, 1.38665771484375, 1.461181640625, 1.53570556640625, 1.6102294921875, 1.68475341796875, 1.75927734375, 1.83380126953125, 1.9083251953125, 1.98284912109375, 2.057373046875, 2.13189697265625, 2.2064208984375, 2.28094482421875, 2.35546875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 10.0, 7.0, 12.0, 17.0, 33.0, 43.0, 67.0, 102.0, 166.0, 236.0, 389.0, 563.0, 829.0, 1293.0, 2109.0, 3084.0, 4827.0, 7506.0, 11589.0, 18159.0, 27934.0, 42655.0, 64212.0, 93555.0, 128008.0, 1191685.0, 152979.0, 111847.0, 79153.0, 53647.0, 35454.0, 23048.0, 14897.0, 9678.0, 6105.0, 3897.0, 2566.0, 1687.0, 1091.0, 701.0, 417.0, 294.0, 189.0, 147.0, 89.0, 55.0, 39.0, 19.0, 20.0, 12.0, 3.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.1453857421875, -0.1408100128173828, -0.13623428344726562, -0.13165855407714844, -0.12708282470703125, -0.12250709533691406, -0.11793136596679688, -0.11335563659667969, -0.1087799072265625, -0.10420417785644531, -0.09962844848632812, -0.09505271911621094, -0.09047698974609375, -0.08590126037597656, -0.08132553100585938, -0.07674980163574219, -0.072174072265625, -0.06759834289550781, -0.06302261352539062, -0.05844688415527344, -0.05387115478515625, -0.04929542541503906, -0.044719696044921875, -0.04014396667480469, -0.0355682373046875, -0.030992507934570312, -0.026416778564453125, -0.021841049194335938, -0.01726531982421875, -0.012689590454101562, -0.008113861083984375, -0.0035381317138671875, 0.00103759765625, 0.0056133270263671875, 0.010189056396484375, 0.014764785766601562, 0.01934051513671875, 0.023916244506835938, 0.028491973876953125, 0.03306770324707031, 0.0376434326171875, 0.04221916198730469, 0.046794891357421875, 0.05137062072753906, 0.05594635009765625, 0.06052207946777344, 0.06509780883789062, 0.06967353820800781, 0.074249267578125, 0.07882499694824219, 0.08340072631835938, 0.08797645568847656, 0.09255218505859375, 0.09712791442871094, 0.10170364379882812, 0.10627937316894531, 0.1108551025390625, 0.11543083190917969, 0.12000656127929688, 0.12458229064941406, 0.12915802001953125, 0.13373374938964844, 0.13830947875976562, 0.1428852081298828, 0.1474609375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 3.0, 6.0, 1.0, 4.0, 7.0, 11.0, 7.0, 18.0, 15.0, 35.0, 43.0, 71.0, 113.0, 163.0, 166.0, 92.0, 74.0, 46.0, 35.0, 12.0, 17.0, 9.0, 5.0, 6.0, 5.0, 5.0, 6.0, 1.0, 4.0, 7.0, 4.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00754547119140625, -0.007310271263122559, -0.007075071334838867, -0.006839871406555176, -0.006604671478271484, -0.006369471549987793, -0.0061342716217041016, -0.00589907169342041, -0.005663871765136719, -0.005428671836853027, -0.005193471908569336, -0.0049582719802856445, -0.004723072052001953, -0.004487872123718262, -0.00425267219543457, -0.004017472267150879, -0.0037822723388671875, -0.003547072410583496, -0.0033118724822998047, -0.0030766725540161133, -0.002841472625732422, -0.0026062726974487305, -0.002371072769165039, -0.0021358728408813477, -0.0019006729125976562, -0.0016654729843139648, -0.0014302730560302734, -0.001195073127746582, -0.0009598731994628906, -0.0007246732711791992, -0.0004894733428955078, -0.0002542734146118164, -1.9073486328125e-05, 0.0002161264419555664, 0.0004513263702392578, 0.0006865262985229492, 0.0009217262268066406, 0.001156926155090332, 0.0013921260833740234, 0.0016273260116577148, 0.0018625259399414062, 0.0020977258682250977, 0.002332925796508789, 0.0025681257247924805, 0.002803325653076172, 0.0030385255813598633, 0.0032737255096435547, 0.003508925437927246, 0.0037441253662109375, 0.003979325294494629, 0.00421452522277832, 0.004449725151062012, 0.004684925079345703, 0.0049201250076293945, 0.005155324935913086, 0.005390524864196777, 0.005625724792480469, 0.00586092472076416, 0.0060961246490478516, 0.006331324577331543, 0.006566524505615234, 0.006801724433898926, 0.007036924362182617, 0.007272124290466309, 0.00750732421875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 3.0, 3.0, 4.0, 11.0, 7.0, 10.0, 10.0, 19.0, 31.0, 37.0, 70.0, 119.0, 242.0, 1326.0, 265400.0, 778831.0, 1765.0, 280.0, 141.0, 72.0, 39.0, 32.0, 21.0, 19.0, 12.0, 7.0, 6.0, 6.0, 6.0, 6.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1617431640625, -0.15653419494628906, -0.15132522583007812, -0.1461162567138672, -0.14090728759765625, -0.1356983184814453, -0.13048934936523438, -0.12528038024902344, -0.1200714111328125, -0.11486244201660156, -0.10965347290039062, -0.10444450378417969, -0.09923553466796875, -0.09402656555175781, -0.08881759643554688, -0.08360862731933594, -0.078399658203125, -0.07319068908691406, -0.06798171997070312, -0.06277275085449219, -0.05756378173828125, -0.05235481262207031, -0.047145843505859375, -0.04193687438964844, -0.0367279052734375, -0.03151893615722656, -0.026309967041015625, -0.021100997924804688, -0.01589202880859375, -0.010683059692382812, -0.005474090576171875, -0.0002651214599609375, 0.00494384765625, 0.010152816772460938, 0.015361785888671875, 0.020570755004882812, 0.02577972412109375, 0.030988693237304688, 0.036197662353515625, 0.04140663146972656, 0.0466156005859375, 0.05182456970214844, 0.057033538818359375, 0.06224250793457031, 0.06745147705078125, 0.07266044616699219, 0.07786941528320312, 0.08307838439941406, 0.088287353515625, 0.09349632263183594, 0.09870529174804688, 0.10391426086425781, 0.10912322998046875, 0.11433219909667969, 0.11954116821289062, 0.12475013732910156, 0.1299591064453125, 0.13516807556152344, 0.14037704467773438, 0.1455860137939453, 0.15079498291015625, 0.1560039520263672, 0.16121292114257812, 0.16642189025878906, 0.171630859375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 7.0, 4.0, 5.0, 9.0, 6.0, 9.0, 13.0, 23.0, 21.0, 42.0, 47.0, 95.0, 149.0, 172.0, 128.0, 85.0, 57.0, 35.0, 21.0, 14.0, 13.0, 10.0, 8.0, 5.0, 6.0, 5.0, 7.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.012497779913246632, -0.012055647559463978, -0.01161351427435875, -0.011171381920576096, -0.010729249566793442, -0.010287116281688213, -0.00984498392790556, -0.009402850642800331, -0.008960718289017677, -0.008518585935235023, -0.008076452650129795, -0.007634320296347141, -0.0071921874769032, -0.006750054657459259, -0.006307922303676605, -0.005865789484232664, -0.005423656664788723, -0.004981523845344782, -0.004539391025900841, -0.004097258672118187, -0.003655125852674246, -0.0032129930332303047, -0.0027708604466170073, -0.00232872786000371, -0.0018865950405597687, -0.0014444623375311494, -0.00100232963450253, -0.0005601969314739108, -0.00011806422844529152, 0.0003240685909986496, 0.0007662011776119471, 0.0012083337642252445, 0.0016504675149917603, 0.0020926003344357014, 0.002534732921048999, 0.0029768655076622963, 0.0034189983271062374, 0.0038611311465501785, 0.004303263500332832, 0.0047453963197767735, 0.005187529139220715, 0.005629661958664656, 0.006071794778108597, 0.006513927131891251, 0.006956059951335192, 0.007398192770779133, 0.007840325124561787, 0.008282458409667015, 0.008724590763449669, 0.009166723117232323, 0.009608856402337551, 0.010050988756120205, 0.010493122041225433, 0.010935254395008087, 0.011377386748790741, 0.011819519102573395, 0.012261652387678623, 0.012703784741461277, 0.013145918026566505, 0.01358805038034916, 0.014030182734131813, 0.014472316019237041, 0.014914448373019695, 0.015356581658124924, 0.015798714011907578]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 3.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 8.0, 10.0, 12.0, 12.0, 15.0, 20.0, 26.0, 22.0, 24.0, 31.0, 29.0, 39.0, 49.0, 45.0, 48.0, 46.0, 48.0, 52.0, 56.0, 44.0, 39.0, 35.0, 31.0, 31.0, 25.0, 31.0, 24.0, 27.0, 21.0, 23.0, 19.0, 9.0, 11.0, 6.0, 9.0, 3.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.003565371036529541, -0.0034372173249721527, -0.0033090636134147644, -0.003180909901857376, -0.003052756190299988, -0.0029246024787425995, -0.002796448767185211, -0.002668295055627823, -0.0025401413440704346, -0.0024119876325130463, -0.002283833920955658, -0.0021556802093982697, -0.0020275264978408813, -0.001899372786283493, -0.0017712190747261047, -0.0016430653631687164, -0.0015149116516113281, -0.0013867579400539398, -0.0012586042284965515, -0.0011304505169391632, -0.001002296805381775, -0.0008741430938243866, -0.0007459893822669983, -0.00061783567070961, -0.0004896819591522217, -0.0003615282475948334, -0.00023337453603744507, -0.00010522082448005676, 2.2932887077331543e-05, 0.00015108659863471985, 0.00027924031019210815, 0.00040739402174949646, 0.0005355477333068848, 0.0006637014448642731, 0.0007918551564216614, 0.0009200088679790497, 0.001048162579536438, 0.0011763162910938263, 0.0013044700026512146, 0.001432623714208603, 0.0015607774257659912, 0.0016889311373233795, 0.0018170848488807678, 0.0019452385604381561, 0.0020733922719955444, 0.0022015459835529327, 0.002329699695110321, 0.0024578534066677094, 0.0025860071182250977, 0.002714160829782486, 0.0028423145413398743, 0.0029704682528972626, 0.003098621964454651, 0.003226775676012039, 0.0033549293875694275, 0.003483083099126816, 0.003611236810684204, 0.0037393905222415924, 0.0038675442337989807, 0.003995697945356369, 0.004123851656913757, 0.004252005368471146, 0.004380159080028534, 0.004508312791585922, 0.0046364665031433105]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 6.0, 5.0, 7.0, 4.0, 9.0, 10.0, 13.0, 20.0, 13.0, 20.0, 24.0, 24.0, 17.0, 37.0, 30.0, 38.0, 34.0, 39.0, 33.0, 39.0, 46.0, 35.0, 48.0, 44.0, 38.0, 34.0, 42.0, 40.0, 38.0, 25.0, 27.0, 20.0, 24.0, 18.0, 19.0, 8.0, 12.0, 10.0, 13.0, 12.0, 9.0, 5.0, 1.0, 2.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-3.58984375, -3.479888916015625, -3.36993408203125, -3.259979248046875, -3.1500244140625, -3.040069580078125, -2.93011474609375, -2.820159912109375, -2.710205078125, -2.600250244140625, -2.49029541015625, -2.380340576171875, -2.2703857421875, -2.160430908203125, -2.05047607421875, -1.940521240234375, -1.83056640625, -1.720611572265625, -1.61065673828125, -1.500701904296875, -1.3907470703125, -1.280792236328125, -1.17083740234375, -1.060882568359375, -0.950927734375, -0.840972900390625, -0.73101806640625, -0.621063232421875, -0.5111083984375, -0.401153564453125, -0.29119873046875, -0.181243896484375, -0.0712890625, 0.038665771484375, 0.14862060546875, 0.258575439453125, 0.3685302734375, 0.478485107421875, 0.58843994140625, 0.698394775390625, 0.808349609375, 0.918304443359375, 1.02825927734375, 1.138214111328125, 1.2481689453125, 1.358123779296875, 1.46807861328125, 1.578033447265625, 1.68798828125, 1.797943115234375, 1.90789794921875, 2.017852783203125, 2.1278076171875, 2.237762451171875, 2.34771728515625, 2.457672119140625, 2.567626953125, 2.677581787109375, 2.78753662109375, 2.897491455078125, 3.0074462890625, 3.117401123046875, 3.22735595703125, 3.337310791015625, 3.447265625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 11.0, 14.0, 17.0, 9.0, 14.0, 30.0, 34.0, 48.0, 54.0, 79.0, 136.0, 192.0, 293.0, 486.0, 890.0, 1574.0, 3240.0, 6889.0, 14795.0, 31766.0, 67137.0, 149752.0, 356856.0, 234511.0, 94567.0, 45087.0, 20828.0, 9614.0, 4584.0, 2149.0, 1132.0, 633.0, 367.0, 233.0, 145.0, 98.0, 78.0, 50.0, 43.0, 31.0, 24.0, 16.0, 22.0, 10.0, 4.0, 7.0, 1.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.3828125, -4.24017333984375, -4.0975341796875, -3.95489501953125, -3.812255859375, -3.66961669921875, -3.5269775390625, -3.38433837890625, -3.24169921875, -3.09906005859375, -2.9564208984375, -2.81378173828125, -2.671142578125, -2.52850341796875, -2.3858642578125, -2.24322509765625, -2.1005859375, -1.95794677734375, -1.8153076171875, -1.67266845703125, -1.530029296875, -1.38739013671875, -1.2447509765625, -1.10211181640625, -0.95947265625, -0.81683349609375, -0.6741943359375, -0.53155517578125, -0.388916015625, -0.24627685546875, -0.1036376953125, 0.03900146484375, 0.181640625, 0.32427978515625, 0.4669189453125, 0.60955810546875, 0.752197265625, 0.89483642578125, 1.0374755859375, 1.18011474609375, 1.32275390625, 1.46539306640625, 1.6080322265625, 1.75067138671875, 1.893310546875, 2.03594970703125, 2.1785888671875, 2.32122802734375, 2.4638671875, 2.60650634765625, 2.7491455078125, 2.89178466796875, 3.034423828125, 3.17706298828125, 3.3197021484375, 3.46234130859375, 3.60498046875, 3.74761962890625, 3.8902587890625, 4.03289794921875, 4.175537109375, 4.31817626953125, 4.4608154296875, 4.60345458984375, 4.74609375]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 3.0, 6.0, 9.0, 6.0, 11.0, 11.0, 10.0, 16.0, 8.0, 20.0, 24.0, 18.0, 31.0, 25.0, 24.0, 41.0, 46.0, 58.0, 65.0, 101.0, 137.0, 286.0, 1329.0, 184.0, 101.0, 78.0, 50.0, 30.0, 37.0, 28.0, 44.0, 37.0, 26.0, 30.0, 25.0, 22.0, 13.0, 14.0, 10.0, 8.0, 7.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.78125, -8.5081787109375, -8.235107421875, -7.9620361328125, -7.68896484375, -7.4158935546875, -7.142822265625, -6.8697509765625, -6.5966796875, -6.3236083984375, -6.050537109375, -5.7774658203125, -5.50439453125, -5.2313232421875, -4.958251953125, -4.6851806640625, -4.412109375, -4.1390380859375, -3.865966796875, -3.5928955078125, -3.31982421875, -3.0467529296875, -2.773681640625, -2.5006103515625, -2.2275390625, -1.9544677734375, -1.681396484375, -1.4083251953125, -1.13525390625, -0.8621826171875, -0.589111328125, -0.3160400390625, -0.04296875, 0.2301025390625, 0.503173828125, 0.7762451171875, 1.04931640625, 1.3223876953125, 1.595458984375, 1.8685302734375, 2.1416015625, 2.4146728515625, 2.687744140625, 2.9608154296875, 3.23388671875, 3.5069580078125, 3.780029296875, 4.0531005859375, 4.326171875, 4.5992431640625, 4.872314453125, 5.1453857421875, 5.41845703125, 5.6915283203125, 5.964599609375, 6.2376708984375, 6.5107421875, 6.7838134765625, 7.056884765625, 7.3299560546875, 7.60302734375, 7.8760986328125, 8.149169921875, 8.4222412109375, 8.6953125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 8.0, 6.0, 11.0, 22.0, 18.0, 34.0, 42.0, 61.0, 102.0, 117.0, 155.0, 270.0, 326.0, 640.0, 1783.0, 13387.0, 230384.0, 2739852.0, 145673.0, 9721.0, 1411.0, 576.0, 327.0, 213.0, 140.0, 116.0, 83.0, 50.0, 52.0, 23.0, 20.0, 20.0, 12.0, 16.0, 10.0, 6.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.2265625, -12.7613525390625, -12.296142578125, -11.8309326171875, -11.36572265625, -10.9005126953125, -10.435302734375, -9.9700927734375, -9.5048828125, -9.0396728515625, -8.574462890625, -8.1092529296875, -7.64404296875, -7.1788330078125, -6.713623046875, -6.2484130859375, -5.783203125, -5.3179931640625, -4.852783203125, -4.3875732421875, -3.92236328125, -3.4571533203125, -2.991943359375, -2.5267333984375, -2.0615234375, -1.5963134765625, -1.131103515625, -0.6658935546875, -0.20068359375, 0.2645263671875, 0.729736328125, 1.1949462890625, 1.66015625, 2.1253662109375, 2.590576171875, 3.0557861328125, 3.52099609375, 3.9862060546875, 4.451416015625, 4.9166259765625, 5.3818359375, 5.8470458984375, 6.312255859375, 6.7774658203125, 7.24267578125, 7.7078857421875, 8.173095703125, 8.6383056640625, 9.103515625, 9.5687255859375, 10.033935546875, 10.4991455078125, 10.96435546875, 11.4295654296875, 11.894775390625, 12.3599853515625, 12.8251953125, 13.2904052734375, 13.755615234375, 14.2208251953125, 14.68603515625, 15.1512451171875, 15.616455078125, 16.0816650390625, 16.546875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 9.0, 43.0, 140.0, 314.0, 320.0, 149.0, 33.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.90700912475586, -22.191837310791016, -20.476667404174805, -18.76149559020996, -17.04632568359375, -15.331153869628906, -13.615982055664062, -11.900811195373535, -10.185640335083008, -8.47046947479248, -6.755298137664795, -5.040126800537109, -3.324955940246582, -1.6097850799560547, 0.10538673400878906, 1.8205575942993164, 3.5357284545898438, 5.250899314880371, 6.966070652008057, 8.681241989135742, 10.39641284942627, 12.111583709716797, 13.82675552368164, 15.541926383972168, 17.257097244262695, 18.97226905822754, 20.68743896484375, 22.402610778808594, 24.117782592773438, 25.83295249938965, 27.548124313354492, 29.263294219970703, 30.97846221923828, 32.693634033203125, 34.40880584716797, 36.12397766113281, 37.83914566040039, 39.554317474365234, 41.26948928833008, 42.98466110229492, 44.6998291015625, 46.415000915527344, 48.13017272949219, 49.84534454345703, 51.56051254272461, 53.27568435668945, 54.9908561706543, 56.70602798461914, 58.421199798583984, 60.13637161254883, 61.85154342651367, 63.56671142578125, 65.2818832397461, 66.99705505371094, 68.71222686767578, 70.42739868164062, 72.14257049560547, 73.85774230957031, 75.57291412353516, 77.2880859375, 79.00325775146484, 80.71842956542969, 82.43359375, 84.14876556396484, 85.86393737792969]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 6.0, 9.0, 7.0, 9.0, 15.0, 14.0, 11.0, 17.0, 15.0, 23.0, 16.0, 23.0, 31.0, 26.0, 34.0, 30.0, 33.0, 32.0, 37.0, 26.0, 40.0, 55.0, 52.0, 45.0, 37.0, 41.0, 33.0, 34.0, 35.0, 35.0, 21.0, 25.0, 16.0, 29.0, 18.0, 13.0, 12.0, 16.0, 7.0, 11.0, 2.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-23.315399169921875, -22.645105361938477, -21.974811553955078, -21.30451774597168, -20.63422393798828, -19.96392822265625, -19.29363441467285, -18.623340606689453, -17.953046798706055, -17.282752990722656, -16.612459182739258, -15.942164421081543, -15.271870613098145, -14.601576805114746, -13.931282043457031, -13.260988235473633, -12.590694427490234, -11.920400619506836, -11.250106811523438, -10.579812049865723, -9.909518241882324, -9.239224433898926, -8.568929672241211, -7.8986358642578125, -7.228342056274414, -6.558048248291016, -5.887753963470459, -5.217459678649902, -4.547165870666504, -3.8768718242645264, -3.206577777862549, -2.536283493041992, -1.8659896850585938, -1.1956956386566162, -0.5254015922546387, 0.14489245414733887, 0.8151865005493164, 1.485480546951294, 2.1557745933532715, 2.826068878173828, 3.4963626861572266, 4.166656494140625, 4.836950778961182, 5.507245063781738, 6.177538871765137, 6.847832679748535, 7.518126964569092, 8.188421249389648, 8.858715057373047, 9.529008865356445, 10.199302673339844, 10.869597434997559, 11.539891242980957, 12.210185050964355, 12.88047981262207, 13.550773620605469, 14.221067428588867, 14.891361236572266, 15.561655044555664, 16.231948852539062, 16.902244567871094, 17.572538375854492, 18.24283218383789, 18.91312599182129, 19.583419799804688]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 4.0, 2.0, 11.0, 8.0, 13.0, 15.0, 12.0, 12.0, 23.0, 22.0, 25.0, 25.0, 33.0, 33.0, 30.0, 39.0, 36.0, 40.0, 44.0, 44.0, 45.0, 47.0, 52.0, 44.0, 43.0, 32.0, 32.0, 33.0, 29.0, 20.0, 26.0, 18.0, 21.0, 16.0, 8.0, 11.0, 8.0, 13.0, 10.0, 4.0, 4.0, 3.0, 3.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.78515625, -3.66448974609375, -3.5438232421875, -3.42315673828125, -3.302490234375, -3.18182373046875, -3.0611572265625, -2.94049072265625, -2.81982421875, -2.69915771484375, -2.5784912109375, -2.45782470703125, -2.337158203125, -2.21649169921875, -2.0958251953125, -1.97515869140625, -1.8544921875, -1.73382568359375, -1.6131591796875, -1.49249267578125, -1.371826171875, -1.25115966796875, -1.1304931640625, -1.00982666015625, -0.88916015625, -0.76849365234375, -0.6478271484375, -0.52716064453125, -0.406494140625, -0.28582763671875, -0.1651611328125, -0.04449462890625, 0.076171875, 0.19683837890625, 0.3175048828125, 0.43817138671875, 0.558837890625, 0.67950439453125, 0.8001708984375, 0.92083740234375, 1.04150390625, 1.16217041015625, 1.2828369140625, 1.40350341796875, 1.524169921875, 1.64483642578125, 1.7655029296875, 1.88616943359375, 2.0068359375, 2.12750244140625, 2.2481689453125, 2.36883544921875, 2.489501953125, 2.61016845703125, 2.7308349609375, 2.85150146484375, 2.97216796875, 3.09283447265625, 3.2135009765625, 3.33416748046875, 3.454833984375, 3.57550048828125, 3.6961669921875, 3.81683349609375, 3.9375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 2.0, 4.0, 3.0, 7.0, 10.0, 10.0, 9.0, 21.0, 22.0, 14.0, 26.0, 40.0, 35.0, 62.0, 67.0, 97.0, 96.0, 168.0, 248.0, 302.0, 529.0, 4130.0, 2736048.0, 1447281.0, 3275.0, 538.0, 310.0, 233.0, 165.0, 112.0, 97.0, 58.0, 56.0, 41.0, 29.0, 31.0, 19.0, 10.0, 14.0, 17.0, 11.0, 3.0, 8.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-35.25, -34.2119140625, -33.173828125, -32.1357421875, -31.09765625, -30.0595703125, -29.021484375, -27.9833984375, -26.9453125, -25.9072265625, -24.869140625, -23.8310546875, -22.79296875, -21.7548828125, -20.716796875, -19.6787109375, -18.640625, -17.6025390625, -16.564453125, -15.5263671875, -14.48828125, -13.4501953125, -12.412109375, -11.3740234375, -10.3359375, -9.2978515625, -8.259765625, -7.2216796875, -6.18359375, -5.1455078125, -4.107421875, -3.0693359375, -2.03125, -0.9931640625, 0.044921875, 1.0830078125, 2.12109375, 3.1591796875, 4.197265625, 5.2353515625, 6.2734375, 7.3115234375, 8.349609375, 9.3876953125, 10.42578125, 11.4638671875, 12.501953125, 13.5400390625, 14.578125, 15.6162109375, 16.654296875, 17.6923828125, 18.73046875, 19.7685546875, 20.806640625, 21.8447265625, 22.8828125, 23.9208984375, 24.958984375, 25.9970703125, 27.03515625, 28.0732421875, 29.111328125, 30.1494140625, 31.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 6.0, 2.0, 4.0, 3.0, 4.0, 3.0, 6.0, 8.0, 5.0, 5.0, 15.0, 7.0, 11.0, 26.0, 37.0, 39.0, 39.0, 54.0, 94.0, 103.0, 119.0, 191.0, 263.0, 363.0, 452.0, 538.0, 410.0, 302.0, 233.0, 146.0, 121.0, 93.0, 87.0, 69.0, 44.0, 28.0, 24.0, 24.0, 26.0, 20.0, 6.0, 11.0, 10.0, 7.0, 6.0, 4.0, 7.0, 2.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-3.931640625, -3.782318115234375, -3.63299560546875, -3.483673095703125, -3.3343505859375, -3.185028076171875, -3.03570556640625, -2.886383056640625, -2.737060546875, -2.587738037109375, -2.43841552734375, -2.289093017578125, -2.1397705078125, -1.990447998046875, -1.84112548828125, -1.691802978515625, -1.54248046875, -1.393157958984375, -1.24383544921875, -1.094512939453125, -0.9451904296875, -0.795867919921875, -0.64654541015625, -0.497222900390625, -0.347900390625, -0.198577880859375, -0.04925537109375, 0.100067138671875, 0.2493896484375, 0.398712158203125, 0.54803466796875, 0.697357177734375, 0.8466796875, 0.996002197265625, 1.14532470703125, 1.294647216796875, 1.4439697265625, 1.593292236328125, 1.74261474609375, 1.891937255859375, 2.041259765625, 2.190582275390625, 2.33990478515625, 2.489227294921875, 2.6385498046875, 2.787872314453125, 2.93719482421875, 3.086517333984375, 3.23583984375, 3.385162353515625, 3.53448486328125, 3.683807373046875, 3.8331298828125, 3.982452392578125, 4.13177490234375, 4.281097412109375, 4.430419921875, 4.579742431640625, 4.72906494140625, 4.878387451171875, 5.0277099609375, 5.177032470703125, 5.32635498046875, 5.475677490234375, 5.625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 1.0, 7.0, 4.0, 7.0, 11.0, 15.0, 14.0, 26.0, 29.0, 42.0, 68.0, 115.0, 178.0, 444.0, 2117.0, 32434.0, 2608946.0, 1523379.0, 23728.0, 1852.0, 399.0, 174.0, 94.0, 54.0, 39.0, 28.0, 26.0, 16.0, 12.0, 11.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.421875, -19.739990234375, -19.05810546875, -18.376220703125, -17.6943359375, -17.012451171875, -16.33056640625, -15.648681640625, -14.966796875, -14.284912109375, -13.60302734375, -12.921142578125, -12.2392578125, -11.557373046875, -10.87548828125, -10.193603515625, -9.51171875, -8.829833984375, -8.14794921875, -7.466064453125, -6.7841796875, -6.102294921875, -5.42041015625, -4.738525390625, -4.056640625, -3.374755859375, -2.69287109375, -2.010986328125, -1.3291015625, -0.647216796875, 0.03466796875, 0.716552734375, 1.3984375, 2.080322265625, 2.76220703125, 3.444091796875, 4.1259765625, 4.807861328125, 5.48974609375, 6.171630859375, 6.853515625, 7.535400390625, 8.21728515625, 8.899169921875, 9.5810546875, 10.262939453125, 10.94482421875, 11.626708984375, 12.30859375, 12.990478515625, 13.67236328125, 14.354248046875, 15.0361328125, 15.718017578125, 16.39990234375, 17.081787109375, 17.763671875, 18.445556640625, 19.12744140625, 19.809326171875, 20.4912109375, 21.173095703125, 21.85498046875, 22.536865234375, 23.21875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 18.0, 58.0, 136.0, 264.0, 271.0, 156.0, 71.0, 27.0, 9.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.94752502441406, -79.23213958740234, -77.51675415039062, -75.80137634277344, -74.08599090576172, -72.37060546875, -70.65522003173828, -68.93983459472656, -67.22445678710938, -65.50907135009766, -63.7936897277832, -62.078304290771484, -60.36292266845703, -58.64753723144531, -56.932151794433594, -55.21677017211914, -53.50138473510742, -51.7859992980957, -50.07061767578125, -48.35523223876953, -46.63985061645508, -44.92446517944336, -43.209083557128906, -41.49369812011719, -39.77831268310547, -38.06292724609375, -36.3475456237793, -34.63216018676758, -32.916778564453125, -31.201393127441406, -29.48600959777832, -27.770626068115234, -26.055248260498047, -24.33986473083496, -22.624481201171875, -20.909095764160156, -19.193714141845703, -17.478328704833984, -15.762945175170898, -14.047561645507812, -12.332178115844727, -10.61679458618164, -8.901411056518555, -7.186026573181152, -5.470643043518066, -3.7552595138549805, -2.039875030517578, -0.3244915008544922, 1.3908920288085938, 3.106275796890259, 4.821659564971924, 6.537043571472168, 8.252427101135254, 9.96781063079834, 11.683195114135742, 13.398578643798828, 15.113962173461914, 16.829345703125, 18.544729232788086, 20.260112762451172, 21.97549819946289, 23.690879821777344, 25.406265258789062, 27.12164878845215, 28.837032318115234]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 1.0, 0.0, 3.0, 5.0, 6.0, 10.0, 11.0, 11.0, 13.0, 18.0, 12.0, 14.0, 19.0, 16.0, 16.0, 25.0, 25.0, 21.0, 39.0, 32.0, 30.0, 42.0, 36.0, 45.0, 31.0, 45.0, 31.0, 42.0, 39.0, 31.0, 39.0, 39.0, 28.0, 37.0, 18.0, 17.0, 25.0, 24.0, 15.0, 19.0, 19.0, 10.0, 9.0, 10.0, 7.0, 4.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.031299591064453, -17.490657806396484, -16.950016021728516, -16.409374237060547, -15.868732452392578, -15.32809066772461, -14.78744888305664, -14.246807098388672, -13.706165313720703, -13.165523529052734, -12.624881744384766, -12.084239959716797, -11.543598175048828, -11.00295639038086, -10.46231460571289, -9.921672821044922, -9.381031036376953, -8.840389251708984, -8.299747467041016, -7.759105682373047, -7.218463897705078, -6.677822113037109, -6.137180328369141, -5.596538543701172, -5.055896759033203, -4.515254974365234, -3.9746131896972656, -3.433971405029297, -2.893329620361328, -2.3526878356933594, -1.8120460510253906, -1.2714042663574219, -0.7307643890380859, -0.1901226043701172, 0.35051918029785156, 0.8911609649658203, 1.431802749633789, 1.9724445343017578, 2.5130863189697266, 3.0537281036376953, 3.594369888305664, 4.135011672973633, 4.675653457641602, 5.21629524230957, 5.756937026977539, 6.297578811645508, 6.838220596313477, 7.378862380981445, 7.919504165649414, 8.460145950317383, 9.000787734985352, 9.54142951965332, 10.082071304321289, 10.622713088989258, 11.163354873657227, 11.703996658325195, 12.244638442993164, 12.785280227661133, 13.325922012329102, 13.86656379699707, 14.407205581665039, 14.947847366333008, 15.488489151000977, 16.029130935668945, 16.569772720336914]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 11.0, 12.0, 19.0, 14.0, 25.0, 12.0, 22.0, 36.0, 34.0, 22.0, 33.0, 23.0, 29.0, 49.0, 41.0, 44.0, 49.0, 37.0, 56.0, 54.0, 39.0, 37.0, 39.0, 36.0, 23.0, 32.0, 18.0, 24.0, 12.0, 18.0, 17.0, 13.0, 10.0, 10.0, 12.0, 10.0, 2.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.85546875, -3.7384033203125, -3.621337890625, -3.5042724609375, -3.38720703125, -3.2701416015625, -3.153076171875, -3.0360107421875, -2.9189453125, -2.8018798828125, -2.684814453125, -2.5677490234375, -2.45068359375, -2.3336181640625, -2.216552734375, -2.0994873046875, -1.982421875, -1.8653564453125, -1.748291015625, -1.6312255859375, -1.51416015625, -1.3970947265625, -1.280029296875, -1.1629638671875, -1.0458984375, -0.9288330078125, -0.811767578125, -0.6947021484375, -0.57763671875, -0.4605712890625, -0.343505859375, -0.2264404296875, -0.109375, 0.0076904296875, 0.124755859375, 0.2418212890625, 0.35888671875, 0.4759521484375, 0.593017578125, 0.7100830078125, 0.8271484375, 0.9442138671875, 1.061279296875, 1.1783447265625, 1.29541015625, 1.4124755859375, 1.529541015625, 1.6466064453125, 1.763671875, 1.8807373046875, 1.997802734375, 2.1148681640625, 2.23193359375, 2.3489990234375, 2.466064453125, 2.5831298828125, 2.7001953125, 2.8172607421875, 2.934326171875, 3.0513916015625, 3.16845703125, 3.2855224609375, 3.402587890625, 3.5196533203125, 3.63671875]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 4.0, 6.0, 12.0, 4.0, 6.0, 19.0, 30.0, 48.0, 51.0, 78.0, 100.0, 168.0, 234.0, 403.0, 584.0, 948.0, 1427.0, 2299.0, 3846.0, 6215.0, 10024.0, 16886.0, 27853.0, 45251.0, 73542.0, 115444.0, 167392.0, 187164.0, 142700.0, 94426.0, 58532.0, 35894.0, 22062.0, 13396.0, 8205.0, 4930.0, 3104.0, 1880.0, 1180.0, 799.0, 483.0, 305.0, 198.0, 143.0, 96.0, 67.0, 42.0, 30.0, 15.0, 14.0, 9.0, 6.0, 3.0, 5.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3115234375, -0.30123138427734375, -0.2909393310546875, -0.28064727783203125, -0.270355224609375, -0.26006317138671875, -0.2497711181640625, -0.23947906494140625, -0.22918701171875, -0.21889495849609375, -0.2086029052734375, -0.19831085205078125, -0.188018798828125, -0.17772674560546875, -0.1674346923828125, -0.15714263916015625, -0.1468505859375, -0.13655853271484375, -0.1262664794921875, -0.11597442626953125, -0.105682373046875, -0.09539031982421875, -0.0850982666015625, -0.07480621337890625, -0.06451416015625, -0.05422210693359375, -0.0439300537109375, -0.03363800048828125, -0.023345947265625, -0.01305389404296875, -0.0027618408203125, 0.00753021240234375, 0.017822265625, 0.02811431884765625, 0.0384063720703125, 0.04869842529296875, 0.058990478515625, 0.06928253173828125, 0.0795745849609375, 0.08986663818359375, 0.10015869140625, 0.11045074462890625, 0.1207427978515625, 0.13103485107421875, 0.141326904296875, 0.15161895751953125, 0.1619110107421875, 0.17220306396484375, 0.1824951171875, 0.19278717041015625, 0.2030792236328125, 0.21337127685546875, 0.223663330078125, 0.23395538330078125, 0.2442474365234375, 0.25453948974609375, 0.26483154296875, 0.27512359619140625, 0.2854156494140625, 0.29570770263671875, 0.305999755859375, 0.31629180908203125, 0.3265838623046875, 0.33687591552734375, 0.34716796875]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 4.0, 4.0, 3.0, 9.0, 11.0, 11.0, 5.0, 16.0, 14.0, 21.0, 20.0, 21.0, 28.0, 33.0, 28.0, 41.0, 32.0, 43.0, 43.0, 44.0, 47.0, 1073.0, 35.0, 39.0, 51.0, 42.0, 36.0, 40.0, 31.0, 30.0, 36.0, 23.0, 11.0, 20.0, 20.0, 12.0, 7.0, 9.0, 8.0, 11.0, 5.0, 6.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.427734375, -2.342987060546875, -2.25823974609375, -2.173492431640625, -2.0887451171875, -2.003997802734375, -1.91925048828125, -1.834503173828125, -1.749755859375, -1.665008544921875, -1.58026123046875, -1.495513916015625, -1.4107666015625, -1.326019287109375, -1.24127197265625, -1.156524658203125, -1.07177734375, -0.987030029296875, -0.90228271484375, -0.817535400390625, -0.7327880859375, -0.648040771484375, -0.56329345703125, -0.478546142578125, -0.393798828125, -0.309051513671875, -0.22430419921875, -0.139556884765625, -0.0548095703125, 0.029937744140625, 0.11468505859375, 0.199432373046875, 0.2841796875, 0.368927001953125, 0.45367431640625, 0.538421630859375, 0.6231689453125, 0.707916259765625, 0.79266357421875, 0.877410888671875, 0.962158203125, 1.046905517578125, 1.13165283203125, 1.216400146484375, 1.3011474609375, 1.385894775390625, 1.47064208984375, 1.555389404296875, 1.64013671875, 1.724884033203125, 1.80963134765625, 1.894378662109375, 1.9791259765625, 2.063873291015625, 2.14862060546875, 2.233367919921875, 2.318115234375, 2.402862548828125, 2.48760986328125, 2.572357177734375, 2.6571044921875, 2.741851806640625, 2.82659912109375, 2.911346435546875, 2.99609375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 2.0, 7.0, 6.0, 11.0, 9.0, 19.0, 34.0, 44.0, 63.0, 85.0, 123.0, 186.0, 299.0, 438.0, 648.0, 945.0, 1387.0, 2154.0, 3258.0, 4867.0, 7402.0, 11228.0, 17220.0, 26360.0, 40104.0, 60871.0, 89774.0, 125391.0, 1119751.0, 225449.0, 116296.0, 81747.0, 55138.0, 36251.0, 23692.0, 15679.0, 10179.0, 6656.0, 4397.0, 2943.0, 2014.0, 1296.0, 903.0, 652.0, 386.0, 230.0, 180.0, 125.0, 74.0, 58.0, 36.0, 26.0, 17.0, 15.0, 8.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.149658203125, -0.14464950561523438, -0.13964080810546875, -0.13463211059570312, -0.1296234130859375, -0.12461471557617188, -0.11960601806640625, -0.11459732055664062, -0.109588623046875, -0.10457992553710938, -0.09957122802734375, -0.09456253051757812, -0.0895538330078125, -0.08454513549804688, -0.07953643798828125, -0.07452774047851562, -0.06951904296875, -0.06451034545898438, -0.05950164794921875, -0.054492950439453125, -0.0494842529296875, -0.044475555419921875, -0.03946685791015625, -0.034458160400390625, -0.029449462890625, -0.024440765380859375, -0.01943206787109375, -0.014423370361328125, -0.0094146728515625, -0.004405975341796875, 0.00060272216796875, 0.005611419677734375, 0.0106201171875, 0.015628814697265625, 0.02063751220703125, 0.025646209716796875, 0.0306549072265625, 0.035663604736328125, 0.04067230224609375, 0.045680999755859375, 0.050689697265625, 0.055698394775390625, 0.06070709228515625, 0.06571578979492188, 0.0707244873046875, 0.07573318481445312, 0.08074188232421875, 0.08575057983398438, 0.09075927734375, 0.09576797485351562, 0.10077667236328125, 0.10578536987304688, 0.1107940673828125, 0.11580276489257812, 0.12081146240234375, 0.12582015991210938, 0.130828857421875, 0.13583755493164062, 0.14084625244140625, 0.14585494995117188, 0.1508636474609375, 0.15587234497070312, 0.16088104248046875, 0.16588973999023438, 0.1708984375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 3.0, 4.0, 3.0, 7.0, 9.0, 7.0, 11.0, 14.0, 13.0, 27.0, 28.0, 32.0, 32.0, 51.0, 105.0, 124.0, 142.0, 108.0, 68.0, 29.0, 38.0, 24.0, 26.0, 21.0, 17.0, 12.0, 11.0, 10.0, 6.0, 7.0, 2.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00962066650390625, -0.009277701377868652, -0.008934736251831055, -0.008591771125793457, -0.00824880599975586, -0.007905840873718262, -0.007562875747680664, -0.007219910621643066, -0.006876945495605469, -0.006533980369567871, -0.0061910152435302734, -0.005848050117492676, -0.005505084991455078, -0.0051621198654174805, -0.004819154739379883, -0.004476189613342285, -0.0041332244873046875, -0.00379025936126709, -0.003447294235229492, -0.0031043291091918945, -0.002761363983154297, -0.0024183988571166992, -0.0020754337310791016, -0.001732468605041504, -0.0013895034790039062, -0.0010465383529663086, -0.0007035732269287109, -0.0003606081008911133, -1.7642974853515625e-05, 0.00032532215118408203, 0.0006682872772216797, 0.0010112524032592773, 0.001354217529296875, 0.0016971826553344727, 0.0020401477813720703, 0.002383112907409668, 0.0027260780334472656, 0.0030690431594848633, 0.003412008285522461, 0.0037549734115600586, 0.004097938537597656, 0.004440903663635254, 0.0047838687896728516, 0.005126833915710449, 0.005469799041748047, 0.0058127641677856445, 0.006155729293823242, 0.00649869441986084, 0.0068416595458984375, 0.007184624671936035, 0.007527589797973633, 0.00787055492401123, 0.008213520050048828, 0.008556485176086426, 0.008899450302124023, 0.009242415428161621, 0.009585380554199219, 0.009928345680236816, 0.010271310806274414, 0.010614275932312012, 0.01095724105834961, 0.011300206184387207, 0.011643171310424805, 0.011986136436462402, 0.0123291015625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 6.0, 6.0, 5.0, 9.0, 11.0, 13.0, 22.0, 29.0, 31.0, 54.0, 58.0, 91.0, 121.0, 209.0, 506.0, 2305.0, 801448.0, 240823.0, 1773.0, 404.0, 206.0, 128.0, 78.0, 60.0, 35.0, 26.0, 29.0, 12.0, 16.0, 11.0, 10.0, 6.0, 3.0, 4.0, 6.0, 6.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2308349609375, -0.2244129180908203, -0.21799087524414062, -0.21156883239746094, -0.20514678955078125, -0.19872474670410156, -0.19230270385742188, -0.1858806610107422, -0.1794586181640625, -0.1730365753173828, -0.16661453247070312, -0.16019248962402344, -0.15377044677734375, -0.14734840393066406, -0.14092636108398438, -0.1345043182373047, -0.128082275390625, -0.12166023254394531, -0.11523818969726562, -0.10881614685058594, -0.10239410400390625, -0.09597206115722656, -0.08955001831054688, -0.08312797546386719, -0.0767059326171875, -0.07028388977050781, -0.06386184692382812, -0.05743980407714844, -0.05101776123046875, -0.04459571838378906, -0.038173675537109375, -0.03175163269042969, -0.02532958984375, -0.018907546997070312, -0.012485504150390625, -0.0060634613037109375, 0.00035858154296875, 0.0067806243896484375, 0.013202667236328125, 0.019624710083007812, 0.0260467529296875, 0.03246879577636719, 0.038890838623046875, 0.04531288146972656, 0.05173492431640625, 0.05815696716308594, 0.06457901000976562, 0.07100105285644531, 0.077423095703125, 0.08384513854980469, 0.09026718139648438, 0.09668922424316406, 0.10311126708984375, 0.10953330993652344, 0.11595535278320312, 0.12237739562988281, 0.1287994384765625, 0.1352214813232422, 0.14164352416992188, 0.14806556701660156, 0.15448760986328125, 0.16090965270996094, 0.16733169555664062, 0.1737537384033203, 0.18017578125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 19.0, 41.0, 130.0, 438.0, 285.0, 57.0, 23.0, 9.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0812457874417305, -0.07951188832521439, -0.07777798920869827, -0.07604409009218216, -0.07431019097566605, -0.07257628440856934, -0.07084238529205322, -0.06910848617553711, -0.067374587059021, -0.06564068794250488, -0.06390678882598877, -0.06217288598418236, -0.060438986867666245, -0.05870508775115013, -0.05697118863463402, -0.055237285792827606, -0.05350338667631149, -0.05176948755979538, -0.050035588443279266, -0.048301685601472855, -0.04656778648495674, -0.04483388736844063, -0.043099988251924515, -0.0413660854101181, -0.03963219001889229, -0.037898290902376175, -0.03616439178586006, -0.03443048894405365, -0.03269658982753754, -0.030962690711021423, -0.02922879159450531, -0.027494890615344048, -0.025760989636182785, -0.024027090519666672, -0.02229318954050541, -0.020559290423989296, -0.018825389444828033, -0.01709149032831192, -0.015357590280473232, -0.013623690232634544, -0.011889790184795856, -0.010155890136957169, -0.00842199008911848, -0.00668809050694108, -0.004954190459102392, -0.0032202908769249916, -0.0014863908290863037, 0.0002475092187523842, 0.001981409266591072, 0.00371530931442976, 0.005449209362268448, 0.0071831089444458485, 0.008917009457945824, 0.010650908574461937, 0.012384808622300625, 0.014118708670139313, 0.015852607786655426, 0.01758650690317154, 0.019320407882332802, 0.021054306998848915, 0.022788207978010178, 0.02452210709452629, 0.026256006211042404, 0.027989907190203667, 0.02972380816936493]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 8.0, 3.0, 7.0, 13.0, 14.0, 20.0, 9.0, 17.0, 13.0, 28.0, 24.0, 23.0, 28.0, 27.0, 34.0, 47.0, 39.0, 45.0, 28.0, 40.0, 38.0, 27.0, 39.0, 32.0, 41.0, 33.0, 39.0, 29.0, 34.0, 24.0, 23.0, 17.0, 23.0, 20.0, 11.0, 23.0, 12.0, 10.0, 10.0, 7.0, 11.0, 7.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.010236263275146484, -0.009880892932415009, -0.009525522589683533, -0.009170152246952057, -0.008814781904220581, -0.008459411561489105, -0.00810404121875763, -0.0077486708760261536, -0.007393300533294678, -0.007037930190563202, -0.006682559847831726, -0.00632718950510025, -0.005971819162368774, -0.005616448819637299, -0.005261078476905823, -0.004905708134174347, -0.004550337791442871, -0.004194967448711395, -0.0038395971059799194, -0.0034842267632484436, -0.0031288564205169678, -0.002773486077785492, -0.002418115735054016, -0.0020627453923225403, -0.0017073750495910645, -0.0013520047068595886, -0.0009966343641281128, -0.000641264021396637, -0.00028589367866516113, 6.94766640663147e-05, 0.00042484700679779053, 0.0007802173495292664, 0.0011355876922607422, 0.001490958034992218, 0.0018463283777236938, 0.0022016987204551697, 0.0025570690631866455, 0.0029124394059181213, 0.003267809748649597, 0.003623180091381073, 0.003978550434112549, 0.004333920776844025, 0.0046892911195755005, 0.005044661462306976, 0.005400031805038452, 0.005755402147769928, 0.006110772490501404, 0.00646614283323288, 0.0068215131759643555, 0.007176883518695831, 0.007532253861427307, 0.007887624204158783, 0.008242994546890259, 0.008598364889621735, 0.00895373523235321, 0.009309105575084686, 0.009664475917816162, 0.010019846260547638, 0.010375216603279114, 0.01073058694601059, 0.011085957288742065, 0.011441327631473541, 0.011796697974205017, 0.012152068316936493, 0.012507438659667969]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 3.0, 3.0, 7.0, 6.0, 11.0, 12.0, 19.0, 14.0, 25.0, 12.0, 22.0, 36.0, 33.0, 24.0, 32.0, 23.0, 29.0, 49.0, 42.0, 43.0, 48.0, 38.0, 56.0, 54.0, 38.0, 38.0, 39.0, 36.0, 22.0, 33.0, 18.0, 24.0, 12.0, 18.0, 17.0, 13.0, 10.0, 10.0, 13.0, 9.0, 2.0, 4.0, 3.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.85546875, -3.7384033203125, -3.621337890625, -3.5042724609375, -3.38720703125, -3.2701416015625, -3.153076171875, -3.0360107421875, -2.9189453125, -2.8018798828125, -2.684814453125, -2.5677490234375, -2.45068359375, -2.3336181640625, -2.216552734375, -2.0994873046875, -1.982421875, -1.8653564453125, -1.748291015625, -1.6312255859375, -1.51416015625, -1.3970947265625, -1.280029296875, -1.1629638671875, -1.0458984375, -0.9288330078125, -0.811767578125, -0.6947021484375, -0.57763671875, -0.4605712890625, -0.343505859375, -0.2264404296875, -0.109375, 0.0076904296875, 0.124755859375, 0.2418212890625, 0.35888671875, 0.4759521484375, 0.593017578125, 0.7100830078125, 0.8271484375, 0.9442138671875, 1.061279296875, 1.1783447265625, 1.29541015625, 1.4124755859375, 1.529541015625, 1.6466064453125, 1.763671875, 1.8807373046875, 1.997802734375, 2.1148681640625, 2.23193359375, 2.3489990234375, 2.466064453125, 2.5831298828125, 2.7001953125, 2.8172607421875, 2.934326171875, 3.0513916015625, 3.16845703125, 3.2855224609375, 3.402587890625, 3.5196533203125, 3.63671875]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 10.0, 7.0, 10.0, 15.0, 12.0, 22.0, 34.0, 49.0, 76.0, 89.0, 122.0, 149.0, 218.0, 298.0, 407.0, 580.0, 841.0, 1464.0, 3168.0, 9210.0, 30911.0, 101406.0, 303187.0, 387527.0, 142034.0, 44494.0, 12966.0, 4169.0, 1803.0, 957.0, 674.0, 457.0, 303.0, 237.0, 171.0, 130.0, 94.0, 63.0, 53.0, 43.0, 27.0, 22.0, 14.0, 9.0, 8.0, 6.0, 2.0, 4.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.93359375, -6.72442626953125, -6.5152587890625, -6.30609130859375, -6.096923828125, -5.88775634765625, -5.6785888671875, -5.46942138671875, -5.26025390625, -5.05108642578125, -4.8419189453125, -4.63275146484375, -4.423583984375, -4.21441650390625, -4.0052490234375, -3.79608154296875, -3.5869140625, -3.37774658203125, -3.1685791015625, -2.95941162109375, -2.750244140625, -2.54107666015625, -2.3319091796875, -2.12274169921875, -1.91357421875, -1.70440673828125, -1.4952392578125, -1.28607177734375, -1.076904296875, -0.86773681640625, -0.6585693359375, -0.44940185546875, -0.240234375, -0.03106689453125, 0.1781005859375, 0.38726806640625, 0.596435546875, 0.80560302734375, 1.0147705078125, 1.22393798828125, 1.43310546875, 1.64227294921875, 1.8514404296875, 2.06060791015625, 2.269775390625, 2.47894287109375, 2.6881103515625, 2.89727783203125, 3.1064453125, 3.31561279296875, 3.5247802734375, 3.73394775390625, 3.943115234375, 4.15228271484375, 4.3614501953125, 4.57061767578125, 4.77978515625, 4.98895263671875, 5.1981201171875, 5.40728759765625, 5.616455078125, 5.82562255859375, 6.0347900390625, 6.24395751953125, 6.453125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 1.0, 5.0, 6.0, 6.0, 5.0, 11.0, 6.0, 13.0, 10.0, 19.0, 16.0, 20.0, 25.0, 37.0, 41.0, 48.0, 46.0, 64.0, 88.0, 126.0, 176.0, 1362.0, 232.0, 158.0, 97.0, 69.0, 71.0, 42.0, 44.0, 29.0, 35.0, 18.0, 20.0, 15.0, 23.0, 12.0, 10.0, 16.0, 10.0, 8.0, 2.0, 5.0, 2.0, 0.0, 4.0, 3.0, 0.0, 2.0, 2.0], "bins": [-10.46875, -10.18359375, -9.8984375, -9.61328125, -9.328125, -9.04296875, -8.7578125, -8.47265625, -8.1875, -7.90234375, -7.6171875, -7.33203125, -7.046875, -6.76171875, -6.4765625, -6.19140625, -5.90625, -5.62109375, -5.3359375, -5.05078125, -4.765625, -4.48046875, -4.1953125, -3.91015625, -3.625, -3.33984375, -3.0546875, -2.76953125, -2.484375, -2.19921875, -1.9140625, -1.62890625, -1.34375, -1.05859375, -0.7734375, -0.48828125, -0.203125, 0.08203125, 0.3671875, 0.65234375, 0.9375, 1.22265625, 1.5078125, 1.79296875, 2.078125, 2.36328125, 2.6484375, 2.93359375, 3.21875, 3.50390625, 3.7890625, 4.07421875, 4.359375, 4.64453125, 4.9296875, 5.21484375, 5.5, 5.78515625, 6.0703125, 6.35546875, 6.640625, 6.92578125, 7.2109375, 7.49609375, 7.78125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 6.0, 8.0, 12.0, 17.0, 16.0, 17.0, 26.0, 34.0, 38.0, 79.0, 113.0, 189.0, 270.0, 522.0, 967.0, 2363.0, 729239.0, 2406602.0, 2692.0, 1053.0, 565.0, 335.0, 166.0, 104.0, 76.0, 54.0, 38.0, 19.0, 20.0, 19.0, 14.0, 12.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.46875, -35.3310546875, -34.193359375, -33.0556640625, -31.91796875, -30.7802734375, -29.642578125, -28.5048828125, -27.3671875, -26.2294921875, -25.091796875, -23.9541015625, -22.81640625, -21.6787109375, -20.541015625, -19.4033203125, -18.265625, -17.1279296875, -15.990234375, -14.8525390625, -13.71484375, -12.5771484375, -11.439453125, -10.3017578125, -9.1640625, -8.0263671875, -6.888671875, -5.7509765625, -4.61328125, -3.4755859375, -2.337890625, -1.2001953125, -0.0625, 1.0751953125, 2.212890625, 3.3505859375, 4.48828125, 5.6259765625, 6.763671875, 7.9013671875, 9.0390625, 10.1767578125, 11.314453125, 12.4521484375, 13.58984375, 14.7275390625, 15.865234375, 17.0029296875, 18.140625, 19.2783203125, 20.416015625, 21.5537109375, 22.69140625, 23.8291015625, 24.966796875, 26.1044921875, 27.2421875, 28.3798828125, 29.517578125, 30.6552734375, 31.79296875, 32.9306640625, 34.068359375, 35.2060546875, 36.34375]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 8.0, 40.0, 56.0, 105.0, 169.0, 192.0, 168.0, 114.0, 81.0, 44.0, 15.0, 7.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.95806884765625, -33.95637512207031, -32.954681396484375, -31.95298957824707, -30.951295852661133, -29.949602127075195, -28.94791030883789, -27.946216583251953, -26.944522857666016, -25.942829132080078, -24.94113540649414, -23.939443588256836, -22.9377498626709, -21.93605613708496, -20.934364318847656, -19.93267059326172, -18.93097686767578, -17.929283142089844, -16.927589416503906, -15.925897598266602, -14.924203872680664, -13.922510147094727, -12.920817375183105, -11.919124603271484, -10.917430877685547, -9.91573715209961, -8.914044380187988, -7.912351131439209, -6.91065788269043, -5.90896463394165, -4.907271385192871, -3.905578136444092, -2.903881072998047, -1.9021878242492676, -0.9004945755004883, 0.10119867324829102, 1.1028919219970703, 2.1045851707458496, 3.106278419494629, 4.107971668243408, 5.1096649169921875, 6.111358165740967, 7.113051414489746, 8.114744186401367, 9.116437911987305, 10.118131637573242, 11.119824409484863, 12.121517181396484, 13.123210906982422, 14.12490463256836, 15.12659740447998, 16.1282901763916, 17.12998390197754, 18.131677627563477, 19.13336944580078, 20.13506317138672, 21.136756896972656, 22.138450622558594, 23.14014434814453, 24.141836166381836, 25.143529891967773, 26.14522361755371, 27.146915435791016, 28.148609161376953, 29.15030288696289]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 8.0, 5.0, 10.0, 18.0, 18.0, 15.0, 19.0, 21.0, 24.0, 27.0, 28.0, 37.0, 30.0, 42.0, 39.0, 36.0, 46.0, 40.0, 50.0, 45.0, 55.0, 39.0, 44.0, 43.0, 39.0, 18.0, 25.0, 23.0, 30.0, 21.0, 15.0, 24.0, 15.0, 13.0, 9.0, 9.0, 8.0, 3.0, 0.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.071399688720703, -26.234182357788086, -25.39696502685547, -24.559749603271484, -23.722532272338867, -22.88531494140625, -22.048097610473633, -21.210880279541016, -20.37366485595703, -19.536447525024414, -18.699230194091797, -17.862014770507812, -17.024797439575195, -16.187580108642578, -15.350362777709961, -14.513145446777344, -13.675928115844727, -12.83871078491211, -12.001494407653809, -11.164277076721191, -10.32706069946289, -9.489843368530273, -8.652626037597656, -7.815409183502197, -6.978192329406738, -6.140975475311279, -5.30375862121582, -4.466541290283203, -3.629324436187744, -2.792107582092285, -1.954890251159668, -1.117673397064209, -0.2804584503173828, 0.5567585229873657, 1.3939754962921143, 2.2311925888061523, 3.0684094429016113, 3.9056262969970703, 4.7428436279296875, 5.5800604820251465, 6.4172773361206055, 7.2544941902160645, 8.091711044311523, 8.92892837524414, 9.766145706176758, 10.603362083435059, 11.440579414367676, 12.277795791625977, 13.115013122558594, 13.952230453491211, 14.789446830749512, 15.626664161682129, 16.46388053894043, 17.301097869873047, 18.138315200805664, 18.97553253173828, 19.812747955322266, 20.649965286254883, 21.4871826171875, 22.324398040771484, 23.1616153717041, 23.99883270263672, 24.836050033569336, 25.673267364501953, 26.51048469543457]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 3.0, 2.0, 7.0, 6.0, 3.0, 6.0, 17.0, 20.0, 17.0, 25.0, 29.0, 17.0, 36.0, 23.0, 30.0, 31.0, 28.0, 51.0, 41.0, 45.0, 52.0, 49.0, 53.0, 36.0, 46.0, 42.0, 45.0, 32.0, 27.0, 32.0, 20.0, 24.0, 11.0, 22.0, 14.0, 8.0, 12.0, 11.0, 6.0, 8.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.96875, -3.84466552734375, -3.7205810546875, -3.59649658203125, -3.472412109375, -3.34832763671875, -3.2242431640625, -3.10015869140625, -2.97607421875, -2.85198974609375, -2.7279052734375, -2.60382080078125, -2.479736328125, -2.35565185546875, -2.2315673828125, -2.10748291015625, -1.9833984375, -1.85931396484375, -1.7352294921875, -1.61114501953125, -1.487060546875, -1.36297607421875, -1.2388916015625, -1.11480712890625, -0.99072265625, -0.86663818359375, -0.7425537109375, -0.61846923828125, -0.494384765625, -0.37030029296875, -0.2462158203125, -0.12213134765625, 0.001953125, 0.12603759765625, 0.2501220703125, 0.37420654296875, 0.498291015625, 0.62237548828125, 0.7464599609375, 0.87054443359375, 0.99462890625, 1.11871337890625, 1.2427978515625, 1.36688232421875, 1.490966796875, 1.61505126953125, 1.7391357421875, 1.86322021484375, 1.9873046875, 2.11138916015625, 2.2354736328125, 2.35955810546875, 2.483642578125, 2.60772705078125, 2.7318115234375, 2.85589599609375, 2.97998046875, 3.10406494140625, 3.2281494140625, 3.35223388671875, 3.476318359375, 3.60040283203125, 3.7244873046875, 3.84857177734375, 3.97265625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 0.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 5.0, 5.0, 12.0, 7.0, 21.0, 33.0, 33.0, 67.0, 80.0, 126.0, 202.0, 319.0, 573.0, 964.0, 1782.0, 3594.0, 8071.0, 22455.0, 85788.0, 415161.0, 1556559.0, 1558931.0, 415228.0, 85900.0, 22437.0, 8124.0, 3580.0, 1750.0, 949.0, 542.0, 327.0, 225.0, 142.0, 73.0, 62.0, 47.0, 35.0, 22.0, 15.0, 7.0, 6.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-5.60546875, -5.43560791015625, -5.2657470703125, -5.09588623046875, -4.926025390625, -4.75616455078125, -4.5863037109375, -4.41644287109375, -4.24658203125, -4.07672119140625, -3.9068603515625, -3.73699951171875, -3.567138671875, -3.39727783203125, -3.2274169921875, -3.05755615234375, -2.8876953125, -2.71783447265625, -2.5479736328125, -2.37811279296875, -2.208251953125, -2.03839111328125, -1.8685302734375, -1.69866943359375, -1.52880859375, -1.35894775390625, -1.1890869140625, -1.01922607421875, -0.849365234375, -0.67950439453125, -0.5096435546875, -0.33978271484375, -0.169921875, -6.103515625e-05, 0.1697998046875, 0.33966064453125, 0.509521484375, 0.67938232421875, 0.8492431640625, 1.01910400390625, 1.18896484375, 1.35882568359375, 1.5286865234375, 1.69854736328125, 1.868408203125, 2.03826904296875, 2.2081298828125, 2.37799072265625, 2.5478515625, 2.71771240234375, 2.8875732421875, 3.05743408203125, 3.227294921875, 3.39715576171875, 3.5670166015625, 3.73687744140625, 3.90673828125, 4.07659912109375, 4.2464599609375, 4.41632080078125, 4.586181640625, 4.75604248046875, 4.9259033203125, 5.09576416015625, 5.265625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 6.0, 11.0, 7.0, 17.0, 21.0, 39.0, 60.0, 54.0, 76.0, 87.0, 121.0, 164.0, 236.0, 313.0, 431.0, 518.0, 461.0, 361.0, 263.0, 206.0, 151.0, 97.0, 86.0, 54.0, 61.0, 38.0, 33.0, 26.0, 18.0, 12.0, 11.0, 11.0, 9.0, 4.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0, -4.8126220703125, -4.625244140625, -4.4378662109375, -4.25048828125, -4.0631103515625, -3.875732421875, -3.6883544921875, -3.5009765625, -3.3135986328125, -3.126220703125, -2.9388427734375, -2.75146484375, -2.5640869140625, -2.376708984375, -2.1893310546875, -2.001953125, -1.8145751953125, -1.627197265625, -1.4398193359375, -1.25244140625, -1.0650634765625, -0.877685546875, -0.6903076171875, -0.5029296875, -0.3155517578125, -0.128173828125, 0.0592041015625, 0.24658203125, 0.4339599609375, 0.621337890625, 0.8087158203125, 0.99609375, 1.1834716796875, 1.370849609375, 1.5582275390625, 1.74560546875, 1.9329833984375, 2.120361328125, 2.3077392578125, 2.4951171875, 2.6824951171875, 2.869873046875, 3.0572509765625, 3.24462890625, 3.4320068359375, 3.619384765625, 3.8067626953125, 3.994140625, 4.1815185546875, 4.368896484375, 4.5562744140625, 4.74365234375, 4.9310302734375, 5.118408203125, 5.3057861328125, 5.4931640625, 5.6805419921875, 5.867919921875, 6.0552978515625, 6.24267578125, 6.4300537109375, 6.617431640625, 6.8048095703125, 6.9921875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 3.0, 12.0, 14.0, 28.0, 35.0, 36.0, 79.0, 99.0, 155.0, 259.0, 377.0, 717.0, 1699.0, 5535.0, 34207.0, 329630.0, 2969072.0, 766827.0, 71165.0, 9766.0, 2494.0, 877.0, 460.0, 266.0, 151.0, 110.0, 70.0, 37.0, 32.0, 22.0, 11.0, 13.0, 9.0, 2.0, 5.0, 4.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.578125, -12.26104736328125, -11.9439697265625, -11.62689208984375, -11.309814453125, -10.99273681640625, -10.6756591796875, -10.35858154296875, -10.04150390625, -9.72442626953125, -9.4073486328125, -9.09027099609375, -8.773193359375, -8.45611572265625, -8.1390380859375, -7.82196044921875, -7.5048828125, -7.18780517578125, -6.8707275390625, -6.55364990234375, -6.236572265625, -5.91949462890625, -5.6024169921875, -5.28533935546875, -4.96826171875, -4.65118408203125, -4.3341064453125, -4.01702880859375, -3.699951171875, -3.38287353515625, -3.0657958984375, -2.74871826171875, -2.431640625, -2.11456298828125, -1.7974853515625, -1.48040771484375, -1.163330078125, -0.84625244140625, -0.5291748046875, -0.21209716796875, 0.10498046875, 0.42205810546875, 0.7391357421875, 1.05621337890625, 1.373291015625, 1.69036865234375, 2.0074462890625, 2.32452392578125, 2.6416015625, 2.95867919921875, 3.2757568359375, 3.59283447265625, 3.909912109375, 4.22698974609375, 4.5440673828125, 4.86114501953125, 5.17822265625, 5.49530029296875, 5.8123779296875, 6.12945556640625, 6.446533203125, 6.76361083984375, 7.0806884765625, 7.39776611328125, 7.71484375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 55.0, 286.0, 476.0, 155.0, 33.0, 5.0], "bins": [-199.4805450439453, -196.17225646972656, -192.8639678955078, -189.5556640625, -186.24737548828125, -182.9390869140625, -179.63079833984375, -176.322509765625, -173.0142059326172, -169.70591735839844, -166.3976287841797, -163.08932495117188, -159.78103637695312, -156.47274780273438, -153.16445922851562, -149.85617065429688, -146.54788208007812, -143.23959350585938, -139.93130493164062, -136.6230010986328, -133.31471252441406, -130.0064239501953, -126.69813537597656, -123.38983917236328, -120.08154296875, -116.77325439453125, -113.46495819091797, -110.15666961669922, -106.84837341308594, -103.54008483886719, -100.23179626464844, -96.92350006103516, -93.61520385742188, -90.30691528320312, -86.99861907958984, -83.6903305053711, -80.38203430175781, -77.07374572753906, -73.76545715332031, -70.45716094970703, -67.14886474609375, -63.840572357177734, -60.53227996826172, -57.22399139404297, -53.91569519042969, -50.60740661621094, -47.29911422729492, -43.990821838378906, -40.68252944946289, -37.374237060546875, -34.06594467163086, -30.757654190063477, -27.44936180114746, -24.141069412231445, -20.832778930664062, -17.524486541748047, -14.216195106506348, -10.907903671264648, -7.599611282348633, -4.291319847106934, -0.983027458190918, 2.3252649307250977, 5.6335554122924805, 8.941847801208496, 12.250140190124512]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 4.0, 9.0, 4.0, 5.0, 8.0, 15.0, 11.0, 14.0, 22.0, 14.0, 32.0, 15.0, 30.0, 27.0, 31.0, 32.0, 42.0, 35.0, 37.0, 50.0, 41.0, 47.0, 39.0, 52.0, 35.0, 45.0, 36.0, 28.0, 28.0, 42.0, 29.0, 29.0, 16.0, 16.0, 22.0, 11.0, 11.0, 12.0, 7.0, 7.0, 8.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-23.61215591430664, -22.91864776611328, -22.225139617919922, -21.531631469726562, -20.838123321533203, -20.14461326599121, -19.45110511779785, -18.757596969604492, -18.064088821411133, -17.370580673217773, -16.677072525024414, -15.983563423156738, -15.290055274963379, -14.59654712677002, -13.903038024902344, -13.209529876708984, -12.516021728515625, -11.822513580322266, -11.129005432128906, -10.43549633026123, -9.741988182067871, -9.048480033874512, -8.354970932006836, -7.661462783813477, -6.967954635620117, -6.274446487426758, -5.58093786239624, -4.887429237365723, -4.193921089172363, -3.500412702560425, -2.8069043159484863, -2.1133956909179688, -1.4198875427246094, -0.7263791561126709, -0.03287076950073242, 0.660637617111206, 1.3541460037231445, 2.047654390335083, 2.7411627769470215, 3.434671401977539, 4.128179550170898, 4.821687698364258, 5.515196323394775, 6.208704948425293, 6.902213096618652, 7.595721244812012, 8.289230346679688, 8.982738494873047, 9.676246643066406, 10.369754791259766, 11.063262939453125, 11.7567720413208, 12.45028018951416, 13.14378833770752, 13.837297439575195, 14.530805587768555, 15.224313735961914, 15.917821884155273, 16.611330032348633, 17.304838180541992, 17.998348236083984, 18.691856384277344, 19.385364532470703, 20.078872680664062, 20.772380828857422]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 4.0, 10.0, 9.0, 15.0, 12.0, 16.0, 15.0, 20.0, 33.0, 29.0, 38.0, 33.0, 37.0, 32.0, 47.0, 48.0, 44.0, 42.0, 49.0, 47.0, 46.0, 43.0, 44.0, 26.0, 31.0, 28.0, 40.0, 27.0, 29.0, 15.0, 15.0, 15.0, 17.0, 5.0, 8.0, 4.0, 5.0, 8.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.823486328125, -2.72314453125, -2.622802734375, -2.5224609375, -2.422119140625, -2.32177734375, -2.221435546875, -2.12109375, -2.020751953125, -1.92041015625, -1.820068359375, -1.7197265625, -1.619384765625, -1.51904296875, -1.418701171875, -1.318359375, -1.218017578125, -1.11767578125, -1.017333984375, -0.9169921875, -0.816650390625, -0.71630859375, -0.615966796875, -0.515625, -0.415283203125, -0.31494140625, -0.214599609375, -0.1142578125, -0.013916015625, 0.08642578125, 0.186767578125, 0.287109375, 0.387451171875, 0.48779296875, 0.588134765625, 0.6884765625, 0.788818359375, 0.88916015625, 0.989501953125, 1.08984375, 1.190185546875, 1.29052734375, 1.390869140625, 1.4912109375, 1.591552734375, 1.69189453125, 1.792236328125, 1.892578125, 1.992919921875, 2.09326171875, 2.193603515625, 2.2939453125, 2.394287109375, 2.49462890625, 2.594970703125, 2.6953125, 2.795654296875, 2.89599609375, 2.996337890625, 3.0966796875, 3.197021484375, 3.29736328125, 3.397705078125, 3.498046875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 7.0, 4.0, 4.0, 9.0, 8.0, 18.0, 23.0, 32.0, 65.0, 90.0, 142.0, 199.0, 327.0, 457.0, 824.0, 1262.0, 2028.0, 3145.0, 4825.0, 7979.0, 12162.0, 19261.0, 30004.0, 47052.0, 73129.0, 109007.0, 150527.0, 167385.0, 140350.0, 98881.0, 65295.0, 41286.0, 26410.0, 16805.0, 10662.0, 6768.0, 4377.0, 2746.0, 1812.0, 1166.0, 745.0, 435.0, 296.0, 199.0, 130.0, 77.0, 50.0, 41.0, 17.0, 23.0, 7.0, 4.0, 8.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.2391357421875, -0.23196792602539062, -0.22480010986328125, -0.21763229370117188, -0.2104644775390625, -0.20329666137695312, -0.19612884521484375, -0.18896102905273438, -0.181793212890625, -0.17462539672851562, -0.16745758056640625, -0.16028976440429688, -0.1531219482421875, -0.14595413208007812, -0.13878631591796875, -0.13161849975585938, -0.12445068359375, -0.11728286743164062, -0.11011505126953125, -0.10294723510742188, -0.0957794189453125, -0.08861160278320312, -0.08144378662109375, -0.07427597045898438, -0.067108154296875, -0.059940338134765625, -0.05277252197265625, -0.045604705810546875, -0.0384368896484375, -0.031269073486328125, -0.02410125732421875, -0.016933441162109375, -0.009765625, -0.002597808837890625, 0.00457000732421875, 0.011737823486328125, 0.0189056396484375, 0.026073455810546875, 0.03324127197265625, 0.040409088134765625, 0.047576904296875, 0.054744720458984375, 0.06191253662109375, 0.06908035278320312, 0.0762481689453125, 0.08341598510742188, 0.09058380126953125, 0.09775161743164062, 0.10491943359375, 0.11208724975585938, 0.11925506591796875, 0.12642288208007812, 0.1335906982421875, 0.14075851440429688, 0.14792633056640625, 0.15509414672851562, 0.162261962890625, 0.16942977905273438, 0.17659759521484375, 0.18376541137695312, 0.1909332275390625, 0.19810104370117188, 0.20526885986328125, 0.21243667602539062, 0.2196044921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 7.0, 4.0, 8.0, 10.0, 15.0, 21.0, 14.0, 25.0, 34.0, 34.0, 43.0, 28.0, 33.0, 46.0, 45.0, 45.0, 41.0, 1066.0, 55.0, 59.0, 54.0, 37.0, 48.0, 33.0, 38.0, 33.0, 23.0, 21.0, 26.0, 15.0, 17.0, 9.0, 10.0, 6.0, 6.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.240234375, -2.1591796875, -2.078125, -1.9970703125, -1.916015625, -1.8349609375, -1.75390625, -1.6728515625, -1.591796875, -1.5107421875, -1.4296875, -1.3486328125, -1.267578125, -1.1865234375, -1.10546875, -1.0244140625, -0.943359375, -0.8623046875, -0.78125, -0.7001953125, -0.619140625, -0.5380859375, -0.45703125, -0.3759765625, -0.294921875, -0.2138671875, -0.1328125, -0.0517578125, 0.029296875, 0.1103515625, 0.19140625, 0.2724609375, 0.353515625, 0.4345703125, 0.515625, 0.5966796875, 0.677734375, 0.7587890625, 0.83984375, 0.9208984375, 1.001953125, 1.0830078125, 1.1640625, 1.2451171875, 1.326171875, 1.4072265625, 1.48828125, 1.5693359375, 1.650390625, 1.7314453125, 1.8125, 1.8935546875, 1.974609375, 2.0556640625, 2.13671875, 2.2177734375, 2.298828125, 2.3798828125, 2.4609375, 2.5419921875, 2.623046875, 2.7041015625, 2.78515625, 2.8662109375, 2.947265625]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 6.0, 10.0, 6.0, 20.0, 29.0, 38.0, 68.0, 112.0, 155.0, 216.0, 385.0, 598.0, 905.0, 1418.0, 2143.0, 3312.0, 5052.0, 7930.0, 12291.0, 19802.0, 31036.0, 47993.0, 73392.0, 107013.0, 145071.0, 1207204.0, 138517.0, 100807.0, 68145.0, 45048.0, 28506.0, 18196.0, 11408.0, 7181.0, 4655.0, 3020.0, 1938.0, 1225.0, 838.0, 520.0, 330.0, 209.0, 139.0, 88.0, 50.0, 38.0, 23.0, 25.0, 15.0, 5.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.126220703125, -0.12177848815917969, -0.11733627319335938, -0.11289405822753906, -0.10845184326171875, -0.10400962829589844, -0.09956741333007812, -0.09512519836425781, -0.0906829833984375, -0.08624076843261719, -0.08179855346679688, -0.07735633850097656, -0.07291412353515625, -0.06847190856933594, -0.06402969360351562, -0.05958747863769531, -0.055145263671875, -0.05070304870605469, -0.046260833740234375, -0.04181861877441406, -0.03737640380859375, -0.03293418884277344, -0.028491973876953125, -0.024049758911132812, -0.0196075439453125, -0.015165328979492188, -0.010723114013671875, -0.0062808990478515625, -0.00183868408203125, 0.0026035308837890625, 0.007045745849609375, 0.011487960815429688, 0.01593017578125, 0.020372390747070312, 0.024814605712890625, 0.029256820678710938, 0.03369903564453125, 0.03814125061035156, 0.042583465576171875, 0.04702568054199219, 0.0514678955078125, 0.05591011047363281, 0.060352325439453125, 0.06479454040527344, 0.06923675537109375, 0.07367897033691406, 0.07812118530273438, 0.08256340026855469, 0.087005615234375, 0.09144783020019531, 0.09589004516601562, 0.10033226013183594, 0.10477447509765625, 0.10921669006347656, 0.11365890502929688, 0.11810111999511719, 0.1225433349609375, 0.1269855499267578, 0.13142776489257812, 0.13586997985839844, 0.14031219482421875, 0.14475440979003906, 0.14919662475585938, 0.1536388397216797, 0.1580810546875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 4.0, 3.0, 1.0, 4.0, 8.0, 4.0, 6.0, 8.0, 14.0, 14.0, 18.0, 25.0, 38.0, 41.0, 58.0, 62.0, 115.0, 169.0, 85.0, 83.0, 56.0, 41.0, 25.0, 27.0, 22.0, 16.0, 15.0, 6.0, 5.0, 4.0, 4.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00760650634765625, -0.007347226142883301, -0.0070879459381103516, -0.006828665733337402, -0.006569385528564453, -0.006310105323791504, -0.006050825119018555, -0.0057915449142456055, -0.005532264709472656, -0.005272984504699707, -0.005013704299926758, -0.004754424095153809, -0.004495143890380859, -0.00423586368560791, -0.003976583480834961, -0.0037173032760620117, -0.0034580230712890625, -0.0031987428665161133, -0.002939462661743164, -0.002680182456970215, -0.0024209022521972656, -0.0021616220474243164, -0.0019023418426513672, -0.001643061637878418, -0.0013837814331054688, -0.0011245012283325195, -0.0008652210235595703, -0.0006059408187866211, -0.0003466606140136719, -8.738040924072266e-05, 0.00017189979553222656, 0.0004311800003051758, 0.000690460205078125, 0.0009497404098510742, 0.0012090206146240234, 0.0014683008193969727, 0.0017275810241699219, 0.001986861228942871, 0.0022461414337158203, 0.0025054216384887695, 0.0027647018432617188, 0.003023982048034668, 0.003283262252807617, 0.0035425424575805664, 0.0038018226623535156, 0.004061102867126465, 0.004320383071899414, 0.004579663276672363, 0.0048389434814453125, 0.005098223686218262, 0.005357503890991211, 0.00561678409576416, 0.005876064300537109, 0.006135344505310059, 0.006394624710083008, 0.006653904914855957, 0.006913185119628906, 0.0071724653244018555, 0.007431745529174805, 0.007691025733947754, 0.007950305938720703, 0.008209586143493652, 0.008468866348266602, 0.00872814655303955, 0.0089874267578125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 6.0, 3.0, 2.0, 6.0, 12.0, 4.0, 13.0, 14.0, 16.0, 35.0, 44.0, 56.0, 83.0, 109.0, 211.0, 372.0, 1223.0, 107588.0, 934934.0, 2667.0, 467.0, 216.0, 144.0, 92.0, 60.0, 35.0, 27.0, 29.0, 12.0, 12.0, 12.0, 13.0, 6.0, 5.0, 6.0, 4.0, 3.0, 6.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.171142578125, -0.1662731170654297, -0.16140365600585938, -0.15653419494628906, -0.15166473388671875, -0.14679527282714844, -0.14192581176757812, -0.1370563507080078, -0.1321868896484375, -0.1273174285888672, -0.12244796752929688, -0.11757850646972656, -0.11270904541015625, -0.10783958435058594, -0.10297012329101562, -0.09810066223144531, -0.093231201171875, -0.08836174011230469, -0.08349227905273438, -0.07862281799316406, -0.07375335693359375, -0.06888389587402344, -0.06401443481445312, -0.05914497375488281, -0.0542755126953125, -0.04940605163574219, -0.044536590576171875, -0.03966712951660156, -0.03479766845703125, -0.029928207397460938, -0.025058746337890625, -0.020189285278320312, -0.01531982421875, -0.010450363159179688, -0.005580902099609375, -0.0007114410400390625, 0.00415802001953125, 0.009027481079101562, 0.013896942138671875, 0.018766403198242188, 0.0236358642578125, 0.028505325317382812, 0.033374786376953125, 0.03824424743652344, 0.04311370849609375, 0.04798316955566406, 0.052852630615234375, 0.05772209167480469, 0.062591552734375, 0.06746101379394531, 0.07233047485351562, 0.07719993591308594, 0.08206939697265625, 0.08693885803222656, 0.09180831909179688, 0.09667778015136719, 0.1015472412109375, 0.10641670227050781, 0.11128616333007812, 0.11615562438964844, 0.12102508544921875, 0.12589454650878906, 0.13076400756835938, 0.1356334686279297, 0.1405029296875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 7.0, 40.0, 483.0, 436.0, 34.0, 14.0, 1.0, 1.0], "bins": [-0.16378076374530792, -0.16100431978702545, -0.15822787582874298, -0.1554514318704605, -0.15267498791217804, -0.14989854395389557, -0.1471220999956131, -0.14434565603733063, -0.14156921207904816, -0.13879276812076569, -0.13601632416248322, -0.13323988020420074, -0.13046343624591827, -0.1276869922876358, -0.12491054832935333, -0.12213409692049026, -0.1193576455116272, -0.11658120155334473, -0.11380475759506226, -0.11102831363677979, -0.10825186967849731, -0.10547542572021484, -0.10269898176193237, -0.0999225303530693, -0.09714609384536743, -0.09436964988708496, -0.09159320592880249, -0.08881676197052002, -0.08604031801223755, -0.08326387405395508, -0.08048743009567261, -0.07771097868680954, -0.07493452727794647, -0.072158083319664, -0.06938163936138153, -0.06660519540309906, -0.06382875144481659, -0.06105230376124382, -0.05827585980296135, -0.05549941211938858, -0.05272297188639641, -0.04994652792811394, -0.04717008396983147, -0.0443936362862587, -0.04161719232797623, -0.038840748369693756, -0.036064304411411285, -0.033287860453128815, -0.030511414632201195, -0.027734970673918724, -0.024958524852991104, -0.022182080894708633, -0.019405636936426163, -0.016629191115498543, -0.013852747157216072, -0.011076301336288452, -0.008299857378005981, -0.005523412488400936, -0.002746968064457178, 2.9476359486579895e-05, 0.002805921249091625, 0.0055823661386966705, 0.008358810096979141, 0.011135255917906761, 0.013911699876189232]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 8.0, 4.0, 8.0, 10.0, 13.0, 13.0, 22.0, 29.0, 27.0, 31.0, 31.0, 33.0, 37.0, 43.0, 50.0, 61.0, 52.0, 50.0, 50.0, 50.0, 45.0, 46.0, 47.0, 33.0, 36.0, 42.0, 19.0, 17.0, 16.0, 19.0, 10.0, 13.0, 12.0, 9.0, 8.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.013729453086853027, -0.013248506933450699, -0.01276756078004837, -0.012286614626646042, -0.011805668473243713, -0.011324722319841385, -0.010843776166439056, -0.010362830013036728, -0.0098818838596344, -0.009400937706232071, -0.008919991552829742, -0.008439045399427414, -0.007958099246025085, -0.007477153092622757, -0.0069962069392204285, -0.0065152607858181, -0.0060343146324157715, -0.005553368479013443, -0.0050724223256111145, -0.004591476172208786, -0.0041105300188064575, -0.003629583865404129, -0.0031486377120018005, -0.002667691558599472, -0.0021867454051971436, -0.001705799251794815, -0.0012248530983924866, -0.0007439069449901581, -0.0002629607915878296, 0.0002179853618144989, 0.0006989315152168274, 0.0011798776686191559, 0.0016608238220214844, 0.002141769975423813, 0.0026227161288261414, 0.00310366228222847, 0.0035846084356307983, 0.004065554589033127, 0.004546500742435455, 0.005027446895837784, 0.005508393049240112, 0.005989339202642441, 0.006470285356044769, 0.006951231509447098, 0.007432177662849426, 0.007913123816251755, 0.008394069969654083, 0.008875016123056412, 0.00935596227645874, 0.009836908429861069, 0.010317854583263397, 0.010798800736665726, 0.011279746890068054, 0.011760693043470383, 0.012241639196872711, 0.01272258535027504, 0.013203531503677368, 0.013684477657079697, 0.014165423810482025, 0.014646369963884354, 0.015127316117286682, 0.01560826227068901, 0.01608920842409134, 0.016570154577493668, 0.017051100730895996]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 3.0, 4.0, 10.0, 10.0, 14.0, 12.0, 16.0, 15.0, 20.0, 33.0, 29.0, 38.0, 33.0, 37.0, 31.0, 48.0, 48.0, 46.0, 40.0, 49.0, 47.0, 46.0, 43.0, 44.0, 26.0, 31.0, 29.0, 38.0, 28.0, 29.0, 15.0, 16.0, 12.0, 19.0, 5.0, 8.0, 4.0, 5.0, 8.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.923828125, -2.823486328125, -2.72314453125, -2.622802734375, -2.5224609375, -2.422119140625, -2.32177734375, -2.221435546875, -2.12109375, -2.020751953125, -1.92041015625, -1.820068359375, -1.7197265625, -1.619384765625, -1.51904296875, -1.418701171875, -1.318359375, -1.218017578125, -1.11767578125, -1.017333984375, -0.9169921875, -0.816650390625, -0.71630859375, -0.615966796875, -0.515625, -0.415283203125, -0.31494140625, -0.214599609375, -0.1142578125, -0.013916015625, 0.08642578125, 0.186767578125, 0.287109375, 0.387451171875, 0.48779296875, 0.588134765625, 0.6884765625, 0.788818359375, 0.88916015625, 0.989501953125, 1.08984375, 1.190185546875, 1.29052734375, 1.390869140625, 1.4912109375, 1.591552734375, 1.69189453125, 1.792236328125, 1.892578125, 1.992919921875, 2.09326171875, 2.193603515625, 2.2939453125, 2.394287109375, 2.49462890625, 2.594970703125, 2.6953125, 2.795654296875, 2.89599609375, 2.996337890625, 3.0966796875, 3.197021484375, 3.29736328125, 3.397705078125, 3.498046875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 0.0, 10.0, 4.0, 14.0, 11.0, 19.0, 17.0, 46.0, 43.0, 61.0, 79.0, 120.0, 178.0, 240.0, 338.0, 515.0, 677.0, 1037.0, 1685.0, 2796.0, 6652.0, 25458.0, 146662.0, 625117.0, 188860.0, 31645.0, 7666.0, 3178.0, 1784.0, 1128.0, 744.0, 536.0, 389.0, 236.0, 167.0, 123.0, 70.0, 73.0, 46.0, 35.0, 36.0, 25.0, 11.0, 9.0, 2.0, 4.0, 3.0, 4.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.94921875, -7.70513916015625, -7.4610595703125, -7.21697998046875, -6.972900390625, -6.72882080078125, -6.4847412109375, -6.24066162109375, -5.99658203125, -5.75250244140625, -5.5084228515625, -5.26434326171875, -5.020263671875, -4.77618408203125, -4.5321044921875, -4.28802490234375, -4.0439453125, -3.79986572265625, -3.5557861328125, -3.31170654296875, -3.067626953125, -2.82354736328125, -2.5794677734375, -2.33538818359375, -2.09130859375, -1.84722900390625, -1.6031494140625, -1.35906982421875, -1.114990234375, -0.87091064453125, -0.6268310546875, -0.38275146484375, -0.138671875, 0.10540771484375, 0.3494873046875, 0.59356689453125, 0.837646484375, 1.08172607421875, 1.3258056640625, 1.56988525390625, 1.81396484375, 2.05804443359375, 2.3021240234375, 2.54620361328125, 2.790283203125, 3.03436279296875, 3.2784423828125, 3.52252197265625, 3.7666015625, 4.01068115234375, 4.2547607421875, 4.49884033203125, 4.742919921875, 4.98699951171875, 5.2310791015625, 5.47515869140625, 5.71923828125, 5.96331787109375, 6.2073974609375, 6.45147705078125, 6.695556640625, 6.93963623046875, 7.1837158203125, 7.42779541015625, 7.671875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 2.0, 8.0, 10.0, 12.0, 14.0, 19.0, 22.0, 17.0, 30.0, 31.0, 35.0, 45.0, 65.0, 98.0, 159.0, 353.0, 1452.0, 196.0, 105.0, 65.0, 50.0, 42.0, 34.0, 42.0, 18.0, 20.0, 19.0, 19.0, 9.0, 5.0, 10.0, 8.0, 7.0, 5.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-9.7734375, -9.4786376953125, -9.183837890625, -8.8890380859375, -8.59423828125, -8.2994384765625, -8.004638671875, -7.7098388671875, -7.4150390625, -7.1202392578125, -6.825439453125, -6.5306396484375, -6.23583984375, -5.9410400390625, -5.646240234375, -5.3514404296875, -5.056640625, -4.7618408203125, -4.467041015625, -4.1722412109375, -3.87744140625, -3.5826416015625, -3.287841796875, -2.9930419921875, -2.6982421875, -2.4034423828125, -2.108642578125, -1.8138427734375, -1.51904296875, -1.2242431640625, -0.929443359375, -0.6346435546875, -0.33984375, -0.0450439453125, 0.249755859375, 0.5445556640625, 0.83935546875, 1.1341552734375, 1.428955078125, 1.7237548828125, 2.0185546875, 2.3133544921875, 2.608154296875, 2.9029541015625, 3.19775390625, 3.4925537109375, 3.787353515625, 4.0821533203125, 4.376953125, 4.6717529296875, 4.966552734375, 5.2613525390625, 5.55615234375, 5.8509521484375, 6.145751953125, 6.4405517578125, 6.7353515625, 7.0301513671875, 7.324951171875, 7.6197509765625, 7.91455078125, 8.2093505859375, 8.504150390625, 8.7989501953125, 9.09375]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 4.0, 4.0, 9.0, 8.0, 9.0, 9.0, 14.0, 16.0, 15.0, 29.0, 33.0, 26.0, 36.0, 48.0, 77.0, 128.0, 164.0, 266.0, 479.0, 782.0, 1653.0, 6930.0, 3006193.0, 123077.0, 2882.0, 1075.0, 577.0, 353.0, 246.0, 134.0, 97.0, 79.0, 53.0, 37.0, 33.0, 34.0, 27.0, 20.0, 15.0, 9.0, 7.0, 6.0, 8.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-22.265625, -21.5419921875, -20.818359375, -20.0947265625, -19.37109375, -18.6474609375, -17.923828125, -17.2001953125, -16.4765625, -15.7529296875, -15.029296875, -14.3056640625, -13.58203125, -12.8583984375, -12.134765625, -11.4111328125, -10.6875, -9.9638671875, -9.240234375, -8.5166015625, -7.79296875, -7.0693359375, -6.345703125, -5.6220703125, -4.8984375, -4.1748046875, -3.451171875, -2.7275390625, -2.00390625, -1.2802734375, -0.556640625, 0.1669921875, 0.890625, 1.6142578125, 2.337890625, 3.0615234375, 3.78515625, 4.5087890625, 5.232421875, 5.9560546875, 6.6796875, 7.4033203125, 8.126953125, 8.8505859375, 9.57421875, 10.2978515625, 11.021484375, 11.7451171875, 12.46875, 13.1923828125, 13.916015625, 14.6396484375, 15.36328125, 16.0869140625, 16.810546875, 17.5341796875, 18.2578125, 18.9814453125, 19.705078125, 20.4287109375, 21.15234375, 21.8759765625, 22.599609375, 23.3232421875, 24.046875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 7.0, 13.0, 71.0, 270.0, 375.0, 201.0, 57.0, 14.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.8744010925293, -40.76940155029297, -38.66440200805664, -36.55940246582031, -34.45440673828125, -32.34940719604492, -30.244407653808594, -28.139408111572266, -26.03441047668457, -23.929410934448242, -21.824413299560547, -19.71941375732422, -17.61441421508789, -15.509416580200195, -13.404417037963867, -11.299418449401855, -9.194419860839844, -7.089421272277832, -4.984422206878662, -2.879423141479492, -0.7744245529174805, 1.3305740356445312, 3.4355735778808594, 5.540572166442871, 7.645570755004883, 9.750569343566895, 11.855567932128906, 13.960567474365234, 16.065567016601562, 18.170564651489258, 20.275564193725586, 22.38056182861328, 24.485565185546875, 26.590564727783203, 28.6955623626709, 30.800561904907227, 32.90555953979492, 35.01055908203125, 37.11555862426758, 39.220558166503906, 41.32555389404297, 43.4305534362793, 45.535552978515625, 47.64054870605469, 49.745548248291016, 51.850547790527344, 53.95554733276367, 56.060546875, 58.16554641723633, 60.270545959472656, 62.375545501708984, 64.48054504394531, 66.58554077148438, 68.69053649902344, 70.79553985595703, 72.9005355834961, 75.00553894042969, 77.11053466796875, 79.21553802490234, 81.3205337524414, 83.425537109375, 85.53053283691406, 87.63552856445312, 89.74053192138672, 91.84552764892578]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 8.0, 6.0, 7.0, 6.0, 18.0, 18.0, 21.0, 16.0, 24.0, 25.0, 36.0, 33.0, 34.0, 35.0, 39.0, 40.0, 46.0, 44.0, 57.0, 58.0, 50.0, 56.0, 45.0, 38.0, 29.0, 37.0, 23.0, 20.0, 27.0, 20.0, 15.0, 16.0, 17.0, 13.0, 4.0, 7.0, 3.0, 7.0, 2.0, 4.0, 0.0, 4.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.353858947753906, -20.564123153686523, -19.774389266967773, -18.98465347290039, -18.19491958618164, -17.405183792114258, -16.615447998046875, -15.825714111328125, -15.035979270935059, -14.246244430541992, -13.456509590148926, -12.66677474975586, -11.877038955688477, -11.087305068969727, -10.297569274902344, -9.507834434509277, -8.718099594116211, -7.9283647537231445, -7.138629913330078, -6.3488945960998535, -5.559159755706787, -4.769424915313721, -3.979689598083496, -3.1899547576904297, -2.4002199172973633, -1.6104849576950073, -0.8207499980926514, -0.03101491928100586, 0.7587199211120605, 1.548454761505127, 2.3381900787353516, 3.127924919128418, 3.9176597595214844, 4.707394599914551, 5.497129440307617, 6.286864757537842, 7.076599597930908, 7.866334438323975, 8.6560697555542, 9.445804595947266, 10.235539436340332, 11.025274276733398, 11.815009117126465, 12.604743957519531, 13.394479751586914, 14.184213638305664, 14.973949432373047, 15.763684272766113, 16.55341911315918, 17.343154907226562, 18.132888793945312, 18.922624588012695, 19.712358474731445, 20.502094268798828, 21.291828155517578, 22.08156394958496, 22.871299743652344, 23.661035537719727, 24.450769424438477, 25.24050521850586, 26.03023910522461, 26.819974899291992, 27.609710693359375, 28.399444580078125, 29.189178466796875]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 1.0, 6.0, 5.0, 2.0, 8.0, 5.0, 6.0, 13.0, 17.0, 15.0, 18.0, 37.0, 35.0, 29.0, 35.0, 29.0, 32.0, 33.0, 55.0, 48.0, 44.0, 54.0, 43.0, 39.0, 39.0, 41.0, 39.0, 29.0, 33.0, 27.0, 27.0, 26.0, 16.0, 19.0, 17.0, 17.0, 16.0, 16.0, 4.0, 10.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0234375, -2.918548583984375, -2.81365966796875, -2.708770751953125, -2.6038818359375, -2.498992919921875, -2.39410400390625, -2.289215087890625, -2.184326171875, -2.079437255859375, -1.97454833984375, -1.869659423828125, -1.7647705078125, -1.659881591796875, -1.55499267578125, -1.450103759765625, -1.34521484375, -1.240325927734375, -1.13543701171875, -1.030548095703125, -0.9256591796875, -0.820770263671875, -0.71588134765625, -0.610992431640625, -0.506103515625, -0.401214599609375, -0.29632568359375, -0.191436767578125, -0.0865478515625, 0.018341064453125, 0.12322998046875, 0.228118896484375, 0.3330078125, 0.437896728515625, 0.54278564453125, 0.647674560546875, 0.7525634765625, 0.857452392578125, 0.96234130859375, 1.067230224609375, 1.172119140625, 1.277008056640625, 1.38189697265625, 1.486785888671875, 1.5916748046875, 1.696563720703125, 1.80145263671875, 1.906341552734375, 2.01123046875, 2.116119384765625, 2.22100830078125, 2.325897216796875, 2.4307861328125, 2.535675048828125, 2.64056396484375, 2.745452880859375, 2.850341796875, 2.955230712890625, 3.06011962890625, 3.165008544921875, 3.2698974609375, 3.374786376953125, 3.47967529296875, 3.584564208984375, 3.689453125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 7.0, 11.0, 11.0, 24.0, 36.0, 55.0, 76.0, 123.0, 174.0, 253.0, 374.0, 567.0, 843.0, 1394.0, 2205.0, 3739.0, 7339.0, 15869.0, 46304.0, 211882.0, 935986.0, 1926891.0, 801629.0, 169364.0, 38793.0, 14037.0, 6860.0, 3697.0, 2005.0, 1348.0, 849.0, 500.0, 314.0, 218.0, 170.0, 101.0, 74.0, 48.0, 32.0, 28.0, 15.0, 12.0, 8.0, 8.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.833984375, -3.694244384765625, -3.55450439453125, -3.414764404296875, -3.2750244140625, -3.135284423828125, -2.99554443359375, -2.855804443359375, -2.716064453125, -2.576324462890625, -2.43658447265625, -2.296844482421875, -2.1571044921875, -2.017364501953125, -1.87762451171875, -1.737884521484375, -1.59814453125, -1.458404541015625, -1.31866455078125, -1.178924560546875, -1.0391845703125, -0.899444580078125, -0.75970458984375, -0.619964599609375, -0.480224609375, -0.340484619140625, -0.20074462890625, -0.061004638671875, 0.0787353515625, 0.218475341796875, 0.35821533203125, 0.497955322265625, 0.6376953125, 0.777435302734375, 0.91717529296875, 1.056915283203125, 1.1966552734375, 1.336395263671875, 1.47613525390625, 1.615875244140625, 1.755615234375, 1.895355224609375, 2.03509521484375, 2.174835205078125, 2.3145751953125, 2.454315185546875, 2.59405517578125, 2.733795166015625, 2.87353515625, 3.013275146484375, 3.15301513671875, 3.292755126953125, 3.4324951171875, 3.572235107421875, 3.71197509765625, 3.851715087890625, 3.991455078125, 4.131195068359375, 4.27093505859375, 4.410675048828125, 4.5504150390625, 4.690155029296875, 4.82989501953125, 4.969635009765625, 5.109375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 5.0, 3.0, 7.0, 7.0, 12.0, 22.0, 22.0, 39.0, 60.0, 91.0, 139.0, 188.0, 303.0, 343.0, 464.0, 571.0, 494.0, 387.0, 262.0, 193.0, 140.0, 86.0, 75.0, 49.0, 38.0, 25.0, 20.0, 9.0, 8.0, 5.0, 6.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.5625, -5.38604736328125, -5.2095947265625, -5.03314208984375, -4.856689453125, -4.68023681640625, -4.5037841796875, -4.32733154296875, -4.15087890625, -3.97442626953125, -3.7979736328125, -3.62152099609375, -3.445068359375, -3.26861572265625, -3.0921630859375, -2.91571044921875, -2.7392578125, -2.56280517578125, -2.3863525390625, -2.20989990234375, -2.033447265625, -1.85699462890625, -1.6805419921875, -1.50408935546875, -1.32763671875, -1.15118408203125, -0.9747314453125, -0.79827880859375, -0.621826171875, -0.44537353515625, -0.2689208984375, -0.09246826171875, 0.083984375, 0.26043701171875, 0.4368896484375, 0.61334228515625, 0.789794921875, 0.96624755859375, 1.1427001953125, 1.31915283203125, 1.49560546875, 1.67205810546875, 1.8485107421875, 2.02496337890625, 2.201416015625, 2.37786865234375, 2.5543212890625, 2.73077392578125, 2.9072265625, 3.08367919921875, 3.2601318359375, 3.43658447265625, 3.613037109375, 3.78948974609375, 3.9659423828125, 4.14239501953125, 4.31884765625, 4.49530029296875, 4.6717529296875, 4.84820556640625, 5.024658203125, 5.20111083984375, 5.3775634765625, 5.55401611328125, 5.73046875]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 7.0, 3.0, 9.0, 7.0, 13.0, 13.0, 28.0, 34.0, 61.0, 67.0, 132.0, 201.0, 364.0, 691.0, 1446.0, 5129.0, 61351.0, 2773793.0, 1315539.0, 29283.0, 3589.0, 1272.0, 579.0, 276.0, 155.0, 85.0, 60.0, 30.0, 24.0, 13.0, 12.0, 10.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.328125, -9.9825439453125, -9.636962890625, -9.2913818359375, -8.94580078125, -8.6002197265625, -8.254638671875, -7.9090576171875, -7.5634765625, -7.2178955078125, -6.872314453125, -6.5267333984375, -6.18115234375, -5.8355712890625, -5.489990234375, -5.1444091796875, -4.798828125, -4.4532470703125, -4.107666015625, -3.7620849609375, -3.41650390625, -3.0709228515625, -2.725341796875, -2.3797607421875, -2.0341796875, -1.6885986328125, -1.343017578125, -0.9974365234375, -0.65185546875, -0.3062744140625, 0.039306640625, 0.3848876953125, 0.73046875, 1.0760498046875, 1.421630859375, 1.7672119140625, 2.11279296875, 2.4583740234375, 2.803955078125, 3.1495361328125, 3.4951171875, 3.8406982421875, 4.186279296875, 4.5318603515625, 4.87744140625, 5.2230224609375, 5.568603515625, 5.9141845703125, 6.259765625, 6.6053466796875, 6.950927734375, 7.2965087890625, 7.64208984375, 7.9876708984375, 8.333251953125, 8.6788330078125, 9.0244140625, 9.3699951171875, 9.715576171875, 10.0611572265625, 10.40673828125, 10.7523193359375, 11.097900390625, 11.4434814453125, 11.7890625]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 12.0, 383.0, 574.0, 44.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-237.49899291992188, -232.7583465576172, -228.01771545410156, -223.27706909179688, -218.5364227294922, -213.79579162597656, -209.05514526367188, -204.31451416015625, -199.57386779785156, -194.83322143554688, -190.09259033203125, -185.35194396972656, -180.61129760742188, -175.87066650390625, -171.13002014160156, -166.38937377929688, -161.64874267578125, -156.90809631347656, -152.16746520996094, -147.42681884765625, -142.68617248535156, -137.94554138183594, -133.20489501953125, -128.46426391601562, -123.72360229492188, -118.98296356201172, -114.24231719970703, -109.50167846679688, -104.76103973388672, -100.02040100097656, -95.27975463867188, -90.53911590576172, -85.79847717285156, -81.0578384399414, -76.31719207763672, -71.57655334472656, -66.8359146118164, -62.095272064208984, -57.35462951660156, -52.613990783691406, -47.873348236083984, -43.13270568847656, -38.392066955566406, -33.651424407958984, -28.910783767700195, -24.170143127441406, -19.429500579833984, -14.688861846923828, -9.948219299316406, -5.207578182220459, -0.4669370651245117, 4.273704528808594, 9.014345169067383, 13.754985809326172, 18.495628356933594, 23.23626708984375, 27.976909637451172, 32.717552185058594, 37.45819091796875, 42.19883346557617, 46.939476013183594, 51.68011474609375, 56.42075729370117, 61.16139602661133, 65.90203857421875]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 4.0, 13.0, 6.0, 7.0, 8.0, 10.0, 10.0, 19.0, 16.0, 30.0, 21.0, 25.0, 42.0, 30.0, 34.0, 42.0, 46.0, 35.0, 37.0, 47.0, 36.0, 44.0, 50.0, 42.0, 38.0, 41.0, 38.0, 37.0, 28.0, 24.0, 26.0, 24.0, 18.0, 16.0, 13.0, 8.0, 12.0, 9.0, 5.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.504249572753906, -15.882972717285156, -15.261695861816406, -14.640419006347656, -14.01914119720459, -13.39786434173584, -12.77658748626709, -12.155309677124023, -11.534032821655273, -10.912755966186523, -10.291479110717773, -9.670202255249023, -9.048924446105957, -8.427647590637207, -7.806370735168457, -7.185093402862549, -6.563817024230957, -5.942540168762207, -5.321262836456299, -4.699985980987549, -4.078708648681641, -3.4574317932128906, -2.8361549377441406, -2.2148776054382324, -1.5936007499694824, -0.9723237156867981, -0.35104668140411377, 0.2702302932739258, 0.8915073871612549, 1.512784481048584, 2.134061336517334, 2.755338668823242, 3.376615524291992, 3.9978926181793213, 4.61916971206665, 5.2404465675354, 5.861723899841309, 6.483000755310059, 7.104277610778809, 7.725554943084717, 8.346832275390625, 8.968109130859375, 9.589385986328125, 10.210662841796875, 10.831940650939941, 11.453217506408691, 12.074494361877441, 12.695772171020508, 13.317048072814941, 13.938324928283691, 14.559601783752441, 15.180879592895508, 15.802156448364258, 16.423433303833008, 17.044710159301758, 17.665987014770508, 18.287263870239258, 18.908540725708008, 19.529817581176758, 20.151094436645508, 20.772371292114258, 21.39365005493164, 22.01492691040039, 22.63620376586914, 23.25748062133789]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 9.0, 3.0, 9.0, 4.0, 10.0, 12.0, 11.0, 12.0, 25.0, 24.0, 28.0, 39.0, 40.0, 35.0, 48.0, 36.0, 31.0, 52.0, 42.0, 41.0, 56.0, 45.0, 44.0, 41.0, 43.0, 31.0, 29.0, 24.0, 29.0, 32.0, 19.0, 19.0, 5.0, 14.0, 12.0, 8.0, 15.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.595703125, -2.510894775390625, -2.42608642578125, -2.341278076171875, -2.2564697265625, -2.171661376953125, -2.08685302734375, -2.002044677734375, -1.917236328125, -1.832427978515625, -1.74761962890625, -1.662811279296875, -1.5780029296875, -1.493194580078125, -1.40838623046875, -1.323577880859375, -1.23876953125, -1.153961181640625, -1.06915283203125, -0.984344482421875, -0.8995361328125, -0.814727783203125, -0.72991943359375, -0.645111083984375, -0.560302734375, -0.475494384765625, -0.39068603515625, -0.305877685546875, -0.2210693359375, -0.136260986328125, -0.05145263671875, 0.033355712890625, 0.1181640625, 0.202972412109375, 0.28778076171875, 0.372589111328125, 0.4573974609375, 0.542205810546875, 0.62701416015625, 0.711822509765625, 0.796630859375, 0.881439208984375, 0.96624755859375, 1.051055908203125, 1.1358642578125, 1.220672607421875, 1.30548095703125, 1.390289306640625, 1.47509765625, 1.559906005859375, 1.64471435546875, 1.729522705078125, 1.8143310546875, 1.899139404296875, 1.98394775390625, 2.068756103515625, 2.153564453125, 2.238372802734375, 2.32318115234375, 2.407989501953125, 2.4927978515625, 2.577606201171875, 2.66241455078125, 2.747222900390625, 2.83203125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 12.0, 10.0, 18.0, 25.0, 38.0, 61.0, 94.0, 158.0, 254.0, 432.0, 678.0, 1187.0, 1937.0, 3252.0, 5374.0, 9195.0, 15610.0, 26676.0, 46676.0, 79331.0, 130850.0, 186997.0, 192316.0, 139413.0, 86441.0, 50563.0, 29466.0, 17100.0, 9873.0, 5918.0, 3426.0, 2026.0, 1239.0, 744.0, 484.0, 280.0, 150.0, 89.0, 58.0, 43.0, 22.0, 17.0, 12.0, 9.0, 4.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.236328125, -0.22918319702148438, -0.22203826904296875, -0.21489334106445312, -0.2077484130859375, -0.20060348510742188, -0.19345855712890625, -0.18631362915039062, -0.179168701171875, -0.17202377319335938, -0.16487884521484375, -0.15773391723632812, -0.1505889892578125, -0.14344406127929688, -0.13629913330078125, -0.12915420532226562, -0.12200927734375, -0.11486434936523438, -0.10771942138671875, -0.10057449340820312, -0.0934295654296875, -0.08628463745117188, -0.07913970947265625, -0.07199478149414062, -0.064849853515625, -0.057704925537109375, -0.05055999755859375, -0.043415069580078125, -0.0362701416015625, -0.029125213623046875, -0.02198028564453125, -0.014835357666015625, -0.0076904296875, -0.000545501708984375, 0.00659942626953125, 0.013744354248046875, 0.0208892822265625, 0.028034210205078125, 0.03517913818359375, 0.042324066162109375, 0.049468994140625, 0.056613922119140625, 0.06375885009765625, 0.07090377807617188, 0.0780487060546875, 0.08519363403320312, 0.09233856201171875, 0.09948348999023438, 0.10662841796875, 0.11377334594726562, 0.12091827392578125, 0.12806320190429688, 0.1352081298828125, 0.14235305786132812, 0.14949798583984375, 0.15664291381835938, 0.163787841796875, 0.17093276977539062, 0.17807769775390625, 0.18522262573242188, 0.1923675537109375, 0.19951248168945312, 0.20665740966796875, 0.21380233764648438, 0.220947265625]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 0.0, 7.0, 1.0, 2.0, 12.0, 9.0, 17.0, 12.0, 11.0, 13.0, 13.0, 18.0, 20.0, 29.0, 22.0, 23.0, 28.0, 29.0, 33.0, 30.0, 29.0, 38.0, 33.0, 41.0, 1059.0, 36.0, 43.0, 38.0, 27.0, 32.0, 41.0, 36.0, 36.0, 30.0, 20.0, 20.0, 20.0, 24.0, 16.0, 14.0, 13.0, 10.0, 10.0, 7.0, 11.0, 5.0, 2.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.5107421875, -1.461639404296875, -1.41253662109375, -1.363433837890625, -1.3143310546875, -1.265228271484375, -1.21612548828125, -1.167022705078125, -1.117919921875, -1.068817138671875, -1.01971435546875, -0.970611572265625, -0.9215087890625, -0.872406005859375, -0.82330322265625, -0.774200439453125, -0.72509765625, -0.675994873046875, -0.62689208984375, -0.577789306640625, -0.5286865234375, -0.479583740234375, -0.43048095703125, -0.381378173828125, -0.332275390625, -0.283172607421875, -0.23406982421875, -0.184967041015625, -0.1358642578125, -0.086761474609375, -0.03765869140625, 0.011444091796875, 0.060546875, 0.109649658203125, 0.15875244140625, 0.207855224609375, 0.2569580078125, 0.306060791015625, 0.35516357421875, 0.404266357421875, 0.453369140625, 0.502471923828125, 0.55157470703125, 0.600677490234375, 0.6497802734375, 0.698883056640625, 0.74798583984375, 0.797088623046875, 0.84619140625, 0.895294189453125, 0.94439697265625, 0.993499755859375, 1.0426025390625, 1.091705322265625, 1.14080810546875, 1.189910888671875, 1.239013671875, 1.288116455078125, 1.33721923828125, 1.386322021484375, 1.4354248046875, 1.484527587890625, 1.53363037109375, 1.582733154296875, 1.6318359375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 4.0, 5.0, 5.0, 6.0, 16.0, 19.0, 14.0, 40.0, 44.0, 77.0, 98.0, 161.0, 244.0, 356.0, 576.0, 899.0, 1274.0, 2015.0, 3140.0, 4813.0, 7737.0, 12060.0, 18510.0, 29133.0, 44464.0, 67419.0, 96941.0, 129547.0, 1185977.0, 153433.0, 110547.0, 78284.0, 52735.0, 34466.0, 22190.0, 14441.0, 9060.0, 5808.0, 3790.0, 2347.0, 1570.0, 980.0, 669.0, 407.0, 263.0, 177.0, 129.0, 91.0, 56.0, 38.0, 24.0, 15.0, 9.0, 8.0, 6.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.11260986328125, -0.10894298553466797, -0.10527610778808594, -0.1016092300415039, -0.09794235229492188, -0.09427547454833984, -0.09060859680175781, -0.08694171905517578, -0.08327484130859375, -0.07960796356201172, -0.07594108581542969, -0.07227420806884766, -0.06860733032226562, -0.0649404525756836, -0.06127357482910156, -0.05760669708251953, -0.0539398193359375, -0.05027294158935547, -0.04660606384277344, -0.042939186096191406, -0.039272308349609375, -0.035605430603027344, -0.03193855285644531, -0.02827167510986328, -0.02460479736328125, -0.02093791961669922, -0.017271041870117188, -0.013604164123535156, -0.009937286376953125, -0.006270408630371094, -0.0026035308837890625, 0.0010633468627929688, 0.004730224609375, 0.008397102355957031, 0.012063980102539062, 0.015730857849121094, 0.019397735595703125, 0.023064613342285156, 0.026731491088867188, 0.03039836883544922, 0.03406524658203125, 0.03773212432861328, 0.04139900207519531, 0.045065879821777344, 0.048732757568359375, 0.052399635314941406, 0.05606651306152344, 0.05973339080810547, 0.0634002685546875, 0.06706714630126953, 0.07073402404785156, 0.0744009017944336, 0.07806777954101562, 0.08173465728759766, 0.08540153503417969, 0.08906841278076172, 0.09273529052734375, 0.09640216827392578, 0.10006904602050781, 0.10373592376708984, 0.10740280151367188, 0.1110696792602539, 0.11473655700683594, 0.11840343475341797, 0.1220703125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 3.0, 4.0, 4.0, 5.0, 6.0, 11.0, 5.0, 7.0, 12.0, 15.0, 14.0, 19.0, 15.0, 33.0, 27.0, 39.0, 34.0, 33.0, 67.0, 57.0, 70.0, 68.0, 69.0, 62.0, 37.0, 41.0, 42.0, 28.0, 19.0, 30.0, 14.0, 18.0, 13.0, 12.0, 8.0, 17.0, 11.0, 10.0, 4.0, 8.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0028018951416015625, -0.0027118325233459473, -0.002621769905090332, -0.002531707286834717, -0.0024416446685791016, -0.0023515820503234863, -0.002261519432067871, -0.002171456813812256, -0.0020813941955566406, -0.0019913315773010254, -0.0019012689590454102, -0.001811206340789795, -0.0017211437225341797, -0.0016310811042785645, -0.0015410184860229492, -0.001450955867767334, -0.0013608932495117188, -0.0012708306312561035, -0.0011807680130004883, -0.001090705394744873, -0.0010006427764892578, -0.0009105801582336426, -0.0008205175399780273, -0.0007304549217224121, -0.0006403923034667969, -0.0005503296852111816, -0.0004602670669555664, -0.00037020444869995117, -0.00028014183044433594, -0.0001900792121887207, -0.00010001659393310547, -9.953975677490234e-06, 8.0108642578125e-05, 0.00017017126083374023, 0.00026023387908935547, 0.0003502964973449707, 0.00044035911560058594, 0.0005304217338562012, 0.0006204843521118164, 0.0007105469703674316, 0.0008006095886230469, 0.0008906722068786621, 0.0009807348251342773, 0.0010707974433898926, 0.0011608600616455078, 0.001250922679901123, 0.0013409852981567383, 0.0014310479164123535, 0.0015211105346679688, 0.001611173152923584, 0.0017012357711791992, 0.0017912983894348145, 0.0018813610076904297, 0.001971423625946045, 0.00206148624420166, 0.0021515488624572754, 0.0022416114807128906, 0.002331674098968506, 0.002421736717224121, 0.0025117993354797363, 0.0026018619537353516, 0.002691924571990967, 0.002781987190246582, 0.0028720498085021973, 0.0029621124267578125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 6.0, 5.0, 8.0, 8.0, 9.0, 19.0, 23.0, 28.0, 39.0, 45.0, 38.0, 63.0, 72.0, 85.0, 116.0, 173.0, 229.0, 418.0, 1002.0, 3140.0, 14768.0, 113784.0, 817294.0, 80964.0, 11663.0, 2471.0, 805.0, 378.0, 196.0, 153.0, 102.0, 89.0, 69.0, 49.0, 45.0, 35.0, 31.0, 23.0, 23.0, 13.0, 11.0, 12.0, 11.0, 2.0, 10.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.053619384765625, -0.05191326141357422, -0.05020713806152344, -0.048501014709472656, -0.046794891357421875, -0.045088768005371094, -0.04338264465332031, -0.04167652130126953, -0.03997039794921875, -0.03826427459716797, -0.03655815124511719, -0.034852027893066406, -0.033145904541015625, -0.031439781188964844, -0.029733657836914062, -0.02802753448486328, -0.0263214111328125, -0.02461528778076172, -0.022909164428710938, -0.021203041076660156, -0.019496917724609375, -0.017790794372558594, -0.016084671020507812, -0.014378547668457031, -0.01267242431640625, -0.010966300964355469, -0.009260177612304688, -0.007554054260253906, -0.005847930908203125, -0.004141807556152344, -0.0024356842041015625, -0.0007295608520507812, 0.0009765625, 0.0026826858520507812, 0.0043888092041015625, 0.006094932556152344, 0.007801055908203125, 0.009507179260253906, 0.011213302612304688, 0.012919425964355469, 0.01462554931640625, 0.01633167266845703, 0.018037796020507812, 0.019743919372558594, 0.021450042724609375, 0.023156166076660156, 0.024862289428710938, 0.02656841278076172, 0.0282745361328125, 0.02998065948486328, 0.03168678283691406, 0.033392906188964844, 0.035099029541015625, 0.036805152893066406, 0.03851127624511719, 0.04021739959716797, 0.04192352294921875, 0.04362964630126953, 0.04533576965332031, 0.047041893005371094, 0.048748016357421875, 0.050454139709472656, 0.05216026306152344, 0.05386638641357422, 0.055572509765625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [6.0, 38.0, 463.0, 450.0, 45.0, 15.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0118210194632411, -0.007860962301492691, -0.003900904208421707, 5.915295332670212e-05, 0.004019211046397686, 0.00797926913946867, 0.011939325369894505, 0.015899382531642914, 0.019859440624713898, 0.02381949871778488, 0.027779556810855865, 0.03173961490392685, 0.03569967299699783, 0.03965973109006882, 0.0436197854578495, 0.047579843550920486, 0.05153990164399147, 0.055499959737062454, 0.05946001783013344, 0.06342007219791412, 0.06738013029098511, 0.07134018838405609, 0.07530024647712708, 0.07926030457019806, 0.08322036266326904, 0.08718042075634003, 0.09114047884941101, 0.095100536942482, 0.09906059503555298, 0.10302065312862396, 0.10698071122169495, 0.11094076931476593, 0.11490082740783691, 0.1188608855009079, 0.12282094359397888, 0.12678100168704987, 0.13074105978012085, 0.13470111787319183, 0.13866117596626282, 0.1426212340593338, 0.14658129215240479, 0.15054135024547577, 0.15450140833854675, 0.15846146643161774, 0.16242152452468872, 0.1663815826177597, 0.1703416407108307, 0.17430169880390167, 0.17826175689697266, 0.18222181499004364, 0.18618187308311462, 0.1901419311761856, 0.1941019892692566, 0.19806204736232758, 0.20202210545539856, 0.20598216354846954, 0.20994220674037933, 0.21390226483345032, 0.2178623229265213, 0.22182238101959229, 0.22578243911266327, 0.22974249720573425, 0.23370255529880524, 0.23766261339187622, 0.2416226714849472]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 4.0, 6.0, 9.0, 12.0, 27.0, 16.0, 23.0, 32.0, 28.0, 39.0, 42.0, 49.0, 61.0, 44.0, 46.0, 66.0, 60.0, 43.0, 60.0, 40.0, 41.0, 45.0, 24.0, 27.0, 18.0, 31.0, 28.0, 23.0, 18.0, 11.0, 10.0, 4.0, 4.0, 3.0, 6.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0056258440017700195, -0.005465121939778328, -0.005304399877786636, -0.005143677815794945, -0.004982955753803253, -0.004822233691811562, -0.00466151162981987, -0.004500789567828178, -0.004340067505836487, -0.004179345443844795, -0.004018623381853104, -0.003857901319861412, -0.0036971792578697205, -0.003536457195878029, -0.0033757351338863373, -0.0032150130718946457, -0.003054291009902954, -0.0028935689479112625, -0.002732846885919571, -0.0025721248239278793, -0.0024114027619361877, -0.002250680699944496, -0.0020899586379528046, -0.001929236575961113, -0.0017685145139694214, -0.0016077924519777298, -0.0014470703899860382, -0.0012863483279943466, -0.001125626266002655, -0.0009649042040109634, -0.0008041821420192719, -0.0006434600800275803, -0.00048273801803588867, -0.0003220159560441971, -0.0001612938940525055, -5.718320608139038e-07, 0.00016015022993087769, 0.0003208722919225693, 0.00048159435391426086, 0.0006423164159059525, 0.000803038477897644, 0.0009637605398893356, 0.0011244826018810272, 0.0012852046638727188, 0.0014459267258644104, 0.001606648787856102, 0.0017673708498477936, 0.0019280929118394852, 0.0020888149738311768, 0.0022495370358228683, 0.00241025909781456, 0.0025709811598062515, 0.002731703221797943, 0.0028924252837896347, 0.0030531473457813263, 0.003213869407773018, 0.0033745914697647095, 0.003535313531756401, 0.0036960355937480927, 0.0038567576557397842, 0.004017479717731476, 0.004178201779723167, 0.004338923841714859, 0.004499645903706551, 0.004660367965698242]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 4.0, 5.0, 9.0, 3.0, 9.0, 4.0, 10.0, 12.0, 11.0, 12.0, 25.0, 24.0, 28.0, 39.0, 40.0, 35.0, 48.0, 36.0, 31.0, 52.0, 42.0, 41.0, 56.0, 45.0, 44.0, 42.0, 42.0, 31.0, 29.0, 24.0, 29.0, 32.0, 19.0, 19.0, 5.0, 14.0, 12.0, 7.0, 16.0, 6.0, 5.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.595703125, -2.510894775390625, -2.42608642578125, -2.341278076171875, -2.2564697265625, -2.171661376953125, -2.08685302734375, -2.002044677734375, -1.917236328125, -1.832427978515625, -1.74761962890625, -1.662811279296875, -1.5780029296875, -1.493194580078125, -1.40838623046875, -1.323577880859375, -1.23876953125, -1.153961181640625, -1.06915283203125, -0.984344482421875, -0.8995361328125, -0.814727783203125, -0.72991943359375, -0.645111083984375, -0.560302734375, -0.475494384765625, -0.39068603515625, -0.305877685546875, -0.2210693359375, -0.136260986328125, -0.05145263671875, 0.033355712890625, 0.1181640625, 0.202972412109375, 0.28778076171875, 0.372589111328125, 0.4573974609375, 0.542205810546875, 0.62701416015625, 0.711822509765625, 0.796630859375, 0.881439208984375, 0.96624755859375, 1.051055908203125, 1.1358642578125, 1.220672607421875, 1.30548095703125, 1.390289306640625, 1.47509765625, 1.559906005859375, 1.64471435546875, 1.729522705078125, 1.8143310546875, 1.899139404296875, 1.98394775390625, 2.068756103515625, 2.153564453125, 2.238372802734375, 2.32318115234375, 2.407989501953125, 2.4927978515625, 2.577606201171875, 2.66241455078125, 2.747222900390625, 2.83203125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 3.0, 5.0, 15.0, 14.0, 21.0, 33.0, 42.0, 52.0, 56.0, 64.0, 101.0, 153.0, 175.0, 250.0, 360.0, 501.0, 750.0, 1243.0, 2352.0, 5296.0, 16914.0, 78457.0, 417038.0, 417686.0, 78633.0, 16772.0, 5304.0, 2422.0, 1249.0, 743.0, 504.0, 369.0, 244.0, 171.0, 143.0, 103.0, 75.0, 61.0, 57.0, 36.0, 27.0, 16.0, 17.0, 12.0, 8.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-4.2421875, -4.1053466796875, -3.968505859375, -3.8316650390625, -3.69482421875, -3.5579833984375, -3.421142578125, -3.2843017578125, -3.1474609375, -3.0106201171875, -2.873779296875, -2.7369384765625, -2.60009765625, -2.4632568359375, -2.326416015625, -2.1895751953125, -2.052734375, -1.9158935546875, -1.779052734375, -1.6422119140625, -1.50537109375, -1.3685302734375, -1.231689453125, -1.0948486328125, -0.9580078125, -0.8211669921875, -0.684326171875, -0.5474853515625, -0.41064453125, -0.2738037109375, -0.136962890625, -0.0001220703125, 0.13671875, 0.2735595703125, 0.410400390625, 0.5472412109375, 0.68408203125, 0.8209228515625, 0.957763671875, 1.0946044921875, 1.2314453125, 1.3682861328125, 1.505126953125, 1.6419677734375, 1.77880859375, 1.9156494140625, 2.052490234375, 2.1893310546875, 2.326171875, 2.4630126953125, 2.599853515625, 2.7366943359375, 2.87353515625, 3.0103759765625, 3.147216796875, 3.2840576171875, 3.4208984375, 3.5577392578125, 3.694580078125, 3.8314208984375, 3.96826171875, 4.1051025390625, 4.241943359375, 4.3787841796875, 4.515625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 3.0, 8.0, 8.0, 12.0, 13.0, 18.0, 20.0, 20.0, 26.0, 33.0, 40.0, 45.0, 67.0, 70.0, 127.0, 264.0, 1377.0, 307.0, 155.0, 88.0, 53.0, 60.0, 51.0, 39.0, 25.0, 21.0, 24.0, 16.0, 9.0, 9.0, 12.0, 8.0, 7.0, 5.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.94140625, -6.69097900390625, -6.4405517578125, -6.19012451171875, -5.939697265625, -5.68927001953125, -5.4388427734375, -5.18841552734375, -4.93798828125, -4.68756103515625, -4.4371337890625, -4.18670654296875, -3.936279296875, -3.68585205078125, -3.4354248046875, -3.18499755859375, -2.9345703125, -2.68414306640625, -2.4337158203125, -2.18328857421875, -1.932861328125, -1.68243408203125, -1.4320068359375, -1.18157958984375, -0.93115234375, -0.68072509765625, -0.4302978515625, -0.17987060546875, 0.070556640625, 0.32098388671875, 0.5714111328125, 0.82183837890625, 1.072265625, 1.32269287109375, 1.5731201171875, 1.82354736328125, 2.073974609375, 2.32440185546875, 2.5748291015625, 2.82525634765625, 3.07568359375, 3.32611083984375, 3.5765380859375, 3.82696533203125, 4.077392578125, 4.32781982421875, 4.5782470703125, 4.82867431640625, 5.0791015625, 5.32952880859375, 5.5799560546875, 5.83038330078125, 6.080810546875, 6.33123779296875, 6.5816650390625, 6.83209228515625, 7.08251953125, 7.33294677734375, 7.5833740234375, 7.83380126953125, 8.084228515625, 8.33465576171875, 8.5850830078125, 8.83551025390625, 9.0859375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 5.0, 7.0, 7.0, 16.0, 16.0, 25.0, 30.0, 52.0, 66.0, 81.0, 120.0, 197.0, 313.0, 602.0, 1692.0, 35118.0, 3091497.0, 13092.0, 1380.0, 470.0, 315.0, 190.0, 113.0, 72.0, 53.0, 47.0, 35.0, 22.0, 16.0, 15.0, 8.0, 7.0, 3.0, 3.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-19.609375, -19.0706787109375, -18.531982421875, -17.9932861328125, -17.45458984375, -16.9158935546875, -16.377197265625, -15.8385009765625, -15.2998046875, -14.7611083984375, -14.222412109375, -13.6837158203125, -13.14501953125, -12.6063232421875, -12.067626953125, -11.5289306640625, -10.990234375, -10.4515380859375, -9.912841796875, -9.3741455078125, -8.83544921875, -8.2967529296875, -7.758056640625, -7.2193603515625, -6.6806640625, -6.1419677734375, -5.603271484375, -5.0645751953125, -4.52587890625, -3.9871826171875, -3.448486328125, -2.9097900390625, -2.37109375, -1.8323974609375, -1.293701171875, -0.7550048828125, -0.21630859375, 0.3223876953125, 0.861083984375, 1.3997802734375, 1.9384765625, 2.4771728515625, 3.015869140625, 3.5545654296875, 4.09326171875, 4.6319580078125, 5.170654296875, 5.7093505859375, 6.248046875, 6.7867431640625, 7.325439453125, 7.8641357421875, 8.40283203125, 8.9415283203125, 9.480224609375, 10.0189208984375, 10.5576171875, 11.0963134765625, 11.635009765625, 12.1737060546875, 12.71240234375, 13.2510986328125, 13.789794921875, 14.3284912109375, 14.8671875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 16.0, 224.0, 649.0, 115.0, 9.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-99.40681457519531, -96.88101959228516, -94.35521697998047, -91.82942199707031, -89.30362701416016, -86.77783203125, -84.25202941894531, -81.72623443603516, -79.200439453125, -76.67464447021484, -74.14884185791016, -71.623046875, -69.09725189208984, -66.57145690917969, -64.045654296875, -61.519859313964844, -58.99406051635742, -56.46826171875, -53.942466735839844, -51.41666793823242, -48.890872955322266, -46.365074157714844, -43.83927917480469, -41.313480377197266, -38.787681579589844, -36.26188278198242, -33.736087799072266, -31.210289001464844, -28.684494018554688, -26.158695220947266, -23.632898330688477, -21.107101440429688, -18.581310272216797, -16.055513381958008, -13.529716491699219, -11.003918647766113, -8.478121757507324, -5.952324867248535, -3.4265270233154297, -0.9007301330566406, 1.6250667572021484, 4.1508636474609375, 6.676661014556885, 9.202458381652832, 11.728255271911621, 14.25405216217041, 16.779850006103516, 19.305646896362305, 21.831443786621094, 24.357240676879883, 26.883037567138672, 29.408836364746094, 31.93463134765625, 34.46043014526367, 36.986228942871094, 39.51202392578125, 42.037818908691406, 44.56361770629883, 47.089412689208984, 49.615211486816406, 52.14100646972656, 54.666805267333984, 57.192604064941406, 59.71839904785156, 62.244197845458984]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 5.0, 4.0, 5.0, 5.0, 4.0, 6.0, 6.0, 10.0, 8.0, 4.0, 8.0, 21.0, 17.0, 20.0, 19.0, 32.0, 25.0, 26.0, 26.0, 38.0, 42.0, 39.0, 37.0, 40.0, 27.0, 39.0, 39.0, 40.0, 37.0, 32.0, 41.0, 44.0, 34.0, 28.0, 26.0, 19.0, 29.0, 27.0, 17.0, 15.0, 16.0, 14.0, 6.0, 12.0, 4.0, 6.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.358322143554688, -14.883041381835938, -14.407760620117188, -13.932479858398438, -13.457200050354004, -12.981919288635254, -12.506638526916504, -12.031357765197754, -11.55607795715332, -11.08079719543457, -10.60551643371582, -10.13023567199707, -9.654955863952637, -9.179675102233887, -8.704394340515137, -8.229113578796387, -7.753832817077637, -7.278552055358887, -6.803271770477295, -6.327991008758545, -5.852710723876953, -5.377429962158203, -4.902149200439453, -4.426868438720703, -3.9515881538391113, -3.4763076305389404, -3.0010271072387695, -2.5257463455200195, -2.0504658222198486, -1.5751852989196777, -1.0999045372009277, -0.6246240139007568, -0.14934349060058594, 0.32593709230422974, 0.8012176752090454, 1.2764983177185059, 1.7517788410186768, 2.2270593643188477, 2.7023401260375977, 3.1776206493377686, 3.6529011726379395, 4.1281819343566895, 4.603462219238281, 5.078742980957031, 5.554023742675781, 6.029304027557373, 6.504584789276123, 6.979865074157715, 7.455145835876465, 7.930426597595215, 8.405707359313965, 8.880987167358398, 9.356267929077148, 9.831548690795898, 10.306829452514648, 10.782110214233398, 11.257390975952148, 11.732671737670898, 12.207952499389648, 12.683233261108398, 13.158513069152832, 13.633793830871582, 14.109074592590332, 14.584355354309082, 15.059635162353516]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 3.0, 7.0, 2.0, 12.0, 3.0, 13.0, 15.0, 13.0, 17.0, 16.0, 31.0, 24.0, 29.0, 31.0, 25.0, 28.0, 31.0, 41.0, 39.0, 42.0, 36.0, 33.0, 36.0, 30.0, 33.0, 30.0, 44.0, 38.0, 30.0, 31.0, 20.0, 29.0, 19.0, 11.0, 21.0, 21.0, 14.0, 15.0, 11.0, 15.0, 10.0, 11.0, 7.0, 4.0, 6.0, 2.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 3.0], "bins": [-2.494140625, -2.41497802734375, -2.3358154296875, -2.25665283203125, -2.177490234375, -2.09832763671875, -2.0191650390625, -1.94000244140625, -1.86083984375, -1.78167724609375, -1.7025146484375, -1.62335205078125, -1.544189453125, -1.46502685546875, -1.3858642578125, -1.30670166015625, -1.2275390625, -1.14837646484375, -1.0692138671875, -0.99005126953125, -0.910888671875, -0.83172607421875, -0.7525634765625, -0.67340087890625, -0.59423828125, -0.51507568359375, -0.4359130859375, -0.35675048828125, -0.277587890625, -0.19842529296875, -0.1192626953125, -0.04010009765625, 0.0390625, 0.11822509765625, 0.1973876953125, 0.27655029296875, 0.355712890625, 0.43487548828125, 0.5140380859375, 0.59320068359375, 0.67236328125, 0.75152587890625, 0.8306884765625, 0.90985107421875, 0.989013671875, 1.06817626953125, 1.1473388671875, 1.22650146484375, 1.3056640625, 1.38482666015625, 1.4639892578125, 1.54315185546875, 1.622314453125, 1.70147705078125, 1.7806396484375, 1.85980224609375, 1.93896484375, 2.01812744140625, 2.0972900390625, 2.17645263671875, 2.255615234375, 2.33477783203125, 2.4139404296875, 2.49310302734375, 2.572265625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 1.0, 8.0, 8.0, 6.0, 12.0, 15.0, 23.0, 29.0, 27.0, 42.0, 53.0, 82.0, 103.0, 126.0, 148.0, 212.0, 276.0, 338.0, 464.0, 677.0, 1216.0, 3182.0, 16196.0, 287198.0, 3111322.0, 730898.0, 32622.0, 4566.0, 1484.0, 777.0, 546.0, 372.0, 257.0, 210.0, 168.0, 143.0, 110.0, 92.0, 68.0, 53.0, 33.0, 29.0, 24.0, 18.0, 12.0, 7.0, 7.0, 5.0, 4.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0], "bins": [-11.6953125, -11.32568359375, -10.9560546875, -10.58642578125, -10.216796875, -9.84716796875, -9.4775390625, -9.10791015625, -8.73828125, -8.36865234375, -7.9990234375, -7.62939453125, -7.259765625, -6.89013671875, -6.5205078125, -6.15087890625, -5.78125, -5.41162109375, -5.0419921875, -4.67236328125, -4.302734375, -3.93310546875, -3.5634765625, -3.19384765625, -2.82421875, -2.45458984375, -2.0849609375, -1.71533203125, -1.345703125, -0.97607421875, -0.6064453125, -0.23681640625, 0.1328125, 0.50244140625, 0.8720703125, 1.24169921875, 1.611328125, 1.98095703125, 2.3505859375, 2.72021484375, 3.08984375, 3.45947265625, 3.8291015625, 4.19873046875, 4.568359375, 4.93798828125, 5.3076171875, 5.67724609375, 6.046875, 6.41650390625, 6.7861328125, 7.15576171875, 7.525390625, 7.89501953125, 8.2646484375, 8.63427734375, 9.00390625, 9.37353515625, 9.7431640625, 10.11279296875, 10.482421875, 10.85205078125, 11.2216796875, 11.59130859375, 11.9609375]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 10.0, 22.0, 33.0, 38.0, 80.0, 121.0, 181.0, 302.0, 366.0, 547.0, 575.0, 502.0, 427.0, 279.0, 215.0, 134.0, 79.0, 66.0, 35.0, 23.0, 17.0, 7.0, 6.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4609375, -9.24456787109375, -9.0281982421875, -8.81182861328125, -8.595458984375, -8.37908935546875, -8.1627197265625, -7.94635009765625, -7.72998046875, -7.51361083984375, -7.2972412109375, -7.08087158203125, -6.864501953125, -6.64813232421875, -6.4317626953125, -6.21539306640625, -5.9990234375, -5.78265380859375, -5.5662841796875, -5.34991455078125, -5.133544921875, -4.91717529296875, -4.7008056640625, -4.48443603515625, -4.26806640625, -4.05169677734375, -3.8353271484375, -3.61895751953125, -3.402587890625, -3.18621826171875, -2.9698486328125, -2.75347900390625, -2.537109375, -2.32073974609375, -2.1043701171875, -1.88800048828125, -1.671630859375, -1.45526123046875, -1.2388916015625, -1.02252197265625, -0.80615234375, -0.58978271484375, -0.3734130859375, -0.15704345703125, 0.059326171875, 0.27569580078125, 0.4920654296875, 0.70843505859375, 0.9248046875, 1.14117431640625, 1.3575439453125, 1.57391357421875, 1.790283203125, 2.00665283203125, 2.2230224609375, 2.43939208984375, 2.65576171875, 2.87213134765625, 3.0885009765625, 3.30487060546875, 3.521240234375, 3.73760986328125, 3.9539794921875, 4.17034912109375, 4.38671875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 2.0, 1.0, 4.0, 6.0, 7.0, 6.0, 14.0, 17.0, 40.0, 59.0, 139.0, 271.0, 573.0, 1501.0, 5171.0, 32526.0, 366271.0, 2730766.0, 965589.0, 77831.0, 9755.0, 2221.0, 765.0, 347.0, 163.0, 94.0, 50.0, 26.0, 23.0, 14.0, 9.0, 5.0, 2.0, 9.0, 1.0, 0.0, 3.0, 4.0], "bins": [-10.109375, -9.87799072265625, -9.6466064453125, -9.41522216796875, -9.183837890625, -8.95245361328125, -8.7210693359375, -8.48968505859375, -8.25830078125, -8.02691650390625, -7.7955322265625, -7.56414794921875, -7.332763671875, -7.10137939453125, -6.8699951171875, -6.63861083984375, -6.4072265625, -6.17584228515625, -5.9444580078125, -5.71307373046875, -5.481689453125, -5.25030517578125, -5.0189208984375, -4.78753662109375, -4.55615234375, -4.32476806640625, -4.0933837890625, -3.86199951171875, -3.630615234375, -3.39923095703125, -3.1678466796875, -2.93646240234375, -2.705078125, -2.47369384765625, -2.2423095703125, -2.01092529296875, -1.779541015625, -1.54815673828125, -1.3167724609375, -1.08538818359375, -0.85400390625, -0.62261962890625, -0.3912353515625, -0.15985107421875, 0.071533203125, 0.30291748046875, 0.5343017578125, 0.76568603515625, 0.9970703125, 1.22845458984375, 1.4598388671875, 1.69122314453125, 1.922607421875, 2.15399169921875, 2.3853759765625, 2.61676025390625, 2.84814453125, 3.07952880859375, 3.3109130859375, 3.54229736328125, 3.773681640625, 4.00506591796875, 4.2364501953125, 4.46783447265625, 4.69921875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 6.0, 1.0, 5.0, 4.0, 18.0, 12.0, 23.0, 34.0, 46.0, 53.0, 64.0, 70.0, 73.0, 87.0, 85.0, 79.0, 66.0, 57.0, 52.0, 44.0, 36.0, 30.0, 22.0, 12.0, 10.0, 6.0, 5.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.712732315063477, -28.638427734375, -27.564125061035156, -26.48982048034668, -25.415515899658203, -24.34121322631836, -23.266908645629883, -22.192604064941406, -21.118301391601562, -20.043996810913086, -18.969694137573242, -17.895389556884766, -16.82108497619629, -15.746781349182129, -14.672477722167969, -13.598173141479492, -12.523868560791016, -11.449564933776855, -10.375260353088379, -9.300956726074219, -8.226652145385742, -7.152348518371582, -6.078044891357422, -5.0037407875061035, -3.929436683654785, -2.855132579803467, -1.7808287143707275, -0.7065248489379883, 0.3677792549133301, 1.4420833587646484, 2.5163869857788086, 3.590691089630127, 4.6649932861328125, 5.739297389984131, 6.813601493835449, 7.887905120849609, 8.962209701538086, 10.036513328552246, 11.110816955566406, 12.185121536254883, 13.259425163269043, 14.333728790283203, 15.40803337097168, 16.482337951660156, 17.556640625, 18.630945205688477, 19.705249786376953, 20.779552459716797, 21.853857040405273, 22.92816162109375, 24.002464294433594, 25.07676887512207, 26.151073455810547, 27.22537612915039, 28.299680709838867, 29.373985290527344, 30.448287963867188, 31.522592544555664, 32.59689712524414, 33.671199798583984, 34.74550247192383, 35.81980895996094, 36.89411163330078, 37.968414306640625, 39.042720794677734]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 2.0, 6.0, 11.0, 4.0, 13.0, 11.0, 21.0, 13.0, 30.0, 22.0, 25.0, 31.0, 23.0, 31.0, 47.0, 36.0, 35.0, 64.0, 37.0, 49.0, 39.0, 35.0, 40.0, 29.0, 33.0, 35.0, 38.0, 34.0, 30.0, 28.0, 26.0, 24.0, 17.0, 14.0, 16.0, 10.0, 6.0, 8.0, 6.0, 9.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.350887298583984, -20.664461135864258, -19.9780330657959, -19.291606903076172, -18.605178833007812, -17.918752670288086, -17.23232650756836, -16.5458984375, -15.859472274780273, -15.17304515838623, -14.486618041992188, -13.800191879272461, -13.113764762878418, -12.427337646484375, -11.740911483764648, -11.054484367370605, -10.368057250976562, -9.68163013458252, -8.995203018188477, -8.30877685546875, -7.622349739074707, -6.935922622680664, -6.249495983123779, -5.5630693435668945, -4.876642227172852, -4.190215110778809, -3.503788471221924, -2.81736159324646, -2.130934715270996, -1.4445078372955322, -0.7580809593200684, -0.0716543197631836, 0.6147727966308594, 1.3011996746063232, 1.987626552581787, 2.674053430557251, 3.360480308532715, 4.046907424926758, 4.733334064483643, 5.419760704040527, 6.10618782043457, 6.792614936828613, 7.479041576385498, 8.165468215942383, 8.851895332336426, 9.538322448730469, 10.224748611450195, 10.911175727844238, 11.597602844238281, 12.284029960632324, 12.970457077026367, 13.656883239746094, 14.343310356140137, 15.02973747253418, 15.716163635253906, 16.402591705322266, 17.089017868041992, 17.77544403076172, 18.461872100830078, 19.148298263549805, 19.83472442626953, 20.52115249633789, 21.207578659057617, 21.894004821777344, 22.580432891845703]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 5.0, 6.0, 9.0, 11.0, 16.0, 15.0, 24.0, 22.0, 21.0, 29.0, 33.0, 34.0, 38.0, 38.0, 48.0, 52.0, 48.0, 45.0, 35.0, 39.0, 35.0, 39.0, 38.0, 33.0, 40.0, 35.0, 36.0, 37.0, 27.0, 12.0, 13.0, 20.0, 9.0, 16.0, 12.0, 4.0, 6.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-43.53125, -42.1513671875, -40.771484375, -39.3916015625, -38.01171875, -36.6318359375, -35.251953125, -33.8720703125, -32.4921875, -31.1123046875, -29.732421875, -28.3525390625, -26.97265625, -25.5927734375, -24.212890625, -22.8330078125, -21.453125, -20.0732421875, -18.693359375, -17.3134765625, -15.93359375, -14.5537109375, -13.173828125, -11.7939453125, -10.4140625, -9.0341796875, -7.654296875, -6.2744140625, -4.89453125, -3.5146484375, -2.134765625, -0.7548828125, 0.625, 2.0048828125, 3.384765625, 4.7646484375, 6.14453125, 7.5244140625, 8.904296875, 10.2841796875, 11.6640625, 13.0439453125, 14.423828125, 15.8037109375, 17.18359375, 18.5634765625, 19.943359375, 21.3232421875, 22.703125, 24.0830078125, 25.462890625, 26.8427734375, 28.22265625, 29.6025390625, 30.982421875, 32.3623046875, 33.7421875, 35.1220703125, 36.501953125, 37.8818359375, 39.26171875, 40.6416015625, 42.021484375, 43.4013671875, 44.78125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 2.0, 9.0, 10.0, 17.0, 18.0, 24.0, 51.0, 68.0, 106.0, 149.0, 233.0, 363.0, 585.0, 843.0, 1336.0, 1996.0, 3205.0, 4761.0, 7430.0, 11725.0, 18303.0, 28831.0, 46347.0, 75125.0, 118750.0, 169856.0, 182206.0, 137152.0, 89198.0, 55448.0, 34498.0, 21486.0, 13692.0, 8585.0, 5714.0, 3612.0, 2405.0, 1543.0, 987.0, 639.0, 422.0, 280.0, 207.0, 121.0, 83.0, 54.0, 28.0, 24.0, 15.0, 4.0, 5.0, 4.0, 7.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.435546875, -2.352081298828125, -2.26861572265625, -2.185150146484375, -2.1016845703125, -2.018218994140625, -1.93475341796875, -1.851287841796875, -1.767822265625, -1.684356689453125, -1.60089111328125, -1.517425537109375, -1.4339599609375, -1.350494384765625, -1.26702880859375, -1.183563232421875, -1.10009765625, -1.016632080078125, -0.93316650390625, -0.849700927734375, -0.7662353515625, -0.682769775390625, -0.59930419921875, -0.515838623046875, -0.432373046875, -0.348907470703125, -0.26544189453125, -0.181976318359375, -0.0985107421875, -0.015045166015625, 0.06842041015625, 0.151885986328125, 0.2353515625, 0.318817138671875, 0.40228271484375, 0.485748291015625, 0.5692138671875, 0.652679443359375, 0.73614501953125, 0.819610595703125, 0.903076171875, 0.986541748046875, 1.07000732421875, 1.153472900390625, 1.2369384765625, 1.320404052734375, 1.40386962890625, 1.487335205078125, 1.57080078125, 1.654266357421875, 1.73773193359375, 1.821197509765625, 1.9046630859375, 1.988128662109375, 2.07159423828125, 2.155059814453125, 2.238525390625, 2.321990966796875, 2.40545654296875, 2.488922119140625, 2.5723876953125, 2.655853271484375, 2.73931884765625, 2.822784423828125, 2.90625]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 14.0, 13.0, 13.0, 21.0, 15.0, 18.0, 17.0, 23.0, 33.0, 23.0, 25.0, 35.0, 34.0, 26.0, 37.0, 44.0, 38.0, 42.0, 1063.0, 49.0, 36.0, 30.0, 33.0, 30.0, 34.0, 29.0, 24.0, 31.0, 27.0, 18.0, 18.0, 10.0, 23.0, 11.0, 17.0, 9.0, 14.0, 3.0, 5.0, 4.0, 6.0, 6.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0], "bins": [-26.78125, -25.96484375, -25.1484375, -24.33203125, -23.515625, -22.69921875, -21.8828125, -21.06640625, -20.25, -19.43359375, -18.6171875, -17.80078125, -16.984375, -16.16796875, -15.3515625, -14.53515625, -13.71875, -12.90234375, -12.0859375, -11.26953125, -10.453125, -9.63671875, -8.8203125, -8.00390625, -7.1875, -6.37109375, -5.5546875, -4.73828125, -3.921875, -3.10546875, -2.2890625, -1.47265625, -0.65625, 0.16015625, 0.9765625, 1.79296875, 2.609375, 3.42578125, 4.2421875, 5.05859375, 5.875, 6.69140625, 7.5078125, 8.32421875, 9.140625, 9.95703125, 10.7734375, 11.58984375, 12.40625, 13.22265625, 14.0390625, 14.85546875, 15.671875, 16.48828125, 17.3046875, 18.12109375, 18.9375, 19.75390625, 20.5703125, 21.38671875, 22.203125, 23.01953125, 23.8359375, 24.65234375, 25.46875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 6.0, 7.0, 9.0, 20.0, 22.0, 26.0, 46.0, 66.0, 93.0, 160.0, 231.0, 364.0, 612.0, 903.0, 1487.0, 2235.0, 3784.0, 6336.0, 10226.0, 17281.0, 28926.0, 48227.0, 78836.0, 123409.0, 174837.0, 1224025.0, 139888.0, 92127.0, 56852.0, 34589.0, 20547.0, 11903.0, 7297.0, 4382.0, 2743.0, 1622.0, 1114.0, 669.0, 420.0, 279.0, 174.0, 101.0, 81.0, 56.0, 39.0, 22.0, 25.0, 15.0, 6.0, 9.0, 7.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-1.9716796875, -1.9122314453125, -1.852783203125, -1.7933349609375, -1.73388671875, -1.6744384765625, -1.614990234375, -1.5555419921875, -1.49609375, -1.4366455078125, -1.377197265625, -1.3177490234375, -1.25830078125, -1.1988525390625, -1.139404296875, -1.0799560546875, -1.0205078125, -0.9610595703125, -0.901611328125, -0.8421630859375, -0.78271484375, -0.7232666015625, -0.663818359375, -0.6043701171875, -0.544921875, -0.4854736328125, -0.426025390625, -0.3665771484375, -0.30712890625, -0.2476806640625, -0.188232421875, -0.1287841796875, -0.0693359375, -0.0098876953125, 0.049560546875, 0.1090087890625, 0.16845703125, 0.2279052734375, 0.287353515625, 0.3468017578125, 0.40625, 0.4656982421875, 0.525146484375, 0.5845947265625, 0.64404296875, 0.7034912109375, 0.762939453125, 0.8223876953125, 0.8818359375, 0.9412841796875, 1.000732421875, 1.0601806640625, 1.11962890625, 1.1790771484375, 1.238525390625, 1.2979736328125, 1.357421875, 1.4168701171875, 1.476318359375, 1.5357666015625, 1.59521484375, 1.6546630859375, 1.714111328125, 1.7735595703125, 1.8330078125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 6.0, 1.0, 4.0, 9.0, 9.0, 8.0, 11.0, 11.0, 8.0, 8.0, 9.0, 13.0, 22.0, 16.0, 30.0, 40.0, 27.0, 41.0, 51.0, 70.0, 86.0, 73.0, 62.0, 62.0, 41.0, 42.0, 33.0, 40.0, 33.0, 29.0, 16.0, 11.0, 10.0, 12.0, 10.0, 8.0, 7.0, 6.0, 7.0, 6.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0220489501953125, -0.021314620971679688, -0.020580291748046875, -0.019845962524414062, -0.01911163330078125, -0.018377304077148438, -0.017642974853515625, -0.016908645629882812, -0.01617431640625, -0.015439987182617188, -0.014705657958984375, -0.013971328735351562, -0.01323699951171875, -0.012502670288085938, -0.011768341064453125, -0.011034011840820312, -0.0102996826171875, -0.009565353393554688, -0.008831024169921875, -0.008096694946289062, -0.00736236572265625, -0.0066280364990234375, -0.005893707275390625, -0.0051593780517578125, -0.004425048828125, -0.0036907196044921875, -0.002956390380859375, -0.0022220611572265625, -0.00148773193359375, -0.0007534027099609375, -1.9073486328125e-05, 0.0007152557373046875, 0.0014495849609375, 0.0021839141845703125, 0.002918243408203125, 0.0036525726318359375, 0.00438690185546875, 0.0051212310791015625, 0.005855560302734375, 0.0065898895263671875, 0.00732421875, 0.008058547973632812, 0.008792877197265625, 0.009527206420898438, 0.01026153564453125, 0.010995864868164062, 0.011730194091796875, 0.012464523315429688, 0.0131988525390625, 0.013933181762695312, 0.014667510986328125, 0.015401840209960938, 0.01613616943359375, 0.016870498657226562, 0.017604827880859375, 0.018339157104492188, 0.019073486328125, 0.019807815551757812, 0.020542144775390625, 0.021276473999023438, 0.02201080322265625, 0.022745132446289062, 0.023479461669921875, 0.024213790893554688, 0.0249481201171875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 6.0, 10.0, 11.0, 27.0, 19.0, 43.0, 53.0, 72.0, 116.0, 157.0, 238.0, 342.0, 569.0, 956.0, 1684.0, 3134.0, 6656.0, 15282.0, 40713.0, 136722.0, 476002.0, 256565.0, 66690.0, 23253.0, 9473.0, 4389.0, 2216.0, 1157.0, 714.0, 400.0, 269.0, 200.0, 108.0, 84.0, 60.0, 47.0, 43.0, 22.0, 13.0, 14.0, 5.0, 4.0, 5.0, 2.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1192626953125, -0.11561775207519531, -0.11197280883789062, -0.10832786560058594, -0.10468292236328125, -0.10103797912597656, -0.09739303588867188, -0.09374809265136719, -0.0901031494140625, -0.08645820617675781, -0.08281326293945312, -0.07916831970214844, -0.07552337646484375, -0.07187843322753906, -0.06823348999023438, -0.06458854675292969, -0.060943603515625, -0.05729866027832031, -0.053653717041015625, -0.05000877380371094, -0.04636383056640625, -0.04271888732910156, -0.039073944091796875, -0.03542900085449219, -0.0317840576171875, -0.028139114379882812, -0.024494171142578125, -0.020849227905273438, -0.01720428466796875, -0.013559341430664062, -0.009914398193359375, -0.0062694549560546875, -0.00262451171875, 0.0010204315185546875, 0.004665374755859375, 0.008310317993164062, 0.01195526123046875, 0.015600204467773438, 0.019245147705078125, 0.022890090942382812, 0.0265350341796875, 0.030179977416992188, 0.033824920654296875, 0.03746986389160156, 0.04111480712890625, 0.04475975036621094, 0.048404693603515625, 0.05204963684082031, 0.055694580078125, 0.05933952331542969, 0.06298446655273438, 0.06662940979003906, 0.07027435302734375, 0.07391929626464844, 0.07756423950195312, 0.08120918273925781, 0.0848541259765625, 0.08849906921386719, 0.09214401245117188, 0.09578895568847656, 0.09943389892578125, 0.10307884216308594, 0.10672378540039062, 0.11036872863769531, 0.114013671875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 9.0, 3.0, 5.0, 7.0, 7.0, 9.0, 10.0, 8.0, 16.0, 24.0, 19.0, 25.0, 30.0, 43.0, 58.0, 70.0, 96.0, 118.0, 118.0, 103.0, 70.0, 56.0, 27.0, 19.0, 6.0, 20.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.06797152012586594, -0.06644570827484131, -0.06491989642381668, -0.06339408457279205, -0.061868276447057724, -0.060342464596033096, -0.05881665274500847, -0.05729084089398384, -0.05576502904295921, -0.054239217191934586, -0.05271340534090996, -0.05118759721517563, -0.049661785364151, -0.04813597351312637, -0.046610161662101746, -0.04508434981107712, -0.04355853796005249, -0.04203272610902786, -0.040506914258003235, -0.03898110240697861, -0.03745529428124428, -0.03592948243021965, -0.03440367057919502, -0.032877858728170395, -0.031352050602436066, -0.029826238751411438, -0.02830042876303196, -0.026774616912007332, -0.025248805060982704, -0.023722995072603226, -0.022197183221578598, -0.02067137137055397, -0.019145561382174492, -0.017619749531149864, -0.016093939542770386, -0.014568127691745758, -0.01304231584072113, -0.011516504921019077, -0.009990694001317024, -0.008464882150292397, -0.0069390712305903435, -0.005413259845227003, -0.0038874486926943064, -0.0023616375401616096, -0.0008358261547982693, 0.0006899852305650711, 0.002215796150267124, 0.003741608001291752, 0.005267418920993805, 0.006793230306357145, 0.008319041691720486, 0.009844852611422539, 0.011370664462447166, 0.01289647538214922, 0.014422286301851273, 0.0159480981528759, 0.017473910003900528, 0.018999721854925156, 0.020525531843304634, 0.022051343694329262, 0.02357715554535389, 0.025102965533733368, 0.026628777384757996, 0.028154589235782623, 0.029680399224162102]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 6.0, 8.0, 10.0, 12.0, 18.0, 15.0, 11.0, 20.0, 20.0, 24.0, 30.0, 22.0, 37.0, 27.0, 24.0, 23.0, 26.0, 33.0, 41.0, 35.0, 29.0, 33.0, 41.0, 27.0, 45.0, 30.0, 24.0, 35.0, 25.0, 36.0, 30.0, 28.0, 35.0, 23.0, 10.0, 19.0, 21.0, 8.0, 6.0, 13.0, 13.0, 8.0, 7.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-0.035949885845184326, -0.03481030836701393, -0.033670730888843536, -0.03253115341067314, -0.03139157593250275, -0.03025199845433235, -0.029112420976161957, -0.027972843497991562, -0.026833266019821167, -0.025693688541650772, -0.024554111063480377, -0.023414533585309982, -0.022274956107139587, -0.021135378628969193, -0.019995801150798798, -0.018856223672628403, -0.017716646194458008, -0.016577068716287613, -0.015437491238117218, -0.014297913759946823, -0.013158336281776428, -0.012018758803606033, -0.010879181325435638, -0.009739603847265244, -0.008600026369094849, -0.007460448890924454, -0.006320871412754059, -0.005181293934583664, -0.004041716456413269, -0.002902138978242874, -0.0017625615000724792, -0.0006229840219020844, 0.0005165934562683105, 0.0016561709344387054, 0.0027957484126091003, 0.003935325890779495, 0.00507490336894989, 0.006214480847120285, 0.00735405832529068, 0.008493635803461075, 0.00963321328163147, 0.010772790759801865, 0.01191236823797226, 0.013051945716142654, 0.01419152319431305, 0.015331100672483444, 0.01647067815065384, 0.017610255628824234, 0.01874983310699463, 0.019889410585165024, 0.02102898806333542, 0.022168565541505814, 0.02330814301967621, 0.024447720497846603, 0.025587297976017, 0.026726875454187393, 0.027866452932357788, 0.029006030410528183, 0.030145607888698578, 0.03128518536686897, 0.03242476284503937, 0.03356434032320976, 0.03470391780138016, 0.03584349527955055, 0.03698307275772095]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 5.0, 3.0, 4.0, 6.0, 5.0, 9.0, 12.0, 15.0, 16.0, 22.0, 24.0, 21.0, 26.0, 35.0, 35.0, 38.0, 39.0, 46.0, 53.0, 45.0, 43.0, 39.0, 39.0, 34.0, 41.0, 36.0, 36.0, 37.0, 36.0, 36.0, 38.0, 26.0, 12.0, 14.0, 19.0, 8.0, 17.0, 12.0, 4.0, 6.0, 7.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-43.53125, -42.1513671875, -40.771484375, -39.3916015625, -38.01171875, -36.6318359375, -35.251953125, -33.8720703125, -32.4921875, -31.1123046875, -29.732421875, -28.3525390625, -26.97265625, -25.5927734375, -24.212890625, -22.8330078125, -21.453125, -20.0732421875, -18.693359375, -17.3134765625, -15.93359375, -14.5537109375, -13.173828125, -11.7939453125, -10.4140625, -9.0341796875, -7.654296875, -6.2744140625, -4.89453125, -3.5146484375, -2.134765625, -0.7548828125, 0.625, 2.0048828125, 3.384765625, 4.7646484375, 6.14453125, 7.5244140625, 8.904296875, 10.2841796875, 11.6640625, 13.0439453125, 14.423828125, 15.8037109375, 17.18359375, 18.5634765625, 19.943359375, 21.3232421875, 22.703125, 24.0830078125, 25.462890625, 26.8427734375, 28.22265625, 29.6025390625, 30.982421875, 32.3623046875, 33.7421875, 35.1220703125, 36.501953125, 37.8818359375, 39.26171875, 40.6416015625, 42.021484375, 43.4013671875, 44.78125]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 5.0, 8.0, 14.0, 11.0, 17.0, 27.0, 35.0, 32.0, 54.0, 90.0, 161.0, 254.0, 561.0, 1377.0, 5070.0, 29319.0, 225798.0, 605714.0, 153528.0, 20374.0, 3828.0, 1146.0, 469.0, 218.0, 137.0, 81.0, 61.0, 34.0, 25.0, 19.0, 20.0, 16.0, 12.0, 6.0, 6.0, 6.0, 9.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.234375, -7.97216796875, -7.7099609375, -7.44775390625, -7.185546875, -6.92333984375, -6.6611328125, -6.39892578125, -6.13671875, -5.87451171875, -5.6123046875, -5.35009765625, -5.087890625, -4.82568359375, -4.5634765625, -4.30126953125, -4.0390625, -3.77685546875, -3.5146484375, -3.25244140625, -2.990234375, -2.72802734375, -2.4658203125, -2.20361328125, -1.94140625, -1.67919921875, -1.4169921875, -1.15478515625, -0.892578125, -0.63037109375, -0.3681640625, -0.10595703125, 0.15625, 0.41845703125, 0.6806640625, 0.94287109375, 1.205078125, 1.46728515625, 1.7294921875, 1.99169921875, 2.25390625, 2.51611328125, 2.7783203125, 3.04052734375, 3.302734375, 3.56494140625, 3.8271484375, 4.08935546875, 4.3515625, 4.61376953125, 4.8759765625, 5.13818359375, 5.400390625, 5.66259765625, 5.9248046875, 6.18701171875, 6.44921875, 6.71142578125, 6.9736328125, 7.23583984375, 7.498046875, 7.76025390625, 8.0224609375, 8.28466796875, 8.546875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 10.0, 8.0, 16.0, 30.0, 33.0, 45.0, 74.0, 75.0, 107.0, 2131.0, 130.0, 104.0, 79.0, 71.0, 43.0, 34.0, 24.0, 11.0, 5.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-122.5625, -118.5791015625, -114.595703125, -110.6123046875, -106.62890625, -102.6455078125, -98.662109375, -94.6787109375, -90.6953125, -86.7119140625, -82.728515625, -78.7451171875, -74.76171875, -70.7783203125, -66.794921875, -62.8115234375, -58.828125, -54.8447265625, -50.861328125, -46.8779296875, -42.89453125, -38.9111328125, -34.927734375, -30.9443359375, -26.9609375, -22.9775390625, -18.994140625, -15.0107421875, -11.02734375, -7.0439453125, -3.060546875, 0.9228515625, 4.90625, 8.8896484375, 12.873046875, 16.8564453125, 20.83984375, 24.8232421875, 28.806640625, 32.7900390625, 36.7734375, 40.7568359375, 44.740234375, 48.7236328125, 52.70703125, 56.6904296875, 60.673828125, 64.6572265625, 68.640625, 72.6240234375, 76.607421875, 80.5908203125, 84.57421875, 88.5576171875, 92.541015625, 96.5244140625, 100.5078125, 104.4912109375, 108.474609375, 112.4580078125, 116.44140625, 120.4248046875, 124.408203125, 128.3916015625, 132.375]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 10.0, 20.0, 22.0, 31.0, 56.0, 76.0, 155.0, 275.0, 666.0, 1592.0, 7743.0, 514397.0, 2608206.0, 9376.0, 1707.0, 654.0, 322.0, 168.0, 85.0, 54.0, 34.0, 21.0, 9.0, 4.0, 8.0, 4.0, 2.0, 0.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.875, -18.3511962890625, -17.827392578125, -17.3035888671875, -16.77978515625, -16.2559814453125, -15.732177734375, -15.2083740234375, -14.6845703125, -14.1607666015625, -13.636962890625, -13.1131591796875, -12.58935546875, -12.0655517578125, -11.541748046875, -11.0179443359375, -10.494140625, -9.9703369140625, -9.446533203125, -8.9227294921875, -8.39892578125, -7.8751220703125, -7.351318359375, -6.8275146484375, -6.3037109375, -5.7799072265625, -5.256103515625, -4.7322998046875, -4.20849609375, -3.6846923828125, -3.160888671875, -2.6370849609375, -2.11328125, -1.5894775390625, -1.065673828125, -0.5418701171875, -0.01806640625, 0.5057373046875, 1.029541015625, 1.5533447265625, 2.0771484375, 2.6009521484375, 3.124755859375, 3.6485595703125, 4.17236328125, 4.6961669921875, 5.219970703125, 5.7437744140625, 6.267578125, 6.7913818359375, 7.315185546875, 7.8389892578125, 8.36279296875, 8.8865966796875, 9.410400390625, 9.9342041015625, 10.4580078125, 10.9818115234375, 11.505615234375, 12.0294189453125, 12.55322265625, 13.0770263671875, 13.600830078125, 14.1246337890625, 14.6484375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 5.0, 11.0, 22.0, 27.0, 70.0, 145.0, 182.0, 207.0, 127.0, 88.0, 47.0, 17.0, 16.0, 10.0, 3.0, 9.0, 7.0, 3.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-105.78873443603516, -102.1515121459961, -98.51429748535156, -94.8770751953125, -91.23986053466797, -87.6026382446289, -83.96542358398438, -80.32820129394531, -76.69097900390625, -73.05375671386719, -69.41654205322266, -65.7793197631836, -62.1421012878418, -58.5048828125, -54.8676643371582, -51.230445861816406, -47.59322738647461, -43.95600891113281, -40.318790435791016, -36.68157196044922, -33.044349670410156, -29.40713119506836, -25.769912719726562, -22.132692337036133, -18.495473861694336, -14.858254432678223, -11.22103500366211, -7.5838165283203125, -3.946597099304199, -0.30937767028808594, 3.327840805053711, 6.965061187744141, 10.602279663085938, 14.23949909210205, 17.876718521118164, 21.51393699645996, 25.15115737915039, 28.788375854492188, 32.425594329833984, 36.06281280517578, 39.700035095214844, 43.33725357055664, 46.97447204589844, 50.6116943359375, 54.2489128112793, 57.886131286621094, 61.52334976196289, 65.16056823730469, 68.79779052734375, 72.43501281738281, 76.07222747802734, 79.7094497680664, 83.34666442871094, 86.98388671875, 90.62110900878906, 94.2583236694336, 97.89553833007812, 101.53276062011719, 105.16997528076172, 108.80719757080078, 112.44441223144531, 116.08163452148438, 119.71885681152344, 123.35607147216797, 126.99329376220703]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 6.0, 10.0, 11.0, 6.0, 6.0, 18.0, 14.0, 17.0, 18.0, 26.0, 25.0, 33.0, 27.0, 28.0, 38.0, 36.0, 39.0, 44.0, 37.0, 49.0, 41.0, 44.0, 39.0, 44.0, 29.0, 38.0, 18.0, 38.0, 26.0, 30.0, 19.0, 24.0, 27.0, 25.0, 12.0, 10.0, 14.0, 8.0, 10.0, 4.0, 2.0, 2.0, 3.0, 3.0, 6.0, 2.0, 2.0], "bins": [-87.40695190429688, -85.05265045166016, -82.69834899902344, -80.34403991699219, -77.98973846435547, -75.63543701171875, -73.28113555908203, -70.92683410644531, -68.5725326538086, -66.21823120117188, -63.86392593383789, -61.50962448120117, -59.15532302856445, -56.80101776123047, -54.44671630859375, -52.09241485595703, -49.73810958862305, -47.38380813598633, -45.029502868652344, -42.675201416015625, -40.320899963378906, -37.96659851074219, -35.6122932434082, -33.257991790771484, -30.903688430786133, -28.54938507080078, -26.195083618164062, -23.84078025817871, -21.48647689819336, -19.13217544555664, -16.77787208557129, -14.42357063293457, -12.069267272949219, -9.714964866638184, -7.36066198348999, -5.006359100341797, -2.6520566940307617, -0.29775428771972656, 2.056549072265625, 4.410850524902344, 6.765153884887695, 9.11945629119873, 11.473758697509766, 13.828062057495117, 16.18236541748047, 18.536666870117188, 20.89097023010254, 23.245271682739258, 25.59957504272461, 27.95387840270996, 30.30817985534668, 32.66248321533203, 35.01678466796875, 37.37108612060547, 39.72539138793945, 42.07969284057617, 44.433998107910156, 46.788299560546875, 49.14260482788086, 51.49690628051758, 53.8512077331543, 56.20551300048828, 58.559814453125, 60.91411590576172, 63.26841735839844]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 7.0, 6.0, 19.0, 28.0, 40.0, 69.0, 135.0, 179.0, 276.0, 426.0, 631.0, 934.0, 1359.0, 2017.0, 2714.0, 4145.0, 1019597.0, 5253.0, 3427.0, 2286.0, 1652.0, 1095.0, 770.0, 521.0, 345.0, 246.0, 139.0, 88.0, 57.0, 38.0, 26.0, 16.0, 11.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.536247253417969, -10.980578422546387, -10.424909591674805, -9.869240760803223, -9.31357192993164, -8.757904052734375, -8.202235221862793, -7.646566390991211, -7.090897560119629, -6.535228729248047, -5.979559898376465, -5.423891544342041, -4.868222713470459, -4.312553882598877, -3.756885290145874, -3.201216697692871, -2.645547866821289, -2.089879035949707, -1.534210443496704, -0.9785417318344116, -0.42287302017211914, 0.1327958106994629, 0.6884644031524658, 1.2441329956054688, 1.7998018264770508, 2.355470657348633, 2.9111392498016357, 3.4668078422546387, 4.022476673126221, 4.578145503997803, 5.133813858032227, 5.689482688903809, 6.245151519775391, 6.800820350646973, 7.356489181518555, 7.9121575355529785, 8.467826843261719, 9.023494720458984, 9.579163551330566, 10.134832382202148, 10.69050121307373, 11.246170043945312, 11.801838874816895, 12.357507705688477, 12.913175582885742, 13.46884536743164, 14.024513244628906, 14.580182075500488, 15.13585090637207, 15.691519737243652, 16.247188568115234, 16.8028564453125, 17.3585262298584, 17.914194107055664, 18.469863891601562, 19.025531768798828, 19.581199645996094, 20.13686752319336, 20.692537307739258, 21.248205184936523, 21.803874969482422, 22.359542846679688, 22.915212631225586, 23.47088050842285, 24.02655029296875]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 5.0, 7.0, 6.0, 11.0, 15.0, 24.0, 39.0, 47.0, 73.0, 154.0, 1410.0, 51460580.0, 554.0, 74.0, 36.0, 34.0, 13.0, 10.0, 10.0, 1.0, 4.0, 3.0, 7.0, 4.0, 4.0, 9.0, 4.0, 2.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-942.0, -906.3271484375, -870.654296875, -834.9814453125, -799.3086547851562, -763.6358032226562, -727.9629516601562, -692.2901000976562, -656.6173095703125, -620.9444580078125, -585.2716064453125, -549.5987548828125, -513.9259643554688, -478.25311279296875, -442.58026123046875, -406.90740966796875, -371.23455810546875, -335.56170654296875, -299.8888854980469, -264.2160339355469, -228.54319763183594, -192.870361328125, -157.197509765625, -121.52467346191406, -85.85183715820312, -50.17899703979492, -14.506156921386719, 21.16668701171875, 56.83952331542969, 92.51235961914062, 128.18521118164062, 163.85804748535156, 199.5308837890625, 235.20372009277344, 270.8765563964844, 306.5494079589844, 342.22222900390625, 377.89508056640625, 413.56793212890625, 449.24078369140625, 484.9136047363281, 520.58642578125, 556.25927734375, 591.93212890625, 627.60498046875, 663.27783203125, 698.95068359375, 734.6234741210938, 770.2963256835938, 805.9691772460938, 841.6420288085938, 877.3148193359375, 912.9876708984375, 948.6605224609375, 984.3333740234375, 1020.0062255859375, 1055.6790771484375, 1091.3519287109375, 1127.0247802734375, 1162.6976318359375, 1198.3704833984375, 1234.043212890625, 1269.716064453125, 1305.388916015625, 1341.061767578125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [2.0, 5.0, 5.0, 3.0, 8.0, 14.0, 17.0, 41.0, 60.0, 73.0, 108.0, 117.0, 188.0, 275.0, 394.0, 523.0, 788.0, 1166.0, 1801.0, 2526.0, 3605.0, 5584.0, 8408.0, 12116.0, 18405.0, 27819.0, 43242.0, 67953.0, 107407.0, 171177.0, 269500.0, 401150.0, 3434373.0, 704499.0, 357825.0, 235642.0, 148806.0, 93648.0, 58995.0, 38543.0, 24615.0, 16575.0, 10784.0, 7067.0, 4735.0, 3390.0, 2329.0, 1567.0, 1077.0, 738.0, 531.0, 370.0, 245.0, 190.0, 132.0, 86.0, 68.0, 44.0, 28.0, 40.0, 20.0, 8.0, 2.0, 4.0], "bins": [-0.900390625, -0.8729782104492188, -0.8455657958984375, -0.8181533813476562, -0.790740966796875, -0.7633285522460938, -0.7359161376953125, -0.7085037231445312, -0.68109130859375, -0.6536788940429688, -0.6262664794921875, -0.5988540649414062, -0.571441650390625, -0.5440292358398438, -0.5166168212890625, -0.48920440673828125, -0.4617919921875, -0.43437957763671875, -0.4069671630859375, -0.37955474853515625, -0.352142333984375, -0.32472991943359375, -0.2973175048828125, -0.26990509033203125, -0.24249267578125, -0.21508026123046875, -0.1876678466796875, -0.16025543212890625, -0.132843017578125, -0.10543060302734375, -0.0780181884765625, -0.05060577392578125, -0.023193359375, 0.00421905517578125, 0.0316314697265625, 0.05904388427734375, 0.086456298828125, 0.11386871337890625, 0.1412811279296875, 0.16869354248046875, 0.19610595703125, 0.22351837158203125, 0.2509307861328125, 0.27834320068359375, 0.305755615234375, 0.33316802978515625, 0.3605804443359375, 0.38799285888671875, 0.4154052734375, 0.44281768798828125, 0.4702301025390625, 0.49764251708984375, 0.525054931640625, 0.5524673461914062, 0.5798797607421875, 0.6072921752929688, 0.63470458984375, 0.6621170043945312, 0.6895294189453125, 0.7169418334960938, 0.744354248046875, 0.7717666625976562, 0.7991790771484375, 0.8265914916992188, 0.85400390625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 2.0, 8.0, 14.0, 8.0, 12.0, 15.0, 14.0, 28.0, 26.0, 36.0, 35.0, 36.0, 31.0, 34.0, 42.0, 39.0, 41.0, 42.0, 63.0, 1041.0, 38.0, 47.0, 40.0, 37.0, 37.0, 36.0, 29.0, 35.0, 29.0, 16.0, 20.0, 18.0, 20.0, 12.0, 13.0, 15.0, 7.0, 5.0, 1.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.6875, -22.98046875, -22.2734375, -21.56640625, -20.859375, -20.15234375, -19.4453125, -18.73828125, -18.03125, -17.32421875, -16.6171875, -15.91015625, -15.203125, -14.49609375, -13.7890625, -13.08203125, -12.375, -11.66796875, -10.9609375, -10.25390625, -9.546875, -8.83984375, -8.1328125, -7.42578125, -6.71875, -6.01171875, -5.3046875, -4.59765625, -3.890625, -3.18359375, -2.4765625, -1.76953125, -1.0625, -0.35546875, 0.3515625, 1.05859375, 1.765625, 2.47265625, 3.1796875, 3.88671875, 4.59375, 5.30078125, 6.0078125, 6.71484375, 7.421875, 8.12890625, 8.8359375, 9.54296875, 10.25, 10.95703125, 11.6640625, 12.37109375, 13.078125, 13.78515625, 14.4921875, 15.19921875, 15.90625, 16.61328125, 17.3203125, 18.02734375, 18.734375, 19.44140625, 20.1484375, 20.85546875, 21.5625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [4.0, 4.0, 5.0, 6.0, 9.0, 9.0, 19.0, 17.0, 49.0, 55.0, 91.0, 104.0, 175.0, 255.0, 370.0, 589.0, 824.0, 1312.0, 1905.0, 2810.0, 4126.0, 6218.0, 9384.0, 14072.0, 21352.0, 33659.0, 53062.0, 86348.0, 145753.0, 253435.0, 438102.0, 3612784.0, 719055.0, 360782.0, 206959.0, 118538.0, 71414.0, 44453.0, 28621.0, 18359.0, 12056.0, 8076.0, 5261.0, 3514.0, 2460.0, 1663.0, 1048.0, 790.0, 514.0, 332.0, 217.0, 151.0, 103.0, 53.0, 53.0, 21.0, 23.0, 10.0, 9.0, 5.0, 2.0, 4.0, 1.0, 2.0], "bins": [-1.087890625, -1.0536956787109375, -1.019500732421875, -0.9853057861328125, -0.95111083984375, -0.9169158935546875, -0.882720947265625, -0.8485260009765625, -0.8143310546875, -0.7801361083984375, -0.745941162109375, -0.7117462158203125, -0.67755126953125, -0.6433563232421875, -0.609161376953125, -0.5749664306640625, -0.540771484375, -0.5065765380859375, -0.472381591796875, -0.4381866455078125, -0.40399169921875, -0.3697967529296875, -0.335601806640625, -0.3014068603515625, -0.2672119140625, -0.2330169677734375, -0.198822021484375, -0.1646270751953125, -0.13043212890625, -0.0962371826171875, -0.062042236328125, -0.0278472900390625, 0.00634765625, 0.0405426025390625, 0.074737548828125, 0.1089324951171875, 0.14312744140625, 0.1773223876953125, 0.211517333984375, 0.2457122802734375, 0.2799072265625, 0.3141021728515625, 0.348297119140625, 0.3824920654296875, 0.41668701171875, 0.4508819580078125, 0.485076904296875, 0.5192718505859375, 0.553466796875, 0.5876617431640625, 0.621856689453125, 0.6560516357421875, 0.69024658203125, 0.7244415283203125, 0.758636474609375, 0.7928314208984375, 0.8270263671875, 0.8612213134765625, 0.895416259765625, 0.9296112060546875, 0.96380615234375, 0.9980010986328125, 1.032196044921875, 1.0663909912109375, 1.1005859375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 8.0, 8.0, 2.0, 3.0, 6.0, 6.0, 12.0, 16.0, 11.0, 20.0, 25.0, 23.0, 29.0, 23.0, 35.0, 31.0, 30.0, 45.0, 41.0, 51.0, 53.0, 1069.0, 42.0, 46.0, 39.0, 47.0, 28.0, 37.0, 43.0, 30.0, 28.0, 24.0, 22.0, 22.0, 21.0, 18.0, 7.0, 5.0, 4.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.828125, -25.890869140625, -24.95361328125, -24.016357421875, -23.0791015625, -22.141845703125, -21.20458984375, -20.267333984375, -19.330078125, -18.392822265625, -17.45556640625, -16.518310546875, -15.5810546875, -14.643798828125, -13.70654296875, -12.769287109375, -11.83203125, -10.894775390625, -9.95751953125, -9.020263671875, -8.0830078125, -7.145751953125, -6.20849609375, -5.271240234375, -4.333984375, -3.396728515625, -2.45947265625, -1.522216796875, -0.5849609375, 0.352294921875, 1.28955078125, 2.226806640625, 3.1640625, 4.101318359375, 5.03857421875, 5.975830078125, 6.9130859375, 7.850341796875, 8.78759765625, 9.724853515625, 10.662109375, 11.599365234375, 12.53662109375, 13.473876953125, 14.4111328125, 15.348388671875, 16.28564453125, 17.222900390625, 18.16015625, 19.097412109375, 20.03466796875, 20.971923828125, 21.9091796875, 22.846435546875, 23.78369140625, 24.720947265625, 25.658203125, 26.595458984375, 27.53271484375, 28.469970703125, 29.4072265625, 30.344482421875, 31.28173828125, 32.218994140625, 33.15625]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 6.0, 7.0, 13.0, 10.0, 16.0, 17.0, 30.0, 53.0, 66.0, 70.0, 92.0, 99.0, 149.0, 175.0, 228.0, 330.0, 497.0, 606.0, 1042.0, 2022.0, 4125.0, 9861.0, 31066.0, 149463.0, 5932661.0, 115361.0, 25964.0, 8473.0, 3698.0, 1831.0, 1039.0, 678.0, 456.0, 330.0, 217.0, 184.0, 122.0, 103.0, 61.0, 73.0, 52.0, 26.0, 26.0, 19.0, 6.0, 4.0, 6.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.1484375, -7.88916015625, -7.6298828125, -7.37060546875, -7.111328125, -6.85205078125, -6.5927734375, -6.33349609375, -6.07421875, -5.81494140625, -5.5556640625, -5.29638671875, -5.037109375, -4.77783203125, -4.5185546875, -4.25927734375, -4.0, -3.74072265625, -3.4814453125, -3.22216796875, -2.962890625, -2.70361328125, -2.4443359375, -2.18505859375, -1.92578125, -1.66650390625, -1.4072265625, -1.14794921875, -0.888671875, -0.62939453125, -0.3701171875, -0.11083984375, 0.1484375, 0.40771484375, 0.6669921875, 0.92626953125, 1.185546875, 1.44482421875, 1.7041015625, 1.96337890625, 2.22265625, 2.48193359375, 2.7412109375, 3.00048828125, 3.259765625, 3.51904296875, 3.7783203125, 4.03759765625, 4.296875, 4.55615234375, 4.8154296875, 5.07470703125, 5.333984375, 5.59326171875, 5.8525390625, 6.11181640625, 6.37109375, 6.63037109375, 6.8896484375, 7.14892578125, 7.408203125, 7.66748046875, 7.9267578125, 8.18603515625, 8.4453125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 2.0, 8.0, 4.0, 7.0, 8.0, 9.0, 8.0, 9.0, 12.0, 17.0, 13.0, 24.0, 24.0, 27.0, 26.0, 33.0, 28.0, 48.0, 40.0, 50.0, 46.0, 44.0, 1058.0, 45.0, 50.0, 37.0, 30.0, 42.0, 36.0, 31.0, 26.0, 28.0, 22.0, 23.0, 19.0, 15.0, 16.0, 12.0, 11.0, 8.0, 7.0, 6.0, 6.0, 2.0, 8.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-35.65625, -34.62158203125, -33.5869140625, -32.55224609375, -31.517578125, -30.48291015625, -29.4482421875, -28.41357421875, -27.37890625, -26.34423828125, -25.3095703125, -24.27490234375, -23.240234375, -22.20556640625, -21.1708984375, -20.13623046875, -19.1015625, -18.06689453125, -17.0322265625, -15.99755859375, -14.962890625, -13.92822265625, -12.8935546875, -11.85888671875, -10.82421875, -9.78955078125, -8.7548828125, -7.72021484375, -6.685546875, -5.65087890625, -4.6162109375, -3.58154296875, -2.546875, -1.51220703125, -0.4775390625, 0.55712890625, 1.591796875, 2.62646484375, 3.6611328125, 4.69580078125, 5.73046875, 6.76513671875, 7.7998046875, 8.83447265625, 9.869140625, 10.90380859375, 11.9384765625, 12.97314453125, 14.0078125, 15.04248046875, 16.0771484375, 17.11181640625, 18.146484375, 19.18115234375, 20.2158203125, 21.25048828125, 22.28515625, 23.31982421875, 24.3544921875, 25.38916015625, 26.423828125, 27.45849609375, 28.4931640625, 29.52783203125, 30.5625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 9.0, 32.0, 149.0, 623.0, 146.0, 25.0, 15.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-188.030517578125, -184.3090362548828, -180.58755493164062, -176.86607360839844, -173.14459228515625, -169.42312622070312, -165.70164489746094, -161.98016357421875, -158.25868225097656, -154.53720092773438, -150.8157196044922, -147.09423828125, -143.37277221679688, -139.6512908935547, -135.9298095703125, -132.2083282470703, -128.48684692382812, -124.76536560058594, -121.04388427734375, -117.3224105834961, -113.6009292602539, -109.87944793701172, -106.15797424316406, -102.43649291992188, -98.71501159667969, -94.9935302734375, -91.27204895019531, -87.55057525634766, -83.82909393310547, -80.10761260986328, -76.38613891601562, -72.66465759277344, -68.94317626953125, -65.22169494628906, -61.50021743774414, -57.77873992919922, -54.05725860595703, -50.335777282714844, -46.61429977416992, -42.892822265625, -39.17133712768555, -35.449859619140625, -31.728378295898438, -28.006898880004883, -24.285419464111328, -20.563940048217773, -16.84246063232422, -13.120981216430664, -9.39950180053711, -5.678022384643555, -1.95654296875, 1.7649364471435547, 5.486415863037109, 9.207895278930664, 12.929374694824219, 16.650854110717773, 20.372333526611328, 24.093812942504883, 27.815292358398438, 31.536771774291992, 35.25825119018555, 38.97972869873047, 42.701210021972656, 46.422691345214844, 50.144168853759766]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 4.0, 9.0, 5.0, 1.0, 8.0, 12.0, 14.0, 22.0, 40.0, 66.0, 103.0, 123.0, 157.0, 134.0, 103.0, 84.0, 31.0, 31.0, 14.0, 10.0, 9.0, 6.0, 7.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-176.2576141357422, -172.0342254638672, -167.81082153320312, -163.58743286132812, -159.36404418945312, -155.14065551757812, -150.91725158691406, -146.69386291503906, -142.470458984375, -138.2470703125, -134.02366638183594, -129.80027770996094, -125.57688903808594, -121.3534927368164, -117.13009643554688, -112.90670776367188, -108.68331909179688, -104.45992279052734, -100.23653411865234, -96.01313781738281, -91.78974914550781, -87.56635284423828, -83.34295654296875, -79.11956787109375, -74.89617156982422, -70.67277526855469, -66.44938659667969, -62.225990295410156, -58.00259780883789, -53.779205322265625, -49.555809020996094, -45.33241653442383, -41.10901641845703, -36.885623931884766, -32.6622314453125, -28.43883514404297, -24.215442657470703, -19.992050170898438, -15.768655776977539, -11.54526138305664, -7.321868896484375, -3.098475456237793, 1.124917984008789, 5.348311424255371, 9.571704864501953, 13.795097351074219, 18.018491744995117, 22.241886138916016, 26.46527862548828, 30.688671112060547, 34.91206359863281, 39.135459899902344, 43.35885238647461, 47.582244873046875, 51.805641174316406, 56.02903366088867, 60.25242614746094, 64.47582244873047, 68.69921112060547, 72.922607421875, 77.14599609375, 81.36939239501953, 85.59278869628906, 89.81617736816406, 94.0395736694336]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 4.0, 4.0, 8.0, 11.0, 15.0, 25.0, 22.0, 29.0, 38.0, 33.0, 52.0, 62.0, 102.0, 94.0, 139.0, 213.0, 332.0, 506.0, 859.0, 1511.0, 2935.0, 6391.0, 29522.0, 3889579.0, 234993.0, 18125.0, 4412.0, 1949.0, 907.0, 507.0, 271.0, 187.0, 144.0, 107.0, 55.0, 31.0, 21.0, 17.0, 21.0, 14.0, 8.0, 6.0, 14.0, 7.0, 3.0, 4.0], "bins": [-0.364013671875, -0.3553142547607422, -0.3466148376464844, -0.33791542053222656, -0.32921600341796875, -0.32051658630371094, -0.3118171691894531, -0.3031177520751953, -0.2944183349609375, -0.2857189178466797, -0.2770195007324219, -0.26832008361816406, -0.25962066650390625, -0.25092124938964844, -0.24222183227539062, -0.2335224151611328, -0.224822998046875, -0.2161235809326172, -0.20742416381835938, -0.19872474670410156, -0.19002532958984375, -0.18132591247558594, -0.17262649536132812, -0.1639270782470703, -0.1552276611328125, -0.1465282440185547, -0.13782882690429688, -0.12912940979003906, -0.12042999267578125, -0.11173057556152344, -0.10303115844726562, -0.09433174133300781, -0.08563232421875, -0.07693290710449219, -0.06823348999023438, -0.05953407287597656, -0.05083465576171875, -0.04213523864746094, -0.033435821533203125, -0.024736404418945312, -0.0160369873046875, -0.0073375701904296875, 0.001361846923828125, 0.010061264038085938, 0.01876068115234375, 0.027460098266601562, 0.036159515380859375, 0.04485893249511719, 0.053558349609375, 0.06225776672363281, 0.07095718383789062, 0.07965660095214844, 0.08835601806640625, 0.09705543518066406, 0.10575485229492188, 0.11445426940917969, 0.1231536865234375, 0.1318531036376953, 0.14055252075195312, 0.14925193786621094, 0.15795135498046875, 0.16665077209472656, 0.17535018920898438, 0.1840496063232422, 0.1927490234375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 1.0, 1.0, 3.0, 5.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 8.0, 12.0, 7.0, 18.0, 17.0, 21.0, 241.0, 554.0, 15.0, 15.0, 12.0, 6.0, 6.0, 7.0, 7.0, 4.0, 11.0, 6.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.4287109375, -0.4184436798095703, -0.4081764221191406, -0.39790916442871094, -0.38764190673828125, -0.37737464904785156, -0.3671073913574219, -0.3568401336669922, -0.3465728759765625, -0.3363056182861328, -0.3260383605957031, -0.31577110290527344, -0.30550384521484375, -0.29523658752441406, -0.2849693298339844, -0.2747020721435547, -0.264434814453125, -0.2541675567626953, -0.24390029907226562, -0.23363304138183594, -0.22336578369140625, -0.21309852600097656, -0.20283126831054688, -0.1925640106201172, -0.1822967529296875, -0.1720294952392578, -0.16176223754882812, -0.15149497985839844, -0.14122772216796875, -0.13096046447753906, -0.12069320678710938, -0.11042594909667969, -0.10015869140625, -0.08989143371582031, -0.07962417602539062, -0.06935691833496094, -0.05908966064453125, -0.04882240295410156, -0.038555145263671875, -0.028287887573242188, -0.0180206298828125, -0.0077533721923828125, 0.002513885498046875, 0.012781143188476562, 0.02304840087890625, 0.03331565856933594, 0.043582916259765625, 0.05385017395019531, 0.064117431640625, 0.07438468933105469, 0.08465194702148438, 0.09491920471191406, 0.10518646240234375, 0.11545372009277344, 0.12572097778320312, 0.1359882354736328, 0.1462554931640625, 0.1565227508544922, 0.16679000854492188, 0.17705726623535156, 0.18732452392578125, 0.19759178161621094, 0.20785903930664062, 0.2181262969970703, 0.2283935546875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 6.0, 6.0, 15.0, 12.0, 16.0, 23.0, 23.0, 33.0, 68.0, 90.0, 113.0, 197.0, 298.0, 457.0, 791.0, 1354.0, 2626.0, 6030.0, 16661.0, 85600.0, 3799525.0, 229169.0, 30970.0, 10085.0, 4360.0, 2295.0, 1237.0, 749.0, 510.0, 266.0, 181.0, 142.0, 91.0, 70.0, 31.0, 39.0, 27.0, 19.0, 22.0, 9.0, 9.0, 9.0, 11.0, 8.0, 9.0, 4.0, 5.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.251953125, -0.24345779418945312, -0.23496246337890625, -0.22646713256835938, -0.2179718017578125, -0.20947647094726562, -0.20098114013671875, -0.19248580932617188, -0.183990478515625, -0.17549514770507812, -0.16699981689453125, -0.15850448608398438, -0.1500091552734375, -0.14151382446289062, -0.13301849365234375, -0.12452316284179688, -0.11602783203125, -0.10753250122070312, -0.09903717041015625, -0.09054183959960938, -0.0820465087890625, -0.07355117797851562, -0.06505584716796875, -0.056560516357421875, -0.048065185546875, -0.039569854736328125, -0.03107452392578125, -0.022579193115234375, -0.0140838623046875, -0.005588531494140625, 0.00290679931640625, 0.011402130126953125, 0.0198974609375, 0.028392791748046875, 0.03688812255859375, 0.045383453369140625, 0.0538787841796875, 0.062374114990234375, 0.07086944580078125, 0.07936477661132812, 0.087860107421875, 0.09635543823242188, 0.10485076904296875, 0.11334609985351562, 0.1218414306640625, 0.13033676147460938, 0.13883209228515625, 0.14732742309570312, 0.15582275390625, 0.16431808471679688, 0.17281341552734375, 0.18130874633789062, 0.1898040771484375, 0.19829940795898438, 0.20679473876953125, 0.21529006958007812, 0.223785400390625, 0.23228073120117188, 0.24077606201171875, 0.24927139282226562, 0.2577667236328125, 0.2662620544433594, 0.27475738525390625, 0.2832527160644531, 0.291748046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 4.0, 2.0, 7.0, 10.0, 9.0, 9.0, 16.0, 21.0, 50.0, 65.0, 178.0, 788.0, 2093.0, 425.0, 127.0, 72.0, 57.0, 28.0, 19.0, 21.0, 17.0, 10.0, 5.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 5.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.182861328125, -0.17701148986816406, -0.17116165161132812, -0.1653118133544922, -0.15946197509765625, -0.1536121368408203, -0.14776229858398438, -0.14191246032714844, -0.1360626220703125, -0.13021278381347656, -0.12436294555664062, -0.11851310729980469, -0.11266326904296875, -0.10681343078613281, -0.10096359252929688, -0.09511375427246094, -0.089263916015625, -0.08341407775878906, -0.07756423950195312, -0.07171440124511719, -0.06586456298828125, -0.06001472473144531, -0.054164886474609375, -0.04831504821777344, -0.0424652099609375, -0.03661537170410156, -0.030765533447265625, -0.024915695190429688, -0.01906585693359375, -0.013216018676757812, -0.007366180419921875, -0.0015163421630859375, 0.00433349609375, 0.010183334350585938, 0.016033172607421875, 0.021883010864257812, 0.02773284912109375, 0.03358268737792969, 0.039432525634765625, 0.04528236389160156, 0.0511322021484375, 0.05698204040527344, 0.06283187866210938, 0.06868171691894531, 0.07453155517578125, 0.08038139343261719, 0.08623123168945312, 0.09208106994628906, 0.097930908203125, 0.10378074645996094, 0.10963058471679688, 0.11548042297363281, 0.12133026123046875, 0.1271800994873047, 0.13302993774414062, 0.13887977600097656, 0.1447296142578125, 0.15057945251464844, 0.15642929077148438, 0.1622791290283203, 0.16812896728515625, 0.1739788055419922, 0.17982864379882812, 0.18567848205566406, 0.1915283203125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 2.0, 15.0, 46.0, 389.0, 425.0, 65.0, 31.0, 12.0, 7.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.1205768585205078, -1.0668493509292603, -1.0131218433380127, -0.9593943357467651, -0.9056668281555176, -0.85193932056427, -0.7982118129730225, -0.7444843053817749, -0.6907567977905273, -0.6370292901992798, -0.5833017826080322, -0.5295742750167847, -0.4758467674255371, -0.42211928963661194, -0.3683917820453644, -0.3146642744541168, -0.26093679666519165, -0.2072092890739441, -0.15348178148269653, -0.09975428879261017, -0.04602678120136261, 0.007700711488723755, 0.061428219079971313, 0.11515572667121887, 0.16888323426246643, 0.222610741853714, 0.27633824944496155, 0.3300657272338867, 0.3837932348251343, 0.43752074241638184, 0.4912482500076294, 0.544975757598877, 0.5987032651901245, 0.6524307727813721, 0.7061582803726196, 0.7598857879638672, 0.8136132955551147, 0.8673408031463623, 0.9210683107376099, 0.9747958183288574, 1.028523325920105, 1.0822508335113525, 1.1359783411026, 1.1897058486938477, 1.2434333562850952, 1.2971608638763428, 1.3508883714675903, 1.404615879058838, 1.458343267440796, 1.5120707750320435, 1.565798282623291, 1.6195257902145386, 1.6732532978057861, 1.7269808053970337, 1.7807083129882812, 1.8344358205795288, 1.8881633281707764, 1.941890835762024, 1.9956183433532715, 2.0493457317352295, 2.1030733585357666, 2.1568007469177246, 2.2105283737182617, 2.2642557621002197, 2.317983388900757]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 10.0, 10.0, 15.0, 25.0, 24.0, 29.0, 38.0, 40.0, 55.0, 66.0, 68.0, 69.0, 60.0, 72.0, 58.0, 70.0, 47.0, 44.0, 37.0, 34.0, 23.0, 22.0, 15.0, 19.0, 11.0, 8.0, 7.0, 2.0, 9.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7763159275054932, -0.7511367201805115, -0.7259575128555298, -0.7007783055305481, -0.6755990982055664, -0.6504198908805847, -0.625240683555603, -0.6000614762306213, -0.5748822689056396, -0.549703061580658, -0.5245238542556763, -0.4993446469306946, -0.4741654396057129, -0.4489862322807312, -0.4238070249557495, -0.3986278176307678, -0.37344858050346375, -0.34826937317848206, -0.32309016585350037, -0.2979109585285187, -0.272731751203537, -0.2475525289773941, -0.22237332165241241, -0.19719411432743073, -0.17201490700244904, -0.14683569967746735, -0.12165649235248566, -0.09647727757692337, -0.07129807025194168, -0.046118855476379395, -0.020939648151397705, 0.004239559173583984, 0.029418766498565674, 0.05459797382354736, 0.07977718114852905, 0.10495639592409134, 0.13013559579849243, 0.15531481802463531, 0.180494025349617, 0.2056732326745987, 0.23085243999958038, 0.25603166222572327, 0.28121086955070496, 0.30639007687568665, 0.33156928420066833, 0.35674849152565, 0.3819276988506317, 0.4071069061756134, 0.4322861135005951, 0.4574653208255768, 0.48264452815055847, 0.5078237652778625, 0.5330029726028442, 0.5581821799278259, 0.5833613872528076, 0.6085405945777893, 0.633719801902771, 0.6588990092277527, 0.6840782165527344, 0.7092574238777161, 0.7344366312026978, 0.7596158385276794, 0.7847950458526611, 0.8099742531776428, 0.8351534605026245]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 6.0, 2.0, 6.0, 10.0, 3.0, 23.0, 25.0, 34.0, 49.0, 68.0, 105.0, 173.0, 250.0, 440.0, 788.0, 1198.0, 1949.0, 3308.0, 6346.0, 12932.0, 35879.0, 912190.0, 42389.0, 14564.0, 6838.0, 3634.0, 2087.0, 1196.0, 775.0, 488.0, 233.0, 181.0, 118.0, 88.0, 57.0, 38.0, 30.0, 18.0, 13.0, 10.0, 3.0, 2.0, 2.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-1.5576171875, -1.5049285888671875, -1.452239990234375, -1.3995513916015625, -1.34686279296875, -1.2941741943359375, -1.241485595703125, -1.1887969970703125, -1.1361083984375, -1.0834197998046875, -1.030731201171875, -0.9780426025390625, -0.92535400390625, -0.8726654052734375, -0.819976806640625, -0.7672882080078125, -0.714599609375, -0.6619110107421875, -0.609222412109375, -0.5565338134765625, -0.50384521484375, -0.4511566162109375, -0.398468017578125, -0.3457794189453125, -0.2930908203125, -0.2404022216796875, -0.187713623046875, -0.1350250244140625, -0.08233642578125, -0.0296478271484375, 0.023040771484375, 0.0757293701171875, 0.12841796875, 0.1811065673828125, 0.233795166015625, 0.2864837646484375, 0.33917236328125, 0.3918609619140625, 0.444549560546875, 0.4972381591796875, 0.5499267578125, 0.6026153564453125, 0.655303955078125, 0.7079925537109375, 0.76068115234375, 0.8133697509765625, 0.866058349609375, 0.9187469482421875, 0.971435546875, 1.0241241455078125, 1.076812744140625, 1.1295013427734375, 1.18218994140625, 1.2348785400390625, 1.287567138671875, 1.3402557373046875, 1.3929443359375, 1.4456329345703125, 1.498321533203125, 1.5510101318359375, 1.60369873046875, 1.6563873291015625, 1.709075927734375, 1.7617645263671875, 1.814453125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 7.0, 0.0, 3.0, 2.0, 4.0, 4.0, 3.0, 6.0, 10.0, 7.0, 12.0, 12.0, 18.0, 24.0, 57.0, 739.0, 12.0, 15.0, 16.0, 6.0, 6.0, 3.0, 11.0, 4.0, 8.0, 9.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.421630859375, -0.4113349914550781, -0.40103912353515625, -0.3907432556152344, -0.3804473876953125, -0.3701515197753906, -0.35985565185546875, -0.3495597839355469, -0.339263916015625, -0.3289680480957031, -0.31867218017578125, -0.3083763122558594, -0.2980804443359375, -0.2877845764160156, -0.27748870849609375, -0.2671928405761719, -0.25689697265625, -0.24660110473632812, -0.23630523681640625, -0.22600936889648438, -0.2157135009765625, -0.20541763305664062, -0.19512176513671875, -0.18482589721679688, -0.174530029296875, -0.16423416137695312, -0.15393829345703125, -0.14364242553710938, -0.1333465576171875, -0.12305068969726562, -0.11275482177734375, -0.10245895385742188, -0.0921630859375, -0.08186721801757812, -0.07157135009765625, -0.061275482177734375, -0.0509796142578125, -0.040683746337890625, -0.03038787841796875, -0.020092010498046875, -0.009796142578125, 0.000499725341796875, 0.01079559326171875, 0.021091461181640625, 0.0313873291015625, 0.041683197021484375, 0.05197906494140625, 0.062274932861328125, 0.07257080078125, 0.08286666870117188, 0.09316253662109375, 0.10345840454101562, 0.1137542724609375, 0.12405014038085938, 0.13434600830078125, 0.14464187622070312, 0.154937744140625, 0.16523361206054688, 0.17552947998046875, 0.18582534790039062, 0.1961212158203125, 0.20641708374023438, 0.21671295166015625, 0.22700881958007812, 0.2373046875]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 5.0, 10.0, 10.0, 17.0, 18.0, 27.0, 23.0, 49.0, 49.0, 66.0, 77.0, 106.0, 148.0, 172.0, 250.0, 398.0, 567.0, 1097.0, 2037.0, 4608.0, 11370.0, 32614.0, 119312.0, 585066.0, 212493.0, 49233.0, 15938.0, 6274.0, 2790.0, 1354.0, 747.0, 412.0, 307.0, 196.0, 170.0, 117.0, 85.0, 75.0, 59.0, 54.0, 32.0, 31.0, 19.0, 14.0, 16.0, 14.0, 7.0, 6.0, 7.0, 6.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.64501953125, -0.6246566772460938, -0.6042938232421875, -0.5839309692382812, -0.563568115234375, -0.5432052612304688, -0.5228424072265625, -0.5024795532226562, -0.48211669921875, -0.46175384521484375, -0.4413909912109375, -0.42102813720703125, -0.400665283203125, -0.38030242919921875, -0.3599395751953125, -0.33957672119140625, -0.3192138671875, -0.29885101318359375, -0.2784881591796875, -0.25812530517578125, -0.237762451171875, -0.21739959716796875, -0.1970367431640625, -0.17667388916015625, -0.15631103515625, -0.13594818115234375, -0.1155853271484375, -0.09522247314453125, -0.074859619140625, -0.05449676513671875, -0.0341339111328125, -0.01377105712890625, 0.006591796875, 0.02695465087890625, 0.0473175048828125, 0.06768035888671875, 0.088043212890625, 0.10840606689453125, 0.1287689208984375, 0.14913177490234375, 0.16949462890625, 0.18985748291015625, 0.2102203369140625, 0.23058319091796875, 0.250946044921875, 0.27130889892578125, 0.2916717529296875, 0.31203460693359375, 0.3323974609375, 0.35276031494140625, 0.3731231689453125, 0.39348602294921875, 0.413848876953125, 0.43421173095703125, 0.4545745849609375, 0.47493743896484375, 0.49530029296875, 0.5156631469726562, 0.5360260009765625, 0.5563888549804688, 0.576751708984375, 0.5971145629882812, 0.6174774169921875, 0.6378402709960938, 0.658203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 8.0, 6.0, 10.0, 9.0, 10.0, 7.0, 8.0, 24.0, 18.0, 19.0, 21.0, 37.0, 34.0, 30.0, 41.0, 42.0, 43.0, 44.0, 41.0, 40.0, 48.0, 35.0, 36.0, 46.0, 32.0, 40.0, 32.0, 29.0, 27.0, 37.0, 21.0, 15.0, 28.0, 11.0, 19.0, 11.0, 11.0, 8.0, 4.0, 7.0, 2.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.84326171875, -0.8143844604492188, -0.7855072021484375, -0.7566299438476562, -0.727752685546875, -0.6988754272460938, -0.6699981689453125, -0.6411209106445312, -0.61224365234375, -0.5833663940429688, -0.5544891357421875, -0.5256118774414062, -0.496734619140625, -0.46785736083984375, -0.4389801025390625, -0.41010284423828125, -0.3812255859375, -0.35234832763671875, -0.3234710693359375, -0.29459381103515625, -0.265716552734375, -0.23683929443359375, -0.2079620361328125, -0.17908477783203125, -0.15020751953125, -0.12133026123046875, -0.0924530029296875, -0.06357574462890625, -0.034698486328125, -0.00582122802734375, 0.0230560302734375, 0.05193328857421875, 0.080810546875, 0.10968780517578125, 0.1385650634765625, 0.16744232177734375, 0.196319580078125, 0.22519683837890625, 0.2540740966796875, 0.28295135498046875, 0.31182861328125, 0.34070587158203125, 0.3695831298828125, 0.39846038818359375, 0.427337646484375, 0.45621490478515625, 0.4850921630859375, 0.5139694213867188, 0.5428466796875, 0.5717239379882812, 0.6006011962890625, 0.6294784545898438, 0.658355712890625, 0.6872329711914062, 0.7161102294921875, 0.7449874877929688, 0.77386474609375, 0.8027420043945312, 0.8316192626953125, 0.8604965209960938, 0.889373779296875, 0.9182510375976562, 0.9471282958984375, 0.9760055541992188, 1.0048828125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 0.0, 6.0, 4.0, 5.0, 7.0, 10.0, 25.0, 25.0, 38.0, 49.0, 81.0, 123.0, 208.0, 477.0, 1070.0, 3383.0, 21332.0, 986032.0, 29417.0, 4001.0, 1166.0, 474.0, 216.0, 146.0, 69.0, 50.0, 32.0, 27.0, 14.0, 19.0, 5.0, 7.0, 4.0, 6.0, 5.0, 10.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8095703125, -0.781219482421875, -0.75286865234375, -0.724517822265625, -0.6961669921875, -0.667816162109375, -0.63946533203125, -0.611114501953125, -0.582763671875, -0.554412841796875, -0.52606201171875, -0.497711181640625, -0.4693603515625, -0.441009521484375, -0.41265869140625, -0.384307861328125, -0.35595703125, -0.327606201171875, -0.29925537109375, -0.270904541015625, -0.2425537109375, -0.214202880859375, -0.18585205078125, -0.157501220703125, -0.129150390625, -0.100799560546875, -0.07244873046875, -0.044097900390625, -0.0157470703125, 0.012603759765625, 0.04095458984375, 0.069305419921875, 0.09765625, 0.126007080078125, 0.15435791015625, 0.182708740234375, 0.2110595703125, 0.239410400390625, 0.26776123046875, 0.296112060546875, 0.324462890625, 0.352813720703125, 0.38116455078125, 0.409515380859375, 0.4378662109375, 0.466217041015625, 0.49456787109375, 0.522918701171875, 0.55126953125, 0.579620361328125, 0.60797119140625, 0.636322021484375, 0.6646728515625, 0.693023681640625, 0.72137451171875, 0.749725341796875, 0.778076171875, 0.806427001953125, 0.83477783203125, 0.863128662109375, 0.8914794921875, 0.919830322265625, 0.94818115234375, 0.976531982421875, 1.0048828125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 12.0, 16.0, 44.0, 107.0, 139.0, 206.0, 196.0, 125.0, 63.0, 42.0, 25.0, 9.0, 9.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8775463104248047e-05, -1.7412006855010986e-05, -1.6048550605773926e-05, -1.4685094356536865e-05, -1.3321638107299805e-05, -1.1958181858062744e-05, -1.0594725608825684e-05, -9.231269359588623e-06, -7.867813110351562e-06, -6.504356861114502e-06, -5.140900611877441e-06, -3.777444362640381e-06, -2.4139881134033203e-06, -1.0505318641662598e-06, 3.129243850708008e-07, 1.6763806343078613e-06, 3.039836883544922e-06, 4.403293132781982e-06, 5.766749382019043e-06, 7.1302056312561035e-06, 8.493661880493164e-06, 9.857118129730225e-06, 1.1220574378967285e-05, 1.2584030628204346e-05, 1.3947486877441406e-05, 1.5310943126678467e-05, 1.6674399375915527e-05, 1.8037855625152588e-05, 1.940131187438965e-05, 2.076476812362671e-05, 2.212822437286377e-05, 2.349168062210083e-05, 2.485513687133789e-05, 2.621859312057495e-05, 2.7582049369812012e-05, 2.8945505619049072e-05, 3.0308961868286133e-05, 3.167241811752319e-05, 3.3035874366760254e-05, 3.4399330615997314e-05, 3.5762786865234375e-05, 3.7126243114471436e-05, 3.8489699363708496e-05, 3.985315561294556e-05, 4.121661186218262e-05, 4.258006811141968e-05, 4.394352436065674e-05, 4.53069806098938e-05, 4.667043685913086e-05, 4.803389310836792e-05, 4.939734935760498e-05, 5.076080560684204e-05, 5.21242618560791e-05, 5.348771810531616e-05, 5.485117435455322e-05, 5.621463060379028e-05, 5.7578086853027344e-05, 5.8941543102264404e-05, 6.0304999351501465e-05, 6.166845560073853e-05, 6.303191184997559e-05, 6.439536809921265e-05, 6.575882434844971e-05, 6.712228059768677e-05, 6.848573684692383e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 5.0, 1.0, 2.0, 7.0, 3.0, 8.0, 10.0, 15.0, 20.0, 32.0, 70.0, 117.0, 179.0, 377.0, 794.0, 2037.0, 7991.0, 94816.0, 907881.0, 27359.0, 4154.0, 1396.0, 608.0, 272.0, 163.0, 82.0, 50.0, 20.0, 21.0, 22.0, 8.0, 5.0, 11.0, 2.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.578125, -0.5596542358398438, -0.5411834716796875, -0.5227127075195312, -0.504241943359375, -0.48577117919921875, -0.4673004150390625, -0.44882965087890625, -0.43035888671875, -0.41188812255859375, -0.3934173583984375, -0.37494659423828125, -0.356475830078125, -0.33800506591796875, -0.3195343017578125, -0.30106353759765625, -0.2825927734375, -0.26412200927734375, -0.2456512451171875, -0.22718048095703125, -0.208709716796875, -0.19023895263671875, -0.1717681884765625, -0.15329742431640625, -0.13482666015625, -0.11635589599609375, -0.0978851318359375, -0.07941436767578125, -0.060943603515625, -0.04247283935546875, -0.0240020751953125, -0.00553131103515625, 0.012939453125, 0.03141021728515625, 0.0498809814453125, 0.06835174560546875, 0.086822509765625, 0.10529327392578125, 0.1237640380859375, 0.14223480224609375, 0.16070556640625, 0.17917633056640625, 0.1976470947265625, 0.21611785888671875, 0.234588623046875, 0.25305938720703125, 0.2715301513671875, 0.29000091552734375, 0.3084716796875, 0.32694244384765625, 0.3454132080078125, 0.36388397216796875, 0.382354736328125, 0.40082550048828125, 0.4192962646484375, 0.43776702880859375, 0.45623779296875, 0.47470855712890625, 0.4931793212890625, 0.5116500854492188, 0.530120849609375, 0.5485916137695312, 0.5670623779296875, 0.5855331420898438, 0.60400390625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 13.0, 9.0, 16.0, 24.0, 28.0, 52.0, 78.0, 131.0, 196.0, 162.0, 102.0, 63.0, 44.0, 27.0, 14.0, 6.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5615234375, -0.538818359375, -0.51611328125, -0.493408203125, -0.470703125, -0.447998046875, -0.42529296875, -0.402587890625, -0.3798828125, -0.357177734375, -0.33447265625, -0.311767578125, -0.2890625, -0.266357421875, -0.24365234375, -0.220947265625, -0.1982421875, -0.175537109375, -0.15283203125, -0.130126953125, -0.107421875, -0.084716796875, -0.06201171875, -0.039306640625, -0.0166015625, 0.006103515625, 0.02880859375, 0.051513671875, 0.07421875, 0.096923828125, 0.11962890625, 0.142333984375, 0.1650390625, 0.187744140625, 0.21044921875, 0.233154296875, 0.255859375, 0.278564453125, 0.30126953125, 0.323974609375, 0.3466796875, 0.369384765625, 0.39208984375, 0.414794921875, 0.4375, 0.460205078125, 0.48291015625, 0.505615234375, 0.5283203125, 0.551025390625, 0.57373046875, 0.596435546875, 0.619140625, 0.641845703125, 0.66455078125, 0.687255859375, 0.7099609375, 0.732666015625, 0.75537109375, 0.778076171875, 0.80078125, 0.823486328125, 0.84619140625, 0.868896484375, 0.8916015625]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 6.0, 14.0, 25.0, 64.0, 333.0, 417.0, 93.0, 33.0, 13.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.647161483764648, -9.228052139282227, -8.808941841125488, -8.389832496643066, -7.970722675323486, -7.551612854003906, -7.132503509521484, -6.713393688201904, -6.294283866882324, -5.875174045562744, -5.456064701080322, -5.036954879760742, -4.617845058441162, -4.198735237121582, -3.77962589263916, -3.36051607131958, -2.941406726837158, -2.5222971439361572, -2.103187322616577, -1.6840777397155762, -1.2649680376052856, -0.8458583354949951, -0.42674875259399414, -0.0076389312744140625, 0.4114706516265869, 0.8305803537368774, 1.249690055847168, 1.668799638748169, 2.08790922164917, 2.50701904296875, 2.926128625869751, 3.345238447189331, 3.764348030090332, 4.183457851409912, 4.602567195892334, 5.021677017211914, 5.440786838531494, 5.859896659851074, 6.279006004333496, 6.698115825653076, 7.117225646972656, 7.536335468292236, 7.955444812774658, 8.374554634094238, 8.79366397857666, 9.212774276733398, 9.63188362121582, 10.050992965698242, 10.470102310180664, 10.889211654663086, 11.308321952819824, 11.727431297302246, 12.146540641784668, 12.565650939941406, 12.984760284423828, 13.40386962890625, 13.822979927062988, 14.24208927154541, 14.661199569702148, 15.08030891418457, 15.499418258666992, 15.91852855682373, 16.33763885498047, 16.75674819946289, 17.175857543945312]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 5.0, 5.0, 0.0, 2.0, 1.0, 5.0, 5.0, 6.0, 4.0, 8.0, 10.0, 15.0, 27.0, 46.0, 71.0, 114.0, 125.0, 143.0, 107.0, 80.0, 61.0, 42.0, 32.0, 21.0, 10.0, 10.0, 5.0, 6.0, 8.0, 1.0, 4.0, 4.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.54543685913086, -14.034297943115234, -13.52315902709961, -13.012019157409668, -12.500880241394043, -11.989741325378418, -11.478601455688477, -10.967462539672852, -10.456323623657227, -9.945184707641602, -9.434045791625977, -8.922905921936035, -8.41176700592041, -7.900628089904785, -7.389488697052002, -6.878349304199219, -6.367210388183594, -5.856071472167969, -5.3449320793151855, -4.833792686462402, -4.322653770446777, -3.8115146160125732, -3.300375461578369, -2.789236307144165, -2.278097152709961, -1.7669579982757568, -1.2558188438415527, -0.7446796894073486, -0.23354053497314453, 0.27759861946105957, 0.7887377738952637, 1.2998769283294678, 1.8110160827636719, 2.322155237197876, 2.83329439163208, 3.344433546066284, 3.8555727005004883, 4.366711616516113, 4.8778510093688965, 5.38899040222168, 5.900129318237305, 6.41126823425293, 6.922407627105713, 7.433547019958496, 7.944685935974121, 8.455824851989746, 8.966964721679688, 9.478103637695312, 9.989242553710938, 10.500381469726562, 11.011520385742188, 11.522660255432129, 12.033799171447754, 12.544938087463379, 13.05607795715332, 13.567216873168945, 14.07835578918457, 14.589494705200195, 15.10063362121582, 15.611773490905762, 16.122913360595703, 16.634052276611328, 17.145191192626953, 17.656330108642578, 18.167469024658203]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 6.0, 1.0, 11.0, 10.0, 9.0, 7.0, 23.0, 35.0, 53.0, 89.0, 120.0, 221.0, 412.0, 919.0, 2349.0, 7713.0, 46062.0, 4056023.0, 67072.0, 9524.0, 2394.0, 771.0, 269.0, 88.0, 48.0, 29.0, 9.0, 8.0, 5.0, 4.0, 4.0, 0.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.6015625, -4.493499755859375, -4.38543701171875, -4.277374267578125, -4.1693115234375, -4.061248779296875, -3.95318603515625, -3.845123291015625, -3.737060546875, -3.628997802734375, -3.52093505859375, -3.412872314453125, -3.3048095703125, -3.196746826171875, -3.08868408203125, -2.980621337890625, -2.87255859375, -2.764495849609375, -2.65643310546875, -2.548370361328125, -2.4403076171875, -2.332244873046875, -2.22418212890625, -2.116119384765625, -2.008056640625, -1.899993896484375, -1.79193115234375, -1.683868408203125, -1.5758056640625, -1.467742919921875, -1.35968017578125, -1.251617431640625, -1.1435546875, -1.035491943359375, -0.92742919921875, -0.819366455078125, -0.7113037109375, -0.603240966796875, -0.49517822265625, -0.387115478515625, -0.279052734375, -0.170989990234375, -0.06292724609375, 0.045135498046875, 0.1531982421875, 0.261260986328125, 0.36932373046875, 0.477386474609375, 0.58544921875, 0.693511962890625, 0.80157470703125, 0.909637451171875, 1.0177001953125, 1.125762939453125, 1.23382568359375, 1.341888427734375, 1.449951171875, 1.558013916015625, 1.66607666015625, 1.774139404296875, 1.8822021484375, 1.990264892578125, 2.09832763671875, 2.206390380859375, 2.314453125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 8.0, 11.0, 11.0, 14.0, 13.0, 18.0, 31.0, 227.0, 496.0, 71.0, 16.0, 17.0, 12.0, 13.0, 4.0, 7.0, 7.0, 5.0, 6.0, 2.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.403076171875, -0.3937339782714844, -0.38439178466796875, -0.3750495910644531, -0.3657073974609375, -0.3563652038574219, -0.34702301025390625, -0.3376808166503906, -0.328338623046875, -0.3189964294433594, -0.30965423583984375, -0.3003120422363281, -0.2909698486328125, -0.2816276550292969, -0.27228546142578125, -0.2629432678222656, -0.25360107421875, -0.24425888061523438, -0.23491668701171875, -0.22557449340820312, -0.2162322998046875, -0.20689010620117188, -0.19754791259765625, -0.18820571899414062, -0.178863525390625, -0.16952133178710938, -0.16017913818359375, -0.15083694458007812, -0.1414947509765625, -0.13215255737304688, -0.12281036376953125, -0.11346817016601562, -0.1041259765625, -0.09478378295898438, -0.08544158935546875, -0.07609939575195312, -0.0667572021484375, -0.057415008544921875, -0.04807281494140625, -0.038730621337890625, -0.029388427734375, -0.020046234130859375, -0.01070404052734375, -0.001361846923828125, 0.0079803466796875, 0.017322540283203125, 0.02666473388671875, 0.036006927490234375, 0.04534912109375, 0.054691314697265625, 0.06403350830078125, 0.07337570190429688, 0.0827178955078125, 0.09206008911132812, 0.10140228271484375, 0.11074447631835938, 0.120086669921875, 0.12942886352539062, 0.13877105712890625, 0.14811325073242188, 0.1574554443359375, 0.16679763793945312, 0.17613983154296875, 0.18548202514648438, 0.19482421875]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 6.0, 2.0, 4.0, 7.0, 14.0, 20.0, 20.0, 29.0, 37.0, 50.0, 81.0, 100.0, 163.0, 254.0, 427.0, 780.0, 1702.0, 4261.0, 13124.0, 66617.0, 3319394.0, 725166.0, 45371.0, 10003.0, 3356.0, 1422.0, 728.0, 400.0, 242.0, 156.0, 113.0, 59.0, 51.0, 27.0, 32.0, 17.0, 21.0, 8.0, 6.0, 11.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83740234375, -0.8111343383789062, -0.7848663330078125, -0.7585983276367188, -0.732330322265625, -0.7060623168945312, -0.6797943115234375, -0.6535263061523438, -0.62725830078125, -0.6009902954101562, -0.5747222900390625, -0.5484542846679688, -0.522186279296875, -0.49591827392578125, -0.4696502685546875, -0.44338226318359375, -0.4171142578125, -0.39084625244140625, -0.3645782470703125, -0.33831024169921875, -0.312042236328125, -0.28577423095703125, -0.2595062255859375, -0.23323822021484375, -0.20697021484375, -0.18070220947265625, -0.1544342041015625, -0.12816619873046875, -0.101898193359375, -0.07563018798828125, -0.0493621826171875, -0.02309417724609375, 0.003173828125, 0.02944183349609375, 0.0557098388671875, 0.08197784423828125, 0.108245849609375, 0.13451385498046875, 0.1607818603515625, 0.18704986572265625, 0.21331787109375, 0.23958587646484375, 0.2658538818359375, 0.29212188720703125, 0.318389892578125, 0.34465789794921875, 0.3709259033203125, 0.39719390869140625, 0.4234619140625, 0.44972991943359375, 0.4759979248046875, 0.5022659301757812, 0.528533935546875, 0.5548019409179688, 0.5810699462890625, 0.6073379516601562, 0.63360595703125, 0.6598739624023438, 0.6861419677734375, 0.7124099731445312, 0.738677978515625, 0.7649459838867188, 0.7912139892578125, 0.8174819946289062, 0.84375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 3.0, 6.0, 7.0, 11.0, 8.0, 15.0, 9.0, 19.0, 21.0, 31.0, 55.0, 70.0, 94.0, 191.0, 490.0, 1574.0, 613.0, 289.0, 182.0, 122.0, 50.0, 57.0, 41.0, 29.0, 25.0, 17.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-0.2186279296875, -0.21263885498046875, -0.2066497802734375, -0.20066070556640625, -0.194671630859375, -0.18868255615234375, -0.1826934814453125, -0.17670440673828125, -0.17071533203125, -0.16472625732421875, -0.1587371826171875, -0.15274810791015625, -0.146759033203125, -0.14076995849609375, -0.1347808837890625, -0.12879180908203125, -0.122802734375, -0.11681365966796875, -0.1108245849609375, -0.10483551025390625, -0.098846435546875, -0.09285736083984375, -0.0868682861328125, -0.08087921142578125, -0.07489013671875, -0.06890106201171875, -0.0629119873046875, -0.05692291259765625, -0.050933837890625, -0.04494476318359375, -0.0389556884765625, -0.03296661376953125, -0.0269775390625, -0.02098846435546875, -0.0149993896484375, -0.00901031494140625, -0.003021240234375, 0.00296783447265625, 0.0089569091796875, 0.01494598388671875, 0.02093505859375, 0.02692413330078125, 0.0329132080078125, 0.03890228271484375, 0.044891357421875, 0.05088043212890625, 0.0568695068359375, 0.06285858154296875, 0.06884765625, 0.07483673095703125, 0.0808258056640625, 0.08681488037109375, 0.092803955078125, 0.09879302978515625, 0.1047821044921875, 0.11077117919921875, 0.11676025390625, 0.12274932861328125, 0.1287384033203125, 0.13472747802734375, 0.140716552734375, 0.14670562744140625, 0.1526947021484375, 0.15868377685546875, 0.1646728515625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 36.0, 697.0, 198.0, 36.0, 16.0, 4.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.570474624633789, -3.4181900024414062, -3.2659051418304443, -3.1136205196380615, -2.9613356590270996, -2.809051036834717, -2.656766414642334, -2.504481792449951, -2.3521969318389893, -2.1999123096466064, -2.0476274490356445, -1.8953428268432617, -1.7430580854415894, -1.590773344039917, -1.4384887218475342, -1.2862039804458618, -1.1339192390441895, -0.9816344976425171, -0.8293498158454895, -0.6770651340484619, -0.5247803926467896, -0.3724956512451172, -0.2202109694480896, -0.06792628765106201, 0.08435845375061035, 0.23664316534996033, 0.3889278769493103, 0.5412125587463379, 0.6934973001480103, 0.8457820415496826, 0.9980667233467102, 1.1503514051437378, 1.3026361465454102, 1.4549208879470825, 1.6072056293487549, 1.7594902515411377, 1.91177499294281, 2.0640597343444824, 2.2163443565368652, 2.368628978729248, 2.52091383934021, 2.6731984615325928, 2.8254833221435547, 2.9777679443359375, 3.1300525665283203, 3.2823374271392822, 3.434622049331665, 3.586906909942627, 3.7391915321350098, 3.8914761543273926, 4.043760776519775, 4.196045875549316, 4.348330497741699, 4.500615119934082, 4.652899742126465, 4.805184364318848, 4.9574689865112305, 5.109753608703613, 5.262038230895996, 5.414323329925537, 5.56660795211792, 5.718892574310303, 5.8711771965026855, 6.023461818695068, 6.175746917724609]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 7.0, 3.0, 4.0, 6.0, 8.0, 16.0, 16.0, 24.0, 20.0, 26.0, 42.0, 49.0, 60.0, 74.0, 73.0, 79.0, 65.0, 56.0, 60.0, 65.0, 53.0, 55.0, 37.0, 23.0, 17.0, 12.0, 17.0, 7.0, 15.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7649224996566772, -1.7162357568740845, -1.6675491333007812, -1.6188623905181885, -1.5701756477355957, -1.521488904953003, -1.4728021621704102, -1.424115538597107, -1.3754287958145142, -1.3267420530319214, -1.2780554294586182, -1.2293686866760254, -1.1806819438934326, -1.1319952011108398, -1.083308458328247, -1.0346218347549438, -0.9859350919723511, -0.9372483491897583, -0.8885616660118103, -0.8398749828338623, -0.7911882400512695, -0.7425014972686768, -0.6938148140907288, -0.6451281309127808, -0.596441388130188, -0.5477546453475952, -0.4990679621696472, -0.45038124918937683, -0.40169453620910645, -0.35300782322883606, -0.3043211102485657, -0.2556343972682953, -0.2069476842880249, -0.15826097130775452, -0.10957425832748413, -0.060887545347213745, -0.01220083236694336, 0.036485880613327026, 0.08517259359359741, 0.1338593065738678, 0.18254601955413818, 0.23123273253440857, 0.27991944551467896, 0.32860615849494934, 0.3772928714752197, 0.4259795844554901, 0.4746662974357605, 0.5233529806137085, 0.5720397233963013, 0.620726466178894, 0.669413149356842, 0.71809983253479, 0.7667865753173828, 0.8154733180999756, 0.8641600012779236, 0.9128466844558716, 0.9615334272384644, 1.0102201700210571, 1.0589067935943604, 1.1075935363769531, 1.156280279159546, 1.2049670219421387, 1.2536537647247314, 1.3023403882980347, 1.3510271310806274]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 2.0, 3.0, 5.0, 8.0, 9.0, 15.0, 13.0, 26.0, 33.0, 73.0, 75.0, 136.0, 264.0, 505.0, 1129.0, 2787.0, 8185.0, 32777.0, 907229.0, 75336.0, 12835.0, 3997.0, 1594.0, 671.0, 368.0, 172.0, 107.0, 61.0, 44.0, 27.0, 21.0, 19.0, 18.0, 9.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.521484375, -2.446624755859375, -2.37176513671875, -2.296905517578125, -2.2220458984375, -2.147186279296875, -2.07232666015625, -1.997467041015625, -1.922607421875, -1.847747802734375, -1.77288818359375, -1.698028564453125, -1.6231689453125, -1.548309326171875, -1.47344970703125, -1.398590087890625, -1.32373046875, -1.248870849609375, -1.17401123046875, -1.099151611328125, -1.0242919921875, -0.949432373046875, -0.87457275390625, -0.799713134765625, -0.724853515625, -0.649993896484375, -0.57513427734375, -0.500274658203125, -0.4254150390625, -0.350555419921875, -0.27569580078125, -0.200836181640625, -0.1259765625, -0.051116943359375, 0.02374267578125, 0.098602294921875, 0.1734619140625, 0.248321533203125, 0.32318115234375, 0.398040771484375, 0.472900390625, 0.547760009765625, 0.62261962890625, 0.697479248046875, 0.7723388671875, 0.847198486328125, 0.92205810546875, 0.996917724609375, 1.07177734375, 1.146636962890625, 1.22149658203125, 1.296356201171875, 1.3712158203125, 1.446075439453125, 1.52093505859375, 1.595794677734375, 1.670654296875, 1.745513916015625, 1.82037353515625, 1.895233154296875, 1.9700927734375, 2.044952392578125, 2.11981201171875, 2.194671630859375, 2.26953125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 5.0, 4.0, 7.0, 8.0, 16.0, 17.0, 14.0, 34.0, 107.0, 315.0, 291.0, 83.0, 31.0, 13.0, 10.0, 12.0, 4.0, 10.0, 6.0, 7.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.401123046875, -0.39218902587890625, -0.3832550048828125, -0.37432098388671875, -0.365386962890625, -0.35645294189453125, -0.3475189208984375, -0.33858489990234375, -0.32965087890625, -0.32071685791015625, -0.3117828369140625, -0.30284881591796875, -0.293914794921875, -0.28498077392578125, -0.2760467529296875, -0.26711273193359375, -0.2581787109375, -0.24924468994140625, -0.2403106689453125, -0.23137664794921875, -0.222442626953125, -0.21350860595703125, -0.2045745849609375, -0.19564056396484375, -0.18670654296875, -0.17777252197265625, -0.1688385009765625, -0.15990447998046875, -0.150970458984375, -0.14203643798828125, -0.1331024169921875, -0.12416839599609375, -0.115234375, -0.10630035400390625, -0.0973663330078125, -0.08843231201171875, -0.079498291015625, -0.07056427001953125, -0.0616302490234375, -0.05269622802734375, -0.04376220703125, -0.03482818603515625, -0.0258941650390625, -0.01696014404296875, -0.008026123046875, 0.00090789794921875, 0.0098419189453125, 0.01877593994140625, 0.0277099609375, 0.03664398193359375, 0.0455780029296875, 0.05451202392578125, 0.063446044921875, 0.07238006591796875, 0.0813140869140625, 0.09024810791015625, 0.09918212890625, 0.10811614990234375, 0.1170501708984375, 0.12598419189453125, 0.134918212890625, 0.14385223388671875, 0.1527862548828125, 0.16172027587890625, 0.170654296875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 7.0, 9.0, 8.0, 7.0, 12.0, 20.0, 26.0, 19.0, 32.0, 53.0, 81.0, 90.0, 163.0, 265.0, 666.0, 1956.0, 8707.0, 61611.0, 763725.0, 187745.0, 18268.0, 3164.0, 960.0, 386.0, 206.0, 106.0, 59.0, 63.0, 31.0, 24.0, 20.0, 17.0, 17.0, 11.0, 12.0, 10.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1748046875, -1.136566162109375, -1.09832763671875, -1.060089111328125, -1.0218505859375, -0.983612060546875, -0.94537353515625, -0.907135009765625, -0.868896484375, -0.830657958984375, -0.79241943359375, -0.754180908203125, -0.7159423828125, -0.677703857421875, -0.63946533203125, -0.601226806640625, -0.56298828125, -0.524749755859375, -0.48651123046875, -0.448272705078125, -0.4100341796875, -0.371795654296875, -0.33355712890625, -0.295318603515625, -0.257080078125, -0.218841552734375, -0.18060302734375, -0.142364501953125, -0.1041259765625, -0.065887451171875, -0.02764892578125, 0.010589599609375, 0.048828125, 0.087066650390625, 0.12530517578125, 0.163543701171875, 0.2017822265625, 0.240020751953125, 0.27825927734375, 0.316497802734375, 0.354736328125, 0.392974853515625, 0.43121337890625, 0.469451904296875, 0.5076904296875, 0.545928955078125, 0.58416748046875, 0.622406005859375, 0.66064453125, 0.698883056640625, 0.73712158203125, 0.775360107421875, 0.8135986328125, 0.851837158203125, 0.89007568359375, 0.928314208984375, 0.966552734375, 1.004791259765625, 1.04302978515625, 1.081268310546875, 1.1195068359375, 1.157745361328125, 1.19598388671875, 1.234222412109375, 1.2724609375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 7.0, 13.0, 17.0, 15.0, 18.0, 21.0, 31.0, 33.0, 24.0, 23.0, 35.0, 40.0, 32.0, 42.0, 41.0, 46.0, 65.0, 49.0, 48.0, 47.0, 50.0, 30.0, 44.0, 34.0, 28.0, 28.0, 33.0, 16.0, 19.0, 14.0, 9.0, 12.0, 9.0, 5.0, 9.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54931640625, -0.5286407470703125, -0.507965087890625, -0.4872894287109375, -0.46661376953125, -0.4459381103515625, -0.425262451171875, -0.4045867919921875, -0.3839111328125, -0.3632354736328125, -0.342559814453125, -0.3218841552734375, -0.30120849609375, -0.2805328369140625, -0.259857177734375, -0.2391815185546875, -0.218505859375, -0.1978302001953125, -0.177154541015625, -0.1564788818359375, -0.13580322265625, -0.1151275634765625, -0.094451904296875, -0.0737762451171875, -0.0531005859375, -0.0324249267578125, -0.011749267578125, 0.0089263916015625, 0.02960205078125, 0.0502777099609375, 0.070953369140625, 0.0916290283203125, 0.1123046875, 0.1329803466796875, 0.153656005859375, 0.1743316650390625, 0.19500732421875, 0.2156829833984375, 0.236358642578125, 0.2570343017578125, 0.2777099609375, 0.2983856201171875, 0.319061279296875, 0.3397369384765625, 0.36041259765625, 0.3810882568359375, 0.401763916015625, 0.4224395751953125, 0.443115234375, 0.4637908935546875, 0.484466552734375, 0.5051422119140625, 0.52581787109375, 0.5464935302734375, 0.567169189453125, 0.5878448486328125, 0.6085205078125, 0.6291961669921875, 0.649871826171875, 0.6705474853515625, 0.69122314453125, 0.7118988037109375, 0.732574462890625, 0.7532501220703125, 0.77392578125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 8.0, 13.0, 28.0, 37.0, 113.0, 270.0, 1145.0, 21271.0, 1021258.0, 3538.0, 508.0, 210.0, 56.0, 43.0, 20.0, 8.0, 8.0, 3.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.83984375, -4.725311279296875, -4.61077880859375, -4.496246337890625, -4.3817138671875, -4.267181396484375, -4.15264892578125, -4.038116455078125, -3.923583984375, -3.809051513671875, -3.69451904296875, -3.579986572265625, -3.4654541015625, -3.350921630859375, -3.23638916015625, -3.121856689453125, -3.00732421875, -2.892791748046875, -2.77825927734375, -2.663726806640625, -2.5491943359375, -2.434661865234375, -2.32012939453125, -2.205596923828125, -2.091064453125, -1.976531982421875, -1.86199951171875, -1.747467041015625, -1.6329345703125, -1.518402099609375, -1.40386962890625, -1.289337158203125, -1.1748046875, -1.060272216796875, -0.94573974609375, -0.831207275390625, -0.7166748046875, -0.602142333984375, -0.48760986328125, -0.373077392578125, -0.258544921875, -0.144012451171875, -0.02947998046875, 0.085052490234375, 0.1995849609375, 0.314117431640625, 0.42864990234375, 0.543182373046875, 0.65771484375, 0.772247314453125, 0.88677978515625, 1.001312255859375, 1.1158447265625, 1.230377197265625, 1.34490966796875, 1.459442138671875, 1.573974609375, 1.688507080078125, 1.80303955078125, 1.917572021484375, 2.0321044921875, 2.146636962890625, 2.26116943359375, 2.375701904296875, 2.490234375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 2.0, 7.0, 6.0, 15.0, 16.0, 26.0, 63.0, 123.0, 261.0, 237.0, 120.0, 53.0, 21.0, 16.0, 8.0, 6.0, 5.0, 5.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37905502319336e-05, -7.179565727710724e-05, -6.980076432228088e-05, -6.780587136745453e-05, -6.581097841262817e-05, -6.381608545780182e-05, -6.182119250297546e-05, -5.982629954814911e-05, -5.7831406593322754e-05, -5.58365136384964e-05, -5.3841620683670044e-05, -5.184672772884369e-05, -4.9851834774017334e-05, -4.785694181919098e-05, -4.5862048864364624e-05, -4.386715590953827e-05, -4.1872262954711914e-05, -3.987736999988556e-05, -3.7882477045059204e-05, -3.588758409023285e-05, -3.3892691135406494e-05, -3.189779818058014e-05, -2.9902905225753784e-05, -2.790801227092743e-05, -2.5913119316101074e-05, -2.391822636127472e-05, -2.1923333406448364e-05, -1.992844045162201e-05, -1.7933547496795654e-05, -1.59386545419693e-05, -1.3943761587142944e-05, -1.194886863231659e-05, -9.953975677490234e-06, -7.95908272266388e-06, -5.964189767837524e-06, -3.9692968130111694e-06, -1.9744038581848145e-06, 2.0489096641540527e-08, 2.0153820514678955e-06, 4.0102750062942505e-06, 6.0051679611206055e-06, 8.00006091594696e-06, 9.994953870773315e-06, 1.198984682559967e-05, 1.3984739780426025e-05, 1.597963273525238e-05, 1.7974525690078735e-05, 1.996941864490509e-05, 2.1964311599731445e-05, 2.39592045545578e-05, 2.5954097509384155e-05, 2.794899046421051e-05, 2.9943883419036865e-05, 3.193877637386322e-05, 3.3933669328689575e-05, 3.592856228351593e-05, 3.7923455238342285e-05, 3.991834819316864e-05, 4.1913241147994995e-05, 4.390813410282135e-05, 4.5903027057647705e-05, 4.789792001247406e-05, 4.9892812967300415e-05, 5.188770592212677e-05, 5.3882598876953125e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 14.0, 29.0, 45.0, 88.0, 194.0, 566.0, 3359.0, 544387.0, 495471.0, 3412.0, 629.0, 193.0, 75.0, 31.0, 19.0, 12.0, 13.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6484375, -2.5787353515625, -2.509033203125, -2.4393310546875, -2.36962890625, -2.2999267578125, -2.230224609375, -2.1605224609375, -2.0908203125, -2.0211181640625, -1.951416015625, -1.8817138671875, -1.81201171875, -1.7423095703125, -1.672607421875, -1.6029052734375, -1.533203125, -1.4635009765625, -1.393798828125, -1.3240966796875, -1.25439453125, -1.1846923828125, -1.114990234375, -1.0452880859375, -0.9755859375, -0.9058837890625, -0.836181640625, -0.7664794921875, -0.69677734375, -0.6270751953125, -0.557373046875, -0.4876708984375, -0.41796875, -0.3482666015625, -0.278564453125, -0.2088623046875, -0.13916015625, -0.0694580078125, 0.000244140625, 0.0699462890625, 0.1396484375, 0.2093505859375, 0.279052734375, 0.3487548828125, 0.41845703125, 0.4881591796875, 0.557861328125, 0.6275634765625, 0.697265625, 0.7669677734375, 0.836669921875, 0.9063720703125, 0.97607421875, 1.0457763671875, 1.115478515625, 1.1851806640625, 1.2548828125, 1.3245849609375, 1.394287109375, 1.4639892578125, 1.53369140625, 1.6033935546875, 1.673095703125, 1.7427978515625, 1.8125]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 11.0, 5.0, 11.0, 18.0, 45.0, 105.0, 234.0, 290.0, 151.0, 72.0, 23.0, 12.0, 7.0, 6.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.58984375, -1.5481719970703125, -1.506500244140625, -1.4648284912109375, -1.42315673828125, -1.3814849853515625, -1.339813232421875, -1.2981414794921875, -1.2564697265625, -1.2147979736328125, -1.173126220703125, -1.1314544677734375, -1.08978271484375, -1.0481109619140625, -1.006439208984375, -0.9647674560546875, -0.923095703125, -0.8814239501953125, -0.839752197265625, -0.7980804443359375, -0.75640869140625, -0.7147369384765625, -0.673065185546875, -0.6313934326171875, -0.5897216796875, -0.5480499267578125, -0.506378173828125, -0.4647064208984375, -0.42303466796875, -0.3813629150390625, -0.339691162109375, -0.2980194091796875, -0.25634765625, -0.2146759033203125, -0.173004150390625, -0.1313323974609375, -0.08966064453125, -0.0479888916015625, -0.006317138671875, 0.0353546142578125, 0.0770263671875, 0.1186981201171875, 0.160369873046875, 0.2020416259765625, 0.24371337890625, 0.2853851318359375, 0.327056884765625, 0.3687286376953125, 0.410400390625, 0.4520721435546875, 0.493743896484375, 0.5354156494140625, 0.57708740234375, 0.6187591552734375, 0.660430908203125, 0.7021026611328125, 0.7437744140625, 0.7854461669921875, 0.827117919921875, 0.8687896728515625, 0.91046142578125, 0.9521331787109375, 0.993804931640625, 1.0354766845703125, 1.0771484375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 24.0, 377.0, 569.0, 30.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.51348876953125, -16.719120025634766, -15.924751281738281, -15.130382537841797, -14.336012840270996, -13.541644096374512, -12.747275352478027, -11.952905654907227, -11.158536911010742, -10.364168167114258, -9.569799423217773, -8.775430679321289, -7.981060981750488, -7.186692237854004, -6.3923234939575195, -5.597954273223877, -4.803586006164551, -4.009217262268066, -3.214848041534424, -2.4204792976379395, -1.626110315322876, -0.8317413330078125, -0.037372589111328125, 0.7569966316223145, 1.5513653755187988, 2.3457343578338623, 3.140103340148926, 3.93447208404541, 4.7288408279418945, 5.523210048675537, 6.3175787925720215, 7.111948013305664, 7.906316757202148, 8.700685501098633, 9.495054244995117, 10.289422988891602, 11.083792686462402, 11.878161430358887, 12.672530174255371, 13.466899871826172, 14.261268615722656, 15.05563735961914, 15.850006103515625, 16.64437484741211, 17.438743591308594, 18.233112335205078, 19.027481079101562, 19.82185173034668, 20.61621856689453, 21.410587310791016, 22.2049560546875, 22.999324798583984, 23.79369354248047, 24.588062286376953, 25.382431030273438, 26.176801681518555, 26.97117042541504, 27.765539169311523, 28.559907913208008, 29.354276657104492, 30.148645401000977, 30.943016052246094, 31.737384796142578, 32.53175354003906, 33.32612228393555]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 3.0, 4.0, 7.0, 6.0, 8.0, 8.0, 11.0, 5.0, 22.0, 24.0, 39.0, 58.0, 72.0, 90.0, 126.0, 99.0, 83.0, 57.0, 74.0, 61.0, 35.0, 25.0, 24.0, 17.0, 12.0, 9.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.278552055358887, -9.018057823181152, -8.757563591003418, -8.497069358825684, -8.23657512664795, -7.976080894470215, -7.715586185455322, -7.455091953277588, -7.1945977210998535, -6.934103488922119, -6.673609256744385, -6.41311502456665, -6.152620315551758, -5.892126083374023, -5.631631851196289, -5.371137619018555, -5.11064338684082, -4.850149154663086, -4.589654922485352, -4.329160690307617, -4.068666458129883, -3.8081719875335693, -3.547677516937256, -3.2871832847595215, -3.026689052581787, -2.7661948204040527, -2.5057005882263184, -2.245206117630005, -1.9847118854522705, -1.7242176532745361, -1.4637233018875122, -1.2032289505004883, -0.9427356719970703, -0.6822413802146912, -0.421747088432312, -0.16125279664993286, 0.09924149513244629, 0.35973572731018066, 0.6202300786972046, 0.8807244300842285, 1.141218662261963, 1.4017128944396973, 1.6622072458267212, 1.9227015972137451, 2.1831958293914795, 2.443690061569214, 2.7041845321655273, 2.9646787643432617, 3.225172996520996, 3.4856672286987305, 3.746161460876465, 4.006655693054199, 4.267149925231934, 4.527644157409668, 4.7881388664245605, 5.048633098602295, 5.309127330780029, 5.569621562957764, 5.830115795135498, 6.090610027313232, 6.351104736328125, 6.611598968505859, 6.872093200683594, 7.132587432861328, 7.3930816650390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 6.0, 7.0, 14.0, 8.0, 12.0, 18.0, 21.0, 25.0, 53.0, 56.0, 72.0, 112.0, 175.0, 290.0, 568.0, 1424.0, 5267.0, 152700.0, 4023343.0, 7243.0, 1653.0, 641.0, 271.0, 120.0, 77.0, 40.0, 24.0, 14.0, 10.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.875, -9.6510009765625, -9.427001953125, -9.2030029296875, -8.97900390625, -8.7550048828125, -8.531005859375, -8.3070068359375, -8.0830078125, -7.8590087890625, -7.635009765625, -7.4110107421875, -7.18701171875, -6.9630126953125, -6.739013671875, -6.5150146484375, -6.291015625, -6.0670166015625, -5.843017578125, -5.6190185546875, -5.39501953125, -5.1710205078125, -4.947021484375, -4.7230224609375, -4.4990234375, -4.2750244140625, -4.051025390625, -3.8270263671875, -3.60302734375, -3.3790283203125, -3.155029296875, -2.9310302734375, -2.70703125, -2.4830322265625, -2.259033203125, -2.0350341796875, -1.81103515625, -1.5870361328125, -1.363037109375, -1.1390380859375, -0.9150390625, -0.6910400390625, -0.467041015625, -0.2430419921875, -0.01904296875, 0.2049560546875, 0.428955078125, 0.6529541015625, 0.876953125, 1.1009521484375, 1.324951171875, 1.5489501953125, 1.77294921875, 1.9969482421875, 2.220947265625, 2.4449462890625, 2.6689453125, 2.8929443359375, 3.116943359375, 3.3409423828125, 3.56494140625, 3.7889404296875, 4.012939453125, 4.2369384765625, 4.4609375]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 5.0, 2.0, 2.0, 7.0, 13.0, 18.0, 25.0, 67.0, 215.0, 327.0, 180.0, 68.0, 35.0, 13.0, 9.0, 11.0, 3.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.436767578125, -0.42693138122558594, -0.4170951843261719, -0.4072589874267578, -0.39742279052734375, -0.3875865936279297, -0.3777503967285156, -0.36791419982910156, -0.3580780029296875, -0.34824180603027344, -0.3384056091308594, -0.3285694122314453, -0.31873321533203125, -0.3088970184326172, -0.2990608215332031, -0.28922462463378906, -0.279388427734375, -0.26955223083496094, -0.2597160339355469, -0.2498798370361328, -0.24004364013671875, -0.2302074432373047, -0.22037124633789062, -0.21053504943847656, -0.2006988525390625, -0.19086265563964844, -0.18102645874023438, -0.1711902618408203, -0.16135406494140625, -0.1515178680419922, -0.14168167114257812, -0.13184547424316406, -0.12200927734375, -0.11217308044433594, -0.10233688354492188, -0.09250068664550781, -0.08266448974609375, -0.07282829284667969, -0.06299209594726562, -0.05315589904785156, -0.0433197021484375, -0.03348350524902344, -0.023647308349609375, -0.013811111450195312, -0.00397491455078125, 0.0058612823486328125, 0.015697479248046875, 0.025533676147460938, 0.035369873046875, 0.04520606994628906, 0.055042266845703125, 0.06487846374511719, 0.07471466064453125, 0.08455085754394531, 0.09438705444335938, 0.10422325134277344, 0.1140594482421875, 0.12389564514160156, 0.13373184204101562, 0.1435680389404297, 0.15340423583984375, 0.1632404327392578, 0.17307662963867188, 0.18291282653808594, 0.1927490234375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 5.0, 6.0, 2.0, 5.0, 4.0, 14.0, 22.0, 40.0, 71.0, 200.0, 659.0, 4762.0, 2153076.0, 2029319.0, 4960.0, 715.0, 202.0, 90.0, 50.0, 29.0, 13.0, 10.0, 7.0, 1.0, 3.0, 6.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.615234375, -3.490570068359375, -3.36590576171875, -3.241241455078125, -3.1165771484375, -2.991912841796875, -2.86724853515625, -2.742584228515625, -2.617919921875, -2.493255615234375, -2.36859130859375, -2.243927001953125, -2.1192626953125, -1.994598388671875, -1.86993408203125, -1.745269775390625, -1.62060546875, -1.495941162109375, -1.37127685546875, -1.246612548828125, -1.1219482421875, -0.997283935546875, -0.87261962890625, -0.747955322265625, -0.623291015625, -0.498626708984375, -0.37396240234375, -0.249298095703125, -0.1246337890625, 3.0517578125e-05, 0.12469482421875, 0.249359130859375, 0.3740234375, 0.498687744140625, 0.62335205078125, 0.748016357421875, 0.8726806640625, 0.997344970703125, 1.12200927734375, 1.246673583984375, 1.371337890625, 1.496002197265625, 1.62066650390625, 1.745330810546875, 1.8699951171875, 1.994659423828125, 2.11932373046875, 2.243988037109375, 2.36865234375, 2.493316650390625, 2.61798095703125, 2.742645263671875, 2.8673095703125, 2.991973876953125, 3.11663818359375, 3.241302490234375, 3.365966796875, 3.490631103515625, 3.61529541015625, 3.739959716796875, 3.8646240234375, 3.989288330078125, 4.11395263671875, 4.238616943359375, 4.36328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 2.0, 4.0, 5.0, 5.0, 9.0, 12.0, 24.0, 32.0, 64.0, 160.0, 520.0, 2500.0, 427.0, 121.0, 67.0, 30.0, 26.0, 12.0, 12.0, 9.0, 4.0, 3.0, 5.0, 1.0, 5.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3857421875, -0.3745231628417969, -0.36330413818359375, -0.3520851135253906, -0.3408660888671875, -0.3296470642089844, -0.31842803955078125, -0.3072090148925781, -0.295989990234375, -0.2847709655761719, -0.27355194091796875, -0.2623329162597656, -0.2511138916015625, -0.23989486694335938, -0.22867584228515625, -0.21745681762695312, -0.20623779296875, -0.19501876831054688, -0.18379974365234375, -0.17258071899414062, -0.1613616943359375, -0.15014266967773438, -0.13892364501953125, -0.12770462036132812, -0.116485595703125, -0.10526657104492188, -0.09404754638671875, -0.08282852172851562, -0.0716094970703125, -0.060390472412109375, -0.04917144775390625, -0.037952423095703125, -0.0267333984375, -0.015514373779296875, -0.00429534912109375, 0.006923675537109375, 0.0181427001953125, 0.029361724853515625, 0.04058074951171875, 0.051799774169921875, 0.063018798828125, 0.07423782348632812, 0.08545684814453125, 0.09667587280273438, 0.1078948974609375, 0.11911392211914062, 0.13033294677734375, 0.14155197143554688, 0.15277099609375, 0.16399002075195312, 0.17520904541015625, 0.18642807006835938, 0.1976470947265625, 0.20886611938476562, 0.22008514404296875, 0.23130416870117188, 0.242523193359375, 0.2537422180175781, 0.26496124267578125, 0.2761802673339844, 0.2873992919921875, 0.2986183166503906, 0.30983734130859375, 0.3210563659667969, 0.332275390625]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 8.0, 8.0, 30.0, 54.0, 97.0, 399.0, 308.0, 64.0, 19.0, 11.0, 6.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.0048153400421143, -1.9438722133636475, -1.8829290866851807, -1.8219859600067139, -1.761042833328247, -1.7000997066497803, -1.6391565799713135, -1.5782135725021362, -1.5172704458236694, -1.4563273191452026, -1.3953841924667358, -1.334441065788269, -1.2734979391098022, -1.212554931640625, -1.1516118049621582, -1.0906686782836914, -1.0297255516052246, -0.9687824249267578, -0.907839298248291, -0.8468961715698242, -0.7859531044960022, -0.7250099778175354, -0.6640668511390686, -0.6031237840652466, -0.5421805381774902, -0.48123741149902344, -0.42029431462287903, -0.35935118794441223, -0.2984080910682678, -0.23746496438980103, -0.17652183771133423, -0.11557874083518982, -0.05463564395904541, 0.006307471543550491, 0.06725058704614639, 0.1281937062740326, 0.1891368180513382, 0.2500799298286438, 0.3110230565071106, 0.371966153383255, 0.4329092800617218, 0.4938524067401886, 0.554795503616333, 0.6157386302947998, 0.6766817569732666, 0.7376248836517334, 0.7985680103302002, 0.8595110774040222, 0.920454204082489, 0.9813973307609558, 1.0423403978347778, 1.1032835245132446, 1.1642266511917114, 1.2251697778701782, 1.286112904548645, 1.3470560312271118, 1.4079991579055786, 1.4689422845840454, 1.5298854112625122, 1.590828537940979, 1.6517716646194458, 1.712714672088623, 1.7736577987670898, 1.8346009254455566, 1.8955440521240234]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 8.0, 6.0, 3.0, 8.0, 11.0, 8.0, 13.0, 16.0, 17.0, 28.0, 27.0, 34.0, 48.0, 69.0, 71.0, 62.0, 68.0, 69.0, 73.0, 77.0, 63.0, 48.0, 43.0, 36.0, 24.0, 22.0, 17.0, 6.0, 4.0, 11.0, 6.0, 1.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1247484683990479, -1.0869015455245972, -1.0490546226501465, -1.0112075805664062, -0.9733606576919556, -0.9355137348175049, -0.8976668119430542, -0.8598198294639587, -0.8219728469848633, -0.7841259241104126, -0.7462789416313171, -0.7084320187568665, -0.670585036277771, -0.6327381134033203, -0.5948911905288696, -0.5570442080497742, -0.5191972851753235, -0.4813503324985504, -0.44350337982177734, -0.40565645694732666, -0.3678094744682312, -0.3299625515937805, -0.29211559891700745, -0.2542686462402344, -0.2164216935634613, -0.17857474088668823, -0.14072778820991516, -0.10288085043430328, -0.06503389775753021, -0.02718694508075714, 0.010659992694854736, 0.04850694537162781, 0.08635389804840088, 0.12420085072517395, 0.16204780340194702, 0.1998947411775589, 0.23774169385433197, 0.27558863162994385, 0.3134355843067169, 0.35128253698349, 0.38912948966026306, 0.42697644233703613, 0.4648233950138092, 0.5026703476905823, 0.540517270565033, 0.5783642530441284, 0.6162111759185791, 0.6540580987930298, 0.6919050812721252, 0.7297520041465759, 0.7675989866256714, 0.8054459095001221, 0.8432928919792175, 0.8811398148536682, 0.9189867973327637, 0.9568337202072144, 0.994680643081665, 1.0325275659561157, 1.0703744888305664, 1.1082215309143066, 1.1460684537887573, 1.183915376663208, 1.2217622995376587, 1.2596092224121094, 1.2974562644958496]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 7.0, 19.0, 26.0, 33.0, 36.0, 66.0, 91.0, 180.0, 301.0, 591.0, 1369.0, 4694.0, 56979.0, 962422.0, 16682.0, 2877.0, 1025.0, 470.0, 226.0, 172.0, 81.0, 53.0, 37.0, 16.0, 30.0, 20.0, 14.0, 6.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.427734375, -2.3502197265625, -2.272705078125, -2.1951904296875, -2.11767578125, -2.0401611328125, -1.962646484375, -1.8851318359375, -1.8076171875, -1.7301025390625, -1.652587890625, -1.5750732421875, -1.49755859375, -1.4200439453125, -1.342529296875, -1.2650146484375, -1.1875, -1.1099853515625, -1.032470703125, -0.9549560546875, -0.87744140625, -0.7999267578125, -0.722412109375, -0.6448974609375, -0.5673828125, -0.4898681640625, -0.412353515625, -0.3348388671875, -0.25732421875, -0.1798095703125, -0.102294921875, -0.0247802734375, 0.052734375, 0.1302490234375, 0.207763671875, 0.2852783203125, 0.36279296875, 0.4403076171875, 0.517822265625, 0.5953369140625, 0.6728515625, 0.7503662109375, 0.827880859375, 0.9053955078125, 0.98291015625, 1.0604248046875, 1.137939453125, 1.2154541015625, 1.29296875, 1.3704833984375, 1.447998046875, 1.5255126953125, 1.60302734375, 1.6805419921875, 1.758056640625, 1.8355712890625, 1.9130859375, 1.9906005859375, 2.068115234375, 2.1456298828125, 2.22314453125, 2.3006591796875, 2.378173828125, 2.4556884765625, 2.533203125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 17.0, 23.0, 67.0, 210.0, 342.0, 208.0, 70.0, 24.0, 12.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41259765625, -0.40329742431640625, -0.3939971923828125, -0.38469696044921875, -0.375396728515625, -0.36609649658203125, -0.3567962646484375, -0.34749603271484375, -0.33819580078125, -0.32889556884765625, -0.3195953369140625, -0.31029510498046875, -0.300994873046875, -0.29169464111328125, -0.2823944091796875, -0.27309417724609375, -0.2637939453125, -0.25449371337890625, -0.2451934814453125, -0.23589324951171875, -0.226593017578125, -0.21729278564453125, -0.2079925537109375, -0.19869232177734375, -0.18939208984375, -0.18009185791015625, -0.1707916259765625, -0.16149139404296875, -0.152191162109375, -0.14289093017578125, -0.1335906982421875, -0.12429046630859375, -0.114990234375, -0.10569000244140625, -0.0963897705078125, -0.08708953857421875, -0.077789306640625, -0.06848907470703125, -0.0591888427734375, -0.04988861083984375, -0.04058837890625, -0.03128814697265625, -0.0219879150390625, -0.01268768310546875, -0.003387451171875, 0.00591278076171875, 0.0152130126953125, 0.02451324462890625, 0.0338134765625, 0.04311370849609375, 0.0524139404296875, 0.06171417236328125, 0.071014404296875, 0.08031463623046875, 0.0896148681640625, 0.09891510009765625, 0.10821533203125, 0.11751556396484375, 0.1268157958984375, 0.13611602783203125, 0.145416259765625, 0.15471649169921875, 0.1640167236328125, 0.17331695556640625, 0.1826171875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 5.0, 11.0, 25.0, 20.0, 39.0, 44.0, 63.0, 79.0, 128.0, 205.0, 310.0, 561.0, 1445.0, 5274.0, 36461.0, 758562.0, 224662.0, 15591.0, 2882.0, 960.0, 431.0, 245.0, 150.0, 125.0, 95.0, 63.0, 24.0, 33.0, 12.0, 8.0, 9.0, 9.0, 9.0, 6.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4580078125, -1.41839599609375, -1.3787841796875, -1.33917236328125, -1.299560546875, -1.25994873046875, -1.2203369140625, -1.18072509765625, -1.14111328125, -1.10150146484375, -1.0618896484375, -1.02227783203125, -0.982666015625, -0.94305419921875, -0.9034423828125, -0.86383056640625, -0.82421875, -0.78460693359375, -0.7449951171875, -0.70538330078125, -0.665771484375, -0.62615966796875, -0.5865478515625, -0.54693603515625, -0.50732421875, -0.46771240234375, -0.4281005859375, -0.38848876953125, -0.348876953125, -0.30926513671875, -0.2696533203125, -0.23004150390625, -0.1904296875, -0.15081787109375, -0.1112060546875, -0.07159423828125, -0.031982421875, 0.00762939453125, 0.0472412109375, 0.08685302734375, 0.12646484375, 0.16607666015625, 0.2056884765625, 0.24530029296875, 0.284912109375, 0.32452392578125, 0.3641357421875, 0.40374755859375, 0.443359375, 0.48297119140625, 0.5225830078125, 0.56219482421875, 0.601806640625, 0.64141845703125, 0.6810302734375, 0.72064208984375, 0.76025390625, 0.79986572265625, 0.8394775390625, 0.87908935546875, 0.918701171875, 0.95831298828125, 0.9979248046875, 1.03753662109375, 1.0771484375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 11.0, 9.0, 9.0, 9.0, 14.0, 17.0, 26.0, 23.0, 31.0, 33.0, 28.0, 33.0, 39.0, 48.0, 56.0, 50.0, 50.0, 40.0, 56.0, 41.0, 58.0, 41.0, 23.0, 42.0, 34.0, 35.0, 25.0, 10.0, 20.0, 19.0, 16.0, 7.0, 8.0, 11.0, 5.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.64013671875, -0.6218948364257812, -0.6036529541015625, -0.5854110717773438, -0.567169189453125, -0.5489273071289062, -0.5306854248046875, -0.5124435424804688, -0.49420166015625, -0.47595977783203125, -0.4577178955078125, -0.43947601318359375, -0.421234130859375, -0.40299224853515625, -0.3847503662109375, -0.36650848388671875, -0.3482666015625, -0.33002471923828125, -0.3117828369140625, -0.29354095458984375, -0.275299072265625, -0.25705718994140625, -0.2388153076171875, -0.22057342529296875, -0.20233154296875, -0.18408966064453125, -0.1658477783203125, -0.14760589599609375, -0.129364013671875, -0.11112213134765625, -0.0928802490234375, -0.07463836669921875, -0.056396484375, -0.03815460205078125, -0.0199127197265625, -0.00167083740234375, 0.016571044921875, 0.03481292724609375, 0.0530548095703125, 0.07129669189453125, 0.08953857421875, 0.10778045654296875, 0.1260223388671875, 0.14426422119140625, 0.162506103515625, 0.18074798583984375, 0.1989898681640625, 0.21723175048828125, 0.2354736328125, 0.25371551513671875, 0.2719573974609375, 0.29019927978515625, 0.308441162109375, 0.32668304443359375, 0.3449249267578125, 0.36316680908203125, 0.38140869140625, 0.39965057373046875, 0.4178924560546875, 0.43613433837890625, 0.454376220703125, 0.47261810302734375, 0.4908599853515625, 0.5091018676757812, 0.52734375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 8.0, 10.0, 14.0, 30.0, 34.0, 75.0, 133.0, 304.0, 902.0, 5068.0, 474096.0, 560843.0, 5365.0, 983.0, 310.0, 155.0, 91.0, 41.0, 29.0, 19.0, 15.0, 4.0, 11.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.8251953125, -0.800933837890625, -0.77667236328125, -0.752410888671875, -0.7281494140625, -0.703887939453125, -0.67962646484375, -0.655364990234375, -0.631103515625, -0.606842041015625, -0.58258056640625, -0.558319091796875, -0.5340576171875, -0.509796142578125, -0.48553466796875, -0.461273193359375, -0.43701171875, -0.412750244140625, -0.38848876953125, -0.364227294921875, -0.3399658203125, -0.315704345703125, -0.29144287109375, -0.267181396484375, -0.242919921875, -0.218658447265625, -0.19439697265625, -0.170135498046875, -0.1458740234375, -0.121612548828125, -0.09735107421875, -0.073089599609375, -0.048828125, -0.024566650390625, -0.00030517578125, 0.023956298828125, 0.0482177734375, 0.072479248046875, 0.09674072265625, 0.121002197265625, 0.145263671875, 0.169525146484375, 0.19378662109375, 0.218048095703125, 0.2423095703125, 0.266571044921875, 0.29083251953125, 0.315093994140625, 0.33935546875, 0.363616943359375, 0.38787841796875, 0.412139892578125, 0.4364013671875, 0.460662841796875, 0.48492431640625, 0.509185791015625, 0.533447265625, 0.557708740234375, 0.58197021484375, 0.606231689453125, 0.6304931640625, 0.654754638671875, 0.67901611328125, 0.703277587890625, 0.7275390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 4.0, 7.0, 8.0, 17.0, 18.0, 32.0, 42.0, 57.0, 47.0, 84.0, 81.0, 131.0, 112.0, 98.0, 69.0, 48.0, 40.0, 25.0, 27.0, 23.0, 5.0, 7.0, 7.0, 1.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014150142669677734, -0.0001376476138830185, -0.00013379380106925964, -0.0001299399882555008, -0.00012608617544174194, -0.0001222323626279831, -0.00011837854981422424, -0.00011452473700046539, -0.00011067092418670654, -0.00010681711137294769, -0.00010296329855918884, -9.910948574542999e-05, -9.525567293167114e-05, -9.140186011791229e-05, -8.754804730415344e-05, -8.369423449039459e-05, -7.984042167663574e-05, -7.598660886287689e-05, -7.213279604911804e-05, -6.827898323535919e-05, -6.442517042160034e-05, -6.057135760784149e-05, -5.671754479408264e-05, -5.286373198032379e-05, -4.900991916656494e-05, -4.515610635280609e-05, -4.130229353904724e-05, -3.744848072528839e-05, -3.359466791152954e-05, -2.974085509777069e-05, -2.588704228401184e-05, -2.203322947025299e-05, -1.817941665649414e-05, -1.432560384273529e-05, -1.047179102897644e-05, -6.61797821521759e-06, -2.7641654014587402e-06, 1.0896474123001099e-06, 4.94346022605896e-06, 8.79727303981781e-06, 1.265108585357666e-05, 1.650489866733551e-05, 2.035871148109436e-05, 2.421252429485321e-05, 2.806633710861206e-05, 3.192014992237091e-05, 3.577396273612976e-05, 3.962777554988861e-05, 4.348158836364746e-05, 4.733540117740631e-05, 5.118921399116516e-05, 5.504302680492401e-05, 5.889683961868286e-05, 6.275065243244171e-05, 6.660446524620056e-05, 7.045827805995941e-05, 7.431209087371826e-05, 7.816590368747711e-05, 8.201971650123596e-05, 8.587352931499481e-05, 8.972734212875366e-05, 9.358115494251251e-05, 9.743496775627136e-05, 0.00010128878057003021, 0.00010514259338378906]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 7.0, 9.0, 13.0, 21.0, 31.0, 50.0, 109.0, 257.0, 737.0, 3439.0, 120090.0, 913112.0, 8758.0, 1228.0, 381.0, 142.0, 67.0, 39.0, 28.0, 11.0, 11.0, 8.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4384765625, -1.4043807983398438, -1.3702850341796875, -1.3361892700195312, -1.302093505859375, -1.2679977416992188, -1.2339019775390625, -1.1998062133789062, -1.16571044921875, -1.1316146850585938, -1.0975189208984375, -1.0634231567382812, -1.029327392578125, -0.9952316284179688, -0.9611358642578125, -0.9270401000976562, -0.8929443359375, -0.8588485717773438, -0.8247528076171875, -0.7906570434570312, -0.756561279296875, -0.7224655151367188, -0.6883697509765625, -0.6542739868164062, -0.62017822265625, -0.5860824584960938, -0.5519866943359375, -0.5178909301757812, -0.483795166015625, -0.44969940185546875, -0.4156036376953125, -0.38150787353515625, -0.347412109375, -0.31331634521484375, -0.2792205810546875, -0.24512481689453125, -0.211029052734375, -0.17693328857421875, -0.1428375244140625, -0.10874176025390625, -0.07464599609375, -0.04055023193359375, -0.0064544677734375, 0.02764129638671875, 0.061737060546875, 0.09583282470703125, 0.1299285888671875, 0.16402435302734375, 0.1981201171875, 0.23221588134765625, 0.2663116455078125, 0.30040740966796875, 0.334503173828125, 0.36859893798828125, 0.4026947021484375, 0.43679046630859375, 0.47088623046875, 0.5049819946289062, 0.5390777587890625, 0.5731735229492188, 0.607269287109375, 0.6413650512695312, 0.6754608154296875, 0.7095565795898438, 0.74365234375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 9.0, 10.0, 11.0, 9.0, 14.0, 21.0, 20.0, 52.0, 52.0, 101.0, 128.0, 139.0, 112.0, 91.0, 63.0, 42.0, 43.0, 22.0, 15.0, 12.0, 9.0, 4.0, 4.0, 8.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3154296875, -0.3035888671875, -0.291748046875, -0.2799072265625, -0.26806640625, -0.2562255859375, -0.244384765625, -0.2325439453125, -0.220703125, -0.2088623046875, -0.197021484375, -0.1851806640625, -0.17333984375, -0.1614990234375, -0.149658203125, -0.1378173828125, -0.1259765625, -0.1141357421875, -0.102294921875, -0.0904541015625, -0.07861328125, -0.0667724609375, -0.054931640625, -0.0430908203125, -0.03125, -0.0194091796875, -0.007568359375, 0.0042724609375, 0.01611328125, 0.0279541015625, 0.039794921875, 0.0516357421875, 0.0634765625, 0.0753173828125, 0.087158203125, 0.0989990234375, 0.11083984375, 0.1226806640625, 0.134521484375, 0.1463623046875, 0.158203125, 0.1700439453125, 0.181884765625, 0.1937255859375, 0.20556640625, 0.2174072265625, 0.229248046875, 0.2410888671875, 0.2529296875, 0.2647705078125, 0.276611328125, 0.2884521484375, 0.30029296875, 0.3121337890625, 0.323974609375, 0.3358154296875, 0.34765625, 0.3594970703125, 0.371337890625, 0.3831787109375, 0.39501953125, 0.4068603515625, 0.418701171875, 0.4305419921875, 0.4423828125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 8.0, 17.0, 25.0, 109.0, 524.0, 247.0, 49.0, 16.0, 9.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-13.821868896484375, -13.473261833190918, -13.124654769897461, -12.776047706604004, -12.427440643310547, -12.07883358001709, -11.730226516723633, -11.381619453430176, -11.033012390136719, -10.684405326843262, -10.335798263549805, -9.987191200256348, -9.63858413696289, -9.289977073669434, -8.941370010375977, -8.59276294708252, -8.244155883789062, -7.8955488204956055, -7.546941757202148, -7.198334693908691, -6.849727630615234, -6.501120567321777, -6.15251350402832, -5.803906440734863, -5.45529842376709, -5.106691360473633, -4.758084297180176, -4.409477233886719, -4.060870170593262, -3.7122631072998047, -3.3636558055877686, -3.0150487422943115, -2.6664419174194336, -2.3178348541259766, -1.9692277908325195, -1.620620608329773, -1.272013545036316, -0.9234064817428589, -0.5747992992401123, -0.22619223594665527, 0.12241482734680176, 0.4710219204425812, 0.8196290135383606, 1.1682361364364624, 1.5168431997299194, 1.8654502630233765, 2.214057445526123, 2.56266450881958, 2.911271572113037, 3.259878635406494, 3.608485698699951, 3.957092761993408, 4.305699825286865, 4.654306888580322, 5.0029144287109375, 5.3515214920043945, 5.700128555297852, 6.048735618591309, 6.397342681884766, 6.745949745178223, 7.09455680847168, 7.443163871765137, 7.791770935058594, 8.14037799835205, 8.488985061645508]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 6.0, 7.0, 9.0, 7.0, 10.0, 11.0, 14.0, 24.0, 21.0, 25.0, 35.0, 45.0, 45.0, 52.0, 65.0, 68.0, 63.0, 59.0, 65.0, 68.0, 50.0, 50.0, 38.0, 42.0, 25.0, 31.0, 18.0, 12.0, 16.0, 6.0, 2.0, 4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.809298992156982, -5.6386823654174805, -5.4680657386779785, -5.297449111938477, -5.126832962036133, -4.956216335296631, -4.785599708557129, -4.614983081817627, -4.444366455078125, -4.273749828338623, -4.103133201599121, -3.9325168132781982, -3.7619001865386963, -3.5912835597991943, -3.4206671714782715, -3.2500505447387695, -3.0794339179992676, -2.9088172912597656, -2.7382006645202637, -2.567584276199341, -2.396967649459839, -2.226351022720337, -2.055734634399414, -1.885118007659912, -1.7145013809204102, -1.5438847541809082, -1.3732682466506958, -1.2026517391204834, -1.0320351123809814, -0.8614185452461243, -0.6908019781112671, -0.5201854705810547, -0.34956836700439453, -0.17895179986953735, -0.008335232734680176, 0.162281334400177, 0.3328979015350342, 0.5035144686698914, 0.6741310358047485, 0.8447475433349609, 1.015364170074463, 1.1859807968139648, 1.3565973043441772, 1.5272138118743896, 1.6978304386138916, 1.8684470653533936, 2.0390634536743164, 2.2096800804138184, 2.3802967071533203, 2.5509133338928223, 2.721529960632324, 2.892146348953247, 3.062762975692749, 3.233379602432251, 3.403995990753174, 3.574612617492676, 3.7452292442321777, 3.9158458709716797, 4.086462497711182, 4.257079124450684, 4.427695274353027, 4.598311901092529, 4.768928527832031, 4.939545154571533, 5.110161781311035]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 6.0, 19.0, 37.0, 55.0, 185.0, 596.0, 7185.0, 4184660.0, 1235.0, 208.0, 62.0, 15.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.625, -20.1700439453125, -19.715087890625, -19.2601318359375, -18.80517578125, -18.3502197265625, -17.895263671875, -17.4403076171875, -16.9853515625, -16.5303955078125, -16.075439453125, -15.6204833984375, -15.16552734375, -14.7105712890625, -14.255615234375, -13.8006591796875, -13.345703125, -12.8907470703125, -12.435791015625, -11.9808349609375, -11.52587890625, -11.0709228515625, -10.615966796875, -10.1610107421875, -9.7060546875, -9.2510986328125, -8.796142578125, -8.3411865234375, -7.88623046875, -7.4312744140625, -6.976318359375, -6.5213623046875, -6.06640625, -5.6114501953125, -5.156494140625, -4.7015380859375, -4.24658203125, -3.7916259765625, -3.336669921875, -2.8817138671875, -2.4267578125, -1.9718017578125, -1.516845703125, -1.0618896484375, -0.60693359375, -0.1519775390625, 0.302978515625, 0.7579345703125, 1.212890625, 1.6678466796875, 2.122802734375, 2.5777587890625, 3.03271484375, 3.4876708984375, 3.942626953125, 4.3975830078125, 4.8525390625, 5.3074951171875, 5.762451171875, 6.2174072265625, 6.67236328125, 7.1273193359375, 7.582275390625, 8.0372314453125, 8.4921875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 19.0, 41.0, 101.0, 211.0, 274.0, 199.0, 89.0, 39.0, 10.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50341796875, -0.4923057556152344, -0.48119354248046875, -0.4700813293457031, -0.4589691162109375, -0.4478569030761719, -0.43674468994140625, -0.4256324768066406, -0.414520263671875, -0.4034080505371094, -0.39229583740234375, -0.3811836242675781, -0.3700714111328125, -0.3589591979980469, -0.34784698486328125, -0.3367347717285156, -0.32562255859375, -0.3145103454589844, -0.30339813232421875, -0.2922859191894531, -0.2811737060546875, -0.2700614929199219, -0.25894927978515625, -0.24783706665039062, -0.236724853515625, -0.22561264038085938, -0.21450042724609375, -0.20338821411132812, -0.1922760009765625, -0.18116378784179688, -0.17005157470703125, -0.15893936157226562, -0.1478271484375, -0.13671493530273438, -0.12560272216796875, -0.11449050903320312, -0.1033782958984375, -0.09226608276367188, -0.08115386962890625, -0.07004165649414062, -0.058929443359375, -0.047817230224609375, -0.03670501708984375, -0.025592803955078125, -0.0144805908203125, -0.003368377685546875, 0.00774383544921875, 0.018856048583984375, 0.02996826171875, 0.041080474853515625, 0.05219268798828125, 0.06330490112304688, 0.0744171142578125, 0.08552932739257812, 0.09664154052734375, 0.10775375366210938, 0.118865966796875, 0.12997817993164062, 0.14109039306640625, 0.15220260620117188, 0.1633148193359375, 0.17442703247070312, 0.18553924560546875, 0.19665145874023438, 0.207763671875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 3.0, 7.0, 6.0, 18.0, 12.0, 22.0, 27.0, 63.0, 61.0, 109.0, 169.0, 382.0, 909.0, 3045.0, 16391.0, 567715.0, 3575565.0, 23972.0, 3895.0, 1010.0, 400.0, 176.0, 103.0, 66.0, 52.0, 25.0, 24.0, 21.0, 12.0, 6.0, 10.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.8662109375, -1.822906494140625, -1.77960205078125, -1.736297607421875, -1.6929931640625, -1.649688720703125, -1.60638427734375, -1.563079833984375, -1.519775390625, -1.476470947265625, -1.43316650390625, -1.389862060546875, -1.3465576171875, -1.303253173828125, -1.25994873046875, -1.216644287109375, -1.17333984375, -1.130035400390625, -1.08673095703125, -1.043426513671875, -1.0001220703125, -0.956817626953125, -0.91351318359375, -0.870208740234375, -0.826904296875, -0.783599853515625, -0.74029541015625, -0.696990966796875, -0.6536865234375, -0.610382080078125, -0.56707763671875, -0.523773193359375, -0.48046875, -0.437164306640625, -0.39385986328125, -0.350555419921875, -0.3072509765625, -0.263946533203125, -0.22064208984375, -0.177337646484375, -0.134033203125, -0.090728759765625, -0.04742431640625, -0.004119873046875, 0.0391845703125, 0.082489013671875, 0.12579345703125, 0.169097900390625, 0.21240234375, 0.255706787109375, 0.29901123046875, 0.342315673828125, 0.3856201171875, 0.428924560546875, 0.47222900390625, 0.515533447265625, 0.558837890625, 0.602142333984375, 0.64544677734375, 0.688751220703125, 0.7320556640625, 0.775360107421875, 0.81866455078125, 0.861968994140625, 0.9052734375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 6.0, 10.0, 12.0, 16.0, 25.0, 37.0, 66.0, 138.0, 467.0, 2256.0, 677.0, 181.0, 56.0, 51.0, 20.0, 18.0, 11.0, 5.0, 4.0, 3.0, 6.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-0.4619140625, -0.4517860412597656, -0.44165802001953125, -0.4315299987792969, -0.4214019775390625, -0.4112739562988281, -0.40114593505859375, -0.3910179138183594, -0.380889892578125, -0.3707618713378906, -0.36063385009765625, -0.3505058288574219, -0.3403778076171875, -0.3302497863769531, -0.32012176513671875, -0.3099937438964844, -0.29986572265625, -0.2897377014160156, -0.27960968017578125, -0.2694816589355469, -0.2593536376953125, -0.24922561645507812, -0.23909759521484375, -0.22896957397460938, -0.218841552734375, -0.20871353149414062, -0.19858551025390625, -0.18845748901367188, -0.1783294677734375, -0.16820144653320312, -0.15807342529296875, -0.14794540405273438, -0.1378173828125, -0.12768936157226562, -0.11756134033203125, -0.10743331909179688, -0.0973052978515625, -0.08717727661132812, -0.07704925537109375, -0.06692123413085938, -0.056793212890625, -0.046665191650390625, -0.03653717041015625, -0.026409149169921875, -0.0162811279296875, -0.006153106689453125, 0.00397491455078125, 0.014102935791015625, 0.02423095703125, 0.034358978271484375, 0.04448699951171875, 0.054615020751953125, 0.0647430419921875, 0.07487106323242188, 0.08499908447265625, 0.09512710571289062, 0.105255126953125, 0.11538314819335938, 0.12551116943359375, 0.13563919067382812, 0.1457672119140625, 0.15589523315429688, 0.16602325439453125, 0.17615127563476562, 0.186279296875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 10.0, 24.0, 55.0, 117.0, 334.0, 300.0, 101.0, 37.0, 13.0, 11.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.654769778251648, -1.6088402271270752, -1.562910795211792, -1.5169812440872192, -1.471051812171936, -1.4251222610473633, -1.37919282913208, -1.3332632780075073, -1.2873337268829346, -1.2414041757583618, -1.1954747438430786, -1.1495451927185059, -1.1036157608032227, -1.05768620967865, -1.0117566585540771, -0.965827226638794, -0.9198977947235107, -0.8739683032035828, -0.8280388116836548, -0.782109260559082, -0.7361798286437988, -0.6902502775192261, -0.6443207859992981, -0.5983912944793701, -0.5524618029594421, -0.5065323114395142, -0.4606028199195862, -0.4146732985973358, -0.36874380707740784, -0.32281431555747986, -0.2768847942352295, -0.2309553027153015, -0.18502581119537354, -0.13909631967544556, -0.09316681325435638, -0.04723730683326721, -0.0013078153133392334, 0.044621676206588745, 0.09055119752883911, 0.1364806890487671, 0.18241018056869507, 0.22833967208862305, 0.274269163608551, 0.3201986849308014, 0.36612817645072937, 0.41205766797065735, 0.4579871892929077, 0.5039166808128357, 0.5498461723327637, 0.5957756638526917, 0.6417051553726196, 0.6876347064971924, 0.7335641384124756, 0.7794936895370483, 0.8254231810569763, 0.8713526725769043, 0.9172821640968323, 0.9632116556167603, 1.009141206741333, 1.0550706386566162, 1.101000189781189, 1.1469296216964722, 1.192859172821045, 1.2387886047363281, 1.2847181558609009]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 2.0, 10.0, 8.0, 14.0, 15.0, 34.0, 26.0, 26.0, 42.0, 44.0, 40.0, 66.0, 69.0, 67.0, 67.0, 57.0, 48.0, 51.0, 48.0, 42.0, 39.0, 36.0, 35.0, 38.0, 15.0, 15.0, 15.0, 8.0, 8.0, 2.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7691313028335571, -0.7409932613372803, -0.7128552794456482, -0.6847172379493713, -0.6565792560577393, -0.6284412145614624, -0.6003031730651855, -0.5721651911735535, -0.5440271496772766, -0.5158891081809998, -0.4877511262893677, -0.4596130847930908, -0.43147507309913635, -0.4033370614051819, -0.3751990497112274, -0.34706103801727295, -0.3189230263233185, -0.290785014629364, -0.26264700293540955, -0.23450897634029388, -0.20637094974517822, -0.17823293805122375, -0.1500949263572693, -0.12195689976215363, -0.09381888806819916, -0.06568086892366409, -0.03754285350441933, -0.00940483808517456, 0.018733181059360504, 0.04687120020389557, 0.07500921189785004, 0.1031472384929657, 0.13128525018692017, 0.15942326188087463, 0.1875612884759903, 0.21569930016994476, 0.24383732676506042, 0.2719753384590149, 0.30011335015296936, 0.32825136184692383, 0.3563894033432007, 0.38452741503715515, 0.4126654267311096, 0.4408034682273865, 0.46894147992134094, 0.4970794916152954, 0.5252175331115723, 0.5533555150032043, 0.5814934968948364, 0.6096315383911133, 0.6377695202827454, 0.6659075617790222, 0.6940455436706543, 0.7221835851669312, 0.750321626663208, 0.7784596085548401, 0.8065976500511169, 0.8347356915473938, 0.8628736734390259, 0.8910117149353027, 0.9191496968269348, 0.9472877383232117, 0.9754257202148438, 1.0035637617111206, 1.0317018032073975]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 5.0, 5.0, 6.0, 17.0, 18.0, 26.0, 38.0, 54.0, 134.0, 233.0, 538.0, 1471.0, 6761.0, 853269.0, 179629.0, 4301.0, 1093.0, 457.0, 208.0, 95.0, 69.0, 40.0, 28.0, 25.0, 9.0, 12.0, 6.0, 3.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.537109375, -2.4599609375, -2.3828125, -2.3056640625, -2.228515625, -2.1513671875, -2.07421875, -1.9970703125, -1.919921875, -1.8427734375, -1.765625, -1.6884765625, -1.611328125, -1.5341796875, -1.45703125, -1.3798828125, -1.302734375, -1.2255859375, -1.1484375, -1.0712890625, -0.994140625, -0.9169921875, -0.83984375, -0.7626953125, -0.685546875, -0.6083984375, -0.53125, -0.4541015625, -0.376953125, -0.2998046875, -0.22265625, -0.1455078125, -0.068359375, 0.0087890625, 0.0859375, 0.1630859375, 0.240234375, 0.3173828125, 0.39453125, 0.4716796875, 0.548828125, 0.6259765625, 0.703125, 0.7802734375, 0.857421875, 0.9345703125, 1.01171875, 1.0888671875, 1.166015625, 1.2431640625, 1.3203125, 1.3974609375, 1.474609375, 1.5517578125, 1.62890625, 1.7060546875, 1.783203125, 1.8603515625, 1.9375, 2.0146484375, 2.091796875, 2.1689453125, 2.24609375, 2.3232421875, 2.400390625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 5.0, 17.0, 25.0, 80.0, 197.0, 287.0, 240.0, 89.0, 36.0, 13.0, 3.0, 6.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.47900390625, -0.46846771240234375, -0.4579315185546875, -0.44739532470703125, -0.436859130859375, -0.42632293701171875, -0.4157867431640625, -0.40525054931640625, -0.39471435546875, -0.38417816162109375, -0.3736419677734375, -0.36310577392578125, -0.352569580078125, -0.34203338623046875, -0.3314971923828125, -0.32096099853515625, -0.3104248046875, -0.29988861083984375, -0.2893524169921875, -0.27881622314453125, -0.268280029296875, -0.25774383544921875, -0.2472076416015625, -0.23667144775390625, -0.22613525390625, -0.21559906005859375, -0.2050628662109375, -0.19452667236328125, -0.183990478515625, -0.17345428466796875, -0.1629180908203125, -0.15238189697265625, -0.141845703125, -0.13130950927734375, -0.1207733154296875, -0.11023712158203125, -0.099700927734375, -0.08916473388671875, -0.0786285400390625, -0.06809234619140625, -0.05755615234375, -0.04701995849609375, -0.0364837646484375, -0.02594757080078125, -0.015411376953125, -0.00487518310546875, 0.0056610107421875, 0.01619720458984375, 0.0267333984375, 0.03726959228515625, 0.0478057861328125, 0.05834197998046875, 0.068878173828125, 0.07941436767578125, 0.0899505615234375, 0.10048675537109375, 0.11102294921875, 0.12155914306640625, 0.1320953369140625, 0.14263153076171875, 0.153167724609375, 0.16370391845703125, 0.1742401123046875, 0.18477630615234375, 0.1953125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 5.0, 9.0, 7.0, 11.0, 19.0, 15.0, 15.0, 52.0, 61.0, 88.0, 131.0, 186.0, 316.0, 599.0, 1327.0, 4716.0, 26507.0, 338088.0, 620302.0, 45796.0, 6739.0, 1751.0, 716.0, 394.0, 256.0, 148.0, 95.0, 61.0, 44.0, 31.0, 18.0, 15.0, 11.0, 6.0, 7.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.8681640625, -0.84027099609375, -0.8123779296875, -0.78448486328125, -0.756591796875, -0.72869873046875, -0.7008056640625, -0.67291259765625, -0.64501953125, -0.61712646484375, -0.5892333984375, -0.56134033203125, -0.533447265625, -0.50555419921875, -0.4776611328125, -0.44976806640625, -0.421875, -0.39398193359375, -0.3660888671875, -0.33819580078125, -0.310302734375, -0.28240966796875, -0.2545166015625, -0.22662353515625, -0.19873046875, -0.17083740234375, -0.1429443359375, -0.11505126953125, -0.087158203125, -0.05926513671875, -0.0313720703125, -0.00347900390625, 0.0244140625, 0.05230712890625, 0.0802001953125, 0.10809326171875, 0.135986328125, 0.16387939453125, 0.1917724609375, 0.21966552734375, 0.24755859375, 0.27545166015625, 0.3033447265625, 0.33123779296875, 0.359130859375, 0.38702392578125, 0.4149169921875, 0.44281005859375, 0.470703125, 0.49859619140625, 0.5264892578125, 0.55438232421875, 0.582275390625, 0.61016845703125, 0.6380615234375, 0.66595458984375, 0.69384765625, 0.72174072265625, 0.7496337890625, 0.77752685546875, 0.805419921875, 0.83331298828125, 0.8612060546875, 0.88909912109375, 0.9169921875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 6.0, 3.0, 11.0, 10.0, 13.0, 13.0, 25.0, 20.0, 17.0, 31.0, 30.0, 37.0, 44.0, 49.0, 47.0, 43.0, 45.0, 55.0, 53.0, 63.0, 44.0, 52.0, 43.0, 41.0, 27.0, 37.0, 26.0, 28.0, 18.0, 11.0, 16.0, 9.0, 9.0, 3.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.6337890625, -0.6136856079101562, -0.5935821533203125, -0.5734786987304688, -0.553375244140625, -0.5332717895507812, -0.5131683349609375, -0.49306488037109375, -0.47296142578125, -0.45285797119140625, -0.4327545166015625, -0.41265106201171875, -0.392547607421875, -0.37244415283203125, -0.3523406982421875, -0.33223724365234375, -0.3121337890625, -0.29203033447265625, -0.2719268798828125, -0.25182342529296875, -0.231719970703125, -0.21161651611328125, -0.1915130615234375, -0.17140960693359375, -0.15130615234375, -0.13120269775390625, -0.1110992431640625, -0.09099578857421875, -0.070892333984375, -0.05078887939453125, -0.0306854248046875, -0.01058197021484375, 0.009521484375, 0.02962493896484375, 0.0497283935546875, 0.06983184814453125, 0.089935302734375, 0.11003875732421875, 0.1301422119140625, 0.15024566650390625, 0.17034912109375, 0.19045257568359375, 0.2105560302734375, 0.23065948486328125, 0.250762939453125, 0.27086639404296875, 0.2909698486328125, 0.31107330322265625, 0.3311767578125, 0.35128021240234375, 0.3713836669921875, 0.39148712158203125, 0.411590576171875, 0.43169403076171875, 0.4517974853515625, 0.47190093994140625, 0.49200439453125, 0.5121078491210938, 0.5322113037109375, 0.5523147583007812, 0.572418212890625, 0.5925216674804688, 0.6126251220703125, 0.6327285766601562, 0.65283203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 11.0, 17.0, 24.0, 72.0, 129.0, 409.0, 10088.0, 1035439.0, 1914.0, 270.0, 98.0, 40.0, 20.0, 11.0, 2.0, 10.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.58203125, -2.5224151611328125, -2.462799072265625, -2.4031829833984375, -2.34356689453125, -2.2839508056640625, -2.224334716796875, -2.1647186279296875, -2.1051025390625, -2.0454864501953125, -1.985870361328125, -1.9262542724609375, -1.86663818359375, -1.8070220947265625, -1.747406005859375, -1.6877899169921875, -1.628173828125, -1.5685577392578125, -1.508941650390625, -1.4493255615234375, -1.38970947265625, -1.3300933837890625, -1.270477294921875, -1.2108612060546875, -1.1512451171875, -1.0916290283203125, -1.032012939453125, -0.9723968505859375, -0.91278076171875, -0.8531646728515625, -0.793548583984375, -0.7339324951171875, -0.67431640625, -0.6147003173828125, -0.555084228515625, -0.4954681396484375, -0.43585205078125, -0.3762359619140625, -0.316619873046875, -0.2570037841796875, -0.1973876953125, -0.1377716064453125, -0.078155517578125, -0.0185394287109375, 0.04107666015625, 0.1006927490234375, 0.160308837890625, 0.2199249267578125, 0.279541015625, 0.3391571044921875, 0.398773193359375, 0.4583892822265625, 0.51800537109375, 0.5776214599609375, 0.637237548828125, 0.6968536376953125, 0.7564697265625, 0.8160858154296875, 0.875701904296875, 0.9353179931640625, 0.99493408203125, 1.0545501708984375, 1.114166259765625, 1.1737823486328125, 1.2333984375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 12.0, 17.0, 22.0, 13.0, 23.0, 21.0, 27.0, 31.0, 38.0, 59.0, 90.0, 124.0, 136.0, 83.0, 64.0, 53.0, 35.0, 29.0, 22.0, 25.0, 16.0, 13.0, 8.0, 2.0, 7.0, 9.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-9.393692016601562e-05, -9.109638631343842e-05, -8.82558524608612e-05, -8.5415318608284e-05, -8.257478475570679e-05, -7.973425090312958e-05, -7.689371705055237e-05, -7.405318319797516e-05, -7.121264934539795e-05, -6.837211549282074e-05, -6.553158164024353e-05, -6.269104778766632e-05, -5.985051393508911e-05, -5.70099800825119e-05, -5.416944622993469e-05, -5.132891237735748e-05, -4.8488378524780273e-05, -4.5647844672203064e-05, -4.2807310819625854e-05, -3.9966776967048645e-05, -3.7126243114471436e-05, -3.4285709261894226e-05, -3.1445175409317017e-05, -2.8604641556739807e-05, -2.5764107704162598e-05, -2.2923573851585388e-05, -2.008303999900818e-05, -1.724250614643097e-05, -1.440197229385376e-05, -1.156143844127655e-05, -8.72090458869934e-06, -5.880370736122131e-06, -3.039836883544922e-06, -1.993030309677124e-07, 2.641230821609497e-06, 5.4817646741867065e-06, 8.322298526763916e-06, 1.1162832379341125e-05, 1.4003366231918335e-05, 1.6843900084495544e-05, 1.9684433937072754e-05, 2.2524967789649963e-05, 2.5365501642227173e-05, 2.8206035494804382e-05, 3.104656934738159e-05, 3.38871031999588e-05, 3.672763705253601e-05, 3.956817090511322e-05, 4.240870475769043e-05, 4.524923861026764e-05, 4.808977246284485e-05, 5.093030631542206e-05, 5.377084016799927e-05, 5.661137402057648e-05, 5.9451907873153687e-05, 6.22924417257309e-05, 6.51329755783081e-05, 6.797350943088531e-05, 7.081404328346252e-05, 7.365457713603973e-05, 7.649511098861694e-05, 7.933564484119415e-05, 8.217617869377136e-05, 8.501671254634857e-05, 8.785724639892578e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 5.0, 2.0, 1.0, 8.0, 8.0, 4.0, 7.0, 12.0, 8.0, 17.0, 22.0, 46.0, 110.0, 283.0, 649.0, 2230.0, 10693.0, 758266.0, 265745.0, 7513.0, 1853.0, 557.0, 235.0, 111.0, 58.0, 26.0, 22.0, 15.0, 15.0, 8.0, 5.0, 4.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.662109375, -0.6391983032226562, -0.6162872314453125, -0.5933761596679688, -0.570465087890625, -0.5475540161132812, -0.5246429443359375, -0.5017318725585938, -0.47882080078125, -0.45590972900390625, -0.4329986572265625, -0.41008758544921875, -0.387176513671875, -0.36426544189453125, -0.3413543701171875, -0.31844329833984375, -0.2955322265625, -0.27262115478515625, -0.2497100830078125, -0.22679901123046875, -0.203887939453125, -0.18097686767578125, -0.1580657958984375, -0.13515472412109375, -0.11224365234375, -0.08933258056640625, -0.0664215087890625, -0.04351043701171875, -0.020599365234375, 0.00231170654296875, 0.0252227783203125, 0.04813385009765625, 0.071044921875, 0.09395599365234375, 0.1168670654296875, 0.13977813720703125, 0.162689208984375, 0.18560028076171875, 0.2085113525390625, 0.23142242431640625, 0.25433349609375, 0.27724456787109375, 0.3001556396484375, 0.32306671142578125, 0.345977783203125, 0.36888885498046875, 0.3917999267578125, 0.41471099853515625, 0.4376220703125, 0.46053314208984375, 0.4834442138671875, 0.5063552856445312, 0.529266357421875, 0.5521774291992188, 0.5750885009765625, 0.5979995727539062, 0.62091064453125, 0.6438217163085938, 0.6667327880859375, 0.6896438598632812, 0.712554931640625, 0.7354660034179688, 0.7583770751953125, 0.7812881469726562, 0.80419921875]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 0.0, 3.0, 6.0, 11.0, 26.0, 35.0, 43.0, 84.0, 130.0, 203.0, 152.0, 121.0, 69.0, 47.0, 17.0, 11.0, 10.0, 5.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.404296875, -0.39067840576171875, -0.3770599365234375, -0.36344146728515625, -0.349822998046875, -0.33620452880859375, -0.3225860595703125, -0.30896759033203125, -0.29534912109375, -0.28173065185546875, -0.2681121826171875, -0.25449371337890625, -0.240875244140625, -0.22725677490234375, -0.2136383056640625, -0.20001983642578125, -0.1864013671875, -0.17278289794921875, -0.1591644287109375, -0.14554595947265625, -0.131927490234375, -0.11830902099609375, -0.1046905517578125, -0.09107208251953125, -0.07745361328125, -0.06383514404296875, -0.0502166748046875, -0.03659820556640625, -0.022979736328125, -0.00936126708984375, 0.0042572021484375, 0.01787567138671875, 0.031494140625, 0.04511260986328125, 0.0587310791015625, 0.07234954833984375, 0.085968017578125, 0.09958648681640625, 0.1132049560546875, 0.12682342529296875, 0.14044189453125, 0.15406036376953125, 0.1676788330078125, 0.18129730224609375, 0.194915771484375, 0.20853424072265625, 0.2221527099609375, 0.23577117919921875, 0.2493896484375, 0.26300811767578125, 0.2766265869140625, 0.29024505615234375, 0.303863525390625, 0.31748199462890625, 0.3311004638671875, 0.34471893310546875, 0.35833740234375, 0.37195587158203125, 0.3855743408203125, 0.39919281005859375, 0.412811279296875, 0.42642974853515625, 0.4400482177734375, 0.45366668701171875, 0.46728515625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 58.0, 887.0, 63.0, 6.0, 0.0, 0.0, 2.0], "bins": [-49.01736068725586, -48.179256439208984, -47.341156005859375, -46.5030517578125, -45.66495132446289, -44.826847076416016, -43.988746643066406, -43.15064239501953, -42.312538146972656, -41.47443389892578, -40.63633346557617, -39.7982292175293, -38.96012878417969, -38.12202453613281, -37.28392028808594, -36.44581985473633, -35.60771942138672, -34.769615173339844, -33.931514739990234, -33.09341049194336, -32.25531005859375, -31.417205810546875, -30.579103469848633, -29.74100112915039, -28.902896881103516, -28.064794540405273, -27.22669219970703, -26.388587951660156, -25.550485610961914, -24.712383270263672, -23.87428092956543, -23.036178588867188, -22.198076248168945, -21.359973907470703, -20.52187156677246, -19.68376922607422, -18.845664978027344, -18.0075626373291, -17.16946029663086, -16.331357955932617, -15.493255615234375, -14.655153274536133, -13.817049980163574, -12.978947639465332, -12.14084529876709, -11.302742004394531, -10.464639663696289, -9.626537322998047, -8.788434982299805, -7.950332164764404, -7.112229824066162, -6.274127006530762, -5.4360246658325195, -4.597921848297119, -3.7598190307617188, -2.9217166900634766, -2.083613395690918, -1.2455108165740967, -0.40740811824798584, 0.430694580078125, 1.2687971591949463, 2.1068997383117676, 2.945002555847168, 3.78310489654541, 4.6212077140808105]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 2.0, 1.0, 3.0, 11.0, 10.0, 11.0, 16.0, 18.0, 18.0, 17.0, 19.0, 24.0, 29.0, 29.0, 36.0, 23.0, 28.0, 37.0, 31.0, 31.0, 43.0, 44.0, 45.0, 41.0, 42.0, 34.0, 41.0, 35.0, 40.0, 34.0, 35.0, 30.0, 18.0, 18.0, 16.0, 14.0, 15.0, 14.0, 7.0, 12.0, 6.0, 4.0, 4.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0], "bins": [-3.4280717372894287, -3.323141098022461, -3.218210458755493, -3.1132798194885254, -3.0083491802215576, -2.90341854095459, -2.798487663269043, -2.6935572624206543, -2.5886263847351074, -2.4836957454681396, -2.378765106201172, -2.273834466934204, -2.1689038276672363, -2.0639731884002686, -1.9590424299240112, -1.8541117906570435, -1.7491812705993652, -1.6442506313323975, -1.5393199920654297, -1.434389352798462, -1.3294587135314941, -1.2245280742645264, -1.119597315788269, -1.0146666765213013, -0.9097360372543335, -0.8048053979873657, -0.699874758720398, -0.5949440598487854, -0.4900134205818176, -0.38508278131484985, -0.2801520824432373, -0.17522144317626953, -0.07029104232788086, 0.03463961184024811, 0.13957026600837708, 0.24450093507766724, 0.349431574344635, 0.4543622136116028, 0.5592929124832153, 0.6642235517501831, 0.7691541910171509, 0.8740848302841187, 0.9790154695510864, 1.0839462280273438, 1.1888768672943115, 1.2938075065612793, 1.398738145828247, 1.5036687850952148, 1.6085994243621826, 1.7135300636291504, 1.8184607028961182, 1.923391342163086, 2.0283219814300537, 2.1332526206970215, 2.2381834983825684, 2.343113899230957, 2.448044776916504, 2.5529754161834717, 2.6579060554504395, 2.7628366947174072, 2.867767333984375, 2.9726979732513428, 3.0776286125183105, 3.1825594902038574, 3.287489891052246]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 3.0, 5.0, 1.0, 2.0, 7.0, 10.0, 10.0, 5.0, 22.0, 25.0, 48.0, 36.0, 54.0, 109.0, 183.0, 391.0, 777.0, 2353.0, 17214.0, 4134906.0, 34503.0, 2482.0, 669.0, 248.0, 111.0, 42.0, 15.0, 15.0, 6.0, 6.0, 8.0, 5.0, 7.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-3.55078125, -3.4729156494140625, -3.395050048828125, -3.3171844482421875, -3.23931884765625, -3.1614532470703125, -3.083587646484375, -3.0057220458984375, -2.9278564453125, -2.8499908447265625, -2.772125244140625, -2.6942596435546875, -2.61639404296875, -2.5385284423828125, -2.460662841796875, -2.3827972412109375, -2.304931640625, -2.2270660400390625, -2.149200439453125, -2.0713348388671875, -1.99346923828125, -1.9156036376953125, -1.837738037109375, -1.7598724365234375, -1.6820068359375, -1.6041412353515625, -1.526275634765625, -1.4484100341796875, -1.37054443359375, -1.2926788330078125, -1.214813232421875, -1.1369476318359375, -1.05908203125, -0.9812164306640625, -0.903350830078125, -0.8254852294921875, -0.74761962890625, -0.6697540283203125, -0.591888427734375, -0.5140228271484375, -0.4361572265625, -0.3582916259765625, -0.280426025390625, -0.2025604248046875, -0.12469482421875, -0.0468292236328125, 0.031036376953125, 0.1089019775390625, 0.186767578125, 0.2646331787109375, 0.342498779296875, 0.4203643798828125, 0.49822998046875, 0.5760955810546875, 0.653961181640625, 0.7318267822265625, 0.8096923828125, 0.8875579833984375, 0.965423583984375, 1.0432891845703125, 1.12115478515625, 1.1990203857421875, 1.276885986328125, 1.3547515869140625, 1.4326171875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 9.0, 23.0, 27.0, 84.0, 149.0, 226.0, 215.0, 135.0, 74.0, 34.0, 13.0, 8.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50146484375, -0.4902801513671875, -0.479095458984375, -0.4679107666015625, -0.45672607421875, -0.4455413818359375, -0.434356689453125, -0.4231719970703125, -0.4119873046875, -0.4008026123046875, -0.389617919921875, -0.3784332275390625, -0.36724853515625, -0.3560638427734375, -0.344879150390625, -0.3336944580078125, -0.322509765625, -0.3113250732421875, -0.300140380859375, -0.2889556884765625, -0.27777099609375, -0.2665863037109375, -0.255401611328125, -0.2442169189453125, -0.2330322265625, -0.2218475341796875, -0.210662841796875, -0.1994781494140625, -0.18829345703125, -0.1771087646484375, -0.165924072265625, -0.1547393798828125, -0.1435546875, -0.1323699951171875, -0.121185302734375, -0.1100006103515625, -0.09881591796875, -0.0876312255859375, -0.076446533203125, -0.0652618408203125, -0.0540771484375, -0.0428924560546875, -0.031707763671875, -0.0205230712890625, -0.00933837890625, 0.0018463134765625, 0.013031005859375, 0.0242156982421875, 0.035400390625, 0.0465850830078125, 0.057769775390625, 0.0689544677734375, 0.08013916015625, 0.0913238525390625, 0.102508544921875, 0.1136932373046875, 0.1248779296875, 0.1360626220703125, 0.147247314453125, 0.1584320068359375, 0.16961669921875, 0.1808013916015625, 0.191986083984375, 0.2031707763671875, 0.21435546875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 5.0, 5.0, 3.0, 5.0, 12.0, 10.0, 17.0, 16.0, 29.0, 59.0, 77.0, 181.0, 352.0, 787.0, 2040.0, 8647.0, 127848.0, 4011417.0, 35306.0, 4747.0, 1413.0, 586.0, 285.0, 156.0, 86.0, 54.0, 35.0, 32.0, 17.0, 13.0, 12.0, 8.0, 4.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.86181640625, -0.8302688598632812, -0.7987213134765625, -0.7671737670898438, -0.735626220703125, -0.7040786743164062, -0.6725311279296875, -0.6409835815429688, -0.60943603515625, -0.5778884887695312, -0.5463409423828125, -0.5147933959960938, -0.483245849609375, -0.45169830322265625, -0.4201507568359375, -0.38860321044921875, -0.3570556640625, -0.32550811767578125, -0.2939605712890625, -0.26241302490234375, -0.230865478515625, -0.19931793212890625, -0.1677703857421875, -0.13622283935546875, -0.10467529296875, -0.07312774658203125, -0.0415802001953125, -0.01003265380859375, 0.021514892578125, 0.05306243896484375, 0.0846099853515625, 0.11615753173828125, 0.147705078125, 0.17925262451171875, 0.2108001708984375, 0.24234771728515625, 0.273895263671875, 0.30544281005859375, 0.3369903564453125, 0.36853790283203125, 0.40008544921875, 0.43163299560546875, 0.4631805419921875, 0.49472808837890625, 0.526275634765625, 0.5578231811523438, 0.5893707275390625, 0.6209182739257812, 0.6524658203125, 0.6840133666992188, 0.7155609130859375, 0.7471084594726562, 0.778656005859375, 0.8102035522460938, 0.8417510986328125, 0.8732986450195312, 0.90484619140625, 0.9363937377929688, 0.9679412841796875, 0.9994888305664062, 1.031036376953125, 1.0625839233398438, 1.0941314697265625, 1.1256790161132812, 1.1572265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 5.0, 6.0, 14.0, 22.0, 45.0, 64.0, 153.0, 681.0, 2434.0, 425.0, 103.0, 45.0, 34.0, 14.0, 9.0, 7.0, 5.0, 8.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2320556640625, -0.22209739685058594, -0.21213912963867188, -0.2021808624267578, -0.19222259521484375, -0.1822643280029297, -0.17230606079101562, -0.16234779357910156, -0.1523895263671875, -0.14243125915527344, -0.13247299194335938, -0.12251472473144531, -0.11255645751953125, -0.10259819030761719, -0.09263992309570312, -0.08268165588378906, -0.072723388671875, -0.06276512145996094, -0.052806854248046875, -0.04284858703613281, -0.03289031982421875, -0.022932052612304688, -0.012973785400390625, -0.0030155181884765625, 0.0069427490234375, 0.016901016235351562, 0.026859283447265625, 0.03681755065917969, 0.04677581787109375, 0.05673408508300781, 0.06669235229492188, 0.07665061950683594, 0.08660888671875, 0.09656715393066406, 0.10652542114257812, 0.11648368835449219, 0.12644195556640625, 0.1364002227783203, 0.14635848999023438, 0.15631675720214844, 0.1662750244140625, 0.17623329162597656, 0.18619155883789062, 0.1961498260498047, 0.20610809326171875, 0.2160663604736328, 0.22602462768554688, 0.23598289489746094, 0.245941162109375, 0.25589942932128906, 0.2658576965332031, 0.2758159637451172, 0.28577423095703125, 0.2957324981689453, 0.3056907653808594, 0.31564903259277344, 0.3256072998046875, 0.33556556701660156, 0.3455238342285156, 0.3554821014404297, 0.36544036865234375, 0.3753986358642578, 0.3853569030761719, 0.39531517028808594, 0.4052734375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 13.0, 24.0, 43.0, 91.0, 164.0, 253.0, 201.0, 87.0, 59.0, 28.0, 14.0, 9.0, 6.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0305263996124268, -1.0068774223327637, -0.9832285642623901, -0.9595796465873718, -0.9359307289123535, -0.9122818112373352, -0.8886328935623169, -0.8649839758872986, -0.8413350582122803, -0.817686140537262, -0.7940372228622437, -0.7703883051872253, -0.746739387512207, -0.7230904698371887, -0.6994415521621704, -0.6757926344871521, -0.6521437168121338, -0.6284947991371155, -0.6048458814620972, -0.5811969637870789, -0.5575480461120605, -0.5338991284370422, -0.5102502107620239, -0.4866012930870056, -0.4629523754119873, -0.439303457736969, -0.4156545400619507, -0.3920056223869324, -0.36835670471191406, -0.34470778703689575, -0.32105886936187744, -0.29740995168685913, -0.2737610340118408, -0.2501121163368225, -0.2264631986618042, -0.2028142809867859, -0.17916536331176758, -0.15551644563674927, -0.13186752796173096, -0.10821861028671265, -0.08456969261169434, -0.060920774936676025, -0.037271857261657715, -0.013622939586639404, 0.010025978088378906, 0.03367489576339722, 0.05732381343841553, 0.08097273111343384, 0.10462164878845215, 0.12827056646347046, 0.15191948413848877, 0.17556840181350708, 0.1992173194885254, 0.2228662371635437, 0.246515154838562, 0.2701640725135803, 0.29381299018859863, 0.31746190786361694, 0.34111082553863525, 0.36475974321365356, 0.3884086608886719, 0.4120575785636902, 0.4357064962387085, 0.4593554139137268, 0.4830043315887451]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 8.0, 8.0, 16.0, 11.0, 22.0, 27.0, 39.0, 42.0, 38.0, 63.0, 52.0, 71.0, 70.0, 62.0, 56.0, 60.0, 52.0, 68.0, 58.0, 42.0, 38.0, 16.0, 18.0, 20.0, 15.0, 12.0, 2.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.7511234283447266, -0.7293632626533508, -0.7076030373573303, -0.6858428716659546, -0.6640826463699341, -0.6423224806785583, -0.6205623149871826, -0.5988020896911621, -0.5770419239997864, -0.5552817583084106, -0.5335215330123901, -0.5117613673210144, -0.4900011718273163, -0.46824097633361816, -0.44648078083992004, -0.4247205853462219, -0.4029603898525238, -0.3812001943588257, -0.35943999886512756, -0.33767980337142944, -0.3159196376800537, -0.2941594421863556, -0.27239924669265747, -0.25063908100128174, -0.22887887060642242, -0.2071186751127243, -0.18535849452018738, -0.16359829902648926, -0.14183810353279114, -0.12007792294025421, -0.09831772744655609, -0.07655754685401917, -0.054797351360321045, -0.03303716331720352, -0.0112769715487957, 0.010483220219612122, 0.032243408262729645, 0.05400359630584717, 0.07576379179954529, 0.09752397239208221, 0.11928416788578033, 0.14104436337947845, 0.16280454397201538, 0.1845647394657135, 0.20632493495941162, 0.22808511555194855, 0.24984531104564667, 0.2716054916381836, 0.2933656871318817, 0.31512588262557983, 0.33688607811927795, 0.3586462736129761, 0.3804064393043518, 0.4021666347980499, 0.42392683029174805, 0.4456869959831238, 0.4674472212791443, 0.4892074167728424, 0.5109676122665405, 0.5327277779579163, 0.5544880032539368, 0.5762481689453125, 0.598008394241333, 0.6197685599327087, 0.6415287256240845]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 6.0, 6.0, 7.0, 8.0, 13.0, 16.0, 14.0, 29.0, 39.0, 61.0, 82.0, 144.0, 267.0, 452.0, 990.0, 2726.0, 15503.0, 648713.0, 363978.0, 11191.0, 2265.0, 896.0, 471.0, 212.0, 160.0, 108.0, 60.0, 43.0, 35.0, 11.0, 12.0, 9.0, 7.0, 13.0, 4.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.994140625, -0.95977783203125, -0.9254150390625, -0.89105224609375, -0.856689453125, -0.82232666015625, -0.7879638671875, -0.75360107421875, -0.71923828125, -0.68487548828125, -0.6505126953125, -0.61614990234375, -0.581787109375, -0.54742431640625, -0.5130615234375, -0.47869873046875, -0.4443359375, -0.40997314453125, -0.3756103515625, -0.34124755859375, -0.306884765625, -0.27252197265625, -0.2381591796875, -0.20379638671875, -0.16943359375, -0.13507080078125, -0.1007080078125, -0.06634521484375, -0.031982421875, 0.00238037109375, 0.0367431640625, 0.07110595703125, 0.10546875, 0.13983154296875, 0.1741943359375, 0.20855712890625, 0.242919921875, 0.27728271484375, 0.3116455078125, 0.34600830078125, 0.38037109375, 0.41473388671875, 0.4490966796875, 0.48345947265625, 0.517822265625, 0.55218505859375, 0.5865478515625, 0.62091064453125, 0.6552734375, 0.68963623046875, 0.7239990234375, 0.75836181640625, 0.792724609375, 0.82708740234375, 0.8614501953125, 0.89581298828125, 0.93017578125, 0.96453857421875, 0.9989013671875, 1.03326416015625, 1.067626953125, 1.10198974609375, 1.1363525390625, 1.17071533203125, 1.205078125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 2.0, 5.0, 12.0, 21.0, 50.0, 92.0, 174.0, 255.0, 193.0, 98.0, 63.0, 23.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.498779296875, -0.4878120422363281, -0.47684478759765625, -0.4658775329589844, -0.4549102783203125, -0.4439430236816406, -0.43297576904296875, -0.4220085144042969, -0.411041259765625, -0.4000740051269531, -0.38910675048828125, -0.3781394958496094, -0.3671722412109375, -0.3562049865722656, -0.34523773193359375, -0.3342704772949219, -0.32330322265625, -0.3123359680175781, -0.30136871337890625, -0.2904014587402344, -0.2794342041015625, -0.2684669494628906, -0.25749969482421875, -0.24653244018554688, -0.235565185546875, -0.22459793090820312, -0.21363067626953125, -0.20266342163085938, -0.1916961669921875, -0.18072891235351562, -0.16976165771484375, -0.15879440307617188, -0.1478271484375, -0.13685989379882812, -0.12589263916015625, -0.11492538452148438, -0.1039581298828125, -0.09299087524414062, -0.08202362060546875, -0.07105636596679688, -0.060089111328125, -0.049121856689453125, -0.03815460205078125, -0.027187347412109375, -0.0162200927734375, -0.005252838134765625, 0.00571441650390625, 0.016681671142578125, 0.02764892578125, 0.038616180419921875, 0.04958343505859375, 0.060550689697265625, 0.0715179443359375, 0.08248519897460938, 0.09345245361328125, 0.10441970825195312, 0.115386962890625, 0.12635421752929688, 0.13732147216796875, 0.14828872680664062, 0.1592559814453125, 0.17022323608398438, 0.18119049072265625, 0.19215774536132812, 0.203125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 11.0, 13.0, 17.0, 18.0, 18.0, 31.0, 48.0, 56.0, 82.0, 106.0, 174.0, 286.0, 465.0, 1145.0, 3687.0, 15613.0, 90810.0, 674176.0, 222113.0, 30144.0, 6320.0, 1704.0, 623.0, 300.0, 170.0, 113.0, 63.0, 55.0, 48.0, 29.0, 21.0, 17.0, 11.0, 18.0, 8.0, 7.0, 4.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.607421875, -0.5869674682617188, -0.5665130615234375, -0.5460586547851562, -0.525604248046875, -0.5051498413085938, -0.4846954345703125, -0.46424102783203125, -0.44378662109375, -0.42333221435546875, -0.4028778076171875, -0.38242340087890625, -0.361968994140625, -0.34151458740234375, -0.3210601806640625, -0.30060577392578125, -0.2801513671875, -0.25969696044921875, -0.2392425537109375, -0.21878814697265625, -0.198333740234375, -0.17787933349609375, -0.1574249267578125, -0.13697052001953125, -0.11651611328125, -0.09606170654296875, -0.0756072998046875, -0.05515289306640625, -0.034698486328125, -0.01424407958984375, 0.0062103271484375, 0.02666473388671875, 0.047119140625, 0.06757354736328125, 0.0880279541015625, 0.10848236083984375, 0.128936767578125, 0.14939117431640625, 0.1698455810546875, 0.19029998779296875, 0.21075439453125, 0.23120880126953125, 0.2516632080078125, 0.27211761474609375, 0.292572021484375, 0.31302642822265625, 0.3334808349609375, 0.35393524169921875, 0.3743896484375, 0.39484405517578125, 0.4152984619140625, 0.43575286865234375, 0.456207275390625, 0.47666168212890625, 0.4971160888671875, 0.5175704956054688, 0.53802490234375, 0.5584793090820312, 0.5789337158203125, 0.5993881225585938, 0.619842529296875, 0.6402969360351562, 0.6607513427734375, 0.6812057495117188, 0.70166015625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 8.0, 5.0, 7.0, 5.0, 5.0, 5.0, 10.0, 18.0, 11.0, 15.0, 18.0, 29.0, 25.0, 21.0, 28.0, 38.0, 40.0, 41.0, 41.0, 53.0, 56.0, 42.0, 56.0, 45.0, 37.0, 45.0, 45.0, 47.0, 31.0, 23.0, 33.0, 18.0, 14.0, 19.0, 11.0, 15.0, 12.0, 6.0, 9.0, 9.0, 2.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50390625, -0.48404693603515625, -0.4641876220703125, -0.44432830810546875, -0.424468994140625, -0.40460968017578125, -0.3847503662109375, -0.36489105224609375, -0.34503173828125, -0.32517242431640625, -0.3053131103515625, -0.28545379638671875, -0.265594482421875, -0.24573516845703125, -0.2258758544921875, -0.20601654052734375, -0.1861572265625, -0.16629791259765625, -0.1464385986328125, -0.12657928466796875, -0.106719970703125, -0.08686065673828125, -0.0670013427734375, -0.04714202880859375, -0.02728271484375, -0.00742340087890625, 0.0124359130859375, 0.03229522705078125, 0.052154541015625, 0.07201385498046875, 0.0918731689453125, 0.11173248291015625, 0.131591796875, 0.15145111083984375, 0.1713104248046875, 0.19116973876953125, 0.211029052734375, 0.23088836669921875, 0.2507476806640625, 0.27060699462890625, 0.29046630859375, 0.31032562255859375, 0.3301849365234375, 0.35004425048828125, 0.369903564453125, 0.38976287841796875, 0.4096221923828125, 0.42948150634765625, 0.4493408203125, 0.46920013427734375, 0.4890594482421875, 0.5089187622070312, 0.528778076171875, 0.5486373901367188, 0.5684967041015625, 0.5883560180664062, 0.60821533203125, 0.6280746459960938, 0.6479339599609375, 0.6677932739257812, 0.687652587890625, 0.7075119018554688, 0.7273712158203125, 0.7472305297851562, 0.76708984375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 3.0, 3.0, 9.0, 12.0, 24.0, 49.0, 77.0, 198.0, 542.0, 2870.0, 145013.0, 892397.0, 6028.0, 825.0, 263.0, 122.0, 43.0, 26.0, 20.0, 10.0, 5.0, 6.0, 3.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62646484375, -0.6100425720214844, -0.5936203002929688, -0.5771980285644531, -0.5607757568359375, -0.5443534851074219, -0.5279312133789062, -0.5115089416503906, -0.495086669921875, -0.4786643981933594, -0.46224212646484375, -0.4458198547363281, -0.4293975830078125, -0.4129753112792969, -0.39655303955078125, -0.3801307678222656, -0.36370849609375, -0.3472862243652344, -0.33086395263671875, -0.3144416809082031, -0.2980194091796875, -0.2815971374511719, -0.26517486572265625, -0.24875259399414062, -0.232330322265625, -0.21590805053710938, -0.19948577880859375, -0.18306350708007812, -0.1666412353515625, -0.15021896362304688, -0.13379669189453125, -0.11737442016601562, -0.1009521484375, -0.08452987670898438, -0.06810760498046875, -0.051685333251953125, -0.0352630615234375, -0.018840789794921875, -0.00241851806640625, 0.014003753662109375, 0.030426025390625, 0.046848297119140625, 0.06327056884765625, 0.07969284057617188, 0.0961151123046875, 0.11253738403320312, 0.12895965576171875, 0.14538192749023438, 0.16180419921875, 0.17822647094726562, 0.19464874267578125, 0.21107101440429688, 0.2274932861328125, 0.24391555786132812, 0.26033782958984375, 0.2767601013183594, 0.293182373046875, 0.3096046447753906, 0.32602691650390625, 0.3424491882324219, 0.3588714599609375, 0.3752937316894531, 0.39171600341796875, 0.4081382751464844, 0.424560546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 13.0, 7.0, 12.0, 27.0, 35.0, 44.0, 62.0, 108.0, 171.0, 170.0, 122.0, 80.0, 45.0, 31.0, 23.0, 15.0, 14.0, 10.0, 8.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00015044212341308594, -0.0001461505889892578, -0.0001418590545654297, -0.00013756752014160156, -0.00013327598571777344, -0.0001289844512939453, -0.0001246929168701172, -0.00012040138244628906, -0.00011610984802246094, -0.00011181831359863281, -0.00010752677917480469, -0.00010323524475097656, -9.894371032714844e-05, -9.465217590332031e-05, -9.036064147949219e-05, -8.606910705566406e-05, -8.177757263183594e-05, -7.748603820800781e-05, -7.319450378417969e-05, -6.890296936035156e-05, -6.461143493652344e-05, -6.031990051269531e-05, -5.602836608886719e-05, -5.173683166503906e-05, -4.744529724121094e-05, -4.315376281738281e-05, -3.886222839355469e-05, -3.457069396972656e-05, -3.0279159545898438e-05, -2.5987625122070312e-05, -2.1696090698242188e-05, -1.7404556274414062e-05, -1.3113021850585938e-05, -8.821487426757812e-06, -4.5299530029296875e-06, -2.384185791015625e-07, 4.0531158447265625e-06, 8.344650268554688e-06, 1.2636184692382812e-05, 1.6927719116210938e-05, 2.1219253540039062e-05, 2.5510787963867188e-05, 2.9802322387695312e-05, 3.409385681152344e-05, 3.838539123535156e-05, 4.267692565917969e-05, 4.696846008300781e-05, 5.125999450683594e-05, 5.555152893066406e-05, 5.984306335449219e-05, 6.413459777832031e-05, 6.842613220214844e-05, 7.271766662597656e-05, 7.700920104980469e-05, 8.130073547363281e-05, 8.559226989746094e-05, 8.988380432128906e-05, 9.417533874511719e-05, 9.846687316894531e-05, 0.00010275840759277344, 0.00010704994201660156, 0.00011134147644042969, 0.00011563301086425781, 0.00011992454528808594, 0.00012421607971191406]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 5.0, 5.0, 9.0, 11.0, 9.0, 11.0, 23.0, 42.0, 56.0, 86.0, 168.0, 342.0, 679.0, 1403.0, 3082.0, 10103.0, 122002.0, 865796.0, 34430.0, 6081.0, 2191.0, 948.0, 459.0, 241.0, 124.0, 77.0, 61.0, 27.0, 14.0, 8.0, 13.0, 6.0, 2.0, 6.0, 5.0, 7.0, 4.0, 5.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.3427734375, -0.3330650329589844, -0.32335662841796875, -0.3136482238769531, -0.3039398193359375, -0.2942314147949219, -0.28452301025390625, -0.2748146057128906, -0.265106201171875, -0.2553977966308594, -0.24568939208984375, -0.23598098754882812, -0.2262725830078125, -0.21656417846679688, -0.20685577392578125, -0.19714736938476562, -0.18743896484375, -0.17773056030273438, -0.16802215576171875, -0.15831375122070312, -0.1486053466796875, -0.13889694213867188, -0.12918853759765625, -0.11948013305664062, -0.109771728515625, -0.10006332397460938, -0.09035491943359375, -0.08064651489257812, -0.0709381103515625, -0.061229705810546875, -0.05152130126953125, -0.041812896728515625, -0.0321044921875, -0.022396087646484375, -0.01268768310546875, -0.002979278564453125, 0.0067291259765625, 0.016437530517578125, 0.02614593505859375, 0.035854339599609375, 0.045562744140625, 0.055271148681640625, 0.06497955322265625, 0.07468795776367188, 0.0843963623046875, 0.09410476684570312, 0.10381317138671875, 0.11352157592773438, 0.12322998046875, 0.13293838500976562, 0.14264678955078125, 0.15235519409179688, 0.1620635986328125, 0.17177200317382812, 0.18148040771484375, 0.19118881225585938, 0.200897216796875, 0.21060562133789062, 0.22031402587890625, 0.23002243041992188, 0.2397308349609375, 0.24943923950195312, 0.25914764404296875, 0.2688560485839844, 0.278564453125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 2.0, 6.0, 7.0, 12.0, 27.0, 35.0, 61.0, 93.0, 188.0, 232.0, 145.0, 77.0, 38.0, 21.0, 11.0, 12.0, 7.0, 3.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42236328125, -0.41040802001953125, -0.3984527587890625, -0.38649749755859375, -0.374542236328125, -0.36258697509765625, -0.3506317138671875, -0.33867645263671875, -0.32672119140625, -0.31476593017578125, -0.3028106689453125, -0.29085540771484375, -0.278900146484375, -0.26694488525390625, -0.2549896240234375, -0.24303436279296875, -0.2310791015625, -0.21912384033203125, -0.2071685791015625, -0.19521331787109375, -0.183258056640625, -0.17130279541015625, -0.1593475341796875, -0.14739227294921875, -0.13543701171875, -0.12348175048828125, -0.1115264892578125, -0.09957122802734375, -0.087615966796875, -0.07566070556640625, -0.0637054443359375, -0.05175018310546875, -0.039794921875, -0.02783966064453125, -0.0158843994140625, -0.00392913818359375, 0.008026123046875, 0.01998138427734375, 0.0319366455078125, 0.04389190673828125, 0.05584716796875, 0.06780242919921875, 0.0797576904296875, 0.09171295166015625, 0.103668212890625, 0.11562347412109375, 0.1275787353515625, 0.13953399658203125, 0.1514892578125, 0.16344451904296875, 0.1753997802734375, 0.18735504150390625, 0.199310302734375, 0.21126556396484375, 0.2232208251953125, 0.23517608642578125, 0.24713134765625, 0.25908660888671875, 0.2710418701171875, 0.28299713134765625, 0.294952392578125, 0.30690765380859375, 0.3188629150390625, 0.33081817626953125, 0.3427734375]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 7.0, 20.0, 42.0, 189.0, 462.0, 207.0, 57.0, 12.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.559015274047852, -8.311469078063965, -8.063922882080078, -7.816376686096191, -7.568830966949463, -7.321284770965576, -7.0737385749816895, -6.826192378997803, -6.578646659851074, -6.3311004638671875, -6.083554267883301, -5.836008071899414, -5.5884623527526855, -5.340916156768799, -5.093369960784912, -4.845823764801025, -4.598277568817139, -4.350731372833252, -4.103185176849365, -3.8556392192840576, -3.60809326171875, -3.3605470657348633, -3.1130008697509766, -2.86545467376709, -2.6179087162017822, -2.3703625202178955, -2.122816562652588, -1.8752703666687012, -1.627724289894104, -1.3801782131195068, -1.1326320171356201, -0.885085940361023, -0.637540340423584, -0.38999423384666443, -0.14244812726974487, 0.10509800910949707, 0.35264408588409424, 0.6001901626586914, 0.8477363586425781, 1.0952824354171753, 1.3428285121917725, 1.5903745889663696, 1.8379206657409668, 2.0854668617248535, 2.3330130577087402, 2.580559015274048, 2.8281052112579346, 3.075651168823242, 3.323197364807129, 3.5707435607910156, 3.8182895183563232, 4.065835952758789, 4.313381671905518, 4.560927867889404, 4.808474063873291, 5.056020259857178, 5.303565979003906, 5.551112174987793, 5.79865837097168, 6.046204566955566, 6.293750286102295, 6.541296482086182, 6.788842678070068, 7.036388874053955, 7.283935070037842]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 5.0, 3.0, 11.0, 15.0, 11.0, 18.0, 20.0, 30.0, 29.0, 46.0, 46.0, 42.0, 44.0, 41.0, 53.0, 47.0, 47.0, 60.0, 40.0, 48.0, 49.0, 56.0, 41.0, 33.0, 30.0, 30.0, 24.0, 17.0, 13.0, 15.0, 9.0, 6.0, 5.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.446514129638672, -4.315009117126465, -4.183504581451416, -4.052000045776367, -3.92049503326416, -3.7889902591705322, -3.6574854850769043, -3.5259807109832764, -3.3944759368896484, -3.2629711627960205, -3.1314663887023926, -2.9999616146087646, -2.8684568405151367, -2.736952066421509, -2.605447292327881, -2.473942518234253, -2.342437744140625, -2.210932970046997, -2.079428195953369, -1.9479234218597412, -1.8164186477661133, -1.6849138736724854, -1.5534090995788574, -1.4219043254852295, -1.2903995513916016, -1.1588947772979736, -1.0273900032043457, -0.8958852291107178, -0.7643804550170898, -0.6328756809234619, -0.501370906829834, -0.36986613273620605, -0.23836088180541992, -0.10685610771179199, 0.024648666381835938, 0.15615344047546387, 0.2876582145690918, 0.4191629886627197, 0.5506677627563477, 0.6821725368499756, 0.8136773109436035, 0.9451820850372314, 1.0766868591308594, 1.2081916332244873, 1.3396964073181152, 1.4712011814117432, 1.602705955505371, 1.734210729598999, 1.865715503692627, 1.9972202777862549, 2.128725051879883, 2.2602298259735107, 2.3917346000671387, 2.5232393741607666, 2.6547441482543945, 2.7862489223480225, 2.9177536964416504, 3.0492584705352783, 3.1807632446289062, 3.312268018722534, 3.443772792816162, 3.57527756690979, 3.706782341003418, 3.838287115097046, 3.969791889190674]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 1.0, 2.0, 4.0, 4.0, 15.0, 24.0, 27.0, 55.0, 122.0, 273.0, 779.0, 6936.0, 4167458.0, 17432.0, 818.0, 192.0, 84.0, 34.0, 15.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.392578125, -3.3182220458984375, -3.243865966796875, -3.1695098876953125, -3.09515380859375, -3.0207977294921875, -2.946441650390625, -2.8720855712890625, -2.7977294921875, -2.7233734130859375, -2.649017333984375, -2.5746612548828125, -2.50030517578125, -2.4259490966796875, -2.351593017578125, -2.2772369384765625, -2.202880859375, -2.1285247802734375, -2.054168701171875, -1.9798126220703125, -1.90545654296875, -1.8311004638671875, -1.756744384765625, -1.6823883056640625, -1.6080322265625, -1.5336761474609375, -1.459320068359375, -1.3849639892578125, -1.31060791015625, -1.2362518310546875, -1.161895751953125, -1.0875396728515625, -1.01318359375, -0.9388275146484375, -0.864471435546875, -0.7901153564453125, -0.71575927734375, -0.6414031982421875, -0.567047119140625, -0.4926910400390625, -0.4183349609375, -0.3439788818359375, -0.269622802734375, -0.1952667236328125, -0.12091064453125, -0.0465545654296875, 0.027801513671875, 0.1021575927734375, 0.176513671875, 0.2508697509765625, 0.325225830078125, 0.3995819091796875, 0.47393798828125, 0.5482940673828125, 0.622650146484375, 0.6970062255859375, 0.7713623046875, 0.8457183837890625, 0.920074462890625, 0.9944305419921875, 1.06878662109375, 1.1431427001953125, 1.217498779296875, 1.2918548583984375, 1.3662109375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 14.0, 10.0, 41.0, 76.0, 103.0, 182.0, 199.0, 151.0, 108.0, 68.0, 25.0, 11.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.470703125, -0.4600658416748047, -0.4494285583496094, -0.43879127502441406, -0.42815399169921875, -0.41751670837402344, -0.4068794250488281, -0.3962421417236328, -0.3856048583984375, -0.3749675750732422, -0.3643302917480469, -0.35369300842285156, -0.34305572509765625, -0.33241844177246094, -0.3217811584472656, -0.3111438751220703, -0.300506591796875, -0.2898693084716797, -0.2792320251464844, -0.26859474182128906, -0.25795745849609375, -0.24732017517089844, -0.23668289184570312, -0.2260456085205078, -0.2154083251953125, -0.2047710418701172, -0.19413375854492188, -0.18349647521972656, -0.17285919189453125, -0.16222190856933594, -0.15158462524414062, -0.1409473419189453, -0.13031005859375, -0.11967277526855469, -0.10903549194335938, -0.09839820861816406, -0.08776092529296875, -0.07712364196777344, -0.06648635864257812, -0.05584907531738281, -0.0452117919921875, -0.03457450866699219, -0.023937225341796875, -0.013299942016601562, -0.00266265869140625, 0.007974624633789062, 0.018611907958984375, 0.029249191284179688, 0.039886474609375, 0.05052375793457031, 0.061161041259765625, 0.07179832458496094, 0.08243560791015625, 0.09307289123535156, 0.10371017456054688, 0.11434745788574219, 0.1249847412109375, 0.1356220245361328, 0.14625930786132812, 0.15689659118652344, 0.16753387451171875, 0.17817115783691406, 0.18880844116210938, 0.1994457244873047, 0.2100830078125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 5.0, 14.0, 24.0, 33.0, 57.0, 91.0, 204.0, 553.0, 2350.0, 17534.0, 3906976.0, 256151.0, 7929.0, 1413.0, 442.0, 188.0, 97.0, 69.0, 49.0, 33.0, 18.0, 21.0, 8.0, 8.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.61669921875, -0.5918655395507812, -0.5670318603515625, -0.5421981811523438, -0.517364501953125, -0.49253082275390625, -0.4676971435546875, -0.44286346435546875, -0.41802978515625, -0.39319610595703125, -0.3683624267578125, -0.34352874755859375, -0.318695068359375, -0.29386138916015625, -0.2690277099609375, -0.24419403076171875, -0.2193603515625, -0.19452667236328125, -0.1696929931640625, -0.14485931396484375, -0.120025634765625, -0.09519195556640625, -0.0703582763671875, -0.04552459716796875, -0.02069091796875, 0.00414276123046875, 0.0289764404296875, 0.05381011962890625, 0.078643798828125, 0.10347747802734375, 0.1283111572265625, 0.15314483642578125, 0.177978515625, 0.20281219482421875, 0.2276458740234375, 0.25247955322265625, 0.277313232421875, 0.30214691162109375, 0.3269805908203125, 0.35181427001953125, 0.37664794921875, 0.40148162841796875, 0.4263153076171875, 0.45114898681640625, 0.475982666015625, 0.5008163452148438, 0.5256500244140625, 0.5504837036132812, 0.5753173828125, 0.6001510620117188, 0.6249847412109375, 0.6498184204101562, 0.674652099609375, 0.6994857788085938, 0.7243194580078125, 0.7491531372070312, 0.77398681640625, 0.7988204956054688, 0.8236541748046875, 0.8484878540039062, 0.873321533203125, 0.8981552124023438, 0.9229888916015625, 0.9478225708007812, 0.97265625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 13.0, 19.0, 20.0, 54.0, 118.0, 412.0, 2547.0, 621.0, 147.0, 48.0, 21.0, 18.0, 13.0, 6.0, 6.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12939453125, -0.12242889404296875, -0.1154632568359375, -0.10849761962890625, -0.101531982421875, -0.09456634521484375, -0.0876007080078125, -0.08063507080078125, -0.07366943359375, -0.06670379638671875, -0.0597381591796875, -0.05277252197265625, -0.045806884765625, -0.03884124755859375, -0.0318756103515625, -0.02490997314453125, -0.0179443359375, -0.01097869873046875, -0.0040130615234375, 0.00295257568359375, 0.009918212890625, 0.01688385009765625, 0.0238494873046875, 0.03081512451171875, 0.03778076171875, 0.04474639892578125, 0.0517120361328125, 0.05867767333984375, 0.065643310546875, 0.07260894775390625, 0.0795745849609375, 0.08654022216796875, 0.093505859375, 0.10047149658203125, 0.1074371337890625, 0.11440277099609375, 0.121368408203125, 0.12833404541015625, 0.1352996826171875, 0.14226531982421875, 0.14923095703125, 0.15619659423828125, 0.1631622314453125, 0.17012786865234375, 0.177093505859375, 0.18405914306640625, 0.1910247802734375, 0.19799041748046875, 0.2049560546875, 0.21192169189453125, 0.2188873291015625, 0.22585296630859375, 0.232818603515625, 0.23978424072265625, 0.2467498779296875, 0.25371551513671875, 0.26068115234375, 0.26764678955078125, 0.2746124267578125, 0.28157806396484375, 0.288543701171875, 0.29550933837890625, 0.3024749755859375, 0.30944061279296875, 0.31640625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 9.0, 32.0, 150.0, 452.0, 276.0, 66.0, 18.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09638249874115, -1.0567069053649902, -1.0170314311981201, -0.9773558974266052, -0.9376803636550903, -0.8980048298835754, -0.8583292961120605, -0.8186537623405457, -0.7789782285690308, -0.7393026947975159, -0.699627161026001, -0.6599516272544861, -0.6202760934829712, -0.5806005597114563, -0.5409250259399414, -0.5012494921684265, -0.4615739583969116, -0.42189842462539673, -0.38222289085388184, -0.34254735708236694, -0.30287182331085205, -0.26319628953933716, -0.22352075576782227, -0.18384522199630737, -0.14416968822479248, -0.10449415445327759, -0.0648186206817627, -0.025143086910247803, 0.01453244686126709, 0.05420798063278198, 0.09388351440429688, 0.13355904817581177, 0.1732344627380371, 0.212909996509552, 0.2525855302810669, 0.2922610640525818, 0.3319365978240967, 0.3716121315956116, 0.41128766536712646, 0.45096319913864136, 0.49063873291015625, 0.5303142666816711, 0.569989800453186, 0.6096653342247009, 0.6493408679962158, 0.6890164017677307, 0.7286919355392456, 0.7683674693107605, 0.8080430030822754, 0.8477185368537903, 0.8873940706253052, 0.9270696043968201, 0.966745138168335, 1.006420612335205, 1.0460962057113647, 1.0857717990875244, 1.1254472732543945, 1.1651227474212646, 1.2047983407974243, 1.244473934173584, 1.284149408340454, 1.3238248825073242, 1.3635004758834839, 1.4031760692596436, 1.4428515434265137]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 5.0, 3.0, 12.0, 5.0, 21.0, 18.0, 18.0, 25.0, 24.0, 26.0, 49.0, 41.0, 48.0, 43.0, 48.0, 60.0, 58.0, 47.0, 49.0, 37.0, 55.0, 49.0, 34.0, 42.0, 28.0, 33.0, 27.0, 20.0, 15.0, 12.0, 14.0, 7.0, 8.0, 3.0, 8.0, 4.0, 1.0, 1.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4704965353012085, -0.45749393105506897, -0.44449129700660706, -0.43148869276046753, -0.4184860587120056, -0.4054834544658661, -0.39248085021972656, -0.37947821617126465, -0.3664756119251251, -0.3534730076789856, -0.3404703736305237, -0.32746776938438416, -0.31446516513824463, -0.3014625310897827, -0.2884599268436432, -0.27545732259750366, -0.26245468854904175, -0.24945206940174103, -0.2364494502544403, -0.22344684600830078, -0.21044422686100006, -0.19744160771369934, -0.18443900346755981, -0.1714363843202591, -0.15843376517295837, -0.14543114602565765, -0.13242852687835693, -0.11942592263221741, -0.10642330348491669, -0.09342068433761597, -0.08041807264089584, -0.06741546094417572, -0.054412841796875, -0.04141022637486458, -0.028407610952854156, -0.015404995530843735, -0.002402380108833313, 0.010600239038467407, 0.02360285073518753, 0.036605462431907654, 0.049608081579208374, 0.0626107007265091, 0.07561331242322922, 0.08861592411994934, 0.10161854326725006, 0.11462116241455078, 0.1276237666606903, 0.14062638580799103, 0.15362900495529175, 0.16663162410259247, 0.1796342432498932, 0.19263684749603271, 0.20563946664333344, 0.21864208579063416, 0.23164469003677368, 0.2446473091840744, 0.2576499283313751, 0.27065253257751465, 0.28365516662597656, 0.2966577708721161, 0.3096603751182556, 0.32266300916671753, 0.33566561341285706, 0.3486682176589966, 0.3616708517074585]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 7.0, 11.0, 26.0, 29.0, 37.0, 63.0, 117.0, 192.0, 460.0, 1019.0, 3526.0, 33590.0, 924625.0, 77275.0, 5179.0, 1318.0, 504.0, 243.0, 139.0, 56.0, 45.0, 31.0, 13.0, 16.0, 9.0, 8.0, 6.0, 6.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4453125, -1.4078826904296875, -1.370452880859375, -1.3330230712890625, -1.29559326171875, -1.2581634521484375, -1.220733642578125, -1.1833038330078125, -1.1458740234375, -1.1084442138671875, -1.071014404296875, -1.0335845947265625, -0.99615478515625, -0.9587249755859375, -0.921295166015625, -0.8838653564453125, -0.846435546875, -0.8090057373046875, -0.771575927734375, -0.7341461181640625, -0.69671630859375, -0.6592864990234375, -0.621856689453125, -0.5844268798828125, -0.5469970703125, -0.5095672607421875, -0.472137451171875, -0.4347076416015625, -0.39727783203125, -0.3598480224609375, -0.322418212890625, -0.2849884033203125, -0.24755859375, -0.2101287841796875, -0.172698974609375, -0.1352691650390625, -0.09783935546875, -0.0604095458984375, -0.022979736328125, 0.0144500732421875, 0.0518798828125, 0.0893096923828125, 0.126739501953125, 0.1641693115234375, 0.20159912109375, 0.2390289306640625, 0.276458740234375, 0.3138885498046875, 0.351318359375, 0.3887481689453125, 0.426177978515625, 0.4636077880859375, 0.50103759765625, 0.5384674072265625, 0.575897216796875, 0.6133270263671875, 0.6507568359375, 0.6881866455078125, 0.725616455078125, 0.7630462646484375, 0.80047607421875, 0.8379058837890625, 0.875335693359375, 0.9127655029296875, 0.9501953125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 9.0, 17.0, 45.0, 79.0, 124.0, 190.0, 186.0, 154.0, 103.0, 47.0, 22.0, 10.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.462646484375, -0.4521465301513672, -0.4416465759277344, -0.43114662170410156, -0.42064666748046875, -0.41014671325683594, -0.3996467590332031, -0.3891468048095703, -0.3786468505859375, -0.3681468963623047, -0.3576469421386719, -0.34714698791503906, -0.33664703369140625, -0.32614707946777344, -0.3156471252441406, -0.3051471710205078, -0.294647216796875, -0.2841472625732422, -0.2736473083496094, -0.26314735412597656, -0.25264739990234375, -0.24214744567871094, -0.23164749145507812, -0.2211475372314453, -0.2106475830078125, -0.2001476287841797, -0.18964767456054688, -0.17914772033691406, -0.16864776611328125, -0.15814781188964844, -0.14764785766601562, -0.1371479034423828, -0.12664794921875, -0.11614799499511719, -0.10564804077148438, -0.09514808654785156, -0.08464813232421875, -0.07414817810058594, -0.06364822387695312, -0.05314826965332031, -0.0426483154296875, -0.03214836120605469, -0.021648406982421875, -0.011148452758789062, -0.00064849853515625, 0.009851455688476562, 0.020351409912109375, 0.030851364135742188, 0.041351318359375, 0.05185127258300781, 0.062351226806640625, 0.07285118103027344, 0.08335113525390625, 0.09385108947753906, 0.10435104370117188, 0.11485099792480469, 0.1253509521484375, 0.1358509063720703, 0.14635086059570312, 0.15685081481933594, 0.16735076904296875, 0.17785072326660156, 0.18835067749023438, 0.1988506317138672, 0.2093505859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 5.0, 6.0, 11.0, 9.0, 8.0, 23.0, 20.0, 19.0, 30.0, 49.0, 54.0, 66.0, 100.0, 178.0, 192.0, 350.0, 646.0, 1390.0, 3430.0, 10413.0, 40064.0, 230341.0, 609479.0, 115832.0, 23918.0, 6953.0, 2459.0, 948.0, 543.0, 311.0, 204.0, 119.0, 110.0, 68.0, 56.0, 45.0, 37.0, 27.0, 17.0, 4.0, 13.0, 6.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.440185546875, -0.4251747131347656, -0.41016387939453125, -0.3951530456542969, -0.3801422119140625, -0.3651313781738281, -0.35012054443359375, -0.3351097106933594, -0.320098876953125, -0.3050880432128906, -0.29007720947265625, -0.2750663757324219, -0.2600555419921875, -0.24504470825195312, -0.23003387451171875, -0.21502304077148438, -0.20001220703125, -0.18500137329101562, -0.16999053955078125, -0.15497970581054688, -0.1399688720703125, -0.12495803833007812, -0.10994720458984375, -0.09493637084960938, -0.079925537109375, -0.06491470336914062, -0.04990386962890625, -0.034893035888671875, -0.0198822021484375, -0.004871368408203125, 0.01013946533203125, 0.025150299072265625, 0.0401611328125, 0.055171966552734375, 0.07018280029296875, 0.08519363403320312, 0.1002044677734375, 0.11521530151367188, 0.13022613525390625, 0.14523696899414062, 0.160247802734375, 0.17525863647460938, 0.19026947021484375, 0.20528030395507812, 0.2202911376953125, 0.23530197143554688, 0.25031280517578125, 0.2653236389160156, 0.28033447265625, 0.2953453063964844, 0.31035614013671875, 0.3253669738769531, 0.3403778076171875, 0.3553886413574219, 0.37039947509765625, 0.3854103088378906, 0.400421142578125, 0.4154319763183594, 0.43044281005859375, 0.4454536437988281, 0.4604644775390625, 0.4754753112792969, 0.49048614501953125, 0.5054969787597656, 0.5205078125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 6.0, 2.0, 3.0, 10.0, 5.0, 9.0, 14.0, 5.0, 23.0, 11.0, 19.0, 10.0, 25.0, 25.0, 40.0, 29.0, 44.0, 32.0, 49.0, 56.0, 45.0, 61.0, 47.0, 38.0, 31.0, 45.0, 35.0, 35.0, 33.0, 35.0, 21.0, 26.0, 19.0, 14.0, 19.0, 17.0, 18.0, 11.0, 8.0, 10.0, 5.0, 4.0, 3.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.62109375, -0.603271484375, -0.58544921875, -0.567626953125, -0.5498046875, -0.531982421875, -0.51416015625, -0.496337890625, -0.478515625, -0.460693359375, -0.44287109375, -0.425048828125, -0.4072265625, -0.389404296875, -0.37158203125, -0.353759765625, -0.3359375, -0.318115234375, -0.30029296875, -0.282470703125, -0.2646484375, -0.246826171875, -0.22900390625, -0.211181640625, -0.193359375, -0.175537109375, -0.15771484375, -0.139892578125, -0.1220703125, -0.104248046875, -0.08642578125, -0.068603515625, -0.05078125, -0.032958984375, -0.01513671875, 0.002685546875, 0.0205078125, 0.038330078125, 0.05615234375, 0.073974609375, 0.091796875, 0.109619140625, 0.12744140625, 0.145263671875, 0.1630859375, 0.180908203125, 0.19873046875, 0.216552734375, 0.234375, 0.252197265625, 0.27001953125, 0.287841796875, 0.3056640625, 0.323486328125, 0.34130859375, 0.359130859375, 0.376953125, 0.394775390625, 0.41259765625, 0.430419921875, 0.4482421875, 0.466064453125, 0.48388671875, 0.501708984375, 0.51953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 5.0, 13.0, 23.0, 32.0, 69.0, 167.0, 403.0, 1699.0, 43630.0, 989378.0, 11574.0, 1022.0, 290.0, 128.0, 61.0, 29.0, 20.0, 7.0, 8.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3759765625, -0.3617095947265625, -0.347442626953125, -0.3331756591796875, -0.31890869140625, -0.3046417236328125, -0.290374755859375, -0.2761077880859375, -0.2618408203125, -0.2475738525390625, -0.233306884765625, -0.2190399169921875, -0.20477294921875, -0.1905059814453125, -0.176239013671875, -0.1619720458984375, -0.147705078125, -0.1334381103515625, -0.119171142578125, -0.1049041748046875, -0.09063720703125, -0.0763702392578125, -0.062103271484375, -0.0478363037109375, -0.0335693359375, -0.0193023681640625, -0.005035400390625, 0.0092315673828125, 0.02349853515625, 0.0377655029296875, 0.052032470703125, 0.0662994384765625, 0.08056640625, 0.0948333740234375, 0.109100341796875, 0.1233673095703125, 0.13763427734375, 0.1519012451171875, 0.166168212890625, 0.1804351806640625, 0.1947021484375, 0.2089691162109375, 0.223236083984375, 0.2375030517578125, 0.25177001953125, 0.2660369873046875, 0.280303955078125, 0.2945709228515625, 0.308837890625, 0.3231048583984375, 0.337371826171875, 0.3516387939453125, 0.36590576171875, 0.3801727294921875, 0.394439697265625, 0.4087066650390625, 0.4229736328125, 0.4372406005859375, 0.451507568359375, 0.4657745361328125, 0.48004150390625, 0.4943084716796875, 0.508575439453125, 0.5228424072265625, 0.537109375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 5.0, 7.0, 6.0, 11.0, 8.0, 14.0, 22.0, 36.0, 40.0, 41.0, 53.0, 72.0, 105.0, 122.0, 112.0, 99.0, 63.0, 37.0, 31.0, 33.0, 17.0, 13.0, 12.0, 15.0, 6.0, 5.0, 7.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.902217864990234e-05, -6.609782576560974e-05, -6.317347288131714e-05, -6.0249119997024536e-05, -5.7324767112731934e-05, -5.440041422843933e-05, -5.147606134414673e-05, -4.8551708459854126e-05, -4.5627355575561523e-05, -4.270300269126892e-05, -3.977864980697632e-05, -3.6854296922683716e-05, -3.392994403839111e-05, -3.100559115409851e-05, -2.8081238269805908e-05, -2.5156885385513306e-05, -2.2232532501220703e-05, -1.93081796169281e-05, -1.6383826732635498e-05, -1.3459473848342896e-05, -1.0535120964050293e-05, -7.6107680797576904e-06, -4.686415195465088e-06, -1.7620623111724854e-06, 1.1622905731201172e-06, 4.08664345741272e-06, 7.010996341705322e-06, 9.935349225997925e-06, 1.2859702110290527e-05, 1.578405499458313e-05, 1.8708407878875732e-05, 2.1632760763168335e-05, 2.4557113647460938e-05, 2.748146653175354e-05, 3.0405819416046143e-05, 3.3330172300338745e-05, 3.625452518463135e-05, 3.917887806892395e-05, 4.210323095321655e-05, 4.5027583837509155e-05, 4.795193672180176e-05, 5.087628960609436e-05, 5.380064249038696e-05, 5.6724995374679565e-05, 5.964934825897217e-05, 6.257370114326477e-05, 6.549805402755737e-05, 6.842240691184998e-05, 7.134675979614258e-05, 7.427111268043518e-05, 7.719546556472778e-05, 8.011981844902039e-05, 8.304417133331299e-05, 8.596852421760559e-05, 8.88928771018982e-05, 9.18172299861908e-05, 9.47415828704834e-05, 9.7665935754776e-05, 0.0001005902886390686, 0.0001035146415233612, 0.00010643899440765381, 0.00010936334729194641, 0.00011228770017623901, 0.00011521205306053162, 0.00011813640594482422]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 6.0, 9.0, 12.0, 15.0, 18.0, 31.0, 65.0, 87.0, 188.0, 378.0, 908.0, 2663.0, 11351.0, 121143.0, 843586.0, 57108.0, 7593.0, 1951.0, 758.0, 307.0, 152.0, 77.0, 42.0, 28.0, 25.0, 14.0, 10.0, 8.0, 6.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2315673828125, -0.22368431091308594, -0.21580123901367188, -0.2079181671142578, -0.20003509521484375, -0.1921520233154297, -0.18426895141601562, -0.17638587951660156, -0.1685028076171875, -0.16061973571777344, -0.15273666381835938, -0.1448535919189453, -0.13697052001953125, -0.1290874481201172, -0.12120437622070312, -0.11332130432128906, -0.105438232421875, -0.09755516052246094, -0.08967208862304688, -0.08178901672363281, -0.07390594482421875, -0.06602287292480469, -0.058139801025390625, -0.05025672912597656, -0.0423736572265625, -0.03449058532714844, -0.026607513427734375, -0.018724441528320312, -0.01084136962890625, -0.0029582977294921875, 0.004924774169921875, 0.012807846069335938, 0.02069091796875, 0.028573989868164062, 0.036457061767578125, 0.04434013366699219, 0.05222320556640625, 0.06010627746582031, 0.06798934936523438, 0.07587242126464844, 0.0837554931640625, 0.09163856506347656, 0.09952163696289062, 0.10740470886230469, 0.11528778076171875, 0.12317085266113281, 0.13105392456054688, 0.13893699645996094, 0.146820068359375, 0.15470314025878906, 0.16258621215820312, 0.1704692840576172, 0.17835235595703125, 0.1862354278564453, 0.19411849975585938, 0.20200157165527344, 0.2098846435546875, 0.21776771545410156, 0.22565078735351562, 0.2335338592529297, 0.24141693115234375, 0.2493000030517578, 0.2571830749511719, 0.26506614685058594, 0.27294921875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 4.0, 6.0, 3.0, 8.0, 8.0, 14.0, 14.0, 21.0, 26.0, 47.0, 62.0, 96.0, 129.0, 123.0, 134.0, 92.0, 58.0, 43.0, 35.0, 19.0, 9.0, 10.0, 13.0, 5.0, 4.0, 5.0, 4.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.2467041015625, -0.2399139404296875, -0.233123779296875, -0.2263336181640625, -0.21954345703125, -0.2127532958984375, -0.205963134765625, -0.1991729736328125, -0.1923828125, -0.1855926513671875, -0.178802490234375, -0.1720123291015625, -0.16522216796875, -0.1584320068359375, -0.151641845703125, -0.1448516845703125, -0.1380615234375, -0.1312713623046875, -0.124481201171875, -0.1176910400390625, -0.11090087890625, -0.1041107177734375, -0.097320556640625, -0.0905303955078125, -0.083740234375, -0.0769500732421875, -0.070159912109375, -0.0633697509765625, -0.05657958984375, -0.0497894287109375, -0.042999267578125, -0.0362091064453125, -0.0294189453125, -0.0226287841796875, -0.015838623046875, -0.0090484619140625, -0.00225830078125, 0.0045318603515625, 0.011322021484375, 0.0181121826171875, 0.02490234375, 0.0316925048828125, 0.038482666015625, 0.0452728271484375, 0.05206298828125, 0.0588531494140625, 0.065643310546875, 0.0724334716796875, 0.0792236328125, 0.0860137939453125, 0.092803955078125, 0.0995941162109375, 0.10638427734375, 0.1131744384765625, 0.119964599609375, 0.1267547607421875, 0.133544921875, 0.1403350830078125, 0.147125244140625, 0.1539154052734375, 0.16070556640625, 0.1674957275390625, 0.174285888671875, 0.1810760498046875, 0.1878662109375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 15.0, 56.0, 407.0, 472.0, 49.0, 6.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.608110427856445, -16.24764060974121, -15.88716983795166, -15.52669906616211, -15.166229248046875, -14.805758476257324, -14.44528865814209, -14.084817886352539, -13.724348068237305, -13.363877296447754, -13.00340747833252, -12.642936706542969, -12.282466888427734, -11.921996116638184, -11.56152629852295, -11.201055526733398, -10.840585708618164, -10.480114936828613, -10.119645118713379, -9.759174346923828, -9.398704528808594, -9.038233757019043, -8.677763938903809, -8.317293167114258, -7.956822395324707, -7.5963521003723145, -7.235881805419922, -6.875411510467529, -6.514941215515137, -6.154470920562744, -5.794000625610352, -5.433529853820801, -5.073060035705566, -4.712589740753174, -4.352119445800781, -3.9916491508483887, -3.631178855895996, -3.2707085609436035, -2.910238027572632, -2.5497677326202393, -2.1892974376678467, -1.828827142715454, -1.4683568477630615, -1.1078864336013794, -0.7474161386489868, -0.38694584369659424, -0.02647542953491211, 0.33399486541748047, 0.694465160369873, 1.0549354553222656, 1.4154057502746582, 1.7758761644363403, 2.1363463401794434, 2.496816635131836, 2.8572871685028076, 3.2177574634552, 3.5782277584075928, 3.9386980533599854, 4.299168586730957, 4.65963888168335, 5.020109176635742, 5.380579471588135, 5.741049766540527, 6.10152006149292, 6.4619903564453125]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 5.0, 8.0, 7.0, 13.0, 10.0, 16.0, 24.0, 26.0, 23.0, 29.0, 37.0, 28.0, 30.0, 60.0, 57.0, 65.0, 63.0, 78.0, 59.0, 46.0, 54.0, 47.0, 37.0, 28.0, 26.0, 35.0, 27.0, 13.0, 13.0, 15.0, 6.0, 4.0, 3.0, 5.0, 3.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.099729537963867, -3.962186813354492, -3.824644088745117, -3.687101125717163, -3.549558401107788, -3.412015676498413, -3.274472713470459, -3.136929988861084, -2.999387264251709, -2.861844539642334, -2.724301815032959, -2.586758852005005, -2.44921612739563, -2.311673402786255, -2.174130439758301, -2.036587715148926, -1.8990449905395508, -1.7615022659301758, -1.6239594221115112, -1.4864165782928467, -1.3488738536834717, -1.2113311290740967, -1.0737882852554321, -0.9362455010414124, -0.7987027168273926, -0.6611599326133728, -0.523617148399353, -0.38607436418533325, -0.24853157997131348, -0.1109887957572937, 0.026553988456726074, 0.16409677267074585, 0.30164003372192383, 0.4391828179359436, 0.5767256021499634, 0.7142683863639832, 0.8518111705780029, 0.9893539547920227, 1.1268967390060425, 1.264439582824707, 1.401982307434082, 1.539525032043457, 1.6770678758621216, 1.8146107196807861, 1.9521534442901611, 2.089696168899536, 2.2272391319274902, 2.3647818565368652, 2.5023245811462402, 2.6398673057556152, 2.7774100303649902, 2.9149529933929443, 3.0524957180023193, 3.1900384426116943, 3.3275814056396484, 3.4651241302490234, 3.6026668548583984, 3.7402095794677734, 3.8777523040771484, 4.015295028686523, 4.152837753295898, 4.290380954742432, 4.427923679351807, 4.565466403961182, 4.703009128570557]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 4.0, 3.0, 10.0, 10.0, 13.0, 15.0, 15.0, 23.0, 45.0, 59.0, 71.0, 161.0, 289.0, 610.0, 1573.0, 5831.0, 85088.0, 4074733.0, 21114.0, 3025.0, 921.0, 325.0, 133.0, 70.0, 42.0, 30.0, 17.0, 11.0, 14.0, 10.0, 5.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-1.8271484375, -1.7859115600585938, -1.7446746826171875, -1.7034378051757812, -1.662200927734375, -1.6209640502929688, -1.5797271728515625, -1.5384902954101562, -1.49725341796875, -1.4560165405273438, -1.4147796630859375, -1.3735427856445312, -1.332305908203125, -1.2910690307617188, -1.2498321533203125, -1.2085952758789062, -1.1673583984375, -1.1261215209960938, -1.0848846435546875, -1.0436477661132812, -1.002410888671875, -0.9611740112304688, -0.9199371337890625, -0.8787002563476562, -0.83746337890625, -0.7962265014648438, -0.7549896240234375, -0.7137527465820312, -0.672515869140625, -0.6312789916992188, -0.5900421142578125, -0.5488052368164062, -0.507568359375, -0.46633148193359375, -0.4250946044921875, -0.38385772705078125, -0.342620849609375, -0.30138397216796875, -0.2601470947265625, -0.21891021728515625, -0.17767333984375, -0.13643646240234375, -0.0951995849609375, -0.05396270751953125, -0.012725830078125, 0.02851104736328125, 0.0697479248046875, 0.11098480224609375, 0.1522216796875, 0.19345855712890625, 0.2346954345703125, 0.27593231201171875, 0.317169189453125, 0.35840606689453125, 0.3996429443359375, 0.44087982177734375, 0.48211669921875, 0.5233535766601562, 0.5645904541015625, 0.6058273315429688, 0.647064208984375, 0.6883010864257812, 0.7295379638671875, 0.7707748413085938, 0.81201171875]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 3.0, 17.0, 22.0, 30.0, 70.0, 104.0, 164.0, 194.0, 141.0, 122.0, 73.0, 36.0, 11.0, 9.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.46044921875, -0.4498462677001953, -0.4392433166503906, -0.42864036560058594, -0.41803741455078125, -0.40743446350097656, -0.3968315124511719, -0.3862285614013672, -0.3756256103515625, -0.3650226593017578, -0.3544197082519531, -0.34381675720214844, -0.33321380615234375, -0.32261085510253906, -0.3120079040527344, -0.3014049530029297, -0.290802001953125, -0.2801990509033203, -0.2695960998535156, -0.25899314880371094, -0.24839019775390625, -0.23778724670410156, -0.22718429565429688, -0.2165813446044922, -0.2059783935546875, -0.1953754425048828, -0.18477249145507812, -0.17416954040527344, -0.16356658935546875, -0.15296363830566406, -0.14236068725585938, -0.1317577362060547, -0.12115478515625, -0.11055183410644531, -0.09994888305664062, -0.08934593200683594, -0.07874298095703125, -0.06814002990722656, -0.057537078857421875, -0.04693412780761719, -0.0363311767578125, -0.025728225708007812, -0.015125274658203125, -0.0045223236083984375, 0.00608062744140625, 0.016683578491210938, 0.027286529541015625, 0.03788948059082031, 0.048492431640625, 0.05909538269042969, 0.06969833374023438, 0.08030128479003906, 0.09090423583984375, 0.10150718688964844, 0.11211013793945312, 0.12271308898925781, 0.1333160400390625, 0.1439189910888672, 0.15452194213867188, 0.16512489318847656, 0.17572784423828125, 0.18633079528808594, 0.19693374633789062, 0.2075366973876953, 0.2181396484375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 6.0, 2.0, 9.0, 8.0, 8.0, 11.0, 17.0, 25.0, 44.0, 63.0, 118.0, 194.0, 429.0, 841.0, 2644.0, 12042.0, 234595.0, 3897887.0, 36954.0, 5580.0, 1548.0, 623.0, 282.0, 139.0, 73.0, 49.0, 30.0, 20.0, 14.0, 6.0, 11.0, 5.0, 3.0, 4.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.79296875, -0.7716751098632812, -0.7503814697265625, -0.7290878295898438, -0.707794189453125, -0.6865005493164062, -0.6652069091796875, -0.6439132690429688, -0.62261962890625, -0.6013259887695312, -0.5800323486328125, -0.5587387084960938, -0.537445068359375, -0.5161514282226562, -0.4948577880859375, -0.47356414794921875, -0.4522705078125, -0.43097686767578125, -0.4096832275390625, -0.38838958740234375, -0.367095947265625, -0.34580230712890625, -0.3245086669921875, -0.30321502685546875, -0.28192138671875, -0.26062774658203125, -0.2393341064453125, -0.21804046630859375, -0.196746826171875, -0.17545318603515625, -0.1541595458984375, -0.13286590576171875, -0.111572265625, -0.09027862548828125, -0.0689849853515625, -0.04769134521484375, -0.026397705078125, -0.00510406494140625, 0.0161895751953125, 0.03748321533203125, 0.05877685546875, 0.08007049560546875, 0.1013641357421875, 0.12265777587890625, 0.143951416015625, 0.16524505615234375, 0.1865386962890625, 0.20783233642578125, 0.2291259765625, 0.25041961669921875, 0.2717132568359375, 0.29300689697265625, 0.314300537109375, 0.33559417724609375, 0.3568878173828125, 0.37818145751953125, 0.39947509765625, 0.42076873779296875, 0.4420623779296875, 0.46335601806640625, 0.484649658203125, 0.5059432983398438, 0.5272369384765625, 0.5485305786132812, 0.56982421875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 7.0, 6.0, 13.0, 20.0, 30.0, 53.0, 152.0, 472.0, 2149.0, 775.0, 188.0, 66.0, 54.0, 28.0, 16.0, 15.0, 8.0, 5.0, 6.0, 8.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.326171875, -0.3164710998535156, -0.30677032470703125, -0.2970695495605469, -0.2873687744140625, -0.2776679992675781, -0.26796722412109375, -0.2582664489746094, -0.248565673828125, -0.23886489868164062, -0.22916412353515625, -0.21946334838867188, -0.2097625732421875, -0.20006179809570312, -0.19036102294921875, -0.18066024780273438, -0.17095947265625, -0.16125869750976562, -0.15155792236328125, -0.14185714721679688, -0.1321563720703125, -0.12245559692382812, -0.11275482177734375, -0.10305404663085938, -0.093353271484375, -0.08365249633789062, -0.07395172119140625, -0.06425094604492188, -0.0545501708984375, -0.044849395751953125, -0.03514862060546875, -0.025447845458984375, -0.0157470703125, -0.006046295166015625, 0.00365447998046875, 0.013355255126953125, 0.0230560302734375, 0.032756805419921875, 0.04245758056640625, 0.052158355712890625, 0.061859130859375, 0.07155990600585938, 0.08126068115234375, 0.09096145629882812, 0.1006622314453125, 0.11036300659179688, 0.12006378173828125, 0.12976455688476562, 0.13946533203125, 0.14916610717773438, 0.15886688232421875, 0.16856765747070312, 0.1782684326171875, 0.18796920776367188, 0.19766998291015625, 0.20737075805664062, 0.217071533203125, 0.22677230834960938, 0.23647308349609375, 0.24617385864257812, 0.2558746337890625, 0.2655754089355469, 0.27527618408203125, 0.2849769592285156, 0.294677734375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 6.0, 18.0, 39.0, 159.0, 342.0, 288.0, 100.0, 38.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.9761909246444702, -0.9265843629837036, -0.876977801322937, -0.8273712396621704, -0.7777646780014038, -0.7281581163406372, -0.6785514950752258, -0.6289449334144592, -0.5793383717536926, -0.529731810092926, -0.4801252484321594, -0.43051865696907043, -0.38091209530830383, -0.33130553364753723, -0.28169894218444824, -0.23209238052368164, -0.18248581886291504, -0.13287925720214844, -0.08327268064022064, -0.03366610407829285, 0.015940457582473755, 0.06554701924324036, 0.11515361070632935, 0.16476017236709595, 0.21436673402786255, 0.26397329568862915, 0.31357985734939575, 0.36318644881248474, 0.41279301047325134, 0.46239957213401794, 0.5120061635971069, 0.5616127252578735, 0.6112191677093506, 0.6608257293701172, 0.7104322910308838, 0.7600388526916504, 0.809645414352417, 0.8592519760131836, 0.908858597278595, 0.9584651589393616, 1.0080716609954834, 1.05767822265625, 1.1072847843170166, 1.1568913459777832, 1.2064979076385498, 1.2561044692993164, 1.305711030960083, 1.3553175926208496, 1.4049242734909058, 1.4545308351516724, 1.504137396812439, 1.5537439584732056, 1.6033505201339722, 1.6529570817947388, 1.702563762664795, 1.7521703243255615, 1.8017768859863281, 1.8513834476470947, 1.9009900093078613, 1.950596570968628, 2.0002031326293945, 2.049809694290161, 2.0994162559509277, 2.1490228176116943, 2.198629379272461]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 10.0, 9.0, 11.0, 15.0, 22.0, 13.0, 27.0, 40.0, 27.0, 43.0, 63.0, 47.0, 66.0, 58.0, 64.0, 68.0, 50.0, 53.0, 51.0, 55.0, 36.0, 36.0, 23.0, 37.0, 17.0, 14.0, 16.0, 11.0, 2.0, 8.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7315791249275208, -0.7047148942947388, -0.6778506636619568, -0.6509864330291748, -0.6241222023963928, -0.5972579717636108, -0.5703937411308289, -0.5435295104980469, -0.5166652798652649, -0.4898010492324829, -0.4629368185997009, -0.43607258796691895, -0.40920835733413696, -0.382344126701355, -0.355479896068573, -0.328615665435791, -0.30175140500068665, -0.27488717436790466, -0.24802294373512268, -0.2211587131023407, -0.19429448246955872, -0.16743023693561554, -0.14056600630283356, -0.11370177567005157, -0.08683754503726959, -0.05997331440448761, -0.03310908004641533, -0.006244845688343048, 0.020619384944438934, 0.047483623027801514, 0.0743478536605835, 0.10121208429336548, 0.12807631492614746, 0.15494054555892944, 0.18180477619171143, 0.2086690068244934, 0.2355332374572754, 0.2623974680900574, 0.28926169872283936, 0.31612592935562134, 0.3429901599884033, 0.3698543906211853, 0.3967186212539673, 0.42358285188674927, 0.45044708251953125, 0.47731131315231323, 0.5041755437850952, 0.5310397744178772, 0.5579040050506592, 0.5847682356834412, 0.6116324663162231, 0.6384966969490051, 0.6653609275817871, 0.6922251582145691, 0.7190893888473511, 0.7459536194801331, 0.7728179097175598, 0.7996821403503418, 0.8265463709831238, 0.8534106016159058, 0.8802748322486877, 0.9071390628814697, 0.9340032935142517, 0.9608675241470337, 0.9877317547798157]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 7.0, 5.0, 16.0, 10.0, 19.0, 38.0, 32.0, 65.0, 78.0, 141.0, 240.0, 412.0, 792.0, 1950.0, 5996.0, 38178.0, 722841.0, 254040.0, 17081.0, 3753.0, 1338.0, 596.0, 362.0, 201.0, 106.0, 69.0, 46.0, 36.0, 38.0, 13.0, 8.0, 8.0, 4.0, 7.0, 5.0, 4.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8193359375, -0.7918548583984375, -0.764373779296875, -0.7368927001953125, -0.70941162109375, -0.6819305419921875, -0.654449462890625, -0.6269683837890625, -0.5994873046875, -0.5720062255859375, -0.544525146484375, -0.5170440673828125, -0.48956298828125, -0.4620819091796875, -0.434600830078125, -0.4071197509765625, -0.379638671875, -0.3521575927734375, -0.324676513671875, -0.2971954345703125, -0.26971435546875, -0.2422332763671875, -0.214752197265625, -0.1872711181640625, -0.1597900390625, -0.1323089599609375, -0.104827880859375, -0.0773468017578125, -0.04986572265625, -0.0223846435546875, 0.005096435546875, 0.0325775146484375, 0.06005859375, 0.0875396728515625, 0.115020751953125, 0.1425018310546875, 0.16998291015625, 0.1974639892578125, 0.224945068359375, 0.2524261474609375, 0.2799072265625, 0.3073883056640625, 0.334869384765625, 0.3623504638671875, 0.38983154296875, 0.4173126220703125, 0.444793701171875, 0.4722747802734375, 0.499755859375, 0.5272369384765625, 0.554718017578125, 0.5821990966796875, 0.60968017578125, 0.6371612548828125, 0.664642333984375, 0.6921234130859375, 0.7196044921875, 0.7470855712890625, 0.774566650390625, 0.8020477294921875, 0.82952880859375, 0.8570098876953125, 0.884490966796875, 0.9119720458984375, 0.939453125]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 16.0, 21.0, 41.0, 75.0, 118.0, 160.0, 180.0, 151.0, 109.0, 65.0, 32.0, 13.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.439697265625, -0.4295330047607422, -0.4193687438964844, -0.40920448303222656, -0.39904022216796875, -0.38887596130371094, -0.3787117004394531, -0.3685474395751953, -0.3583831787109375, -0.3482189178466797, -0.3380546569824219, -0.32789039611816406, -0.31772613525390625, -0.30756187438964844, -0.2973976135253906, -0.2872333526611328, -0.277069091796875, -0.2669048309326172, -0.2567405700683594, -0.24657630920410156, -0.23641204833984375, -0.22624778747558594, -0.21608352661132812, -0.2059192657470703, -0.1957550048828125, -0.1855907440185547, -0.17542648315429688, -0.16526222229003906, -0.15509796142578125, -0.14493370056152344, -0.13476943969726562, -0.12460517883300781, -0.11444091796875, -0.10427665710449219, -0.09411239624023438, -0.08394813537597656, -0.07378387451171875, -0.06361961364746094, -0.053455352783203125, -0.04329109191894531, -0.0331268310546875, -0.022962570190429688, -0.012798309326171875, -0.0026340484619140625, 0.00753021240234375, 0.017694473266601562, 0.027858734130859375, 0.03802299499511719, 0.048187255859375, 0.05835151672363281, 0.06851577758789062, 0.07868003845214844, 0.08884429931640625, 0.09900856018066406, 0.10917282104492188, 0.11933708190917969, 0.1295013427734375, 0.1396656036376953, 0.14982986450195312, 0.15999412536621094, 0.17015838623046875, 0.18032264709472656, 0.19048690795898438, 0.2006511688232422, 0.2108154296875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 2.0, 6.0, 6.0, 11.0, 8.0, 14.0, 15.0, 31.0, 41.0, 42.0, 61.0, 81.0, 124.0, 196.0, 407.0, 772.0, 1707.0, 4394.0, 14488.0, 68610.0, 480250.0, 401910.0, 56305.0, 12313.0, 3753.0, 1373.0, 664.0, 340.0, 212.0, 110.0, 70.0, 53.0, 37.0, 36.0, 15.0, 13.0, 13.0, 18.0, 8.0, 6.0, 10.0, 5.0, 7.0, 1.0, 6.0, 3.0, 1.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.44189453125, -0.42662811279296875, -0.4113616943359375, -0.39609527587890625, -0.380828857421875, -0.36556243896484375, -0.3502960205078125, -0.33502960205078125, -0.31976318359375, -0.30449676513671875, -0.2892303466796875, -0.27396392822265625, -0.258697509765625, -0.24343109130859375, -0.2281646728515625, -0.21289825439453125, -0.1976318359375, -0.18236541748046875, -0.1670989990234375, -0.15183258056640625, -0.136566162109375, -0.12129974365234375, -0.1060333251953125, -0.09076690673828125, -0.07550048828125, -0.06023406982421875, -0.0449676513671875, -0.02970123291015625, -0.014434814453125, 0.00083160400390625, 0.0160980224609375, 0.03136444091796875, 0.046630859375, 0.06189727783203125, 0.0771636962890625, 0.09243011474609375, 0.107696533203125, 0.12296295166015625, 0.1382293701171875, 0.15349578857421875, 0.16876220703125, 0.18402862548828125, 0.1992950439453125, 0.21456146240234375, 0.229827880859375, 0.24509429931640625, 0.2603607177734375, 0.27562713623046875, 0.2908935546875, 0.30615997314453125, 0.3214263916015625, 0.33669281005859375, 0.351959228515625, 0.36722564697265625, 0.3824920654296875, 0.39775848388671875, 0.41302490234375, 0.42829132080078125, 0.4435577392578125, 0.45882415771484375, 0.474090576171875, 0.48935699462890625, 0.5046234130859375, 0.5198898315429688, 0.53515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 4.0, 8.0, 8.0, 19.0, 13.0, 13.0, 24.0, 24.0, 19.0, 34.0, 27.0, 39.0, 32.0, 27.0, 37.0, 37.0, 54.0, 46.0, 36.0, 46.0, 32.0, 32.0, 31.0, 36.0, 39.0, 32.0, 27.0, 25.0, 29.0, 25.0, 21.0, 18.0, 13.0, 7.0, 14.0, 11.0, 8.0, 4.0, 6.0, 3.0, 5.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.499267578125, -0.4834861755371094, -0.46770477294921875, -0.4519233703613281, -0.4361419677734375, -0.4203605651855469, -0.40457916259765625, -0.3887977600097656, -0.373016357421875, -0.3572349548339844, -0.34145355224609375, -0.3256721496582031, -0.3098907470703125, -0.2941093444824219, -0.27832794189453125, -0.2625465393066406, -0.24676513671875, -0.23098373413085938, -0.21520233154296875, -0.19942092895507812, -0.1836395263671875, -0.16785812377929688, -0.15207672119140625, -0.13629531860351562, -0.120513916015625, -0.10473251342773438, -0.08895111083984375, -0.07316970825195312, -0.0573883056640625, -0.041606903076171875, -0.02582550048828125, -0.010044097900390625, 0.0057373046875, 0.021518707275390625, 0.03730010986328125, 0.053081512451171875, 0.0688629150390625, 0.08464431762695312, 0.10042572021484375, 0.11620712280273438, 0.131988525390625, 0.14776992797851562, 0.16355133056640625, 0.17933273315429688, 0.1951141357421875, 0.21089553833007812, 0.22667694091796875, 0.24245834350585938, 0.25823974609375, 0.2740211486816406, 0.28980255126953125, 0.3055839538574219, 0.3213653564453125, 0.3371467590332031, 0.35292816162109375, 0.3687095642089844, 0.384490966796875, 0.4002723693847656, 0.41605377197265625, 0.4318351745605469, 0.4476165771484375, 0.4633979797363281, 0.47917938232421875, 0.4949607849121094, 0.5107421875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 3.0, 6.0, 7.0, 3.0, 10.0, 22.0, 28.0, 49.0, 94.0, 221.0, 519.0, 1602.0, 7232.0, 119741.0, 892919.0, 21480.0, 3089.0, 880.0, 322.0, 137.0, 74.0, 47.0, 19.0, 16.0, 16.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.337646484375, -0.32525634765625, -0.3128662109375, -0.30047607421875, -0.2880859375, -0.27569580078125, -0.2633056640625, -0.25091552734375, -0.238525390625, -0.22613525390625, -0.2137451171875, -0.20135498046875, -0.18896484375, -0.17657470703125, -0.1641845703125, -0.15179443359375, -0.139404296875, -0.12701416015625, -0.1146240234375, -0.10223388671875, -0.08984375, -0.07745361328125, -0.0650634765625, -0.05267333984375, -0.040283203125, -0.02789306640625, -0.0155029296875, -0.00311279296875, 0.00927734375, 0.02166748046875, 0.0340576171875, 0.04644775390625, 0.058837890625, 0.07122802734375, 0.0836181640625, 0.09600830078125, 0.1083984375, 0.12078857421875, 0.1331787109375, 0.14556884765625, 0.157958984375, 0.17034912109375, 0.1827392578125, 0.19512939453125, 0.20751953125, 0.21990966796875, 0.2322998046875, 0.24468994140625, 0.257080078125, 0.26947021484375, 0.2818603515625, 0.29425048828125, 0.306640625, 0.31903076171875, 0.3314208984375, 0.34381103515625, 0.356201171875, 0.36859130859375, 0.3809814453125, 0.39337158203125, 0.40576171875, 0.41815185546875, 0.4305419921875, 0.44293212890625, 0.455322265625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 7.0, 2.0, 8.0, 15.0, 19.0, 23.0, 26.0, 30.0, 39.0, 49.0, 41.0, 65.0, 79.0, 89.0, 91.0, 81.0, 77.0, 49.0, 42.0, 42.0, 32.0, 23.0, 17.0, 13.0, 13.0, 7.0, 3.0, 9.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.308887481689453e-05, -8.083414286375046e-05, -7.857941091060638e-05, -7.632467895746231e-05, -7.406994700431824e-05, -7.181521505117416e-05, -6.956048309803009e-05, -6.730575114488602e-05, -6.505101919174194e-05, -6.279628723859787e-05, -6.0541555285453796e-05, -5.828682333230972e-05, -5.603209137916565e-05, -5.3777359426021576e-05, -5.15226274728775e-05, -4.926789551973343e-05, -4.7013163566589355e-05, -4.475843161344528e-05, -4.250369966030121e-05, -4.0248967707157135e-05, -3.799423575401306e-05, -3.573950380086899e-05, -3.3484771847724915e-05, -3.123003989458084e-05, -2.8975307941436768e-05, -2.6720575988292694e-05, -2.446584403514862e-05, -2.2211112082004547e-05, -1.9956380128860474e-05, -1.77016481757164e-05, -1.5446916222572327e-05, -1.3192184269428253e-05, -1.093745231628418e-05, -8.682720363140106e-06, -6.427988409996033e-06, -4.173256456851959e-06, -1.9185245037078857e-06, 3.3620744943618774e-07, 2.5909394025802612e-06, 4.845671355724335e-06, 7.100403308868408e-06, 9.355135262012482e-06, 1.1609867215156555e-05, 1.3864599168300629e-05, 1.6119331121444702e-05, 1.8374063074588776e-05, 2.062879502773285e-05, 2.2883526980876923e-05, 2.5138258934020996e-05, 2.739299088716507e-05, 2.9647722840309143e-05, 3.1902454793453217e-05, 3.415718674659729e-05, 3.6411918699741364e-05, 3.866665065288544e-05, 4.092138260602951e-05, 4.3176114559173584e-05, 4.543084651231766e-05, 4.768557846546173e-05, 4.9940310418605804e-05, 5.219504237174988e-05, 5.444977432489395e-05, 5.6704506278038025e-05, 5.89592382311821e-05, 6.121397018432617e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 5.0, 2.0, 3.0, 6.0, 12.0, 23.0, 35.0, 53.0, 108.0, 177.0, 557.0, 1817.0, 10880.0, 360622.0, 654893.0, 15764.0, 2415.0, 669.0, 245.0, 135.0, 60.0, 31.0, 20.0, 10.0, 3.0, 7.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3115234375, -0.3000144958496094, -0.28850555419921875, -0.2769966125488281, -0.2654876708984375, -0.2539787292480469, -0.24246978759765625, -0.23096084594726562, -0.219451904296875, -0.20794296264648438, -0.19643402099609375, -0.18492507934570312, -0.1734161376953125, -0.16190719604492188, -0.15039825439453125, -0.13888931274414062, -0.12738037109375, -0.11587142944335938, -0.10436248779296875, -0.09285354614257812, -0.0813446044921875, -0.06983566284179688, -0.05832672119140625, -0.046817779541015625, -0.035308837890625, -0.023799896240234375, -0.01229095458984375, -0.000782012939453125, 0.0107269287109375, 0.022235870361328125, 0.03374481201171875, 0.045253753662109375, 0.0567626953125, 0.06827163696289062, 0.07978057861328125, 0.09128952026367188, 0.1027984619140625, 0.11430740356445312, 0.12581634521484375, 0.13732528686523438, 0.148834228515625, 0.16034317016601562, 0.17185211181640625, 0.18336105346679688, 0.1948699951171875, 0.20637893676757812, 0.21788787841796875, 0.22939682006835938, 0.24090576171875, 0.2524147033691406, 0.26392364501953125, 0.2754325866699219, 0.2869415283203125, 0.2984504699707031, 0.30995941162109375, 0.3214683532714844, 0.332977294921875, 0.3444862365722656, 0.35599517822265625, 0.3675041198730469, 0.3790130615234375, 0.3905220031738281, 0.40203094482421875, 0.4135398864746094, 0.425048828125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 6.0, 3.0, 6.0, 9.0, 15.0, 17.0, 24.0, 49.0, 55.0, 82.0, 166.0, 178.0, 145.0, 83.0, 57.0, 39.0, 21.0, 18.0, 10.0, 7.0, 3.0, 4.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.350830078125, -0.3402824401855469, -0.32973480224609375, -0.3191871643066406, -0.3086395263671875, -0.2980918884277344, -0.28754425048828125, -0.2769966125488281, -0.266448974609375, -0.2559013366699219, -0.24535369873046875, -0.23480606079101562, -0.2242584228515625, -0.21371078491210938, -0.20316314697265625, -0.19261550903320312, -0.18206787109375, -0.17152023315429688, -0.16097259521484375, -0.15042495727539062, -0.1398773193359375, -0.12932968139648438, -0.11878204345703125, -0.10823440551757812, -0.097686767578125, -0.08713912963867188, -0.07659149169921875, -0.06604385375976562, -0.0554962158203125, -0.044948577880859375, -0.03440093994140625, -0.023853302001953125, -0.0133056640625, -0.002758026123046875, 0.00778961181640625, 0.018337249755859375, 0.0288848876953125, 0.039432525634765625, 0.04998016357421875, 0.060527801513671875, 0.071075439453125, 0.08162307739257812, 0.09217071533203125, 0.10271835327148438, 0.1132659912109375, 0.12381362915039062, 0.13436126708984375, 0.14490890502929688, 0.15545654296875, 0.16600418090820312, 0.17655181884765625, 0.18709945678710938, 0.1976470947265625, 0.20819473266601562, 0.21874237060546875, 0.22929000854492188, 0.239837646484375, 0.2503852844238281, 0.26093292236328125, 0.2714805603027344, 0.2820281982421875, 0.2925758361816406, 0.30312347412109375, 0.3136711120605469, 0.32421875]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 9.0, 16.0, 87.0, 567.0, 291.0, 35.0, 7.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.300676345825195, -17.940441131591797, -17.5802059173584, -17.219968795776367, -16.85973358154297, -16.49949836730957, -16.139263153076172, -15.779026985168457, -15.418790817260742, -15.058555603027344, -14.698319435119629, -14.33808422088623, -13.977848052978516, -13.617612838745117, -13.257377624511719, -12.897141456604004, -12.536906242370605, -12.176671028137207, -11.816434860229492, -11.456199645996094, -11.095963478088379, -10.73572826385498, -10.375492095947266, -10.015256881713867, -9.655021667480469, -9.29478645324707, -8.934550285339355, -8.574315071105957, -8.214078903198242, -7.853843688964844, -7.493607997894287, -7.1333723068237305, -6.773136615753174, -6.412900924682617, -6.0526652336120605, -5.692429542541504, -5.3321943283081055, -4.971958160400391, -4.611722946166992, -4.2514872550964355, -3.891251564025879, -3.5310158729553223, -3.1707801818847656, -2.810544729232788, -2.4503090381622314, -2.090073347091675, -1.7298378944396973, -1.3696022033691406, -1.009366512298584, -0.6491308808326721, -0.28889524936676025, 0.07134032249450684, 0.4315760135650635, 0.7918117046356201, 1.1520471572875977, 1.5122828483581543, 1.872518539428711, 2.2327542304992676, 2.592989921569824, 2.9532253742218018, 3.3134610652923584, 3.673696756362915, 4.033932209014893, 4.394167900085449, 4.754403591156006]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 5.0, 3.0, 6.0, 8.0, 14.0, 17.0, 20.0, 31.0, 22.0, 28.0, 35.0, 35.0, 45.0, 44.0, 41.0, 43.0, 61.0, 62.0, 55.0, 45.0, 53.0, 37.0, 44.0, 34.0, 35.0, 28.0, 19.0, 32.0, 19.0, 11.0, 18.0, 7.0, 14.0, 8.0, 3.0, 5.0, 6.0, 1.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.3008971214294434, -3.185000419616699, -3.069103479385376, -2.953206777572632, -2.8373098373413086, -2.7214131355285645, -2.6055164337158203, -2.489619493484497, -2.373722791671753, -2.257826089859009, -2.1419291496276855, -2.0260324478149414, -1.9101356267929077, -1.794238805770874, -1.6783419847488403, -1.5624451637268066, -1.446548342704773, -1.3306515216827393, -1.2147547006607056, -1.0988578796386719, -0.9829611778259277, -0.867064356803894, -0.7511675357818604, -0.6352707743644714, -0.5193739533424377, -0.40347716212272644, -0.28758037090301514, -0.17168354988098145, -0.05578675866127014, 0.06011003255844116, 0.17600685358047485, 0.29190361499786377, 0.40780043601989746, 0.5236972570419312, 0.6395940184593201, 0.7554908394813538, 0.8713876008987427, 0.9872844219207764, 1.10318124294281, 1.2190780639648438, 1.334974765777588, 1.4508715867996216, 1.5667684078216553, 1.6826651096343994, 1.798561930656433, 1.9144587516784668, 2.030355453491211, 2.146252393722534, 2.2621493339538574, 2.3780460357666016, 2.493942975997925, 2.609839677810669, 2.725736618041992, 2.8416333198547363, 2.9575300216674805, 3.0734269618988037, 3.189323663711548, 3.305220365524292, 3.4211173057556152, 3.5370140075683594, 3.6529109477996826, 3.7688076496124268, 3.88470458984375, 4.000601291656494, 4.116497993469238]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 8.0, 6.0, 6.0, 5.0, 9.0, 10.0, 20.0, 22.0, 48.0, 48.0, 90.0, 126.0, 229.0, 532.0, 1556.0, 7108.0, 85756.0, 4061183.0, 31634.0, 4122.0, 1039.0, 381.0, 174.0, 86.0, 37.0, 23.0, 12.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1650390625, -1.1381607055664062, -1.1112823486328125, -1.0844039916992188, -1.057525634765625, -1.0306472778320312, -1.0037689208984375, -0.9768905639648438, -0.95001220703125, -0.9231338500976562, -0.8962554931640625, -0.8693771362304688, -0.842498779296875, -0.8156204223632812, -0.7887420654296875, -0.7618637084960938, -0.7349853515625, -0.7081069946289062, -0.6812286376953125, -0.6543502807617188, -0.627471923828125, -0.6005935668945312, -0.5737152099609375, -0.5468368530273438, -0.51995849609375, -0.49308013916015625, -0.4662017822265625, -0.43932342529296875, -0.412445068359375, -0.38556671142578125, -0.3586883544921875, -0.33180999755859375, -0.304931640625, -0.27805328369140625, -0.2511749267578125, -0.22429656982421875, -0.197418212890625, -0.17053985595703125, -0.1436614990234375, -0.11678314208984375, -0.08990478515625, -0.06302642822265625, -0.0361480712890625, -0.00926971435546875, 0.017608642578125, 0.04448699951171875, 0.0713653564453125, 0.09824371337890625, 0.1251220703125, 0.15200042724609375, 0.1788787841796875, 0.20575714111328125, 0.232635498046875, 0.25951385498046875, 0.2863922119140625, 0.31327056884765625, 0.34014892578125, 0.36702728271484375, 0.3939056396484375, 0.42078399658203125, 0.447662353515625, 0.47454071044921875, 0.5014190673828125, 0.5282974243164062, 0.55517578125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 8.0, 8.0, 20.0, 22.0, 62.0, 86.0, 127.0, 135.0, 150.0, 135.0, 94.0, 66.0, 44.0, 22.0, 10.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.44287109375, -0.4326190948486328, -0.4223670959472656, -0.41211509704589844, -0.40186309814453125, -0.39161109924316406, -0.3813591003417969, -0.3711071014404297, -0.3608551025390625, -0.3506031036376953, -0.3403511047363281, -0.33009910583496094, -0.31984710693359375, -0.30959510803222656, -0.2993431091308594, -0.2890911102294922, -0.278839111328125, -0.2685871124267578, -0.2583351135253906, -0.24808311462402344, -0.23783111572265625, -0.22757911682128906, -0.21732711791992188, -0.2070751190185547, -0.1968231201171875, -0.1865711212158203, -0.17631912231445312, -0.16606712341308594, -0.15581512451171875, -0.14556312561035156, -0.13531112670898438, -0.1250591278076172, -0.11480712890625, -0.10455513000488281, -0.09430313110351562, -0.08405113220214844, -0.07379913330078125, -0.06354713439941406, -0.053295135498046875, -0.04304313659667969, -0.0327911376953125, -0.022539138793945312, -0.012287139892578125, -0.0020351409912109375, 0.00821685791015625, 0.018468856811523438, 0.028720855712890625, 0.03897285461425781, 0.049224853515625, 0.05947685241699219, 0.06972885131835938, 0.07998085021972656, 0.09023284912109375, 0.10048484802246094, 0.11073684692382812, 0.12098884582519531, 0.1312408447265625, 0.1414928436279297, 0.15174484252929688, 0.16199684143066406, 0.17224884033203125, 0.18250083923339844, 0.19275283813476562, 0.2030048370361328, 0.2132568359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 13.0, 13.0, 23.0, 49.0, 50.0, 95.0, 172.0, 341.0, 1213.0, 8291.0, 3182287.0, 992718.0, 7116.0, 1139.0, 347.0, 155.0, 96.0, 58.0, 49.0, 26.0, 15.0, 10.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.85986328125, -0.8311691284179688, -0.8024749755859375, -0.7737808227539062, -0.745086669921875, -0.7163925170898438, -0.6876983642578125, -0.6590042114257812, -0.63031005859375, -0.6016159057617188, -0.5729217529296875, -0.5442276000976562, -0.515533447265625, -0.48683929443359375, -0.4581451416015625, -0.42945098876953125, -0.4007568359375, -0.37206268310546875, -0.3433685302734375, -0.31467437744140625, -0.285980224609375, -0.25728607177734375, -0.2285919189453125, -0.19989776611328125, -0.17120361328125, -0.14250946044921875, -0.1138153076171875, -0.08512115478515625, -0.056427001953125, -0.02773284912109375, 0.0009613037109375, 0.02965545654296875, 0.058349609375, 0.08704376220703125, 0.1157379150390625, 0.14443206787109375, 0.173126220703125, 0.20182037353515625, 0.2305145263671875, 0.25920867919921875, 0.28790283203125, 0.31659698486328125, 0.3452911376953125, 0.37398529052734375, 0.402679443359375, 0.43137359619140625, 0.4600677490234375, 0.48876190185546875, 0.5174560546875, 0.5461502075195312, 0.5748443603515625, 0.6035385131835938, 0.632232666015625, 0.6609268188476562, 0.6896209716796875, 0.7183151245117188, 0.74700927734375, 0.7757034301757812, 0.8043975830078125, 0.8330917358398438, 0.861785888671875, 0.8904800415039062, 0.9191741943359375, 0.9478683471679688, 0.9765625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 10.0, 26.0, 62.0, 168.0, 1703.0, 1846.0, 159.0, 46.0, 21.0, 8.0, 9.0, 10.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3564453125, -0.34494781494140625, -0.3334503173828125, -0.32195281982421875, -0.310455322265625, -0.29895782470703125, -0.2874603271484375, -0.27596282958984375, -0.26446533203125, -0.25296783447265625, -0.2414703369140625, -0.22997283935546875, -0.218475341796875, -0.20697784423828125, -0.1954803466796875, -0.18398284912109375, -0.1724853515625, -0.16098785400390625, -0.1494903564453125, -0.13799285888671875, -0.126495361328125, -0.11499786376953125, -0.1035003662109375, -0.09200286865234375, -0.08050537109375, -0.06900787353515625, -0.0575103759765625, -0.04601287841796875, -0.034515380859375, -0.02301788330078125, -0.0115203857421875, -2.288818359375e-05, 0.011474609375, 0.02297210693359375, 0.0344696044921875, 0.04596710205078125, 0.057464599609375, 0.06896209716796875, 0.0804595947265625, 0.09195709228515625, 0.10345458984375, 0.11495208740234375, 0.1264495849609375, 0.13794708251953125, 0.149444580078125, 0.16094207763671875, 0.1724395751953125, 0.18393707275390625, 0.1954345703125, 0.20693206787109375, 0.2184295654296875, 0.22992706298828125, 0.241424560546875, 0.25292205810546875, 0.2644195556640625, 0.27591705322265625, 0.28741455078125, 0.29891204833984375, 0.3104095458984375, 0.32190704345703125, 0.333404541015625, 0.34490203857421875, 0.3563995361328125, 0.36789703369140625, 0.37939453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 13.0, 30.0, 69.0, 220.0, 329.0, 211.0, 93.0, 26.0, 11.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5919851064682007, -0.5536344051361084, -0.5152837038040161, -0.47693297266960144, -0.43858227133750916, -0.40023157000541687, -0.3618808388710022, -0.3235301375389099, -0.2851794362068176, -0.24682873487472534, -0.20847801864147186, -0.17012730240821838, -0.1317766010761261, -0.09342589974403381, -0.055075183510780334, -0.016724467277526855, 0.02162623405456543, 0.05997694283723831, 0.0983276516199112, 0.13667836785316467, 0.17502906918525696, 0.21337977051734924, 0.2517305016517639, 0.2900812029838562, 0.3284319043159485, 0.36678260564804077, 0.40513330698013306, 0.44348403811454773, 0.48183473944664, 0.5201854705810547, 0.558536171913147, 0.5968868732452393, 0.6352376937866211, 0.6735883951187134, 0.7119390964508057, 0.750289797782898, 0.7886404991149902, 0.8269912004470825, 0.8653419613838196, 0.9036926627159119, 0.9420433640480042, 0.9803940653800964, 1.0187448263168335, 1.0570955276489258, 1.095446228981018, 1.1337969303131104, 1.1721476316452026, 1.210498332977295, 1.2488490343093872, 1.2871997356414795, 1.3255504369735718, 1.363901138305664, 1.4022518396377563, 1.4406025409698486, 1.478953242301941, 1.5173039436340332, 1.555654764175415, 1.5940054655075073, 1.6323561668395996, 1.670706868171692, 1.7090575695037842, 1.7474082708358765, 1.7857589721679688, 1.8241097927093506, 1.8624603748321533]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 9.0, 8.0, 10.0, 13.0, 12.0, 17.0, 31.0, 33.0, 24.0, 29.0, 30.0, 48.0, 49.0, 48.0, 55.0, 53.0, 56.0, 52.0, 56.0, 39.0, 39.0, 47.0, 36.0, 37.0, 25.0, 31.0, 21.0, 21.0, 12.0, 15.0, 11.0, 9.0, 7.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.5508478879928589, -0.5347390174865723, -0.5186301469802856, -0.5025213360786438, -0.4864124655723572, -0.47030359506607056, -0.45419472455978394, -0.4380858540534973, -0.4219770133495331, -0.40586814284324646, -0.3897593021392822, -0.3736504316329956, -0.357541561126709, -0.34143272042274475, -0.32532384991645813, -0.3092150092124939, -0.2931061387062073, -0.27699726819992065, -0.2608884274959564, -0.2447795569896698, -0.22867070138454437, -0.21256184577941895, -0.19645297527313232, -0.1803441196680069, -0.16423526406288147, -0.14812640845775604, -0.13201755285263062, -0.115908682346344, -0.09979982674121857, -0.08369097113609314, -0.06758210808038712, -0.05147324502468109, -0.03536444902420044, -0.019255589693784714, -0.003146730363368988, 0.012962128967046738, 0.029070988297462463, 0.04517984390258789, 0.061288706958293915, 0.07739757001399994, 0.09350642561912537, 0.1096152812242508, 0.12572413682937622, 0.14183300733566284, 0.15794186294078827, 0.1740507185459137, 0.19015958905220032, 0.20626844465732574, 0.22237730026245117, 0.2384861558675766, 0.254595011472702, 0.27070388197898865, 0.2868127226829529, 0.3029215931892395, 0.3190304636955261, 0.33513933420181274, 0.351248174905777, 0.3673570454120636, 0.38346588611602783, 0.39957475662231445, 0.4156836271286011, 0.4317924678325653, 0.44790133833885193, 0.46401017904281616, 0.4801190495491028]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 7.0, 10.0, 14.0, 19.0, 24.0, 28.0, 44.0, 64.0, 80.0, 133.0, 221.0, 378.0, 637.0, 1379.0, 3561.0, 13057.0, 85896.0, 713149.0, 197725.0, 22982.0, 5151.0, 1924.0, 837.0, 468.0, 256.0, 147.0, 111.0, 55.0, 45.0, 30.0, 24.0, 17.0, 10.0, 19.0, 8.0, 9.0, 8.0, 3.0, 8.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.6181640625, -0.5966033935546875, -0.575042724609375, -0.5534820556640625, -0.53192138671875, -0.5103607177734375, -0.488800048828125, -0.4672393798828125, -0.4456787109375, -0.4241180419921875, -0.402557373046875, -0.3809967041015625, -0.35943603515625, -0.3378753662109375, -0.316314697265625, -0.2947540283203125, -0.273193359375, -0.2516326904296875, -0.230072021484375, -0.2085113525390625, -0.18695068359375, -0.1653900146484375, -0.143829345703125, -0.1222686767578125, -0.1007080078125, -0.0791473388671875, -0.057586669921875, -0.0360260009765625, -0.01446533203125, 0.0070953369140625, 0.028656005859375, 0.0502166748046875, 0.07177734375, 0.0933380126953125, 0.114898681640625, 0.1364593505859375, 0.15802001953125, 0.1795806884765625, 0.201141357421875, 0.2227020263671875, 0.2442626953125, 0.2658233642578125, 0.287384033203125, 0.3089447021484375, 0.33050537109375, 0.3520660400390625, 0.373626708984375, 0.3951873779296875, 0.416748046875, 0.4383087158203125, 0.459869384765625, 0.4814300537109375, 0.50299072265625, 0.5245513916015625, 0.546112060546875, 0.5676727294921875, 0.5892333984375, 0.6107940673828125, 0.632354736328125, 0.6539154052734375, 0.67547607421875, 0.6970367431640625, 0.718597412109375, 0.7401580810546875, 0.76171875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 9.0, 8.0, 17.0, 29.0, 53.0, 91.0, 121.0, 142.0, 162.0, 121.0, 91.0, 75.0, 44.0, 16.0, 12.0, 5.0, 1.0, 4.0, 0.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.43896484375, -0.4287891387939453, -0.4186134338378906, -0.40843772888183594, -0.39826202392578125, -0.38808631896972656, -0.3779106140136719, -0.3677349090576172, -0.3575592041015625, -0.3473834991455078, -0.3372077941894531, -0.32703208923339844, -0.31685638427734375, -0.30668067932128906, -0.2965049743652344, -0.2863292694091797, -0.276153564453125, -0.2659778594970703, -0.2558021545410156, -0.24562644958496094, -0.23545074462890625, -0.22527503967285156, -0.21509933471679688, -0.2049236297607422, -0.1947479248046875, -0.1845722198486328, -0.17439651489257812, -0.16422080993652344, -0.15404510498046875, -0.14386940002441406, -0.13369369506835938, -0.12351799011230469, -0.11334228515625, -0.10316658020019531, -0.09299087524414062, -0.08281517028808594, -0.07263946533203125, -0.06246376037597656, -0.052288055419921875, -0.04211235046386719, -0.0319366455078125, -0.021760940551757812, -0.011585235595703125, -0.0014095306396484375, 0.00876617431640625, 0.018941879272460938, 0.029117584228515625, 0.03929328918457031, 0.049468994140625, 0.05964469909667969, 0.06982040405273438, 0.07999610900878906, 0.09017181396484375, 0.10034751892089844, 0.11052322387695312, 0.12069892883300781, 0.1308746337890625, 0.1410503387451172, 0.15122604370117188, 0.16140174865722656, 0.17157745361328125, 0.18175315856933594, 0.19192886352539062, 0.2021045684814453, 0.2122802734375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 8.0, 12.0, 13.0, 14.0, 20.0, 35.0, 46.0, 67.0, 77.0, 158.0, 240.0, 627.0, 1622.0, 5380.0, 22451.0, 123334.0, 622244.0, 224585.0, 35806.0, 7890.0, 2211.0, 833.0, 326.0, 180.0, 110.0, 73.0, 38.0, 38.0, 31.0, 13.0, 16.0, 12.0, 7.0, 10.0, 4.0, 5.0, 7.0, 4.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.485595703125, -0.4697532653808594, -0.45391082763671875, -0.4380683898925781, -0.4222259521484375, -0.4063835144042969, -0.39054107666015625, -0.3746986389160156, -0.358856201171875, -0.3430137634277344, -0.32717132568359375, -0.3113288879394531, -0.2954864501953125, -0.2796440124511719, -0.26380157470703125, -0.24795913696289062, -0.23211669921875, -0.21627426147460938, -0.20043182373046875, -0.18458938598632812, -0.1687469482421875, -0.15290451049804688, -0.13706207275390625, -0.12121963500976562, -0.105377197265625, -0.08953475952148438, -0.07369232177734375, -0.057849884033203125, -0.0420074462890625, -0.026165008544921875, -0.01032257080078125, 0.005519866943359375, 0.0213623046875, 0.037204742431640625, 0.05304718017578125, 0.06888961791992188, 0.0847320556640625, 0.10057449340820312, 0.11641693115234375, 0.13225936889648438, 0.148101806640625, 0.16394424438476562, 0.17978668212890625, 0.19562911987304688, 0.2114715576171875, 0.22731399536132812, 0.24315643310546875, 0.2589988708496094, 0.27484130859375, 0.2906837463378906, 0.30652618408203125, 0.3223686218261719, 0.3382110595703125, 0.3540534973144531, 0.36989593505859375, 0.3857383728027344, 0.401580810546875, 0.4174232482910156, 0.43326568603515625, 0.4491081237792969, 0.4649505615234375, 0.4807929992675781, 0.49663543701171875, 0.5124778747558594, 0.5283203125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 2.0, 2.0, 8.0, 8.0, 7.0, 7.0, 16.0, 17.0, 19.0, 17.0, 18.0, 20.0, 24.0, 32.0, 29.0, 41.0, 38.0, 51.0, 36.0, 33.0, 57.0, 57.0, 50.0, 41.0, 41.0, 42.0, 45.0, 30.0, 29.0, 39.0, 14.0, 28.0, 19.0, 22.0, 14.0, 9.0, 10.0, 6.0, 5.0, 4.0, 6.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.61279296875, -0.5940399169921875, -0.575286865234375, -0.5565338134765625, -0.53778076171875, -0.5190277099609375, -0.500274658203125, -0.4815216064453125, -0.4627685546875, -0.4440155029296875, -0.425262451171875, -0.4065093994140625, -0.38775634765625, -0.3690032958984375, -0.350250244140625, -0.3314971923828125, -0.312744140625, -0.2939910888671875, -0.275238037109375, -0.2564849853515625, -0.23773193359375, -0.2189788818359375, -0.200225830078125, -0.1814727783203125, -0.1627197265625, -0.1439666748046875, -0.125213623046875, -0.1064605712890625, -0.08770751953125, -0.0689544677734375, -0.050201416015625, -0.0314483642578125, -0.0126953125, 0.0060577392578125, 0.024810791015625, 0.0435638427734375, 0.06231689453125, 0.0810699462890625, 0.099822998046875, 0.1185760498046875, 0.1373291015625, 0.1560821533203125, 0.174835205078125, 0.1935882568359375, 0.21234130859375, 0.2310943603515625, 0.249847412109375, 0.2686004638671875, 0.287353515625, 0.3061065673828125, 0.324859619140625, 0.3436126708984375, 0.36236572265625, 0.3811187744140625, 0.399871826171875, 0.4186248779296875, 0.4373779296875, 0.4561309814453125, 0.474884033203125, 0.4936370849609375, 0.51239013671875, 0.5311431884765625, 0.549896240234375, 0.5686492919921875, 0.58740234375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 7.0, 4.0, 14.0, 24.0, 43.0, 92.0, 199.0, 651.0, 3552.0, 274035.0, 762380.0, 6264.0, 836.0, 239.0, 83.0, 52.0, 24.0, 21.0, 14.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.6083984375, -0.5942840576171875, -0.580169677734375, -0.5660552978515625, -0.55194091796875, -0.5378265380859375, -0.523712158203125, -0.5095977783203125, -0.4954833984375, -0.4813690185546875, -0.467254638671875, -0.4531402587890625, -0.43902587890625, -0.4249114990234375, -0.410797119140625, -0.3966827392578125, -0.382568359375, -0.3684539794921875, -0.354339599609375, -0.3402252197265625, -0.32611083984375, -0.3119964599609375, -0.297882080078125, -0.2837677001953125, -0.2696533203125, -0.2555389404296875, -0.241424560546875, -0.2273101806640625, -0.21319580078125, -0.1990814208984375, -0.184967041015625, -0.1708526611328125, -0.15673828125, -0.1426239013671875, -0.128509521484375, -0.1143951416015625, -0.10028076171875, -0.0861663818359375, -0.072052001953125, -0.0579376220703125, -0.0438232421875, -0.0297088623046875, -0.015594482421875, -0.0014801025390625, 0.01263427734375, 0.0267486572265625, 0.040863037109375, 0.0549774169921875, 0.069091796875, 0.0832061767578125, 0.097320556640625, 0.1114349365234375, 0.12554931640625, 0.1396636962890625, 0.153778076171875, 0.1678924560546875, 0.1820068359375, 0.1961212158203125, 0.210235595703125, 0.2243499755859375, 0.23846435546875, 0.2525787353515625, 0.266693115234375, 0.2808074951171875, 0.294921875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 14.0, 6.0, 16.0, 11.0, 19.0, 13.0, 30.0, 45.0, 45.0, 74.0, 130.0, 159.0, 125.0, 94.0, 54.0, 50.0, 28.0, 24.0, 20.0, 17.0, 10.0, 11.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011873245239257812, -0.00011471286416053772, -0.00011069327592849731, -0.00010667368769645691, -0.0001026540994644165, -9.86345112323761e-05, -9.46149230003357e-05, -9.059533476829529e-05, -8.657574653625488e-05, -8.255615830421448e-05, -7.853657007217407e-05, -7.451698184013367e-05, -7.049739360809326e-05, -6.647780537605286e-05, -6.245821714401245e-05, -5.8438628911972046e-05, -5.441904067993164e-05, -5.0399452447891235e-05, -4.637986421585083e-05, -4.2360275983810425e-05, -3.834068775177002e-05, -3.4321099519729614e-05, -3.030151128768921e-05, -2.6281923055648804e-05, -2.22623348236084e-05, -1.8242746591567993e-05, -1.4223158359527588e-05, -1.0203570127487183e-05, -6.183981895446777e-06, -2.164393663406372e-06, 1.8551945686340332e-06, 5.8747828006744385e-06, 9.894371032714844e-06, 1.3913959264755249e-05, 1.7933547496795654e-05, 2.195313572883606e-05, 2.5972723960876465e-05, 2.999231219291687e-05, 3.4011900424957275e-05, 3.803148865699768e-05, 4.2051076889038086e-05, 4.607066512107849e-05, 5.0090253353118896e-05, 5.41098415851593e-05, 5.812942981719971e-05, 6.214901804924011e-05, 6.616860628128052e-05, 7.018819451332092e-05, 7.420778274536133e-05, 7.822737097740173e-05, 8.224695920944214e-05, 8.626654744148254e-05, 9.028613567352295e-05, 9.430572390556335e-05, 9.832531213760376e-05, 0.00010234490036964417, 0.00010636448860168457, 0.00011038407683372498, 0.00011440366506576538, 0.00011842325329780579, 0.0001224428415298462, 0.0001264624297618866, 0.000130482017993927, 0.0001345016062259674, 0.0001385211944580078]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 11.0, 8.0, 14.0, 21.0, 31.0, 50.0, 85.0, 160.0, 308.0, 701.0, 1682.0, 4857.0, 19537.0, 174539.0, 740900.0, 86712.0, 12749.0, 3648.0, 1332.0, 570.0, 279.0, 159.0, 66.0, 46.0, 41.0, 11.0, 7.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.229248046875, -0.2229442596435547, -0.21664047241210938, -0.21033668518066406, -0.20403289794921875, -0.19772911071777344, -0.19142532348632812, -0.1851215362548828, -0.1788177490234375, -0.1725139617919922, -0.16621017456054688, -0.15990638732910156, -0.15360260009765625, -0.14729881286621094, -0.14099502563476562, -0.1346912384033203, -0.128387451171875, -0.12208366394042969, -0.11577987670898438, -0.10947608947753906, -0.10317230224609375, -0.09686851501464844, -0.09056472778320312, -0.08426094055175781, -0.0779571533203125, -0.07165336608886719, -0.06534957885742188, -0.05904579162597656, -0.05274200439453125, -0.04643821716308594, -0.040134429931640625, -0.03383064270019531, -0.02752685546875, -0.021223068237304688, -0.014919281005859375, -0.008615493774414062, -0.00231170654296875, 0.0039920806884765625, 0.010295867919921875, 0.016599655151367188, 0.0229034423828125, 0.029207229614257812, 0.035511016845703125, 0.04181480407714844, 0.04811859130859375, 0.05442237854003906, 0.060726165771484375, 0.06702995300292969, 0.073333740234375, 0.07963752746582031, 0.08594131469726562, 0.09224510192871094, 0.09854888916015625, 0.10485267639160156, 0.11115646362304688, 0.11746025085449219, 0.1237640380859375, 0.1300678253173828, 0.13637161254882812, 0.14267539978027344, 0.14897918701171875, 0.15528297424316406, 0.16158676147460938, 0.1678905487060547, 0.1741943359375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 2.0, 4.0, 6.0, 6.0, 6.0, 7.0, 8.0, 10.0, 11.0, 18.0, 34.0, 32.0, 33.0, 54.0, 84.0, 98.0, 140.0, 117.0, 88.0, 64.0, 45.0, 34.0, 26.0, 16.0, 7.0, 12.0, 8.0, 9.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24560546875, -0.23865509033203125, -0.2317047119140625, -0.22475433349609375, -0.217803955078125, -0.21085357666015625, -0.2039031982421875, -0.19695281982421875, -0.19000244140625, -0.18305206298828125, -0.1761016845703125, -0.16915130615234375, -0.162200927734375, -0.15525054931640625, -0.1483001708984375, -0.14134979248046875, -0.1343994140625, -0.12744903564453125, -0.1204986572265625, -0.11354827880859375, -0.106597900390625, -0.09964752197265625, -0.0926971435546875, -0.08574676513671875, -0.07879638671875, -0.07184600830078125, -0.0648956298828125, -0.05794525146484375, -0.050994873046875, -0.04404449462890625, -0.0370941162109375, -0.03014373779296875, -0.023193359375, -0.01624298095703125, -0.0092926025390625, -0.00234222412109375, 0.004608154296875, 0.01155853271484375, 0.0185089111328125, 0.02545928955078125, 0.03240966796875, 0.03936004638671875, 0.0463104248046875, 0.05326080322265625, 0.060211181640625, 0.06716156005859375, 0.0741119384765625, 0.08106231689453125, 0.0880126953125, 0.09496307373046875, 0.1019134521484375, 0.10886383056640625, 0.115814208984375, 0.12276458740234375, 0.1297149658203125, 0.13666534423828125, 0.14361572265625, 0.15056610107421875, 0.1575164794921875, 0.16446685791015625, 0.171417236328125, 0.17836761474609375, 0.1853179931640625, 0.19226837158203125, 0.19921875]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 16.0, 91.0, 629.0, 238.0, 25.0, 8.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.62953758239746, -16.200651168823242, -15.771766662597656, -15.342881202697754, -14.913995742797852, -14.48511028289795, -14.056224822998047, -13.627338409423828, -13.198453903198242, -12.76956844329834, -12.340682983398438, -11.911797523498535, -11.482912063598633, -11.05402660369873, -10.625141143798828, -10.19625473022461, -9.767369270324707, -9.338483810424805, -8.909598350524902, -8.480712890625, -8.051827430725098, -7.622941970825195, -7.194056034088135, -6.765170574188232, -6.33628511428833, -5.907399654388428, -5.478514194488525, -5.049628257751465, -4.6207427978515625, -4.19185733795166, -3.762971878051758, -3.3340864181518555, -2.905200958251953, -2.476315498352051, -2.0474300384521484, -1.618544340133667, -1.1896588802337646, -0.7607734203338623, -0.33188772201538086, 0.09699773788452148, 0.5258831977844238, 0.954768717288971, 1.383654236793518, 1.81253981590271, 2.2414252758026123, 2.6703107357025146, 3.099196434020996, 3.5280818939208984, 3.956967353820801, 4.385852813720703, 4.8147382736206055, 5.243623733520508, 5.67250919342041, 6.1013946533203125, 6.530280590057373, 6.959166049957275, 7.388051509857178, 7.81693696975708, 8.24582290649414, 8.674708366394043, 9.103593826293945, 9.532479286193848, 9.96136474609375, 10.390250205993652, 10.819135665893555]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 5.0, 8.0, 8.0, 13.0, 14.0, 24.0, 22.0, 17.0, 31.0, 30.0, 40.0, 34.0, 43.0, 31.0, 33.0, 43.0, 42.0, 54.0, 49.0, 46.0, 45.0, 40.0, 39.0, 41.0, 28.0, 37.0, 26.0, 19.0, 20.0, 16.0, 19.0, 15.0, 16.0, 9.0, 7.0, 11.0, 9.0, 4.0, 1.0, 1.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-3.628267765045166, -3.510695219039917, -3.393122911453247, -3.275550365447998, -3.157977819442749, -3.040405511856079, -2.92283296585083, -2.80526065826416, -2.687688112258911, -2.570115566253662, -2.452543258666992, -2.334970712661743, -2.217398166656494, -2.099825859069824, -1.9822533130645752, -1.8646808862686157, -1.7471083402633667, -1.6295359134674072, -1.5119633674621582, -1.3943909406661987, -1.2768185138702393, -1.1592459678649902, -1.0416735410690308, -0.9241011142730713, -0.806528627872467, -0.6889561414718628, -0.5713837146759033, -0.4538112282752991, -0.3362387716770172, -0.21866631507873535, -0.1010938286781311, 0.01647859811782837, 0.13405108451843262, 0.2516235411167145, 0.36919599771499634, 0.4867684841156006, 0.6043409109115601, 0.7219133973121643, 0.8394858837127686, 0.957058310508728, 1.0746307373046875, 1.192203164100647, 1.309775710105896, 1.4273481369018555, 1.544920563697815, 1.6624929904937744, 1.7800655364990234, 1.897637963294983, 2.0152106285095215, 2.1327831745147705, 2.2503554821014404, 2.3679280281066895, 2.4855005741119385, 2.6030728816986084, 2.7206454277038574, 2.8382177352905273, 2.9557902812957764, 3.0733628273010254, 3.1909351348876953, 3.3085076808929443, 3.4260802268981934, 3.5436525344848633, 3.6612250804901123, 3.7787976264953613, 3.8963699340820312]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 10.0, 10.0, 5.0, 16.0, 13.0, 16.0, 26.0, 66.0, 87.0, 173.0, 372.0, 961.0, 3308.0, 21744.0, 4039167.0, 118907.0, 6860.0, 1559.0, 522.0, 226.0, 93.0, 65.0, 24.0, 20.0, 11.0, 5.0, 5.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2353515625, -1.2042617797851562, -1.1731719970703125, -1.1420822143554688, -1.110992431640625, -1.0799026489257812, -1.0488128662109375, -1.0177230834960938, -0.98663330078125, -0.9555435180664062, -0.9244537353515625, -0.8933639526367188, -0.862274169921875, -0.8311843872070312, -0.8000946044921875, -0.7690048217773438, -0.7379150390625, -0.7068252563476562, -0.6757354736328125, -0.6446456909179688, -0.613555908203125, -0.5824661254882812, -0.5513763427734375, -0.5202865600585938, -0.48919677734375, -0.45810699462890625, -0.4270172119140625, -0.39592742919921875, -0.364837646484375, -0.33374786376953125, -0.3026580810546875, -0.27156829833984375, -0.240478515625, -0.20938873291015625, -0.1782989501953125, -0.14720916748046875, -0.116119384765625, -0.08502960205078125, -0.0539398193359375, -0.02285003662109375, 0.00823974609375, 0.03932952880859375, 0.0704193115234375, 0.10150909423828125, 0.132598876953125, 0.16368865966796875, 0.1947784423828125, 0.22586822509765625, 0.2569580078125, 0.28804779052734375, 0.3191375732421875, 0.35022735595703125, 0.381317138671875, 0.41240692138671875, 0.4434967041015625, 0.47458648681640625, 0.50567626953125, 0.5367660522460938, 0.5678558349609375, 0.5989456176757812, 0.630035400390625, 0.6611251831054688, 0.6922149658203125, 0.7233047485351562, 0.75439453125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 18.0, 23.0, 33.0, 88.0, 91.0, 107.0, 146.0, 136.0, 113.0, 76.0, 68.0, 34.0, 22.0, 16.0, 10.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.44091796875, -0.4303779602050781, -0.41983795166015625, -0.4092979431152344, -0.3987579345703125, -0.3882179260253906, -0.37767791748046875, -0.3671379089355469, -0.356597900390625, -0.3460578918457031, -0.33551788330078125, -0.3249778747558594, -0.3144378662109375, -0.3038978576660156, -0.29335784912109375, -0.2828178405761719, -0.27227783203125, -0.2617378234863281, -0.25119781494140625, -0.24065780639648438, -0.2301177978515625, -0.21957778930664062, -0.20903778076171875, -0.19849777221679688, -0.187957763671875, -0.17741775512695312, -0.16687774658203125, -0.15633773803710938, -0.1457977294921875, -0.13525772094726562, -0.12471771240234375, -0.11417770385742188, -0.1036376953125, -0.09309768676757812, -0.08255767822265625, -0.07201766967773438, -0.0614776611328125, -0.050937652587890625, -0.04039764404296875, -0.029857635498046875, -0.019317626953125, -0.008777618408203125, 0.00176239013671875, 0.012302398681640625, 0.0228424072265625, 0.033382415771484375, 0.04392242431640625, 0.054462432861328125, 0.06500244140625, 0.07554244995117188, 0.08608245849609375, 0.09662246704101562, 0.1071624755859375, 0.11770248413085938, 0.12824249267578125, 0.13878250122070312, 0.149322509765625, 0.15986251831054688, 0.17040252685546875, 0.18094253540039062, 0.1914825439453125, 0.20202255249023438, 0.21256256103515625, 0.22310256958007812, 0.233642578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 10.0, 10.0, 13.0, 36.0, 53.0, 78.0, 151.0, 349.0, 853.0, 3041.0, 18248.0, 1226087.0, 2918267.0, 21811.0, 3532.0, 993.0, 379.0, 170.0, 70.0, 50.0, 29.0, 20.0, 13.0, 4.0, 2.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55224609375, -0.5325469970703125, -0.512847900390625, -0.4931488037109375, -0.47344970703125, -0.4537506103515625, -0.434051513671875, -0.4143524169921875, -0.3946533203125, -0.3749542236328125, -0.355255126953125, -0.3355560302734375, -0.31585693359375, -0.2961578369140625, -0.276458740234375, -0.2567596435546875, -0.237060546875, -0.2173614501953125, -0.197662353515625, -0.1779632568359375, -0.15826416015625, -0.1385650634765625, -0.118865966796875, -0.0991668701171875, -0.0794677734375, -0.0597686767578125, -0.040069580078125, -0.0203704833984375, -0.00067138671875, 0.0190277099609375, 0.038726806640625, 0.0584259033203125, 0.078125, 0.0978240966796875, 0.117523193359375, 0.1372222900390625, 0.15692138671875, 0.1766204833984375, 0.196319580078125, 0.2160186767578125, 0.2357177734375, 0.2554168701171875, 0.275115966796875, 0.2948150634765625, 0.31451416015625, 0.3342132568359375, 0.353912353515625, 0.3736114501953125, 0.393310546875, 0.4130096435546875, 0.432708740234375, 0.4524078369140625, 0.47210693359375, 0.4918060302734375, 0.511505126953125, 0.5312042236328125, 0.5509033203125, 0.5706024169921875, 0.590301513671875, 0.6100006103515625, 0.62969970703125, 0.6493988037109375, 0.669097900390625, 0.6887969970703125, 0.70849609375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 10.0, 10.0, 14.0, 28.0, 47.0, 97.0, 333.0, 2204.0, 965.0, 173.0, 71.0, 30.0, 27.0, 19.0, 12.0, 10.0, 9.0, 1.0, 3.0, 5.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.355224609375, -0.3465156555175781, -0.33780670166015625, -0.3290977478027344, -0.3203887939453125, -0.3116798400878906, -0.30297088623046875, -0.2942619323730469, -0.285552978515625, -0.2768440246582031, -0.26813507080078125, -0.2594261169433594, -0.2507171630859375, -0.24200820922851562, -0.23329925537109375, -0.22459030151367188, -0.21588134765625, -0.20717239379882812, -0.19846343994140625, -0.18975448608398438, -0.1810455322265625, -0.17233657836914062, -0.16362762451171875, -0.15491867065429688, -0.146209716796875, -0.13750076293945312, -0.12879180908203125, -0.12008285522460938, -0.1113739013671875, -0.10266494750976562, -0.09395599365234375, -0.08524703979492188, -0.0765380859375, -0.06782913208007812, -0.05912017822265625, -0.050411224365234375, -0.0417022705078125, -0.032993316650390625, -0.02428436279296875, -0.015575408935546875, -0.006866455078125, 0.001842498779296875, 0.01055145263671875, 0.019260406494140625, 0.0279693603515625, 0.036678314208984375, 0.04538726806640625, 0.054096221923828125, 0.06280517578125, 0.07151412963867188, 0.08022308349609375, 0.08893203735351562, 0.0976409912109375, 0.10634994506835938, 0.11505889892578125, 0.12376785278320312, 0.132476806640625, 0.14118576049804688, 0.14989471435546875, 0.15860366821289062, 0.1673126220703125, 0.17602157592773438, 0.18473052978515625, 0.19343948364257812, 0.2021484375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 14.0, 181.0, 740.0, 71.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3326778411865234, -1.1888482570648193, -1.0450186729431152, -0.9011891484260559, -0.7573595643043518, -0.6135299801826477, -0.4697004556655884, -0.3258708715438843, -0.18204128742218018, -0.03821171820163727, 0.10561785101890564, 0.24944740533828735, 0.39327698945999146, 0.5371065735816956, 0.6809360980987549, 0.824765682220459, 0.9685952663421631, 1.1124248504638672, 1.2562544345855713, 1.4000840187072754, 1.5439136028289795, 1.6877431869506836, 1.8315726518630981, 1.9754022359848022, 2.119231700897217, 2.263061285018921, 2.406890869140625, 2.550720453262329, 2.694550037384033, 2.8383796215057373, 2.9822092056274414, 3.1260385513305664, 3.2698683738708496, 3.4136979579925537, 3.557527542114258, 3.701357126235962, 3.845186710357666, 3.98901629447937, 4.132845878601074, 4.276675224304199, 4.420505046844482, 4.564334392547607, 4.708164215087891, 4.851993560791016, 4.995823383331299, 5.139652729034424, 5.283482551574707, 5.427311897277832, 5.571141242980957, 5.714970588684082, 5.858800411224365, 6.00262975692749, 6.146459579467773, 6.290288925170898, 6.434118747711182, 6.577948093414307, 6.72177791595459, 6.865607261657715, 7.009437084197998, 7.153266429901123, 7.297096252441406, 7.440925598144531, 7.5847554206848145, 7.7285847663879395, 7.872414588928223]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 8.0, 6.0, 5.0, 7.0, 11.0, 15.0, 18.0, 16.0, 22.0, 27.0, 25.0, 26.0, 23.0, 34.0, 39.0, 42.0, 30.0, 45.0, 40.0, 53.0, 48.0, 37.0, 43.0, 50.0, 37.0, 38.0, 33.0, 31.0, 34.0, 21.0, 17.0, 24.0, 12.0, 13.0, 12.0, 5.0, 9.0, 11.0, 6.0, 6.0, 3.0, 5.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.5325351357460022, -0.5153860449790955, -0.4982369542121887, -0.4810878336429596, -0.46393874287605286, -0.4467896521091461, -0.429640531539917, -0.41249144077301025, -0.3953423500061035, -0.3781932592391968, -0.36104416847229004, -0.3438950479030609, -0.3267459571361542, -0.30959686636924744, -0.2924477458000183, -0.2752986550331116, -0.25814956426620483, -0.2410004734992981, -0.22385136783123016, -0.20670226216316223, -0.1895531713962555, -0.17240408062934875, -0.15525497496128082, -0.1381058692932129, -0.12095677852630615, -0.10380768030881882, -0.08665858209133148, -0.06950948387384415, -0.05236038565635681, -0.035211287438869476, -0.01806218922138214, -0.0009130910038948059, 0.016236066818237305, 0.03338516503572464, 0.050534263253211975, 0.06768336147069931, 0.08483245968818665, 0.10198155790567398, 0.11913065612316132, 0.13627976179122925, 0.153428852558136, 0.17057794332504272, 0.18772704899311066, 0.2048761546611786, 0.22202524542808533, 0.23917433619499207, 0.2563234567642212, 0.27347254753112793, 0.29062163829803467, 0.3077707290649414, 0.32491981983184814, 0.34206894040107727, 0.359218031167984, 0.37636712193489075, 0.3935162425041199, 0.4106653332710266, 0.42781442403793335, 0.4449635148048401, 0.4621126055717468, 0.47926172614097595, 0.4964108169078827, 0.5135599374771118, 0.5307090282440186, 0.5478581190109253, 0.565007209777832]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 1.0, 4.0, 7.0, 8.0, 7.0, 9.0, 17.0, 19.0, 30.0, 55.0, 71.0, 132.0, 237.0, 546.0, 1332.0, 4437.0, 22834.0, 449134.0, 537478.0, 24790.0, 4776.0, 1405.0, 535.0, 281.0, 165.0, 87.0, 55.0, 37.0, 18.0, 15.0, 10.0, 6.0, 6.0, 4.0, 6.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7685546875, -0.7401123046875, -0.711669921875, -0.6832275390625, -0.65478515625, -0.6263427734375, -0.597900390625, -0.5694580078125, -0.541015625, -0.5125732421875, -0.484130859375, -0.4556884765625, -0.42724609375, -0.3988037109375, -0.370361328125, -0.3419189453125, -0.3134765625, -0.2850341796875, -0.256591796875, -0.2281494140625, -0.19970703125, -0.1712646484375, -0.142822265625, -0.1143798828125, -0.0859375, -0.0574951171875, -0.029052734375, -0.0006103515625, 0.02783203125, 0.0562744140625, 0.084716796875, 0.1131591796875, 0.1416015625, 0.1700439453125, 0.198486328125, 0.2269287109375, 0.25537109375, 0.2838134765625, 0.312255859375, 0.3406982421875, 0.369140625, 0.3975830078125, 0.426025390625, 0.4544677734375, 0.48291015625, 0.5113525390625, 0.539794921875, 0.5682373046875, 0.5966796875, 0.6251220703125, 0.653564453125, 0.6820068359375, 0.71044921875, 0.7388916015625, 0.767333984375, 0.7957763671875, 0.82421875, 0.8526611328125, 0.881103515625, 0.9095458984375, 0.93798828125, 0.9664306640625, 0.994873046875, 1.0233154296875, 1.0517578125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 10.0, 11.0, 13.0, 30.0, 44.0, 84.0, 93.0, 130.0, 143.0, 131.0, 102.0, 82.0, 55.0, 27.0, 22.0, 12.0, 8.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.43505859375, -0.42459869384765625, -0.4141387939453125, -0.40367889404296875, -0.393218994140625, -0.38275909423828125, -0.3722991943359375, -0.36183929443359375, -0.35137939453125, -0.34091949462890625, -0.3304595947265625, -0.31999969482421875, -0.309539794921875, -0.29907989501953125, -0.2886199951171875, -0.27816009521484375, -0.2677001953125, -0.25724029541015625, -0.2467803955078125, -0.23632049560546875, -0.225860595703125, -0.21540069580078125, -0.2049407958984375, -0.19448089599609375, -0.18402099609375, -0.17356109619140625, -0.1631011962890625, -0.15264129638671875, -0.142181396484375, -0.13172149658203125, -0.1212615966796875, -0.11080169677734375, -0.100341796875, -0.08988189697265625, -0.0794219970703125, -0.06896209716796875, -0.058502197265625, -0.04804229736328125, -0.0375823974609375, -0.02712249755859375, -0.01666259765625, -0.00620269775390625, 0.0042572021484375, 0.01471710205078125, 0.025177001953125, 0.03563690185546875, 0.0460968017578125, 0.05655670166015625, 0.0670166015625, 0.07747650146484375, 0.0879364013671875, 0.09839630126953125, 0.108856201171875, 0.11931610107421875, 0.1297760009765625, 0.14023590087890625, 0.15069580078125, 0.16115570068359375, 0.1716156005859375, 0.18207550048828125, 0.192535400390625, 0.20299530029296875, 0.2134552001953125, 0.22391510009765625, 0.234375]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 6.0, 8.0, 9.0, 13.0, 19.0, 22.0, 30.0, 38.0, 55.0, 61.0, 92.0, 148.0, 194.0, 324.0, 713.0, 1952.0, 6157.0, 24752.0, 144556.0, 710353.0, 127146.0, 22546.0, 5748.0, 1876.0, 683.0, 327.0, 189.0, 131.0, 93.0, 71.0, 43.0, 49.0, 33.0, 27.0, 17.0, 19.0, 9.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.484130859375, -0.4687461853027344, -0.45336151123046875, -0.4379768371582031, -0.4225921630859375, -0.4072074890136719, -0.39182281494140625, -0.3764381408691406, -0.361053466796875, -0.3456687927246094, -0.33028411865234375, -0.3148994445800781, -0.2995147705078125, -0.2841300964355469, -0.26874542236328125, -0.2533607482910156, -0.23797607421875, -0.22259140014648438, -0.20720672607421875, -0.19182205200195312, -0.1764373779296875, -0.16105270385742188, -0.14566802978515625, -0.13028335571289062, -0.114898681640625, -0.09951400756835938, -0.08412933349609375, -0.06874465942382812, -0.0533599853515625, -0.037975311279296875, -0.02259063720703125, -0.007205963134765625, 0.0081787109375, 0.023563385009765625, 0.03894805908203125, 0.054332733154296875, 0.0697174072265625, 0.08510208129882812, 0.10048675537109375, 0.11587142944335938, 0.131256103515625, 0.14664077758789062, 0.16202545166015625, 0.17741012573242188, 0.1927947998046875, 0.20817947387695312, 0.22356414794921875, 0.23894882202148438, 0.25433349609375, 0.2697181701660156, 0.28510284423828125, 0.3004875183105469, 0.3158721923828125, 0.3312568664550781, 0.34664154052734375, 0.3620262145996094, 0.377410888671875, 0.3927955627441406, 0.40818023681640625, 0.4235649108886719, 0.4389495849609375, 0.4543342590332031, 0.46971893310546875, 0.4851036071777344, 0.50048828125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 0.0, 5.0, 1.0, 7.0, 7.0, 9.0, 9.0, 4.0, 6.0, 13.0, 12.0, 21.0, 24.0, 29.0, 22.0, 22.0, 27.0, 32.0, 25.0, 33.0, 40.0, 49.0, 36.0, 44.0, 39.0, 33.0, 37.0, 39.0, 34.0, 34.0, 31.0, 32.0, 23.0, 29.0, 31.0, 24.0, 15.0, 21.0, 20.0, 10.0, 15.0, 12.0, 8.0, 10.0, 9.0, 3.0, 10.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51611328125, -0.49988555908203125, -0.4836578369140625, -0.46743011474609375, -0.451202392578125, -0.43497467041015625, -0.4187469482421875, -0.40251922607421875, -0.38629150390625, -0.37006378173828125, -0.3538360595703125, -0.33760833740234375, -0.321380615234375, -0.30515289306640625, -0.2889251708984375, -0.27269744873046875, -0.2564697265625, -0.24024200439453125, -0.2240142822265625, -0.20778656005859375, -0.191558837890625, -0.17533111572265625, -0.1591033935546875, -0.14287567138671875, -0.12664794921875, -0.11042022705078125, -0.0941925048828125, -0.07796478271484375, -0.061737060546875, -0.04550933837890625, -0.0292816162109375, -0.01305389404296875, 0.003173828125, 0.01940155029296875, 0.0356292724609375, 0.05185699462890625, 0.068084716796875, 0.08431243896484375, 0.1005401611328125, 0.11676788330078125, 0.13299560546875, 0.14922332763671875, 0.1654510498046875, 0.18167877197265625, 0.197906494140625, 0.21413421630859375, 0.2303619384765625, 0.24658966064453125, 0.2628173828125, 0.27904510498046875, 0.2952728271484375, 0.31150054931640625, 0.327728271484375, 0.34395599365234375, 0.3601837158203125, 0.37641143798828125, 0.39263916015625, 0.40886688232421875, 0.4250946044921875, 0.44132232666015625, 0.457550048828125, 0.47377777099609375, 0.4900054931640625, 0.5062332153320312, 0.5224609375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 11.0, 34.0, 93.0, 302.0, 2304.0, 1037569.0, 7629.0, 408.0, 142.0, 42.0, 13.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95166015625, -0.9195327758789062, -0.8874053955078125, -0.8552780151367188, -0.823150634765625, -0.7910232543945312, -0.7588958740234375, -0.7267684936523438, -0.69464111328125, -0.6625137329101562, -0.6303863525390625, -0.5982589721679688, -0.566131591796875, -0.5340042114257812, -0.5018768310546875, -0.46974945068359375, -0.4376220703125, -0.40549468994140625, -0.3733673095703125, -0.34123992919921875, -0.309112548828125, -0.27698516845703125, -0.2448577880859375, -0.21273040771484375, -0.18060302734375, -0.14847564697265625, -0.1163482666015625, -0.08422088623046875, -0.052093505859375, -0.01996612548828125, 0.0121612548828125, 0.04428863525390625, 0.076416015625, 0.10854339599609375, 0.1406707763671875, 0.17279815673828125, 0.204925537109375, 0.23705291748046875, 0.2691802978515625, 0.30130767822265625, 0.33343505859375, 0.36556243896484375, 0.3976898193359375, 0.42981719970703125, 0.461944580078125, 0.49407196044921875, 0.5261993408203125, 0.5583267211914062, 0.5904541015625, 0.6225814819335938, 0.6547088623046875, 0.6868362426757812, 0.718963623046875, 0.7510910034179688, 0.7832183837890625, 0.8153457641601562, 0.84747314453125, 0.8796005249023438, 0.9117279052734375, 0.9438552856445312, 0.975982666015625, 1.0081100463867188, 1.0402374267578125, 1.0723648071289062, 1.1044921875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 3.0, 8.0, 12.0, 16.0, 34.0, 36.0, 55.0, 102.0, 155.0, 182.0, 135.0, 92.0, 65.0, 32.0, 26.0, 13.0, 14.0, 4.0, 10.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.669759750366211e-05, -6.285030394792557e-05, -5.9003010392189026e-05, -5.5155716836452484e-05, -5.130842328071594e-05, -4.74611297249794e-05, -4.361383616924286e-05, -3.976654261350632e-05, -3.5919249057769775e-05, -3.2071955502033234e-05, -2.8224661946296692e-05, -2.437736839056015e-05, -2.053007483482361e-05, -1.6682781279087067e-05, -1.2835487723350525e-05, -8.988194167613983e-06, -5.140900611877441e-06, -1.2936070561408997e-06, 2.553686499595642e-06, 6.400980055332184e-06, 1.0248273611068726e-05, 1.4095567166805267e-05, 1.794286072254181e-05, 2.179015427827835e-05, 2.5637447834014893e-05, 2.9484741389751434e-05, 3.3332034945487976e-05, 3.717932850122452e-05, 4.102662205696106e-05, 4.48739156126976e-05, 4.872120916843414e-05, 5.2568502724170685e-05, 5.6415796279907227e-05, 6.026308983564377e-05, 6.411038339138031e-05, 6.795767694711685e-05, 7.18049705028534e-05, 7.565226405858994e-05, 7.949955761432648e-05, 8.334685117006302e-05, 8.719414472579956e-05, 9.10414382815361e-05, 9.488873183727264e-05, 9.873602539300919e-05, 0.00010258331894874573, 0.00010643061250448227, 0.00011027790606021881, 0.00011412519961595535, 0.0001179724931716919, 0.00012181978672742844, 0.00012566708028316498, 0.00012951437383890152, 0.00013336166739463806, 0.0001372089609503746, 0.00014105625450611115, 0.0001449035480618477, 0.00014875084161758423, 0.00015259813517332077, 0.0001564454287290573, 0.00016029272228479385, 0.0001641400158405304, 0.00016798730939626694, 0.00017183460295200348, 0.00017568189650774002, 0.00017952919006347656]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 6.0, 6.0, 16.0, 31.0, 77.0, 132.0, 317.0, 2208.0, 1029439.0, 15505.0, 467.0, 186.0, 88.0, 41.0, 22.0, 11.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.359375, -1.3282623291015625, -1.297149658203125, -1.2660369873046875, -1.23492431640625, -1.2038116455078125, -1.172698974609375, -1.1415863037109375, -1.1104736328125, -1.0793609619140625, -1.048248291015625, -1.0171356201171875, -0.98602294921875, -0.9549102783203125, -0.923797607421875, -0.8926849365234375, -0.861572265625, -0.8304595947265625, -0.799346923828125, -0.7682342529296875, -0.73712158203125, -0.7060089111328125, -0.674896240234375, -0.6437835693359375, -0.6126708984375, -0.5815582275390625, -0.550445556640625, -0.5193328857421875, -0.48822021484375, -0.4571075439453125, -0.425994873046875, -0.3948822021484375, -0.36376953125, -0.3326568603515625, -0.301544189453125, -0.2704315185546875, -0.23931884765625, -0.2082061767578125, -0.177093505859375, -0.1459808349609375, -0.1148681640625, -0.0837554931640625, -0.052642822265625, -0.0215301513671875, 0.00958251953125, 0.0406951904296875, 0.071807861328125, 0.1029205322265625, 0.134033203125, 0.1651458740234375, 0.196258544921875, 0.2273712158203125, 0.25848388671875, 0.2895965576171875, 0.320709228515625, 0.3518218994140625, 0.3829345703125, 0.4140472412109375, 0.445159912109375, 0.4762725830078125, 0.50738525390625, 0.5384979248046875, 0.569610595703125, 0.6007232666015625, 0.6318359375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 30.0, 96.0, 360.0, 385.0, 90.0, 25.0, 13.0, 4.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0751953125, -1.0502243041992188, -1.0252532958984375, -1.0002822875976562, -0.975311279296875, -0.9503402709960938, -0.9253692626953125, -0.9003982543945312, -0.87542724609375, -0.8504562377929688, -0.8254852294921875, -0.8005142211914062, -0.775543212890625, -0.7505722045898438, -0.7256011962890625, -0.7006301879882812, -0.6756591796875, -0.6506881713867188, -0.6257171630859375, -0.6007461547851562, -0.575775146484375, -0.5508041381835938, -0.5258331298828125, -0.5008621215820312, -0.47589111328125, -0.45092010498046875, -0.4259490966796875, -0.40097808837890625, -0.376007080078125, -0.35103607177734375, -0.3260650634765625, -0.30109405517578125, -0.276123046875, -0.25115203857421875, -0.2261810302734375, -0.20121002197265625, -0.176239013671875, -0.15126800537109375, -0.1262969970703125, -0.10132598876953125, -0.07635498046875, -0.05138397216796875, -0.0264129638671875, -0.00144195556640625, 0.023529052734375, 0.04850006103515625, 0.0734710693359375, 0.09844207763671875, 0.1234130859375, 0.14838409423828125, 0.1733551025390625, 0.19832611083984375, 0.223297119140625, 0.24826812744140625, 0.2732391357421875, 0.29821014404296875, 0.32318115234375, 0.34815216064453125, 0.3731231689453125, 0.39809417724609375, 0.423065185546875, 0.44803619384765625, 0.4730072021484375, 0.49797821044921875, 0.52294921875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 12.0, 310.0, 635.0, 48.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-29.883636474609375, -29.351224899291992, -28.81881332397461, -28.286401748657227, -27.753990173339844, -27.22157859802246, -26.689167022705078, -26.156755447387695, -25.624343872070312, -25.09193229675293, -24.559520721435547, -24.027109146118164, -23.49469757080078, -22.9622859954834, -22.429874420166016, -21.897462844848633, -21.36505126953125, -20.832639694213867, -20.300228118896484, -19.7678165435791, -19.23540496826172, -18.702993392944336, -18.170581817626953, -17.63817024230957, -17.105756759643555, -16.573345184326172, -16.04093360900879, -15.508522033691406, -14.976110458374023, -14.44369888305664, -13.911287307739258, -13.378875732421875, -12.846465110778809, -12.314053535461426, -11.781641960144043, -11.24923038482666, -10.716818809509277, -10.184407234191895, -9.651994705200195, -9.119583129882812, -8.58717155456543, -8.054759979248047, -7.522348403930664, -6.989936828613281, -6.457525253295898, -5.925113677978516, -5.392701625823975, -4.860290050506592, -4.327878952026367, -3.7954673767089844, -3.2630558013916016, -2.7306439876556396, -2.198232412338257, -1.665820837020874, -1.133409023284912, -0.6009974479675293, -0.06858587265014648, 0.4638257622718811, 0.9962373971939087, 1.528649091720581, 2.061060667037964, 2.5934722423553467, 3.1258840560913086, 3.6582956314086914, 4.190707206726074]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 5.0, 6.0, 9.0, 10.0, 11.0, 15.0, 16.0, 15.0, 24.0, 14.0, 27.0, 25.0, 28.0, 35.0, 47.0, 36.0, 48.0, 43.0, 37.0, 54.0, 42.0, 49.0, 33.0, 51.0, 47.0, 34.0, 27.0, 28.0, 23.0, 20.0, 18.0, 20.0, 21.0, 13.0, 10.0, 13.0, 6.0, 8.0, 3.0, 6.0, 6.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.8852200508117676, -2.792926788330078, -2.7006335258483887, -2.608340263366699, -2.5160470008850098, -2.4237537384033203, -2.331460475921631, -2.2391674518585205, -2.146874189376831, -2.0545809268951416, -1.9622876644134521, -1.8699944019317627, -1.7777012586593628, -1.6854079961776733, -1.5931147336959839, -1.500821590423584, -1.408528208732605, -1.3162349462509155, -1.223941683769226, -1.1316485404968262, -1.0393552780151367, -0.9470620155334473, -0.8547687530517578, -0.7624755501747131, -0.6701822876930237, -0.5778890252113342, -0.48559582233428955, -0.3933025598526001, -0.30100932717323303, -0.20871609449386597, -0.11642283201217651, -0.024129629135131836, 0.06816363334655762, 0.16045686602592468, 0.25275009870529175, 0.3450433611869812, 0.43733659386634827, 0.5296298265457153, 0.6219230890274048, 0.7142162919044495, 0.8065095543861389, 0.8988028168678284, 0.991096019744873, 1.0833892822265625, 1.175682544708252, 1.2679758071899414, 1.3602690696716309, 1.4525622129440308, 1.5448554754257202, 1.6371487379074097, 1.7294420003890991, 1.821735143661499, 1.9140284061431885, 2.006321668624878, 2.0986149311065674, 2.190908193588257, 2.2832014560699463, 2.3754947185516357, 2.467787981033325, 2.5600812435150146, 2.652374505996704, 2.7446675300598145, 2.836960792541504, 2.9292540550231934, 3.021547317504883]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 4.0, 5.0, 1.0, 6.0, 15.0, 11.0, 11.0, 11.0, 23.0, 30.0, 49.0, 77.0, 149.0, 292.0, 589.0, 1480.0, 4360.0, 18409.0, 2645010.0, 1499277.0, 18015.0, 4037.0, 1337.0, 533.0, 252.0, 114.0, 60.0, 35.0, 42.0, 19.0, 11.0, 11.0, 4.0, 2.0, 3.0, 2.0], "bins": [-1.0927734375, -1.06951904296875, -1.0462646484375, -1.02301025390625, -0.999755859375, -0.97650146484375, -0.9532470703125, -0.92999267578125, -0.90673828125, -0.88348388671875, -0.8602294921875, -0.83697509765625, -0.813720703125, -0.79046630859375, -0.7672119140625, -0.74395751953125, -0.720703125, -0.69744873046875, -0.6741943359375, -0.65093994140625, -0.627685546875, -0.60443115234375, -0.5811767578125, -0.55792236328125, -0.53466796875, -0.51141357421875, -0.4881591796875, -0.46490478515625, -0.441650390625, -0.41839599609375, -0.3951416015625, -0.37188720703125, -0.3486328125, -0.32537841796875, -0.3021240234375, -0.27886962890625, -0.255615234375, -0.23236083984375, -0.2091064453125, -0.18585205078125, -0.16259765625, -0.13934326171875, -0.1160888671875, -0.09283447265625, -0.069580078125, -0.04632568359375, -0.0230712890625, 0.00018310546875, 0.0234375, 0.04669189453125, 0.0699462890625, 0.09320068359375, 0.116455078125, 0.13970947265625, 0.1629638671875, 0.18621826171875, 0.20947265625, 0.23272705078125, 0.2559814453125, 0.27923583984375, 0.302490234375, 0.32574462890625, 0.3489990234375, 0.37225341796875, 0.3955078125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 10.0, 15.0, 13.0, 13.0, 45.0, 53.0, 76.0, 104.0, 130.0, 116.0, 124.0, 99.0, 71.0, 53.0, 34.0, 20.0, 11.0, 10.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.43212890625, -0.42168426513671875, -0.4112396240234375, -0.40079498291015625, -0.390350341796875, -0.37990570068359375, -0.3694610595703125, -0.35901641845703125, -0.34857177734375, -0.33812713623046875, -0.3276824951171875, -0.31723785400390625, -0.306793212890625, -0.29634857177734375, -0.2859039306640625, -0.27545928955078125, -0.2650146484375, -0.25457000732421875, -0.2441253662109375, -0.23368072509765625, -0.223236083984375, -0.21279144287109375, -0.2023468017578125, -0.19190216064453125, -0.18145751953125, -0.17101287841796875, -0.1605682373046875, -0.15012359619140625, -0.139678955078125, -0.12923431396484375, -0.1187896728515625, -0.10834503173828125, -0.097900390625, -0.08745574951171875, -0.0770111083984375, -0.06656646728515625, -0.056121826171875, -0.04567718505859375, -0.0352325439453125, -0.02478790283203125, -0.01434326171875, -0.00389862060546875, 0.0065460205078125, 0.01699066162109375, 0.027435302734375, 0.03787994384765625, 0.0483245849609375, 0.05876922607421875, 0.0692138671875, 0.07965850830078125, 0.0901031494140625, 0.10054779052734375, 0.110992431640625, 0.12143707275390625, 0.1318817138671875, 0.14232635498046875, 0.15277099609375, 0.16321563720703125, 0.1736602783203125, 0.18410491943359375, 0.194549560546875, 0.20499420166015625, 0.2154388427734375, 0.22588348388671875, 0.236328125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 12.0, 27.0, 48.0, 198.0, 731.0, 4256.0, 126310.0, 4049718.0, 11129.0, 1425.0, 294.0, 83.0, 34.0, 12.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.900390625, -0.86602783203125, -0.8316650390625, -0.79730224609375, -0.762939453125, -0.72857666015625, -0.6942138671875, -0.65985107421875, -0.62548828125, -0.59112548828125, -0.5567626953125, -0.52239990234375, -0.488037109375, -0.45367431640625, -0.4193115234375, -0.38494873046875, -0.3505859375, -0.31622314453125, -0.2818603515625, -0.24749755859375, -0.213134765625, -0.17877197265625, -0.1444091796875, -0.11004638671875, -0.07568359375, -0.04132080078125, -0.0069580078125, 0.02740478515625, 0.061767578125, 0.09613037109375, 0.1304931640625, 0.16485595703125, 0.19921875, 0.23358154296875, 0.2679443359375, 0.30230712890625, 0.336669921875, 0.37103271484375, 0.4053955078125, 0.43975830078125, 0.47412109375, 0.50848388671875, 0.5428466796875, 0.57720947265625, 0.611572265625, 0.64593505859375, 0.6802978515625, 0.71466064453125, 0.7490234375, 0.78338623046875, 0.8177490234375, 0.85211181640625, 0.886474609375, 0.92083740234375, 0.9552001953125, 0.98956298828125, 1.02392578125, 1.05828857421875, 1.0926513671875, 1.12701416015625, 1.161376953125, 1.19573974609375, 1.2301025390625, 1.26446533203125, 1.298828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 4.0, 0.0, 6.0, 7.0, 6.0, 8.0, 16.0, 21.0, 43.0, 55.0, 155.0, 574.0, 2537.0, 401.0, 110.0, 37.0, 39.0, 15.0, 11.0, 3.0, 12.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1865234375, -0.179718017578125, -0.17291259765625, -0.166107177734375, -0.1593017578125, -0.152496337890625, -0.14569091796875, -0.138885498046875, -0.132080078125, -0.125274658203125, -0.11846923828125, -0.111663818359375, -0.1048583984375, -0.098052978515625, -0.09124755859375, -0.084442138671875, -0.07763671875, -0.070831298828125, -0.06402587890625, -0.057220458984375, -0.0504150390625, -0.043609619140625, -0.03680419921875, -0.029998779296875, -0.023193359375, -0.016387939453125, -0.00958251953125, -0.002777099609375, 0.0040283203125, 0.010833740234375, 0.01763916015625, 0.024444580078125, 0.03125, 0.038055419921875, 0.04486083984375, 0.051666259765625, 0.0584716796875, 0.065277099609375, 0.07208251953125, 0.078887939453125, 0.085693359375, 0.092498779296875, 0.09930419921875, 0.106109619140625, 0.1129150390625, 0.119720458984375, 0.12652587890625, 0.133331298828125, 0.14013671875, 0.146942138671875, 0.15374755859375, 0.160552978515625, 0.1673583984375, 0.174163818359375, 0.18096923828125, 0.187774658203125, 0.194580078125, 0.201385498046875, 0.20819091796875, 0.214996337890625, 0.2218017578125, 0.228607177734375, 0.23541259765625, 0.242218017578125, 0.2490234375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 6.0, 12.0, 48.0, 210.0, 487.0, 193.0, 43.0, 11.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.1846022605895996, -3.1204991340637207, -3.0563957691192627, -2.9922924041748047, -2.928189277648926, -2.864086151123047, -2.799982786178589, -2.735879421234131, -2.671776294708252, -2.607673168182373, -2.543569803237915, -2.479466438293457, -2.415363311767578, -2.351260185241699, -2.287156820297241, -2.223053455352783, -2.1589503288269043, -2.0948472023010254, -2.0307438373565674, -1.966640591621399, -1.9025373458862305, -1.838434100151062, -1.7743308544158936, -1.710227608680725, -1.6461243629455566, -1.5820211172103882, -1.5179178714752197, -1.4538146257400513, -1.3897113800048828, -1.3256081342697144, -1.261504888534546, -1.1974016427993774, -1.133298635482788, -1.0691953897476196, -1.0050921440124512, -0.9409888982772827, -0.8768856525421143, -0.8127824068069458, -0.7486791610717773, -0.6845759153366089, -0.6204726696014404, -0.556369423866272, -0.4922661781311035, -0.42816293239593506, -0.3640596866607666, -0.29995644092559814, -0.2358531951904297, -0.17174994945526123, -0.10764670372009277, -0.043543457984924316, 0.02055978775024414, 0.0846630334854126, 0.14876627922058105, 0.2128695249557495, 0.27697277069091797, 0.3410760164260864, 0.4051792621612549, 0.46928250789642334, 0.5333857536315918, 0.5974889993667603, 0.6615922451019287, 0.7256954908370972, 0.7897987365722656, 0.8539019823074341, 0.9180052280426025]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 5.0, 8.0, 6.0, 9.0, 12.0, 15.0, 9.0, 12.0, 15.0, 18.0, 16.0, 29.0, 21.0, 41.0, 31.0, 45.0, 45.0, 39.0, 43.0, 47.0, 55.0, 40.0, 51.0, 36.0, 40.0, 44.0, 35.0, 38.0, 29.0, 31.0, 22.0, 23.0, 22.0, 15.0, 12.0, 4.0, 13.0, 5.0, 6.0, 6.0, 4.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.4691504240036011, -0.45378774404525757, -0.43842506408691406, -0.42306238412857056, -0.40769970417022705, -0.39233702421188354, -0.37697431445121765, -0.36161163449287415, -0.34624895453453064, -0.33088627457618713, -0.31552359461784363, -0.3001609146595001, -0.28479820489883423, -0.2694355249404907, -0.2540728449821472, -0.2387101650238037, -0.2233474850654602, -0.2079848051071167, -0.1926221251487732, -0.1772594302892685, -0.161896750330925, -0.14653407037258148, -0.13117137551307678, -0.11580869555473328, -0.10044601559638977, -0.08508333563804626, -0.06972064822912216, -0.05435796454548836, -0.03899528086185455, -0.023632600903511047, -0.008269913494586945, 0.007092773914337158, 0.022455453872680664, 0.03781813755631447, 0.05318082123994827, 0.06854350864887238, 0.08390618860721588, 0.09926886856555939, 0.11463155597448349, 0.1299942433834076, 0.1453569233417511, 0.1607196033000946, 0.1760822832584381, 0.1914449781179428, 0.20680765807628632, 0.22217033803462982, 0.23753303289413452, 0.252895712852478, 0.26825839281082153, 0.28362107276916504, 0.29898375272750854, 0.31434643268585205, 0.32970911264419556, 0.34507179260253906, 0.36043450236320496, 0.37579718232154846, 0.39115986227989197, 0.4065225422382355, 0.421885222196579, 0.4372479021549225, 0.4526106119155884, 0.4679732918739319, 0.4833359718322754, 0.4986986517906189, 0.5140613317489624]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 6.0, 11.0, 18.0, 21.0, 26.0, 62.0, 98.0, 197.0, 348.0, 874.0, 2835.0, 16749.0, 303524.0, 688076.0, 29531.0, 4142.0, 1118.0, 459.0, 194.0, 96.0, 58.0, 34.0, 29.0, 15.0, 8.0, 9.0, 7.0, 3.0, 1.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.2470703125, -1.2159881591796875, -1.184906005859375, -1.1538238525390625, -1.12274169921875, -1.0916595458984375, -1.060577392578125, -1.0294952392578125, -0.9984130859375, -0.9673309326171875, -0.936248779296875, -0.9051666259765625, -0.87408447265625, -0.8430023193359375, -0.811920166015625, -0.7808380126953125, -0.749755859375, -0.7186737060546875, -0.687591552734375, -0.6565093994140625, -0.62542724609375, -0.5943450927734375, -0.563262939453125, -0.5321807861328125, -0.5010986328125, -0.4700164794921875, -0.438934326171875, -0.4078521728515625, -0.37677001953125, -0.3456878662109375, -0.314605712890625, -0.2835235595703125, -0.25244140625, -0.2213592529296875, -0.190277099609375, -0.1591949462890625, -0.12811279296875, -0.0970306396484375, -0.065948486328125, -0.0348663330078125, -0.0037841796875, 0.0272979736328125, 0.058380126953125, 0.0894622802734375, 0.12054443359375, 0.1516265869140625, 0.182708740234375, 0.2137908935546875, 0.244873046875, 0.2759552001953125, 0.307037353515625, 0.3381195068359375, 0.36920166015625, 0.4002838134765625, 0.431365966796875, 0.4624481201171875, 0.4935302734375, 0.5246124267578125, 0.555694580078125, 0.5867767333984375, 0.61785888671875, 0.6489410400390625, 0.680023193359375, 0.7111053466796875, 0.7421875]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 15.0, 11.0, 25.0, 49.0, 59.0, 87.0, 97.0, 129.0, 114.0, 126.0, 93.0, 67.0, 51.0, 21.0, 19.0, 15.0, 7.0, 4.0, 2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.42236328125, -0.4120903015136719, -0.40181732177734375, -0.3915443420410156, -0.3812713623046875, -0.3709983825683594, -0.36072540283203125, -0.3504524230957031, -0.340179443359375, -0.3299064636230469, -0.31963348388671875, -0.3093605041503906, -0.2990875244140625, -0.2888145446777344, -0.27854156494140625, -0.2682685852050781, -0.25799560546875, -0.24772262573242188, -0.23744964599609375, -0.22717666625976562, -0.2169036865234375, -0.20663070678710938, -0.19635772705078125, -0.18608474731445312, -0.175811767578125, -0.16553878784179688, -0.15526580810546875, -0.14499282836914062, -0.1347198486328125, -0.12444686889648438, -0.11417388916015625, -0.10390090942382812, -0.0936279296875, -0.08335494995117188, -0.07308197021484375, -0.06280899047851562, -0.0525360107421875, -0.042263031005859375, -0.03199005126953125, -0.021717071533203125, -0.011444091796875, -0.001171112060546875, 0.00910186767578125, 0.019374847412109375, 0.0296478271484375, 0.039920806884765625, 0.05019378662109375, 0.060466766357421875, 0.07073974609375, 0.08101272583007812, 0.09128570556640625, 0.10155868530273438, 0.1118316650390625, 0.12210464477539062, 0.13237762451171875, 0.14265060424804688, 0.152923583984375, 0.16319656372070312, 0.17346954345703125, 0.18374252319335938, 0.1940155029296875, 0.20428848266601562, 0.21456146240234375, 0.22483444213867188, 0.235107421875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 5.0, 6.0, 12.0, 13.0, 22.0, 20.0, 35.0, 42.0, 48.0, 80.0, 115.0, 231.0, 480.0, 1580.0, 6086.0, 26054.0, 187470.0, 716650.0, 88214.0, 15670.0, 3785.0, 1052.0, 331.0, 156.0, 114.0, 66.0, 59.0, 45.0, 35.0, 18.0, 14.0, 16.0, 14.0, 3.0, 6.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.6038818359375, -0.585205078125, -0.5665283203125, -0.5478515625, -0.5291748046875, -0.510498046875, -0.4918212890625, -0.47314453125, -0.4544677734375, -0.435791015625, -0.4171142578125, -0.3984375, -0.3797607421875, -0.361083984375, -0.3424072265625, -0.32373046875, -0.3050537109375, -0.286376953125, -0.2677001953125, -0.2490234375, -0.2303466796875, -0.211669921875, -0.1929931640625, -0.17431640625, -0.1556396484375, -0.136962890625, -0.1182861328125, -0.099609375, -0.0809326171875, -0.062255859375, -0.0435791015625, -0.02490234375, -0.0062255859375, 0.012451171875, 0.0311279296875, 0.0498046875, 0.0684814453125, 0.087158203125, 0.1058349609375, 0.12451171875, 0.1431884765625, 0.161865234375, 0.1805419921875, 0.19921875, 0.2178955078125, 0.236572265625, 0.2552490234375, 0.27392578125, 0.2926025390625, 0.311279296875, 0.3299560546875, 0.3486328125, 0.3673095703125, 0.385986328125, 0.4046630859375, 0.42333984375, 0.4420166015625, 0.460693359375, 0.4793701171875, 0.498046875, 0.5167236328125, 0.535400390625, 0.5540771484375, 0.57275390625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 2.0, 6.0, 12.0, 15.0, 11.0, 10.0, 20.0, 14.0, 26.0, 20.0, 23.0, 31.0, 21.0, 31.0, 42.0, 26.0, 30.0, 52.0, 34.0, 44.0, 33.0, 60.0, 46.0, 51.0, 29.0, 36.0, 31.0, 23.0, 18.0, 26.0, 24.0, 22.0, 15.0, 26.0, 17.0, 14.0, 7.0, 13.0, 9.0, 8.0, 6.0, 3.0, 5.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.63232421875, -0.6148796081542969, -0.5974349975585938, -0.5799903869628906, -0.5625457763671875, -0.5451011657714844, -0.5276565551757812, -0.5102119445800781, -0.492767333984375, -0.4753227233886719, -0.45787811279296875, -0.4404335021972656, -0.4229888916015625, -0.4055442810058594, -0.38809967041015625, -0.3706550598144531, -0.35321044921875, -0.3357658386230469, -0.31832122802734375, -0.3008766174316406, -0.2834320068359375, -0.2659873962402344, -0.24854278564453125, -0.23109817504882812, -0.213653564453125, -0.19620895385742188, -0.17876434326171875, -0.16131973266601562, -0.1438751220703125, -0.12643051147460938, -0.10898590087890625, -0.09154129028320312, -0.0740966796875, -0.056652069091796875, -0.03920745849609375, -0.021762847900390625, -0.0043182373046875, 0.013126373291015625, 0.03057098388671875, 0.048015594482421875, 0.065460205078125, 0.08290481567382812, 0.10034942626953125, 0.11779403686523438, 0.1352386474609375, 0.15268325805664062, 0.17012786865234375, 0.18757247924804688, 0.20501708984375, 0.22246170043945312, 0.23990631103515625, 0.2573509216308594, 0.2747955322265625, 0.2922401428222656, 0.30968475341796875, 0.3271293640136719, 0.344573974609375, 0.3620185852050781, 0.37946319580078125, 0.3969078063964844, 0.4143524169921875, 0.4317970275878906, 0.44924163818359375, 0.4666862487792969, 0.484130859375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 4.0, 7.0, 6.0, 12.0, 17.0, 32.0, 33.0, 60.0, 78.0, 111.0, 228.0, 544.0, 1225.0, 4771.0, 47036.0, 916545.0, 69658.0, 5555.0, 1434.0, 545.0, 261.0, 126.0, 74.0, 58.0, 40.0, 26.0, 22.0, 16.0, 13.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.243408203125, -0.23424148559570312, -0.22507476806640625, -0.21590805053710938, -0.2067413330078125, -0.19757461547851562, -0.18840789794921875, -0.17924118041992188, -0.170074462890625, -0.16090774536132812, -0.15174102783203125, -0.14257431030273438, -0.1334075927734375, -0.12424087524414062, -0.11507415771484375, -0.10590744018554688, -0.09674072265625, -0.08757400512695312, -0.07840728759765625, -0.06924057006835938, -0.0600738525390625, -0.050907135009765625, -0.04174041748046875, -0.032573699951171875, -0.023406982421875, -0.014240264892578125, -0.00507354736328125, 0.004093170166015625, 0.0132598876953125, 0.022426605224609375, 0.03159332275390625, 0.040760040283203125, 0.0499267578125, 0.059093475341796875, 0.06826019287109375, 0.07742691040039062, 0.0865936279296875, 0.09576034545898438, 0.10492706298828125, 0.11409378051757812, 0.123260498046875, 0.13242721557617188, 0.14159393310546875, 0.15076065063476562, 0.1599273681640625, 0.16909408569335938, 0.17826080322265625, 0.18742752075195312, 0.19659423828125, 0.20576095581054688, 0.21492767333984375, 0.22409439086914062, 0.2332611083984375, 0.24242782592773438, 0.25159454345703125, 0.2607612609863281, 0.269927978515625, 0.2790946960449219, 0.28826141357421875, 0.2974281311035156, 0.3065948486328125, 0.3157615661621094, 0.32492828369140625, 0.3340950012207031, 0.34326171875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 14.0, 20.0, 17.0, 14.0, 24.0, 41.0, 56.0, 106.0, 111.0, 147.0, 123.0, 82.0, 66.0, 44.0, 28.0, 26.0, 12.0, 14.0, 6.0, 10.0, 10.0, 7.0, 5.0, 5.0, 2.0, 0.0, 1.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00010544061660766602, -0.0001016249880194664, -9.780935943126678e-05, -9.399373084306717e-05, -9.017810225486755e-05, -8.636247366666794e-05, -8.254684507846832e-05, -7.873121649026871e-05, -7.491558790206909e-05, -7.109995931386948e-05, -6.728433072566986e-05, -6.346870213747025e-05, -5.965307354927063e-05, -5.5837444961071014e-05, -5.20218163728714e-05, -4.8206187784671783e-05, -4.439055919647217e-05, -4.057493060827255e-05, -3.675930202007294e-05, -3.294367343187332e-05, -2.9128044843673706e-05, -2.531241625547409e-05, -2.1496787667274475e-05, -1.768115907907486e-05, -1.3865530490875244e-05, -1.0049901902675629e-05, -6.234273314476013e-06, -2.4186447262763977e-06, 1.3969838619232178e-06, 5.212612450122833e-06, 9.028241038322449e-06, 1.2843869626522064e-05, 1.665949821472168e-05, 2.0475126802921295e-05, 2.429075539112091e-05, 2.8106383979320526e-05, 3.192201256752014e-05, 3.573764115571976e-05, 3.955326974391937e-05, 4.336889833211899e-05, 4.7184526920318604e-05, 5.100015550851822e-05, 5.4815784096717834e-05, 5.863141268491745e-05, 6.244704127311707e-05, 6.626266986131668e-05, 7.00782984495163e-05, 7.389392703771591e-05, 7.770955562591553e-05, 8.152518421411514e-05, 8.534081280231476e-05, 8.915644139051437e-05, 9.297206997871399e-05, 9.67876985669136e-05, 0.00010060332715511322, 0.00010441895574331284, 0.00010823458433151245, 0.00011205021291971207, 0.00011586584150791168, 0.0001196814700961113, 0.0001234970986843109, 0.00012731272727251053, 0.00013112835586071014, 0.00013494398444890976, 0.00013875961303710938]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 3.0, 1.0, 5.0, 3.0, 7.0, 1.0, 9.0, 11.0, 14.0, 27.0, 57.0, 103.0, 238.0, 739.0, 3330.0, 42312.0, 942258.0, 54417.0, 3674.0, 804.0, 272.0, 118.0, 56.0, 39.0, 21.0, 13.0, 6.0, 4.0, 5.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.42919921875, -0.4188652038574219, -0.40853118896484375, -0.3981971740722656, -0.3878631591796875, -0.3775291442871094, -0.36719512939453125, -0.3568611145019531, -0.346527099609375, -0.3361930847167969, -0.32585906982421875, -0.3155250549316406, -0.3051910400390625, -0.2948570251464844, -0.28452301025390625, -0.2741889953613281, -0.26385498046875, -0.2535209655761719, -0.24318695068359375, -0.23285293579101562, -0.2225189208984375, -0.21218490600585938, -0.20185089111328125, -0.19151687622070312, -0.181182861328125, -0.17084884643554688, -0.16051483154296875, -0.15018081665039062, -0.1398468017578125, -0.12951278686523438, -0.11917877197265625, -0.10884475708007812, -0.0985107421875, -0.08817672729492188, -0.07784271240234375, -0.06750869750976562, -0.0571746826171875, -0.046840667724609375, -0.03650665283203125, -0.026172637939453125, -0.015838623046875, -0.005504608154296875, 0.00482940673828125, 0.015163421630859375, 0.0254974365234375, 0.035831451416015625, 0.04616546630859375, 0.056499481201171875, 0.06683349609375, 0.07716751098632812, 0.08750152587890625, 0.09783554077148438, 0.1081695556640625, 0.11850357055664062, 0.12883758544921875, 0.13917160034179688, 0.149505615234375, 0.15983963012695312, 0.17017364501953125, 0.18050765991210938, 0.1908416748046875, 0.20117568969726562, 0.21150970458984375, 0.22184371948242188, 0.232177734375]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 2.0, 4.0, 4.0, 7.0, 13.0, 37.0, 38.0, 55.0, 99.0, 172.0, 168.0, 148.0, 90.0, 51.0, 48.0, 19.0, 13.0, 16.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.380126953125, -0.3711585998535156, -0.36219024658203125, -0.3532218933105469, -0.3442535400390625, -0.3352851867675781, -0.32631683349609375, -0.3173484802246094, -0.308380126953125, -0.2994117736816406, -0.29044342041015625, -0.2814750671386719, -0.2725067138671875, -0.2635383605957031, -0.25457000732421875, -0.24560165405273438, -0.23663330078125, -0.22766494750976562, -0.21869659423828125, -0.20972824096679688, -0.2007598876953125, -0.19179153442382812, -0.18282318115234375, -0.17385482788085938, -0.164886474609375, -0.15591812133789062, -0.14694976806640625, -0.13798141479492188, -0.1290130615234375, -0.12004470825195312, -0.11107635498046875, -0.10210800170898438, -0.0931396484375, -0.08417129516601562, -0.07520294189453125, -0.06623458862304688, -0.0572662353515625, -0.048297882080078125, -0.03932952880859375, -0.030361175537109375, -0.021392822265625, -0.012424468994140625, -0.00345611572265625, 0.005512237548828125, 0.0144805908203125, 0.023448944091796875, 0.03241729736328125, 0.041385650634765625, 0.05035400390625, 0.059322357177734375, 0.06829071044921875, 0.07725906372070312, 0.0862274169921875, 0.09519577026367188, 0.10416412353515625, 0.11313247680664062, 0.122100830078125, 0.13106918334960938, 0.14003753662109375, 0.14900588989257812, 0.1579742431640625, 0.16694259643554688, 0.17591094970703125, 0.18487930297851562, 0.19384765625]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 22.0, 216.0, 654.0, 110.0, 10.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.414237976074219, -14.990077018737793, -14.565916061401367, -14.141755104064941, -13.717594146728516, -13.293434143066406, -12.86927318572998, -12.445112228393555, -12.020951271057129, -11.596790313720703, -11.172629356384277, -10.748468399047852, -10.324308395385742, -9.900146484375, -9.47598648071289, -9.051825523376465, -8.627664566040039, -8.203503608703613, -7.7793426513671875, -7.35518217086792, -6.931021213531494, -6.506860256195068, -6.082699775695801, -5.658538818359375, -5.234377861022949, -4.810216903686523, -4.386055946350098, -3.96189546585083, -3.5377345085144043, -3.1135735511779785, -2.689412832260132, -2.265252113342285, -1.8410911560058594, -1.4169303178787231, -0.9927694797515869, -0.5686086416244507, -0.14444780349731445, 0.27971315383911133, 0.703873872756958, 1.1280345916748047, 1.5521955490112305, 1.9763563871383667, 2.400517225265503, 2.8246779441833496, 3.2488389015197754, 3.672999858856201, 4.097160339355469, 4.5213212966918945, 4.94548225402832, 5.369643211364746, 5.793804168701172, 6.2179646492004395, 6.642125606536865, 7.066286563873291, 7.490447044372559, 7.914608001708984, 8.33876895904541, 8.762929916381836, 9.187090873718262, 9.611251831054688, 10.035411834716797, 10.459573745727539, 10.883733749389648, 11.307894706726074, 11.7320556640625]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 5.0, 4.0, 3.0, 5.0, 2.0, 6.0, 6.0, 11.0, 15.0, 9.0, 24.0, 25.0, 30.0, 28.0, 39.0, 20.0, 38.0, 46.0, 40.0, 40.0, 44.0, 55.0, 37.0, 51.0, 56.0, 44.0, 50.0, 39.0, 30.0, 38.0, 22.0, 23.0, 19.0, 18.0, 17.0, 14.0, 15.0, 10.0, 9.0, 2.0, 6.0, 6.0, 2.0, 2.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8697915077209473, -2.7741777896881104, -2.6785643100738525, -2.5829505920410156, -2.487337112426758, -2.391723394393921, -2.296109676361084, -2.200496196746826, -2.1048827171325684, -2.0092689990997314, -1.9136555194854736, -1.8180418014526367, -1.722428321838379, -1.626814603805542, -1.5312010049819946, -1.4355874061584473, -1.3399736881256104, -1.244360089302063, -1.1487464904785156, -1.0531327724456787, -0.9575192332267761, -0.8619056344032288, -0.7662919759750366, -0.6706783771514893, -0.5750647783279419, -0.47945117950439453, -0.3838375508785248, -0.28822392225265503, -0.19261032342910767, -0.0969967246055603, -0.001383066177368164, 0.0942305326461792, 0.18984436988830566, 0.285457968711853, 0.3810715973377228, 0.47668522596359253, 0.5722988247871399, 0.6679124236106873, 0.7635260820388794, 0.8591396808624268, 0.9547532796859741, 1.0503668785095215, 1.1459804773330688, 1.2415940761566162, 1.3372077941894531, 1.432821273803711, 1.5284349918365479, 1.6240485906600952, 1.7196621894836426, 1.81527578830719, 1.9108893871307373, 2.006503105163574, 2.102116584777832, 2.197730302810669, 2.293344020843506, 2.3889575004577637, 2.4845709800720215, 2.5801846981048584, 2.675798177719116, 2.771411895751953, 2.867025375366211, 2.962639093399048, 3.0582528114318848, 3.1538662910461426, 3.2494800090789795]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 1.0, 8.0, 3.0, 8.0, 8.0, 22.0, 20.0, 41.0, 52.0, 78.0, 146.0, 263.0, 551.0, 1472.0, 4589.0, 23625.0, 3930624.0, 215241.0, 12632.0, 2954.0, 1037.0, 419.0, 191.0, 104.0, 67.0, 48.0, 27.0, 15.0, 9.0, 4.0, 4.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-1.787109375, -1.745391845703125, -1.70367431640625, -1.661956787109375, -1.6202392578125, -1.578521728515625, -1.53680419921875, -1.495086669921875, -1.453369140625, -1.411651611328125, -1.36993408203125, -1.328216552734375, -1.2864990234375, -1.244781494140625, -1.20306396484375, -1.161346435546875, -1.11962890625, -1.077911376953125, -1.03619384765625, -0.994476318359375, -0.9527587890625, -0.911041259765625, -0.86932373046875, -0.827606201171875, -0.785888671875, -0.744171142578125, -0.70245361328125, -0.660736083984375, -0.6190185546875, -0.577301025390625, -0.53558349609375, -0.493865966796875, -0.4521484375, -0.410430908203125, -0.36871337890625, -0.326995849609375, -0.2852783203125, -0.243560791015625, -0.20184326171875, -0.160125732421875, -0.118408203125, -0.076690673828125, -0.03497314453125, 0.006744384765625, 0.0484619140625, 0.090179443359375, 0.13189697265625, 0.173614501953125, 0.21533203125, 0.257049560546875, 0.29876708984375, 0.340484619140625, 0.3822021484375, 0.423919677734375, 0.46563720703125, 0.507354736328125, 0.549072265625, 0.590789794921875, 0.63250732421875, 0.674224853515625, 0.7159423828125, 0.757659912109375, 0.79937744140625, 0.841094970703125, 0.8828125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 8.0, 13.0, 15.0, 34.0, 41.0, 67.0, 70.0, 106.0, 108.0, 97.0, 124.0, 105.0, 66.0, 53.0, 35.0, 24.0, 13.0, 9.0, 5.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.42919921875, -0.418792724609375, -0.40838623046875, -0.397979736328125, -0.3875732421875, -0.377166748046875, -0.36676025390625, -0.356353759765625, -0.345947265625, -0.335540771484375, -0.32513427734375, -0.314727783203125, -0.3043212890625, -0.293914794921875, -0.28350830078125, -0.273101806640625, -0.2626953125, -0.252288818359375, -0.24188232421875, -0.231475830078125, -0.2210693359375, -0.210662841796875, -0.20025634765625, -0.189849853515625, -0.179443359375, -0.169036865234375, -0.15863037109375, -0.148223876953125, -0.1378173828125, -0.127410888671875, -0.11700439453125, -0.106597900390625, -0.09619140625, -0.085784912109375, -0.07537841796875, -0.064971923828125, -0.0545654296875, -0.044158935546875, -0.03375244140625, -0.023345947265625, -0.012939453125, -0.002532958984375, 0.00787353515625, 0.018280029296875, 0.0286865234375, 0.039093017578125, 0.04949951171875, 0.059906005859375, 0.0703125, 0.080718994140625, 0.09112548828125, 0.101531982421875, 0.1119384765625, 0.122344970703125, 0.13275146484375, 0.143157958984375, 0.153564453125, 0.163970947265625, 0.17437744140625, 0.184783935546875, 0.1951904296875, 0.205596923828125, 0.21600341796875, 0.226409912109375, 0.23681640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 2.0, 11.0, 35.0, 82.0, 216.0, 633.0, 2475.0, 14354.0, 474853.0, 3677331.0, 19945.0, 3147.0, 810.0, 226.0, 88.0, 38.0, 17.0, 8.0, 5.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0869140625, -1.049530029296875, -1.01214599609375, -0.974761962890625, -0.9373779296875, -0.899993896484375, -0.86260986328125, -0.825225830078125, -0.787841796875, -0.750457763671875, -0.71307373046875, -0.675689697265625, -0.6383056640625, -0.600921630859375, -0.56353759765625, -0.526153564453125, -0.48876953125, -0.451385498046875, -0.41400146484375, -0.376617431640625, -0.3392333984375, -0.301849365234375, -0.26446533203125, -0.227081298828125, -0.189697265625, -0.152313232421875, -0.11492919921875, -0.077545166015625, -0.0401611328125, -0.002777099609375, 0.03460693359375, 0.071990966796875, 0.109375, 0.146759033203125, 0.18414306640625, 0.221527099609375, 0.2589111328125, 0.296295166015625, 0.33367919921875, 0.371063232421875, 0.408447265625, 0.445831298828125, 0.48321533203125, 0.520599365234375, 0.5579833984375, 0.595367431640625, 0.63275146484375, 0.670135498046875, 0.70751953125, 0.744903564453125, 0.78228759765625, 0.819671630859375, 0.8570556640625, 0.894439697265625, 0.93182373046875, 0.969207763671875, 1.006591796875, 1.043975830078125, 1.08135986328125, 1.118743896484375, 1.1561279296875, 1.193511962890625, 1.23089599609375, 1.268280029296875, 1.3056640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 8.0, 8.0, 15.0, 23.0, 24.0, 43.0, 55.0, 121.0, 592.0, 2682.0, 245.0, 95.0, 42.0, 20.0, 19.0, 10.0, 13.0, 14.0, 12.0, 3.0, 2.0, 3.0, 6.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257080078125, -0.24766159057617188, -0.23824310302734375, -0.22882461547851562, -0.2194061279296875, -0.20998764038085938, -0.20056915283203125, -0.19115066528320312, -0.181732177734375, -0.17231369018554688, -0.16289520263671875, -0.15347671508789062, -0.1440582275390625, -0.13463973999023438, -0.12522125244140625, -0.11580276489257812, -0.10638427734375, -0.09696578979492188, -0.08754730224609375, -0.07812881469726562, -0.0687103271484375, -0.059291839599609375, -0.04987335205078125, -0.040454864501953125, -0.031036376953125, -0.021617889404296875, -0.01219940185546875, -0.002780914306640625, 0.0066375732421875, 0.016056060791015625, 0.02547454833984375, 0.034893035888671875, 0.0443115234375, 0.053730010986328125, 0.06314849853515625, 0.07256698608398438, 0.0819854736328125, 0.09140396118164062, 0.10082244873046875, 0.11024093627929688, 0.119659423828125, 0.12907791137695312, 0.13849639892578125, 0.14791488647460938, 0.1573333740234375, 0.16675186157226562, 0.17617034912109375, 0.18558883666992188, 0.19500732421875, 0.20442581176757812, 0.21384429931640625, 0.22326278686523438, 0.2326812744140625, 0.24209976196289062, 0.25151824951171875, 0.2609367370605469, 0.270355224609375, 0.2797737121582031, 0.28919219970703125, 0.2986106872558594, 0.3080291748046875, 0.3174476623535156, 0.32686614990234375, 0.3362846374511719, 0.345703125]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 6.0, 19.0, 63.0, 167.0, 359.0, 252.0, 91.0, 23.0, 15.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.3674895763397217, -2.299513339996338, -2.231537342071533, -2.1635611057281494, -2.0955848693847656, -2.027608871459961, -1.9596326351165771, -1.891656517982483, -1.8236804008483887, -1.7557042837142944, -1.6877281665802002, -1.6197519302368164, -1.5517758131027222, -1.483799695968628, -1.4158234596252441, -1.34784734249115, -1.2798712253570557, -1.2118951082229614, -1.1439189910888672, -1.0759427547454834, -1.0079666376113892, -0.9399905204772949, -0.8720143437385559, -0.8040381669998169, -0.7360620498657227, -0.6680859327316284, -0.6001097559928894, -0.5321335792541504, -0.46415746212005615, -0.3961813151836395, -0.3282051682472229, -0.2602290213108063, -0.19225311279296875, -0.12427696585655212, -0.0563008189201355, 0.011675328016281128, 0.07965147495269775, 0.14762762188911438, 0.215603768825531, 0.28357991576194763, 0.35155606269836426, 0.4195322096347809, 0.4875083565711975, 0.5554845333099365, 0.6234606504440308, 0.691436767578125, 0.759412944316864, 0.827389121055603, 0.8953652381896973, 0.9633413553237915, 1.0313174724578857, 1.0992937088012695, 1.1672698259353638, 1.235245943069458, 1.3032221794128418, 1.371198296546936, 1.4391744136810303, 1.5071505308151245, 1.5751266479492188, 1.6431028842926025, 1.7110790014266968, 1.779055118560791, 1.8470313549041748, 1.915007472038269, 1.9829835891723633]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 10.0, 10.0, 13.0, 27.0, 18.0, 33.0, 33.0, 37.0, 54.0, 54.0, 60.0, 67.0, 54.0, 74.0, 66.0, 51.0, 52.0, 49.0, 47.0, 34.0, 34.0, 33.0, 21.0, 24.0, 19.0, 13.0, 6.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-1.1910669803619385, -1.159200668334961, -1.1273342370986938, -1.0954679250717163, -1.0636016130447388, -1.0317351818084717, -0.9998688697814941, -0.9680024981498718, -0.9361361265182495, -0.9042697548866272, -0.8724034428596497, -0.8405370712280273, -0.808670699596405, -0.7768043279647827, -0.7449380159378052, -0.7130716443061829, -0.6812053322792053, -0.649338960647583, -0.6174726486206055, -0.5856062769889832, -0.5537399053573608, -0.5218735933303833, -0.490007221698761, -0.45814085006713867, -0.42627450823783875, -0.3944081664085388, -0.3625417947769165, -0.3306754529476166, -0.29880911111831665, -0.26694273948669434, -0.2350763976573944, -0.2032100409269333, -0.17134368419647217, -0.13947732746601105, -0.10761097818613052, -0.07574462890625, -0.04387827217578888, -0.012011915445327759, 0.019854426383972168, 0.05172078311443329, 0.08358713984489441, 0.11545349657535553, 0.14731985330581665, 0.17918619513511658, 0.2110525518655777, 0.24291890859603882, 0.27478525042533875, 0.30665159225463867, 0.338517963886261, 0.3703843057155609, 0.4022506773471832, 0.43411701917648315, 0.46598339080810547, 0.4978497326374054, 0.5297160744667053, 0.5615824460983276, 0.5934487581253052, 0.6253151297569275, 0.657181441783905, 0.6890478134155273, 0.7209141850471497, 0.752780556678772, 0.7846468687057495, 0.8165132403373718, 0.8483796119689941]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 6.0, 4.0, 6.0, 3.0, 14.0, 18.0, 31.0, 41.0, 56.0, 93.0, 133.0, 239.0, 478.0, 1059.0, 2536.0, 7946.0, 40339.0, 491008.0, 454309.0, 37895.0, 7825.0, 2520.0, 956.0, 423.0, 227.0, 131.0, 79.0, 46.0, 38.0, 19.0, 16.0, 21.0, 8.0, 4.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.8232421875, -0.7938232421875, -0.764404296875, -0.7349853515625, -0.70556640625, -0.6761474609375, -0.646728515625, -0.6173095703125, -0.587890625, -0.5584716796875, -0.529052734375, -0.4996337890625, -0.47021484375, -0.4407958984375, -0.411376953125, -0.3819580078125, -0.3525390625, -0.3231201171875, -0.293701171875, -0.2642822265625, -0.23486328125, -0.2054443359375, -0.176025390625, -0.1466064453125, -0.1171875, -0.0877685546875, -0.058349609375, -0.0289306640625, 0.00048828125, 0.0299072265625, 0.059326171875, 0.0887451171875, 0.1181640625, 0.1475830078125, 0.177001953125, 0.2064208984375, 0.23583984375, 0.2652587890625, 0.294677734375, 0.3240966796875, 0.353515625, 0.3829345703125, 0.412353515625, 0.4417724609375, 0.47119140625, 0.5006103515625, 0.530029296875, 0.5594482421875, 0.5888671875, 0.6182861328125, 0.647705078125, 0.6771240234375, 0.70654296875, 0.7359619140625, 0.765380859375, 0.7947998046875, 0.82421875, 0.8536376953125, 0.883056640625, 0.9124755859375, 0.94189453125, 0.9713134765625, 1.000732421875, 1.0301513671875, 1.0595703125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 14.0, 13.0, 28.0, 44.0, 56.0, 75.0, 88.0, 102.0, 114.0, 108.0, 104.0, 92.0, 52.0, 41.0, 28.0, 8.0, 11.0, 11.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4267578125, -0.41623497009277344, -0.4057121276855469, -0.3951892852783203, -0.38466644287109375, -0.3741436004638672, -0.3636207580566406, -0.35309791564941406, -0.3425750732421875, -0.33205223083496094, -0.3215293884277344, -0.3110065460205078, -0.30048370361328125, -0.2899608612060547, -0.2794380187988281, -0.26891517639160156, -0.258392333984375, -0.24786949157714844, -0.23734664916992188, -0.2268238067626953, -0.21630096435546875, -0.2057781219482422, -0.19525527954101562, -0.18473243713378906, -0.1742095947265625, -0.16368675231933594, -0.15316390991210938, -0.1426410675048828, -0.13211822509765625, -0.12159538269042969, -0.11107254028320312, -0.10054969787597656, -0.09002685546875, -0.07950401306152344, -0.06898117065429688, -0.05845832824707031, -0.04793548583984375, -0.03741264343261719, -0.026889801025390625, -0.016366958618164062, -0.0058441162109375, 0.0046787261962890625, 0.015201568603515625, 0.025724411010742188, 0.03624725341796875, 0.04677009582519531, 0.057292938232421875, 0.06781578063964844, 0.078338623046875, 0.08886146545410156, 0.09938430786132812, 0.10990715026855469, 0.12042999267578125, 0.1309528350830078, 0.14147567749023438, 0.15199851989746094, 0.1625213623046875, 0.17304420471191406, 0.18356704711914062, 0.1940898895263672, 0.20461273193359375, 0.2151355743408203, 0.22565841674804688, 0.23618125915527344, 0.2467041015625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 8.0, 12.0, 18.0, 42.0, 89.0, 156.0, 389.0, 927.0, 2986.0, 12898.0, 121112.0, 796906.0, 97569.0, 11228.0, 2660.0, 905.0, 338.0, 131.0, 82.0, 39.0, 19.0, 13.0, 8.0, 4.0, 5.0, 0.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0361328125, -1.0060653686523438, -0.9759979248046875, -0.9459304809570312, -0.915863037109375, -0.8857955932617188, -0.8557281494140625, -0.8256607055664062, -0.79559326171875, -0.7655258178710938, -0.7354583740234375, -0.7053909301757812, -0.675323486328125, -0.6452560424804688, -0.6151885986328125, -0.5851211547851562, -0.5550537109375, -0.5249862670898438, -0.4949188232421875, -0.46485137939453125, -0.434783935546875, -0.40471649169921875, -0.3746490478515625, -0.34458160400390625, -0.31451416015625, -0.28444671630859375, -0.2543792724609375, -0.22431182861328125, -0.194244384765625, -0.16417694091796875, -0.1341094970703125, -0.10404205322265625, -0.073974609375, -0.04390716552734375, -0.0138397216796875, 0.01622772216796875, 0.046295166015625, 0.07636260986328125, 0.1064300537109375, 0.13649749755859375, 0.16656494140625, 0.19663238525390625, 0.2266998291015625, 0.25676727294921875, 0.286834716796875, 0.31690216064453125, 0.3469696044921875, 0.37703704833984375, 0.4071044921875, 0.43717193603515625, 0.4672393798828125, 0.49730682373046875, 0.527374267578125, 0.5574417114257812, 0.5875091552734375, 0.6175765991210938, 0.64764404296875, 0.6777114868164062, 0.7077789306640625, 0.7378463745117188, 0.767913818359375, 0.7979812622070312, 0.8280487060546875, 0.8581161499023438, 0.88818359375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 3.0, 2.0, 4.0, 3.0, 5.0, 11.0, 7.0, 15.0, 26.0, 38.0, 38.0, 49.0, 59.0, 59.0, 59.0, 65.0, 72.0, 82.0, 71.0, 74.0, 52.0, 42.0, 50.0, 29.0, 21.0, 22.0, 13.0, 14.0, 6.0, 5.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2060546875, -1.167816162109375, -1.12957763671875, -1.091339111328125, -1.0531005859375, -1.014862060546875, -0.97662353515625, -0.938385009765625, -0.900146484375, -0.861907958984375, -0.82366943359375, -0.785430908203125, -0.7471923828125, -0.708953857421875, -0.67071533203125, -0.632476806640625, -0.59423828125, -0.555999755859375, -0.51776123046875, -0.479522705078125, -0.4412841796875, -0.403045654296875, -0.36480712890625, -0.326568603515625, -0.288330078125, -0.250091552734375, -0.21185302734375, -0.173614501953125, -0.1353759765625, -0.097137451171875, -0.05889892578125, -0.020660400390625, 0.017578125, 0.055816650390625, 0.09405517578125, 0.132293701171875, 0.1705322265625, 0.208770751953125, 0.24700927734375, 0.285247802734375, 0.323486328125, 0.361724853515625, 0.39996337890625, 0.438201904296875, 0.4764404296875, 0.514678955078125, 0.55291748046875, 0.591156005859375, 0.62939453125, 0.667633056640625, 0.70587158203125, 0.744110107421875, 0.7823486328125, 0.820587158203125, 0.85882568359375, 0.897064208984375, 0.935302734375, 0.973541259765625, 1.01177978515625, 1.050018310546875, 1.0882568359375, 1.126495361328125, 1.16473388671875, 1.202972412109375, 1.2412109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 6.0, 15.0, 22.0, 33.0, 81.0, 142.0, 350.0, 1023.0, 4030.0, 40122.0, 961179.0, 36099.0, 3818.0, 955.0, 367.0, 154.0, 64.0, 40.0, 16.0, 13.0, 6.0, 7.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.779296875, -0.7585067749023438, -0.7377166748046875, -0.7169265747070312, -0.696136474609375, -0.6753463745117188, -0.6545562744140625, -0.6337661743164062, -0.61297607421875, -0.5921859741210938, -0.5713958740234375, -0.5506057739257812, -0.529815673828125, -0.5090255737304688, -0.4882354736328125, -0.46744537353515625, -0.4466552734375, -0.42586517333984375, -0.4050750732421875, -0.38428497314453125, -0.363494873046875, -0.34270477294921875, -0.3219146728515625, -0.30112457275390625, -0.28033447265625, -0.25954437255859375, -0.2387542724609375, -0.21796417236328125, -0.197174072265625, -0.17638397216796875, -0.1555938720703125, -0.13480377197265625, -0.114013671875, -0.09322357177734375, -0.0724334716796875, -0.05164337158203125, -0.030853271484375, -0.01006317138671875, 0.0107269287109375, 0.03151702880859375, 0.05230712890625, 0.07309722900390625, 0.0938873291015625, 0.11467742919921875, 0.135467529296875, 0.15625762939453125, 0.1770477294921875, 0.19783782958984375, 0.2186279296875, 0.23941802978515625, 0.2602081298828125, 0.28099822998046875, 0.301788330078125, 0.32257843017578125, 0.3433685302734375, 0.36415863037109375, 0.38494873046875, 0.40573883056640625, 0.4265289306640625, 0.44731903076171875, 0.468109130859375, 0.48889923095703125, 0.5096893310546875, 0.5304794311523438, 0.55126953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 5.0, 9.0, 14.0, 29.0, 45.0, 42.0, 53.0, 64.0, 100.0, 162.0, 148.0, 94.0, 62.0, 57.0, 36.0, 25.0, 18.0, 11.0, 14.0, 6.0, 2.0, 5.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00013005733489990234, -0.0001261197030544281, -0.00012218207120895386, -0.00011824443936347961, -0.00011430680751800537, -0.00011036917567253113, -0.00010643154382705688, -0.00010249391198158264, -9.85562801361084e-05, -9.461864829063416e-05, -9.068101644515991e-05, -8.674338459968567e-05, -8.280575275421143e-05, -7.886812090873718e-05, -7.493048906326294e-05, -7.09928572177887e-05, -6.705522537231445e-05, -6.311759352684021e-05, -5.917996168136597e-05, -5.5242329835891724e-05, -5.130469799041748e-05, -4.736706614494324e-05, -4.3429434299468994e-05, -3.949180245399475e-05, -3.555417060852051e-05, -3.1616538763046265e-05, -2.767890691757202e-05, -2.374127507209778e-05, -1.9803643226623535e-05, -1.5866011381149292e-05, -1.1928379535675049e-05, -7.990747690200806e-06, -4.0531158447265625e-06, -1.1548399925231934e-07, 3.822147846221924e-06, 7.759779691696167e-06, 1.169741153717041e-05, 1.5635043382644653e-05, 1.9572675228118896e-05, 2.351030707359314e-05, 2.7447938919067383e-05, 3.1385570764541626e-05, 3.532320261001587e-05, 3.926083445549011e-05, 4.3198466300964355e-05, 4.71360981464386e-05, 5.107372999191284e-05, 5.5011361837387085e-05, 5.894899368286133e-05, 6.288662552833557e-05, 6.682425737380981e-05, 7.076188921928406e-05, 7.46995210647583e-05, 7.863715291023254e-05, 8.257478475570679e-05, 8.651241660118103e-05, 9.045004844665527e-05, 9.438768029212952e-05, 9.832531213760376e-05, 0.000102262943983078, 0.00010620057582855225, 0.00011013820767402649, 0.00011407583951950073, 0.00011801347136497498, 0.00012195110321044922]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 5.0, 0.0, 2.0, 7.0, 9.0, 10.0, 7.0, 21.0, 29.0, 48.0, 75.0, 82.0, 150.0, 294.0, 657.0, 1940.0, 10478.0, 245469.0, 764099.0, 20550.0, 2895.0, 848.0, 330.0, 204.0, 111.0, 76.0, 51.0, 37.0, 26.0, 13.0, 13.0, 5.0, 6.0, 6.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38330078125, -0.36742401123046875, -0.3515472412109375, -0.33567047119140625, -0.319793701171875, -0.30391693115234375, -0.2880401611328125, -0.27216339111328125, -0.25628662109375, -0.24040985107421875, -0.2245330810546875, -0.20865631103515625, -0.192779541015625, -0.17690277099609375, -0.1610260009765625, -0.14514923095703125, -0.1292724609375, -0.11339569091796875, -0.0975189208984375, -0.08164215087890625, -0.065765380859375, -0.04988861083984375, -0.0340118408203125, -0.01813507080078125, -0.00225830078125, 0.01361846923828125, 0.0294952392578125, 0.04537200927734375, 0.061248779296875, 0.07712554931640625, 0.0930023193359375, 0.10887908935546875, 0.124755859375, 0.14063262939453125, 0.1565093994140625, 0.17238616943359375, 0.188262939453125, 0.20413970947265625, 0.2200164794921875, 0.23589324951171875, 0.25177001953125, 0.26764678955078125, 0.2835235595703125, 0.29940032958984375, 0.315277099609375, 0.33115386962890625, 0.3470306396484375, 0.36290740966796875, 0.3787841796875, 0.39466094970703125, 0.4105377197265625, 0.42641448974609375, 0.442291259765625, 0.45816802978515625, 0.4740447998046875, 0.48992156982421875, 0.50579833984375, 0.5216751098632812, 0.5375518798828125, 0.5534286499023438, 0.569305419921875, 0.5851821899414062, 0.6010589599609375, 0.6169357299804688, 0.6328125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 7.0, 7.0, 11.0, 24.0, 50.0, 125.0, 345.0, 235.0, 106.0, 45.0, 24.0, 18.0, 7.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.859375, -0.8285675048828125, -0.797760009765625, -0.7669525146484375, -0.73614501953125, -0.7053375244140625, -0.674530029296875, -0.6437225341796875, -0.6129150390625, -0.5821075439453125, -0.551300048828125, -0.5204925537109375, -0.48968505859375, -0.4588775634765625, -0.428070068359375, -0.3972625732421875, -0.366455078125, -0.3356475830078125, -0.304840087890625, -0.2740325927734375, -0.24322509765625, -0.2124176025390625, -0.181610107421875, -0.1508026123046875, -0.1199951171875, -0.0891876220703125, -0.058380126953125, -0.0275726318359375, 0.00323486328125, 0.0340423583984375, 0.064849853515625, 0.0956573486328125, 0.12646484375, 0.1572723388671875, 0.188079833984375, 0.2188873291015625, 0.24969482421875, 0.2805023193359375, 0.311309814453125, 0.3421173095703125, 0.3729248046875, 0.4037322998046875, 0.434539794921875, 0.4653472900390625, 0.49615478515625, 0.5269622802734375, 0.557769775390625, 0.5885772705078125, 0.619384765625, 0.6501922607421875, 0.680999755859375, 0.7118072509765625, 0.74261474609375, 0.7734222412109375, 0.804229736328125, 0.8350372314453125, 0.8658447265625, 0.8966522216796875, 0.927459716796875, 0.9582672119140625, 0.98907470703125, 1.0198822021484375, 1.050689697265625, 1.0814971923828125, 1.1123046875]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 13.0, 118.0, 651.0, 214.0, 16.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-46.49867248535156, -45.67909622192383, -44.85951614379883, -44.039939880371094, -43.22036361694336, -42.400787353515625, -41.581207275390625, -40.76163101196289, -39.942054748535156, -39.12247848510742, -38.30289840698242, -37.48332214355469, -36.66374588012695, -35.84416961669922, -35.02458953857422, -34.205013275146484, -33.38543701171875, -32.565860748291016, -31.74628257751465, -30.92670440673828, -30.107128143310547, -29.28754997253418, -28.467971801757812, -27.648395538330078, -26.828815460205078, -26.00923728942871, -25.189661026000977, -24.37008285522461, -23.550506591796875, -22.730928421020508, -21.91135025024414, -21.091773986816406, -20.272197723388672, -19.452619552612305, -18.63304328918457, -17.813465118408203, -16.99388885498047, -16.1743106842041, -15.35473346710205, -14.53515625, -13.715579986572266, -12.896002769470215, -12.076425552368164, -11.256847381591797, -10.437271118164062, -9.617692947387695, -8.798115730285645, -7.978538513183594, -7.158961296081543, -6.339384078979492, -5.519806861877441, -4.700229167938232, -3.8806519508361816, -3.061074733734131, -2.241497039794922, -1.421919822692871, -0.6023426055908203, 0.21723473072052002, 1.0368120670318604, 1.8563895225524902, 2.675966739654541, 3.495543956756592, 4.315121650695801, 5.134698867797852, 5.954276084899902]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 3.0, 7.0, 7.0, 12.0, 11.0, 15.0, 16.0, 27.0, 21.0, 30.0, 26.0, 42.0, 44.0, 45.0, 55.0, 50.0, 67.0, 48.0, 57.0, 47.0, 65.0, 47.0, 45.0, 41.0, 28.0, 29.0, 29.0, 20.0, 12.0, 15.0, 14.0, 7.0, 4.0, 2.0, 5.0, 5.0, 2.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.473816871643066, -5.273499488830566, -5.073182582855225, -4.872865676879883, -4.672548294067383, -4.472230911254883, -4.271914005279541, -4.071597099304199, -3.871279716491699, -3.6709625720977783, -3.4706454277038574, -3.2703282833099365, -3.0700111389160156, -2.8696939945220947, -2.669376850128174, -2.469059705734253, -2.268742561340332, -2.068425416946411, -1.8681082725524902, -1.6677911281585693, -1.4674739837646484, -1.2671568393707275, -1.0668396949768066, -0.8665225505828857, -0.6662054061889648, -0.46588826179504395, -0.26557111740112305, -0.06525397300720215, 0.13506317138671875, 0.33538031578063965, 0.5356974601745605, 0.7360146045684814, 0.9363317489624023, 1.1366488933563232, 1.3369660377502441, 1.537283182144165, 1.737600326538086, 1.9379174709320068, 2.1382346153259277, 2.3385517597198486, 2.5388689041137695, 2.7391860485076904, 2.9395031929016113, 3.1398203372955322, 3.340137481689453, 3.540454626083374, 3.740771770477295, 3.941088914871216, 4.141406059265137, 4.341723442077637, 4.5420403480529785, 4.74235725402832, 4.94267463684082, 5.14299201965332, 5.343308925628662, 5.543625831604004, 5.743943214416504, 5.944260597229004, 6.144577503204346, 6.3448944091796875, 6.5452117919921875, 6.7455291748046875, 6.945846080780029, 7.146162986755371, 7.346480369567871]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 3.0, 4.0, 4.0, 12.0, 18.0, 14.0, 18.0, 35.0, 50.0, 81.0, 122.0, 284.0, 626.0, 1441.0, 3664.0, 12548.0, 153872.0, 3978621.0, 32294.0, 6490.0, 2215.0, 966.0, 405.0, 203.0, 121.0, 67.0, 41.0, 22.0, 16.0, 10.0, 6.0, 2.0, 0.0, 0.0, 3.0, 4.0, 0.0, 0.0, 2.0], "bins": [-1.66015625, -1.6208648681640625, -1.581573486328125, -1.5422821044921875, -1.50299072265625, -1.4636993408203125, -1.424407958984375, -1.3851165771484375, -1.3458251953125, -1.3065338134765625, -1.267242431640625, -1.2279510498046875, -1.18865966796875, -1.1493682861328125, -1.110076904296875, -1.0707855224609375, -1.031494140625, -0.9922027587890625, -0.952911376953125, -0.9136199951171875, -0.87432861328125, -0.8350372314453125, -0.795745849609375, -0.7564544677734375, -0.7171630859375, -0.6778717041015625, -0.638580322265625, -0.5992889404296875, -0.55999755859375, -0.5207061767578125, -0.481414794921875, -0.4421234130859375, -0.40283203125, -0.3635406494140625, -0.324249267578125, -0.2849578857421875, -0.24566650390625, -0.2063751220703125, -0.167083740234375, -0.1277923583984375, -0.0885009765625, -0.0492095947265625, -0.009918212890625, 0.0293731689453125, 0.06866455078125, 0.1079559326171875, 0.147247314453125, 0.1865386962890625, 0.225830078125, 0.2651214599609375, 0.304412841796875, 0.3437042236328125, 0.38299560546875, 0.4222869873046875, 0.461578369140625, 0.5008697509765625, 0.5401611328125, 0.5794525146484375, 0.618743896484375, 0.6580352783203125, 0.69732666015625, 0.7366180419921875, 0.775909423828125, 0.8152008056640625, 0.8544921875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 17.0, 23.0, 31.0, 30.0, 45.0, 61.0, 61.0, 91.0, 88.0, 87.0, 84.0, 77.0, 73.0, 64.0, 52.0, 29.0, 25.0, 18.0, 11.0, 9.0, 5.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.43798828125, -0.42717742919921875, -0.4163665771484375, -0.40555572509765625, -0.394744873046875, -0.38393402099609375, -0.3731231689453125, -0.36231231689453125, -0.35150146484375, -0.34069061279296875, -0.3298797607421875, -0.31906890869140625, -0.308258056640625, -0.29744720458984375, -0.2866363525390625, -0.27582550048828125, -0.2650146484375, -0.25420379638671875, -0.2433929443359375, -0.23258209228515625, -0.221771240234375, -0.21096038818359375, -0.2001495361328125, -0.18933868408203125, -0.17852783203125, -0.16771697998046875, -0.1569061279296875, -0.14609527587890625, -0.135284423828125, -0.12447357177734375, -0.1136627197265625, -0.10285186767578125, -0.092041015625, -0.08123016357421875, -0.0704193115234375, -0.05960845947265625, -0.048797607421875, -0.03798675537109375, -0.0271759033203125, -0.01636505126953125, -0.00555419921875, 0.00525665283203125, 0.0160675048828125, 0.02687835693359375, 0.037689208984375, 0.04850006103515625, 0.0593109130859375, 0.07012176513671875, 0.0809326171875, 0.09174346923828125, 0.1025543212890625, 0.11336517333984375, 0.124176025390625, 0.13498687744140625, 0.1457977294921875, 0.15660858154296875, 0.16741943359375, 0.17823028564453125, 0.1890411376953125, 0.19985198974609375, 0.210662841796875, 0.22147369384765625, 0.2322845458984375, 0.24309539794921875, 0.25390625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 6.0, 9.0, 19.0, 20.0, 55.0, 94.0, 177.0, 301.0, 614.0, 1309.0, 3906.0, 22702.0, 3844786.0, 302997.0, 12557.0, 2611.0, 1054.0, 468.0, 263.0, 148.0, 86.0, 47.0, 29.0, 10.0, 9.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8359375, -0.7958526611328125, -0.755767822265625, -0.7156829833984375, -0.67559814453125, -0.6355133056640625, -0.595428466796875, -0.5553436279296875, -0.5152587890625, -0.4751739501953125, -0.435089111328125, -0.3950042724609375, -0.35491943359375, -0.3148345947265625, -0.274749755859375, -0.2346649169921875, -0.194580078125, -0.1544952392578125, -0.114410400390625, -0.0743255615234375, -0.03424072265625, 0.0058441162109375, 0.045928955078125, 0.0860137939453125, 0.1260986328125, 0.1661834716796875, 0.206268310546875, 0.2463531494140625, 0.28643798828125, 0.3265228271484375, 0.366607666015625, 0.4066925048828125, 0.44677734375, 0.4868621826171875, 0.526947021484375, 0.5670318603515625, 0.60711669921875, 0.6472015380859375, 0.687286376953125, 0.7273712158203125, 0.7674560546875, 0.8075408935546875, 0.847625732421875, 0.8877105712890625, 0.92779541015625, 0.9678802490234375, 1.007965087890625, 1.0480499267578125, 1.088134765625, 1.1282196044921875, 1.168304443359375, 1.2083892822265625, 1.24847412109375, 1.2885589599609375, 1.328643798828125, 1.3687286376953125, 1.4088134765625, 1.4488983154296875, 1.488983154296875, 1.5290679931640625, 1.56915283203125, 1.6092376708984375, 1.649322509765625, 1.6894073486328125, 1.7294921875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 5.0, 12.0, 9.0, 12.0, 25.0, 33.0, 56.0, 116.0, 565.0, 2773.0, 262.0, 78.0, 42.0, 30.0, 16.0, 11.0, 10.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.372802734375, -0.3560752868652344, -0.33934783935546875, -0.3226203918457031, -0.3058929443359375, -0.2891654968261719, -0.27243804931640625, -0.2557106018066406, -0.238983154296875, -0.22225570678710938, -0.20552825927734375, -0.18880081176757812, -0.1720733642578125, -0.15534591674804688, -0.13861846923828125, -0.12189102172851562, -0.10516357421875, -0.08843612670898438, -0.07170867919921875, -0.054981231689453125, -0.0382537841796875, -0.021526336669921875, -0.00479888916015625, 0.011928558349609375, 0.028656005859375, 0.045383453369140625, 0.06211090087890625, 0.07883834838867188, 0.0955657958984375, 0.11229324340820312, 0.12902069091796875, 0.14574813842773438, 0.1624755859375, 0.17920303344726562, 0.19593048095703125, 0.21265792846679688, 0.2293853759765625, 0.24611282348632812, 0.26284027099609375, 0.2795677185058594, 0.296295166015625, 0.3130226135253906, 0.32975006103515625, 0.3464775085449219, 0.3632049560546875, 0.3799324035644531, 0.39665985107421875, 0.4133872985839844, 0.43011474609375, 0.4468421936035156, 0.46356964111328125, 0.4802970886230469, 0.4970245361328125, 0.5137519836425781, 0.5304794311523438, 0.5472068786621094, 0.563934326171875, 0.5806617736816406, 0.5973892211914062, 0.6141166687011719, 0.6308441162109375, 0.6475715637207031, 0.6642990112304688, 0.6810264587402344, 0.69775390625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 4.0, 7.0, 17.0, 39.0, 104.0, 211.0, 306.0, 181.0, 91.0, 29.0, 13.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2857009172439575, -1.1956744194030762, -1.1056480407714844, -1.0156216621398926, -0.9255951642990112, -0.8355687260627747, -0.7455422878265381, -0.6555158495903015, -0.5654894113540649, -0.47546297311782837, -0.3854365348815918, -0.2954100966453552, -0.20538365840911865, -0.11535722017288208, -0.025330781936645508, 0.06469565629959106, 0.15472209453582764, 0.2447485327720642, 0.3347749710083008, 0.42480140924453735, 0.5148278474807739, 0.6048542857170105, 0.6948807239532471, 0.7849071621894836, 0.8749336004257202, 0.9649600386619568, 1.0549864768981934, 1.1450128555297852, 1.2350393533706665, 1.3250658512115479, 1.4150922298431396, 1.5051186084747314, 1.5951452255249023, 1.6851716041564941, 1.7751981019973755, 1.8652245998382568, 1.9552509784698486, 2.0452773571014404, 2.1353039741516113, 2.225330352783203, 2.315356731414795, 2.4053831100463867, 2.4954094886779785, 2.5854361057281494, 2.675462484359741, 2.765488862991333, 2.855515480041504, 2.9455418586730957, 3.0355682373046875, 3.1255946159362793, 3.215620994567871, 3.305647611618042, 3.395673990249634, 3.4857003688812256, 3.5757269859313965, 3.6657533645629883, 3.75577974319458, 3.845806121826172, 3.9358325004577637, 4.0258588790893555, 4.1158857345581055, 4.205912113189697, 4.295938491821289, 4.385964870452881, 4.475991249084473]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 4.0, 1.0, 5.0, 6.0, 8.0, 3.0, 8.0, 7.0, 11.0, 20.0, 18.0, 19.0, 32.0, 33.0, 31.0, 44.0, 30.0, 56.0, 47.0, 52.0, 60.0, 51.0, 45.0, 45.0, 44.0, 46.0, 39.0, 46.0, 24.0, 32.0, 29.0, 22.0, 10.0, 13.0, 25.0, 13.0, 10.0, 13.0, 6.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-1.5787252187728882, -1.5397706031799316, -1.5008161067962646, -1.461861491203308, -1.4229069948196411, -1.3839523792266846, -1.3449978828430176, -1.306043267250061, -1.2670886516571045, -1.228134036064148, -1.189179539680481, -1.1502249240875244, -1.1112704277038574, -1.0723158121109009, -1.0333613157272339, -0.9944067001342773, -0.9554522037506104, -0.9164976477622986, -0.8775430917739868, -0.838588535785675, -0.7996339797973633, -0.7606793642044067, -0.721724808216095, -0.6827702522277832, -0.6438156962394714, -0.6048611402511597, -0.5659065842628479, -0.5269520282745361, -0.487997442483902, -0.4490428864955902, -0.41008830070495605, -0.3711337447166443, -0.3321792483329773, -0.2932246923446655, -0.25427013635635376, -0.2153155505657196, -0.17636099457740784, -0.13740643858909607, -0.09845186769962311, -0.059497296810150146, -0.02054274082183838, 0.018411822617053986, 0.05736638605594635, 0.09632094949483871, 0.13527551293373108, 0.17423006892204285, 0.2131846398115158, 0.25213921070098877, 0.29109376668930054, 0.3300483226776123, 0.3690028786659241, 0.4079574644565582, 0.44691202044487, 0.48586657643318176, 0.5248211622238159, 0.5637757182121277, 0.6027302742004395, 0.6416848301887512, 0.680639386177063, 0.7195939421653748, 0.7585484981536865, 0.7975031137466431, 0.8364576697349548, 0.8754122257232666, 0.9143667817115784]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 11.0, 4.0, 15.0, 8.0, 18.0, 19.0, 37.0, 62.0, 103.0, 191.0, 328.0, 716.0, 1589.0, 3759.0, 12311.0, 70744.0, 676067.0, 244144.0, 27304.0, 6528.0, 2455.0, 1059.0, 485.0, 236.0, 138.0, 80.0, 53.0, 30.0, 16.0, 16.0, 9.0, 2.0, 6.0, 1.0, 5.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8935546875, -0.861358642578125, -0.82916259765625, -0.796966552734375, -0.7647705078125, -0.732574462890625, -0.70037841796875, -0.668182373046875, -0.635986328125, -0.603790283203125, -0.57159423828125, -0.539398193359375, -0.5072021484375, -0.475006103515625, -0.44281005859375, -0.410614013671875, -0.37841796875, -0.346221923828125, -0.31402587890625, -0.281829833984375, -0.2496337890625, -0.217437744140625, -0.18524169921875, -0.153045654296875, -0.120849609375, -0.088653564453125, -0.05645751953125, -0.024261474609375, 0.0079345703125, 0.040130615234375, 0.07232666015625, 0.104522705078125, 0.13671875, 0.168914794921875, 0.20111083984375, 0.233306884765625, 0.2655029296875, 0.297698974609375, 0.32989501953125, 0.362091064453125, 0.394287109375, 0.426483154296875, 0.45867919921875, 0.490875244140625, 0.5230712890625, 0.555267333984375, 0.58746337890625, 0.619659423828125, 0.65185546875, 0.684051513671875, 0.71624755859375, 0.748443603515625, 0.7806396484375, 0.812835693359375, 0.84503173828125, 0.877227783203125, 0.909423828125, 0.941619873046875, 0.97381591796875, 1.006011962890625, 1.0382080078125, 1.070404052734375, 1.10260009765625, 1.134796142578125, 1.1669921875]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 8.0, 10.0, 11.0, 31.0, 30.0, 35.0, 43.0, 64.0, 68.0, 81.0, 93.0, 100.0, 77.0, 82.0, 64.0, 50.0, 52.0, 29.0, 24.0, 20.0, 15.0, 3.0, 3.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.43115234375, -0.4204597473144531, -0.40976715087890625, -0.3990745544433594, -0.3883819580078125, -0.3776893615722656, -0.36699676513671875, -0.3563041687011719, -0.345611572265625, -0.3349189758300781, -0.32422637939453125, -0.3135337829589844, -0.3028411865234375, -0.2921485900878906, -0.28145599365234375, -0.2707633972167969, -0.26007080078125, -0.24937820434570312, -0.23868560791015625, -0.22799301147460938, -0.2173004150390625, -0.20660781860351562, -0.19591522216796875, -0.18522262573242188, -0.174530029296875, -0.16383743286132812, -0.15314483642578125, -0.14245223999023438, -0.1317596435546875, -0.12106704711914062, -0.11037445068359375, -0.09968185424804688, -0.0889892578125, -0.07829666137695312, -0.06760406494140625, -0.056911468505859375, -0.0462188720703125, -0.035526275634765625, -0.02483367919921875, -0.014141082763671875, -0.003448486328125, 0.007244110107421875, 0.01793670654296875, 0.028629302978515625, 0.0393218994140625, 0.050014495849609375, 0.06070709228515625, 0.07139968872070312, 0.08209228515625, 0.09278488159179688, 0.10347747802734375, 0.11417007446289062, 0.1248626708984375, 0.13555526733398438, 0.14624786376953125, 0.15694046020507812, 0.167633056640625, 0.17832565307617188, 0.18901824951171875, 0.19971084594726562, 0.2104034423828125, 0.22109603881835938, 0.23178863525390625, 0.24248123168945312, 0.253173828125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 8.0, 8.0, 5.0, 17.0, 14.0, 30.0, 33.0, 77.0, 137.0, 212.0, 420.0, 960.0, 2697.0, 9668.0, 63565.0, 769097.0, 176405.0, 18279.0, 4269.0, 1344.0, 590.0, 282.0, 154.0, 97.0, 70.0, 32.0, 23.0, 16.0, 12.0, 8.0, 8.0, 5.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.16796875, -1.129913330078125, -1.09185791015625, -1.053802490234375, -1.0157470703125, -0.977691650390625, -0.93963623046875, -0.901580810546875, -0.863525390625, -0.825469970703125, -0.78741455078125, -0.749359130859375, -0.7113037109375, -0.673248291015625, -0.63519287109375, -0.597137451171875, -0.55908203125, -0.521026611328125, -0.48297119140625, -0.444915771484375, -0.4068603515625, -0.368804931640625, -0.33074951171875, -0.292694091796875, -0.254638671875, -0.216583251953125, -0.17852783203125, -0.140472412109375, -0.1024169921875, -0.064361572265625, -0.02630615234375, 0.011749267578125, 0.0498046875, 0.087860107421875, 0.12591552734375, 0.163970947265625, 0.2020263671875, 0.240081787109375, 0.27813720703125, 0.316192626953125, 0.354248046875, 0.392303466796875, 0.43035888671875, 0.468414306640625, 0.5064697265625, 0.544525146484375, 0.58258056640625, 0.620635986328125, 0.65869140625, 0.696746826171875, 0.73480224609375, 0.772857666015625, 0.8109130859375, 0.848968505859375, 0.88702392578125, 0.925079345703125, 0.963134765625, 1.001190185546875, 1.03924560546875, 1.077301025390625, 1.1153564453125, 1.153411865234375, 1.19146728515625, 1.229522705078125, 1.267578125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 8.0, 8.0, 8.0, 13.0, 16.0, 23.0, 31.0, 19.0, 50.0, 37.0, 64.0, 56.0, 68.0, 58.0, 70.0, 69.0, 60.0, 51.0, 62.0, 38.0, 36.0, 32.0, 23.0, 19.0, 12.0, 19.0, 13.0, 6.0, 9.0, 7.0, 3.0, 5.0, 0.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.349609375, -1.298492431640625, -1.24737548828125, -1.196258544921875, -1.1451416015625, -1.094024658203125, -1.04290771484375, -0.991790771484375, -0.940673828125, -0.889556884765625, -0.83843994140625, -0.787322998046875, -0.7362060546875, -0.685089111328125, -0.63397216796875, -0.582855224609375, -0.53173828125, -0.480621337890625, -0.42950439453125, -0.378387451171875, -0.3272705078125, -0.276153564453125, -0.22503662109375, -0.173919677734375, -0.122802734375, -0.071685791015625, -0.02056884765625, 0.030548095703125, 0.0816650390625, 0.132781982421875, 0.18389892578125, 0.235015869140625, 0.2861328125, 0.337249755859375, 0.38836669921875, 0.439483642578125, 0.4906005859375, 0.541717529296875, 0.59283447265625, 0.643951416015625, 0.695068359375, 0.746185302734375, 0.79730224609375, 0.848419189453125, 0.8995361328125, 0.950653076171875, 1.00177001953125, 1.052886962890625, 1.10400390625, 1.155120849609375, 1.20623779296875, 1.257354736328125, 1.3084716796875, 1.359588623046875, 1.41070556640625, 1.461822509765625, 1.512939453125, 1.564056396484375, 1.61517333984375, 1.666290283203125, 1.7174072265625, 1.768524169921875, 1.81964111328125, 1.870758056640625, 1.921875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 7.0, 11.0, 15.0, 12.0, 29.0, 45.0, 69.0, 100.0, 159.0, 304.0, 617.0, 1398.0, 3674.0, 16521.0, 950333.0, 64960.0, 6433.0, 2029.0, 854.0, 417.0, 205.0, 133.0, 78.0, 55.0, 32.0, 19.0, 23.0, 7.0, 9.0, 9.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6787109375, -1.63299560546875, -1.5872802734375, -1.54156494140625, -1.495849609375, -1.45013427734375, -1.4044189453125, -1.35870361328125, -1.31298828125, -1.26727294921875, -1.2215576171875, -1.17584228515625, -1.130126953125, -1.08441162109375, -1.0386962890625, -0.99298095703125, -0.947265625, -0.90155029296875, -0.8558349609375, -0.81011962890625, -0.764404296875, -0.71868896484375, -0.6729736328125, -0.62725830078125, -0.58154296875, -0.53582763671875, -0.4901123046875, -0.44439697265625, -0.398681640625, -0.35296630859375, -0.3072509765625, -0.26153564453125, -0.2158203125, -0.17010498046875, -0.1243896484375, -0.07867431640625, -0.032958984375, 0.01275634765625, 0.0584716796875, 0.10418701171875, 0.14990234375, 0.19561767578125, 0.2413330078125, 0.28704833984375, 0.332763671875, 0.37847900390625, 0.4241943359375, 0.46990966796875, 0.515625, 0.56134033203125, 0.6070556640625, 0.65277099609375, 0.698486328125, 0.74420166015625, 0.7899169921875, 0.83563232421875, 0.88134765625, 0.92706298828125, 0.9727783203125, 1.01849365234375, 1.064208984375, 1.10992431640625, 1.1556396484375, 1.20135498046875, 1.2470703125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 11.0, 15.0, 21.0, 55.0, 56.0, 60.0, 106.0, 136.0, 120.0, 101.0, 89.0, 62.0, 42.0, 41.0, 23.0, 20.0, 10.0, 8.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00011873245239257812, -0.00011389702558517456, -0.000109061598777771, -0.00010422617197036743, -9.939074516296387e-05, -9.45553183555603e-05, -8.971989154815674e-05, -8.488446474075317e-05, -8.004903793334961e-05, -7.521361112594604e-05, -7.037818431854248e-05, -6.554275751113892e-05, -6.070733070373535e-05, -5.587190389633179e-05, -5.103647708892822e-05, -4.620105028152466e-05, -4.1365623474121094e-05, -3.653019666671753e-05, -3.1694769859313965e-05, -2.68593430519104e-05, -2.2023916244506836e-05, -1.718848943710327e-05, -1.2353062629699707e-05, -7.517635822296143e-06, -2.682209014892578e-06, 2.1532177925109863e-06, 6.988644599914551e-06, 1.1824071407318115e-05, 1.665949821472168e-05, 2.1494925022125244e-05, 2.633035182952881e-05, 3.116577863693237e-05, 3.600120544433594e-05, 4.08366322517395e-05, 4.5672059059143066e-05, 5.050748586654663e-05, 5.5342912673950195e-05, 6.017833948135376e-05, 6.501376628875732e-05, 6.984919309616089e-05, 7.468461990356445e-05, 7.952004671096802e-05, 8.435547351837158e-05, 8.919090032577515e-05, 9.402632713317871e-05, 9.886175394058228e-05, 0.00010369718074798584, 0.0001085326075553894, 0.00011336803436279297, 0.00011820346117019653, 0.0001230388879776001, 0.00012787431478500366, 0.00013270974159240723, 0.0001375451683998108, 0.00014238059520721436, 0.00014721602201461792, 0.00015205144882202148, 0.00015688687562942505, 0.0001617223024368286, 0.00016655772924423218, 0.00017139315605163574, 0.0001762285828590393, 0.00018106400966644287, 0.00018589943647384644, 0.00019073486328125]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 10.0, 13.0, 19.0, 38.0, 55.0, 117.0, 212.0, 507.0, 1928.0, 13361.0, 970367.0, 56809.0, 3719.0, 770.0, 298.0, 150.0, 88.0, 42.0, 24.0, 12.0, 5.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6298828125, -1.582916259765625, -1.53594970703125, -1.488983154296875, -1.4420166015625, -1.395050048828125, -1.34808349609375, -1.301116943359375, -1.254150390625, -1.207183837890625, -1.16021728515625, -1.113250732421875, -1.0662841796875, -1.019317626953125, -0.97235107421875, -0.925384521484375, -0.87841796875, -0.831451416015625, -0.78448486328125, -0.737518310546875, -0.6905517578125, -0.643585205078125, -0.59661865234375, -0.549652099609375, -0.502685546875, -0.455718994140625, -0.40875244140625, -0.361785888671875, -0.3148193359375, -0.267852783203125, -0.22088623046875, -0.173919677734375, -0.126953125, -0.079986572265625, -0.03302001953125, 0.013946533203125, 0.0609130859375, 0.107879638671875, 0.15484619140625, 0.201812744140625, 0.248779296875, 0.295745849609375, 0.34271240234375, 0.389678955078125, 0.4366455078125, 0.483612060546875, 0.53057861328125, 0.577545166015625, 0.62451171875, 0.671478271484375, 0.71844482421875, 0.765411376953125, 0.8123779296875, 0.859344482421875, 0.90631103515625, 0.953277587890625, 1.000244140625, 1.047210693359375, 1.09417724609375, 1.141143798828125, 1.1881103515625, 1.235076904296875, 1.28204345703125, 1.329010009765625, 1.3759765625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 5.0, 8.0, 12.0, 26.0, 56.0, 132.0, 467.0, 185.0, 53.0, 19.0, 14.0, 5.0, 8.0, 5.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.287109375, -2.2210235595703125, -2.154937744140625, -2.0888519287109375, -2.02276611328125, -1.9566802978515625, -1.890594482421875, -1.8245086669921875, -1.7584228515625, -1.6923370361328125, -1.626251220703125, -1.5601654052734375, -1.49407958984375, -1.4279937744140625, -1.361907958984375, -1.2958221435546875, -1.229736328125, -1.1636505126953125, -1.097564697265625, -1.0314788818359375, -0.96539306640625, -0.8993072509765625, -0.833221435546875, -0.7671356201171875, -0.7010498046875, -0.6349639892578125, -0.568878173828125, -0.5027923583984375, -0.43670654296875, -0.3706207275390625, -0.304534912109375, -0.2384490966796875, -0.17236328125, -0.1062774658203125, -0.040191650390625, 0.0258941650390625, 0.09197998046875, 0.1580657958984375, 0.224151611328125, 0.2902374267578125, 0.3563232421875, 0.4224090576171875, 0.488494873046875, 0.5545806884765625, 0.62066650390625, 0.6867523193359375, 0.752838134765625, 0.8189239501953125, 0.885009765625, 0.9510955810546875, 1.017181396484375, 1.0832672119140625, 1.14935302734375, 1.2154388427734375, 1.281524658203125, 1.3476104736328125, 1.4136962890625, 1.4797821044921875, 1.545867919921875, 1.6119537353515625, 1.67803955078125, 1.7441253662109375, 1.810211181640625, 1.8762969970703125, 1.9423828125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 5.0, 12.0, 90.0, 496.0, 372.0, 37.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.260047912597656, -39.19731903076172, -38.13459014892578, -37.07185745239258, -36.00912857055664, -34.9463996887207, -33.8836669921875, -32.82093811035156, -31.758209228515625, -30.695480346679688, -29.632749557495117, -28.570018768310547, -27.50728988647461, -26.444561004638672, -25.3818302154541, -24.31909942626953, -23.256370544433594, -22.193641662597656, -21.130910873413086, -20.068180084228516, -19.005451202392578, -17.94272232055664, -16.87999153137207, -15.817261695861816, -14.754531860351562, -13.691802024841309, -12.629072189331055, -11.5663423538208, -10.503612518310547, -9.440882682800293, -8.378152847290039, -7.315423011779785, -6.252689361572266, -5.189959526062012, -4.127229690551758, -3.064499855041504, -2.00177001953125, -0.9390401840209961, 0.12368965148925781, 1.1864194869995117, 2.2491493225097656, 3.3118791580200195, 4.374608993530273, 5.437338829040527, 6.500068664550781, 7.562798500061035, 8.625528335571289, 9.688258171081543, 10.750988006591797, 11.81371784210205, 12.876447677612305, 13.939177513122559, 15.001907348632812, 16.06463623046875, 17.12736701965332, 18.19009780883789, 19.252826690673828, 20.315555572509766, 21.378286361694336, 22.441017150878906, 23.503746032714844, 24.56647491455078, 25.62920570373535, 26.691936492919922, 27.75466537475586]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 5.0, 7.0, 13.0, 20.0, 16.0, 18.0, 32.0, 31.0, 31.0, 40.0, 42.0, 49.0, 45.0, 53.0, 52.0, 51.0, 58.0, 48.0, 47.0, 36.0, 38.0, 33.0, 35.0, 31.0, 32.0, 20.0, 17.0, 13.0, 17.0, 16.0, 8.0, 13.0, 5.0, 9.0, 2.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-8.110275268554688, -7.8624725341796875, -7.6146697998046875, -7.3668670654296875, -7.119063854217529, -6.871261119842529, -6.623458385467529, -6.375655651092529, -6.127852439880371, -5.880049705505371, -5.632246971130371, -5.384444236755371, -5.136641025543213, -4.888838291168213, -4.641035556793213, -4.393232822418213, -4.145430088043213, -3.897627353668213, -3.649824380874634, -3.402021646499634, -3.1542186737060547, -2.9064159393310547, -2.6586132049560547, -2.4108104705810547, -2.1630074977874756, -1.915204644203186, -1.6674017906188965, -1.4195990562438965, -1.171796202659607, -0.9239933490753174, -0.6761906147003174, -0.42838776111602783, -0.18058538436889648, 0.06721743941307068, 0.31502026319503784, 0.5628230571746826, 0.8106259107589722, 1.0584287643432617, 1.3062314987182617, 1.5540343523025513, 1.8018372058868408, 2.049639940261841, 2.29744291305542, 2.54524564743042, 2.79304838180542, 3.040851354598999, 3.288654088973999, 3.536457061767578, 3.784259796142578, 4.032062530517578, 4.279865264892578, 4.527667999267578, 4.775471210479736, 5.023273944854736, 5.271076679229736, 5.518879413604736, 5.7666826248168945, 6.0144853591918945, 6.2622880935668945, 6.5100908279418945, 6.757894039154053, 7.005696773529053, 7.253499507904053, 7.501302242279053, 7.749104976654053]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 7.0, 6.0, 7.0, 5.0, 6.0, 20.0, 10.0, 18.0, 20.0, 37.0, 48.0, 79.0, 94.0, 150.0, 238.0, 476.0, 931.0, 2397.0, 8331.0, 75155.0, 4067414.0, 29846.0, 5377.0, 1757.0, 746.0, 422.0, 216.0, 139.0, 92.0, 67.0, 42.0, 36.0, 22.0, 15.0, 13.0, 15.0, 9.0, 7.0, 6.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3701171875, -1.3302154541015625, -1.290313720703125, -1.2504119873046875, -1.21051025390625, -1.1706085205078125, -1.130706787109375, -1.0908050537109375, -1.0509033203125, -1.0110015869140625, -0.971099853515625, -0.9311981201171875, -0.89129638671875, -0.8513946533203125, -0.811492919921875, -0.7715911865234375, -0.731689453125, -0.6917877197265625, -0.651885986328125, -0.6119842529296875, -0.57208251953125, -0.5321807861328125, -0.492279052734375, -0.4523773193359375, -0.4124755859375, -0.3725738525390625, -0.332672119140625, -0.2927703857421875, -0.25286865234375, -0.2129669189453125, -0.173065185546875, -0.1331634521484375, -0.09326171875, -0.0533599853515625, -0.013458251953125, 0.0264434814453125, 0.06634521484375, 0.1062469482421875, 0.146148681640625, 0.1860504150390625, 0.2259521484375, 0.2658538818359375, 0.305755615234375, 0.3456573486328125, 0.38555908203125, 0.4254608154296875, 0.465362548828125, 0.5052642822265625, 0.545166015625, 0.5850677490234375, 0.624969482421875, 0.6648712158203125, 0.70477294921875, 0.7446746826171875, 0.784576416015625, 0.8244781494140625, 0.8643798828125, 0.9042816162109375, 0.944183349609375, 0.9840850830078125, 1.02398681640625, 1.0638885498046875, 1.103790283203125, 1.1436920166015625, 1.18359375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 7.0, 14.0, 13.0, 21.0, 39.0, 43.0, 67.0, 71.0, 83.0, 86.0, 67.0, 77.0, 71.0, 63.0, 69.0, 48.0, 45.0, 30.0, 17.0, 11.0, 12.0, 8.0, 14.0, 4.0, 5.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.413818359375, -0.4015388488769531, -0.38925933837890625, -0.3769798278808594, -0.3647003173828125, -0.3524208068847656, -0.34014129638671875, -0.3278617858886719, -0.315582275390625, -0.3033027648925781, -0.29102325439453125, -0.2787437438964844, -0.2664642333984375, -0.2541847229003906, -0.24190521240234375, -0.22962570190429688, -0.21734619140625, -0.20506668090820312, -0.19278717041015625, -0.18050765991210938, -0.1682281494140625, -0.15594863891601562, -0.14366912841796875, -0.13138961791992188, -0.119110107421875, -0.10683059692382812, -0.09455108642578125, -0.08227157592773438, -0.0699920654296875, -0.057712554931640625, -0.04543304443359375, -0.033153533935546875, -0.0208740234375, -0.008594512939453125, 0.00368499755859375, 0.015964508056640625, 0.0282440185546875, 0.040523529052734375, 0.05280303955078125, 0.06508255004882812, 0.077362060546875, 0.08964157104492188, 0.10192108154296875, 0.11420059204101562, 0.1264801025390625, 0.13875961303710938, 0.15103912353515625, 0.16331863403320312, 0.17559814453125, 0.18787765502929688, 0.20015716552734375, 0.21243667602539062, 0.2247161865234375, 0.23699569702148438, 0.24927520751953125, 0.2615547180175781, 0.273834228515625, 0.2861137390136719, 0.29839324951171875, 0.3106727600097656, 0.3229522705078125, 0.3352317810058594, 0.34751129150390625, 0.3597908020019531, 0.3720703125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 15.0, 17.0, 13.0, 21.0, 26.0, 52.0, 70.0, 120.0, 170.0, 265.0, 444.0, 811.0, 1595.0, 3406.0, 8321.0, 44207.0, 4043424.0, 72916.0, 10379.0, 3830.0, 1819.0, 970.0, 532.0, 367.0, 146.0, 116.0, 65.0, 45.0, 44.0, 28.0, 23.0, 13.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8740234375, -0.839874267578125, -0.80572509765625, -0.771575927734375, -0.7374267578125, -0.703277587890625, -0.66912841796875, -0.634979248046875, -0.600830078125, -0.566680908203125, -0.53253173828125, -0.498382568359375, -0.4642333984375, -0.430084228515625, -0.39593505859375, -0.361785888671875, -0.32763671875, -0.293487548828125, -0.25933837890625, -0.225189208984375, -0.1910400390625, -0.156890869140625, -0.12274169921875, -0.088592529296875, -0.054443359375, -0.020294189453125, 0.01385498046875, 0.048004150390625, 0.0821533203125, 0.116302490234375, 0.15045166015625, 0.184600830078125, 0.21875, 0.252899169921875, 0.28704833984375, 0.321197509765625, 0.3553466796875, 0.389495849609375, 0.42364501953125, 0.457794189453125, 0.491943359375, 0.526092529296875, 0.56024169921875, 0.594390869140625, 0.6285400390625, 0.662689208984375, 0.69683837890625, 0.730987548828125, 0.76513671875, 0.799285888671875, 0.83343505859375, 0.867584228515625, 0.9017333984375, 0.935882568359375, 0.97003173828125, 1.004180908203125, 1.038330078125, 1.072479248046875, 1.10662841796875, 1.140777587890625, 1.1749267578125, 1.209075927734375, 1.24322509765625, 1.277374267578125, 1.3115234375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 1.0, 4.0, 4.0, 9.0, 12.0, 22.0, 42.0, 123.0, 3426.0, 318.0, 44.0, 27.0, 14.0, 7.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.265869140625, -0.2566413879394531, -0.24741363525390625, -0.23818588256835938, -0.2289581298828125, -0.21973037719726562, -0.21050262451171875, -0.20127487182617188, -0.192047119140625, -0.18281936645507812, -0.17359161376953125, -0.16436386108398438, -0.1551361083984375, -0.14590835571289062, -0.13668060302734375, -0.12745285034179688, -0.11822509765625, -0.10899734497070312, -0.09976959228515625, -0.09054183959960938, -0.0813140869140625, -0.07208633422851562, -0.06285858154296875, -0.053630828857421875, -0.044403076171875, -0.035175323486328125, -0.02594757080078125, -0.016719818115234375, -0.0074920654296875, 0.001735687255859375, 0.01096343994140625, 0.020191192626953125, 0.0294189453125, 0.038646697998046875, 0.04787445068359375, 0.057102203369140625, 0.0663299560546875, 0.07555770874023438, 0.08478546142578125, 0.09401321411132812, 0.103240966796875, 0.11246871948242188, 0.12169647216796875, 0.13092422485351562, 0.1401519775390625, 0.14937973022460938, 0.15860748291015625, 0.16783523559570312, 0.17706298828125, 0.18629074096679688, 0.19551849365234375, 0.20474624633789062, 0.2139739990234375, 0.22320175170898438, 0.23242950439453125, 0.24165725708007812, 0.250885009765625, 0.2601127624511719, 0.26934051513671875, 0.2785682678222656, 0.2877960205078125, 0.2970237731933594, 0.30625152587890625, 0.3154792785644531, 0.32470703125]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 11.0, 93.0, 386.0, 430.0, 74.0, 9.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9047476649284363, -0.8055824041366577, -0.7064172029495239, -0.6072519421577454, -0.5080866813659668, -0.408921480178833, -0.30975621938705444, -0.21059101819992065, -0.11142575740814209, -0.012260518968105316, 0.08690471947193146, 0.18606996536254883, 0.285235196352005, 0.3844004273414612, 0.48356568813323975, 0.5827308893203735, 0.6818961501121521, 0.7810614109039307, 0.8802266120910645, 0.979391872882843, 1.0785571336746216, 1.1777223348617554, 1.2768876552581787, 1.3760528564453125, 1.4752180576324463, 1.57438325881958, 1.6735485792160034, 1.7727137804031372, 1.871878981590271, 1.9710443019866943, 2.070209503173828, 2.169374704360962, 2.268540143966675, 2.3677053451538086, 2.4668705463409424, 2.566035747528076, 2.665201187133789, 2.764366388320923, 2.8635315895080566, 2.9626967906951904, 3.061861991882324, 3.161027193069458, 3.260192394256592, 3.3593578338623047, 3.4585230350494385, 3.5576882362365723, 3.656853437423706, 3.75601863861084, 3.8551840782165527, 3.9543492794036865, 4.05351448059082, 4.152679920196533, 4.251844882965088, 4.351010322570801, 4.4501752853393555, 4.549340724945068, 4.648505687713623, 4.747671127319336, 4.846836090087891, 4.9460015296936035, 5.045166492462158, 5.144331932067871, 5.243496894836426, 5.342662334442139, 5.441827774047852]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 5.0, 4.0, 8.0, 5.0, 8.0, 13.0, 19.0, 21.0, 23.0, 18.0, 28.0, 24.0, 39.0, 39.0, 48.0, 41.0, 42.0, 57.0, 45.0, 56.0, 50.0, 32.0, 46.0, 45.0, 41.0, 36.0, 42.0, 36.0, 33.0, 23.0, 18.0, 20.0, 7.0, 12.0, 6.0, 4.0, 6.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7838696241378784, -0.7628446817398071, -0.7418197393417358, -0.7207947373390198, -0.6997697949409485, -0.6787448525428772, -0.6577199101448059, -0.6366949081420898, -0.6156699657440186, -0.5946450233459473, -0.573620080947876, -0.5525950789451599, -0.5315701365470886, -0.5105451941490173, -0.48952025175094604, -0.46849527955055237, -0.4474703371524811, -0.4264453947544098, -0.4054204225540161, -0.3843954801559448, -0.36337050795555115, -0.34234556555747986, -0.3213205933570862, -0.3002956509590149, -0.2792707085609436, -0.2582457661628723, -0.23722079396247864, -0.21619585156440735, -0.19517087936401367, -0.17414593696594238, -0.1531209796667099, -0.13209602236747742, -0.11107105016708374, -0.09004609286785126, -0.06902113556861877, -0.04799618571996689, -0.026971228420734406, -0.005946271121501923, 0.015078678727149963, 0.036103636026382446, 0.05712859332561493, 0.07815355062484741, 0.0991785079240799, 0.12020345777273178, 0.14122840762138367, 0.16225337982177734, 0.18327832221984863, 0.20430327951908112, 0.2253282368183136, 0.24635319411754608, 0.26737815141677856, 0.28840309381484985, 0.30942806601524353, 0.3304530084133148, 0.3514779806137085, 0.3725029230117798, 0.3935278654098511, 0.41455280780792236, 0.43557778000831604, 0.45660272240638733, 0.477627694606781, 0.4986526370048523, 0.5196775794029236, 0.5407025814056396, 0.5617275238037109]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 9.0, 1.0, 3.0, 6.0, 8.0, 13.0, 22.0, 45.0, 65.0, 96.0, 197.0, 407.0, 980.0, 2568.0, 8232.0, 34936.0, 194800.0, 573313.0, 186868.0, 33568.0, 8062.0, 2539.0, 924.0, 434.0, 180.0, 106.0, 70.0, 36.0, 22.0, 13.0, 14.0, 8.0, 7.0, 4.0, 2.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8804473876953125, -0.854156494140625, -0.8278656005859375, -0.80157470703125, -0.7752838134765625, -0.748992919921875, -0.7227020263671875, -0.6964111328125, -0.6701202392578125, -0.643829345703125, -0.6175384521484375, -0.59124755859375, -0.5649566650390625, -0.538665771484375, -0.5123748779296875, -0.486083984375, -0.4597930908203125, -0.433502197265625, -0.4072113037109375, -0.38092041015625, -0.3546295166015625, -0.328338623046875, -0.3020477294921875, -0.2757568359375, -0.2494659423828125, -0.223175048828125, -0.1968841552734375, -0.17059326171875, -0.1443023681640625, -0.118011474609375, -0.0917205810546875, -0.0654296875, -0.0391387939453125, -0.012847900390625, 0.0134429931640625, 0.03973388671875, 0.0660247802734375, 0.092315673828125, 0.1186065673828125, 0.1448974609375, 0.1711883544921875, 0.197479248046875, 0.2237701416015625, 0.25006103515625, 0.2763519287109375, 0.302642822265625, 0.3289337158203125, 0.355224609375, 0.3815155029296875, 0.407806396484375, 0.4340972900390625, 0.46038818359375, 0.4866790771484375, 0.512969970703125, 0.5392608642578125, 0.5655517578125, 0.5918426513671875, 0.618133544921875, 0.6444244384765625, 0.67071533203125, 0.6970062255859375, 0.723297119140625, 0.7495880126953125, 0.77587890625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 7.0, 6.0, 11.0, 10.0, 17.0, 20.0, 32.0, 37.0, 68.0, 64.0, 89.0, 68.0, 64.0, 70.0, 54.0, 71.0, 61.0, 55.0, 51.0, 37.0, 28.0, 19.0, 15.0, 8.0, 14.0, 9.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.421630859375, -0.4092979431152344, -0.39696502685546875, -0.3846321105957031, -0.3722991943359375, -0.3599662780761719, -0.34763336181640625, -0.3353004455566406, -0.322967529296875, -0.3106346130371094, -0.29830169677734375, -0.2859687805175781, -0.2736358642578125, -0.2613029479980469, -0.24897003173828125, -0.23663711547851562, -0.22430419921875, -0.21197128295898438, -0.19963836669921875, -0.18730545043945312, -0.1749725341796875, -0.16263961791992188, -0.15030670166015625, -0.13797378540039062, -0.125640869140625, -0.11330795288085938, -0.10097503662109375, -0.08864212036132812, -0.0763092041015625, -0.06397628784179688, -0.05164337158203125, -0.039310455322265625, -0.0269775390625, -0.014644622802734375, -0.00231170654296875, 0.010021209716796875, 0.0223541259765625, 0.034687042236328125, 0.04701995849609375, 0.059352874755859375, 0.071685791015625, 0.08401870727539062, 0.09635162353515625, 0.10868453979492188, 0.1210174560546875, 0.13335037231445312, 0.14568328857421875, 0.15801620483398438, 0.17034912109375, 0.18268203735351562, 0.19501495361328125, 0.20734786987304688, 0.2196807861328125, 0.23201370239257812, 0.24434661865234375, 0.2566795349121094, 0.269012451171875, 0.2813453674316406, 0.29367828369140625, 0.3060111999511719, 0.3183441162109375, 0.3306770324707031, 0.34300994873046875, 0.3553428649902344, 0.36767578125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 9.0, 10.0, 4.0, 10.0, 18.0, 22.0, 30.0, 37.0, 59.0, 89.0, 156.0, 276.0, 645.0, 1809.0, 6791.0, 42988.0, 531785.0, 420019.0, 35186.0, 5734.0, 1557.0, 587.0, 294.0, 144.0, 83.0, 67.0, 44.0, 17.0, 16.0, 20.0, 10.0, 7.0, 13.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.353515625, -1.31243896484375, -1.2713623046875, -1.23028564453125, -1.189208984375, -1.14813232421875, -1.1070556640625, -1.06597900390625, -1.02490234375, -0.98382568359375, -0.9427490234375, -0.90167236328125, -0.860595703125, -0.81951904296875, -0.7784423828125, -0.73736572265625, -0.6962890625, -0.65521240234375, -0.6141357421875, -0.57305908203125, -0.531982421875, -0.49090576171875, -0.4498291015625, -0.40875244140625, -0.36767578125, -0.32659912109375, -0.2855224609375, -0.24444580078125, -0.203369140625, -0.16229248046875, -0.1212158203125, -0.08013916015625, -0.0390625, 0.00201416015625, 0.0430908203125, 0.08416748046875, 0.125244140625, 0.16632080078125, 0.2073974609375, 0.24847412109375, 0.28955078125, 0.33062744140625, 0.3717041015625, 0.41278076171875, 0.453857421875, 0.49493408203125, 0.5360107421875, 0.57708740234375, 0.6181640625, 0.65924072265625, 0.7003173828125, 0.74139404296875, 0.782470703125, 0.82354736328125, 0.8646240234375, 0.90570068359375, 0.94677734375, 0.98785400390625, 1.0289306640625, 1.07000732421875, 1.111083984375, 1.15216064453125, 1.1932373046875, 1.23431396484375, 1.275390625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 8.0, 14.0, 12.0, 15.0, 21.0, 15.0, 25.0, 31.0, 36.0, 43.0, 36.0, 48.0, 51.0, 48.0, 63.0, 47.0, 52.0, 52.0, 42.0, 29.0, 44.0, 34.0, 32.0, 28.0, 22.0, 24.0, 26.0, 16.0, 17.0, 13.0, 12.0, 5.0, 1.0, 7.0, 4.0, 5.0, 7.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.6728515625, -1.619049072265625, -1.56524658203125, -1.511444091796875, -1.4576416015625, -1.403839111328125, -1.35003662109375, -1.296234130859375, -1.242431640625, -1.188629150390625, -1.13482666015625, -1.081024169921875, -1.0272216796875, -0.973419189453125, -0.91961669921875, -0.865814208984375, -0.81201171875, -0.758209228515625, -0.70440673828125, -0.650604248046875, -0.5968017578125, -0.542999267578125, -0.48919677734375, -0.435394287109375, -0.381591796875, -0.327789306640625, -0.27398681640625, -0.220184326171875, -0.1663818359375, -0.112579345703125, -0.05877685546875, -0.004974365234375, 0.048828125, 0.102630615234375, 0.15643310546875, 0.210235595703125, 0.2640380859375, 0.317840576171875, 0.37164306640625, 0.425445556640625, 0.479248046875, 0.533050537109375, 0.58685302734375, 0.640655517578125, 0.6944580078125, 0.748260498046875, 0.80206298828125, 0.855865478515625, 0.90966796875, 0.963470458984375, 1.01727294921875, 1.071075439453125, 1.1248779296875, 1.178680419921875, 1.23248291015625, 1.286285400390625, 1.340087890625, 1.393890380859375, 1.44769287109375, 1.501495361328125, 1.5552978515625, 1.609100341796875, 1.66290283203125, 1.716705322265625, 1.7705078125]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 4.0, 13.0, 12.0, 30.0, 27.0, 68.0, 91.0, 186.0, 386.0, 1215.0, 4875.0, 90074.0, 938593.0, 9875.0, 1959.0, 588.0, 233.0, 125.0, 78.0, 47.0, 22.0, 16.0, 12.0, 5.0, 5.0, 4.0, 6.0, 0.0, 4.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.615234375, -2.5449066162109375, -2.474578857421875, -2.4042510986328125, -2.33392333984375, -2.2635955810546875, -2.193267822265625, -2.1229400634765625, -2.0526123046875, -1.9822845458984375, -1.911956787109375, -1.8416290283203125, -1.77130126953125, -1.7009735107421875, -1.630645751953125, -1.5603179931640625, -1.489990234375, -1.4196624755859375, -1.349334716796875, -1.2790069580078125, -1.20867919921875, -1.1383514404296875, -1.068023681640625, -0.9976959228515625, -0.9273681640625, -0.8570404052734375, -0.786712646484375, -0.7163848876953125, -0.64605712890625, -0.5757293701171875, -0.505401611328125, -0.4350738525390625, -0.36474609375, -0.2944183349609375, -0.224090576171875, -0.1537628173828125, -0.08343505859375, -0.0131072998046875, 0.057220458984375, 0.1275482177734375, 0.1978759765625, 0.2682037353515625, 0.338531494140625, 0.4088592529296875, 0.47918701171875, 0.5495147705078125, 0.619842529296875, 0.6901702880859375, 0.760498046875, 0.8308258056640625, 0.901153564453125, 0.9714813232421875, 1.04180908203125, 1.1121368408203125, 1.182464599609375, 1.2527923583984375, 1.3231201171875, 1.3934478759765625, 1.463775634765625, 1.5341033935546875, 1.60443115234375, 1.6747589111328125, 1.745086669921875, 1.8154144287109375, 1.8857421875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 6.0, 8.0, 9.0, 10.0, 21.0, 25.0, 21.0, 43.0, 52.0, 70.0, 67.0, 69.0, 92.0, 83.0, 82.0, 74.0, 45.0, 46.0, 38.0, 31.0, 28.0, 19.0, 14.0, 11.0, 8.0, 3.0, 6.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.759166717529297e-05, -6.507895886898041e-05, -6.256625056266785e-05, -6.0053542256355286e-05, -5.7540833950042725e-05, -5.5028125643730164e-05, -5.25154173374176e-05, -5.000270903110504e-05, -4.749000072479248e-05, -4.497729241847992e-05, -4.246458411216736e-05, -3.99518758058548e-05, -3.7439167499542236e-05, -3.4926459193229675e-05, -3.2413750886917114e-05, -2.9901042580604553e-05, -2.7388334274291992e-05, -2.487562596797943e-05, -2.236291766166687e-05, -1.985020935535431e-05, -1.7337501049041748e-05, -1.4824792742729187e-05, -1.2312084436416626e-05, -9.799376130104065e-06, -7.286667823791504e-06, -4.773959517478943e-06, -2.261251211166382e-06, 2.514570951461792e-07, 2.7641654014587402e-06, 5.276873707771301e-06, 7.789582014083862e-06, 1.0302290320396423e-05, 1.2814998626708984e-05, 1.5327706933021545e-05, 1.7840415239334106e-05, 2.0353123545646667e-05, 2.286583185195923e-05, 2.537854015827179e-05, 2.789124846458435e-05, 3.040395677089691e-05, 3.291666507720947e-05, 3.5429373383522034e-05, 3.7942081689834595e-05, 4.0454789996147156e-05, 4.296749830245972e-05, 4.548020660877228e-05, 4.799291491508484e-05, 5.05056232213974e-05, 5.301833152770996e-05, 5.553103983402252e-05, 5.804374814033508e-05, 6.0556456446647644e-05, 6.30691647529602e-05, 6.558187305927277e-05, 6.809458136558533e-05, 7.060728967189789e-05, 7.311999797821045e-05, 7.563270628452301e-05, 7.814541459083557e-05, 8.065812289714813e-05, 8.31708312034607e-05, 8.568353950977325e-05, 8.819624781608582e-05, 9.070895612239838e-05, 9.322166442871094e-05]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 5.0, 12.0, 10.0, 14.0, 27.0, 51.0, 66.0, 178.0, 402.0, 1161.0, 5473.0, 802625.0, 232684.0, 4225.0, 973.0, 328.0, 140.0, 79.0, 32.0, 24.0, 23.0, 13.0, 4.0, 6.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.837890625, -2.7630767822265625, -2.688262939453125, -2.6134490966796875, -2.53863525390625, -2.4638214111328125, -2.389007568359375, -2.3141937255859375, -2.2393798828125, -2.1645660400390625, -2.089752197265625, -2.0149383544921875, -1.94012451171875, -1.8653106689453125, -1.790496826171875, -1.7156829833984375, -1.640869140625, -1.5660552978515625, -1.491241455078125, -1.4164276123046875, -1.34161376953125, -1.2667999267578125, -1.191986083984375, -1.1171722412109375, -1.0423583984375, -0.9675445556640625, -0.892730712890625, -0.8179168701171875, -0.74310302734375, -0.6682891845703125, -0.593475341796875, -0.5186614990234375, -0.44384765625, -0.3690338134765625, -0.294219970703125, -0.2194061279296875, -0.14459228515625, -0.0697784423828125, 0.005035400390625, 0.0798492431640625, 0.1546630859375, 0.2294769287109375, 0.304290771484375, 0.3791046142578125, 0.45391845703125, 0.5287322998046875, 0.603546142578125, 0.6783599853515625, 0.753173828125, 0.8279876708984375, 0.902801513671875, 0.9776153564453125, 1.05242919921875, 1.1272430419921875, 1.202056884765625, 1.2768707275390625, 1.3516845703125, 1.4264984130859375, 1.501312255859375, 1.5761260986328125, 1.65093994140625, 1.7257537841796875, 1.800567626953125, 1.8753814697265625, 1.9501953125]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 7.0, 2.0, 6.0, 6.0, 7.0, 15.0, 14.0, 50.0, 232.0, 434.0, 156.0, 34.0, 17.0, 9.0, 7.0, 5.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7705078125, -1.6876678466796875, -1.604827880859375, -1.5219879150390625, -1.43914794921875, -1.3563079833984375, -1.273468017578125, -1.1906280517578125, -1.1077880859375, -1.0249481201171875, -0.942108154296875, -0.8592681884765625, -0.77642822265625, -0.6935882568359375, -0.610748291015625, -0.5279083251953125, -0.445068359375, -0.3622283935546875, -0.279388427734375, -0.1965484619140625, -0.11370849609375, -0.0308685302734375, 0.051971435546875, 0.1348114013671875, 0.2176513671875, 0.3004913330078125, 0.383331298828125, 0.4661712646484375, 0.54901123046875, 0.6318511962890625, 0.714691162109375, 0.7975311279296875, 0.88037109375, 0.9632110595703125, 1.046051025390625, 1.1288909912109375, 1.21173095703125, 1.2945709228515625, 1.377410888671875, 1.4602508544921875, 1.5430908203125, 1.6259307861328125, 1.708770751953125, 1.7916107177734375, 1.87445068359375, 1.9572906494140625, 2.040130615234375, 2.1229705810546875, 2.205810546875, 2.2886505126953125, 2.371490478515625, 2.4543304443359375, 2.53717041015625, 2.6200103759765625, 2.702850341796875, 2.7856903076171875, 2.8685302734375, 2.9513702392578125, 3.034210205078125, 3.1170501708984375, 3.19989013671875, 3.2827301025390625, 3.365570068359375, 3.4484100341796875, 3.53125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 13.0, 35.0, 131.0, 288.0, 321.0, 161.0, 53.0, 7.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.952669143676758, -19.160310745239258, -18.367950439453125, -17.575592041015625, -16.783233642578125, -15.990874290466309, -15.198514938354492, -14.406156539916992, -13.613797187805176, -12.82143783569336, -12.02907943725586, -11.236720085144043, -10.444360733032227, -9.652002334594727, -8.85964298248291, -8.067283630371094, -7.274925231933594, -6.4825663566589355, -5.690207481384277, -4.897848129272461, -4.105489253997803, -3.3131303787231445, -2.520771026611328, -1.72841215133667, -0.9360532760620117, -0.14369428157806396, 0.6486647129058838, 1.441023826599121, 2.2333827018737793, 3.0257415771484375, 3.818100929260254, 4.610459804534912, 5.4028167724609375, 6.195175647735596, 6.987534523010254, 7.77989387512207, 8.57225227355957, 9.364611625671387, 10.156970977783203, 10.949329376220703, 11.74168872833252, 12.534048080444336, 13.326406478881836, 14.118765830993652, 14.911125183105469, 15.703483581542969, 16.49584197998047, 17.2882022857666, 18.0805606842041, 18.8729190826416, 19.665279388427734, 20.457637786865234, 21.249996185302734, 22.042354583740234, 22.834714889526367, 23.627073287963867, 24.41943359375, 25.2117919921875, 26.004152297973633, 26.796510696411133, 27.588869094848633, 28.381229400634766, 29.173587799072266, 29.965946197509766, 30.758304595947266]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 13.0, 14.0, 10.0, 18.0, 23.0, 24.0, 30.0, 31.0, 49.0, 54.0, 58.0, 53.0, 71.0, 52.0, 52.0, 58.0, 56.0, 31.0, 50.0, 45.0, 31.0, 32.0, 21.0, 16.0, 27.0, 22.0, 12.0, 7.0, 9.0, 6.0, 6.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.075013160705566, -11.707974433898926, -11.340935707092285, -10.973896980285645, -10.606857299804688, -10.239818572998047, -9.872779846191406, -9.505741119384766, -9.138702392578125, -8.771663665771484, -8.404624938964844, -8.037586212158203, -7.670547008514404, -7.303508281707764, -6.936469078063965, -6.569430351257324, -6.202391624450684, -5.835352897644043, -5.468314170837402, -5.1012749671936035, -4.734236240386963, -4.367197513580322, -4.000158309936523, -3.633119583129883, -3.266080856323242, -2.8990421295166016, -2.532003164291382, -2.164964199066162, -1.7979254722595215, -1.4308866262435913, -1.0638477802276611, -0.6968088150024414, -0.3297691345214844, 0.0372697114944458, 0.404308557510376, 0.7713474035263062, 1.1383862495422363, 1.5054250955581665, 1.8724639415740967, 2.2395029067993164, 2.606541633605957, 2.9735803604125977, 3.3406193256378174, 3.707658290863037, 4.074697017669678, 4.441735744476318, 4.808774948120117, 5.175813674926758, 5.542852401733398, 5.909891128540039, 6.27692985534668, 6.6439690589904785, 7.011007785797119, 7.37804651260376, 7.745085716247559, 8.1121244430542, 8.47916316986084, 8.84620189666748, 9.213240623474121, 9.580279350280762, 9.947319030761719, 10.31435775756836, 10.681396484375, 11.04843521118164, 11.415473937988281]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 10.0, 6.0, 16.0, 23.0, 31.0, 50.0, 75.0, 156.0, 252.0, 401.0, 771.0, 1687.0, 4418.0, 17867.0, 342093.0, 3791933.0, 24741.0, 5546.0, 2014.0, 961.0, 455.0, 293.0, 178.0, 102.0, 71.0, 48.0, 18.0, 19.0, 12.0, 12.0, 7.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3759765625, -1.336761474609375, -1.29754638671875, -1.258331298828125, -1.2191162109375, -1.179901123046875, -1.14068603515625, -1.101470947265625, -1.062255859375, -1.023040771484375, -0.98382568359375, -0.944610595703125, -0.9053955078125, -0.866180419921875, -0.82696533203125, -0.787750244140625, -0.74853515625, -0.709320068359375, -0.67010498046875, -0.630889892578125, -0.5916748046875, -0.552459716796875, -0.51324462890625, -0.474029541015625, -0.434814453125, -0.395599365234375, -0.35638427734375, -0.317169189453125, -0.2779541015625, -0.238739013671875, -0.19952392578125, -0.160308837890625, -0.12109375, -0.081878662109375, -0.04266357421875, -0.003448486328125, 0.0357666015625, 0.074981689453125, 0.11419677734375, 0.153411865234375, 0.192626953125, 0.231842041015625, 0.27105712890625, 0.310272216796875, 0.3494873046875, 0.388702392578125, 0.42791748046875, 0.467132568359375, 0.50634765625, 0.545562744140625, 0.58477783203125, 0.623992919921875, 0.6632080078125, 0.702423095703125, 0.74163818359375, 0.780853271484375, 0.820068359375, 0.859283447265625, 0.89849853515625, 0.937713623046875, 0.9769287109375, 1.016143798828125, 1.05535888671875, 1.094573974609375, 1.1337890625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 10.0, 11.0, 9.0, 14.0, 21.0, 37.0, 45.0, 54.0, 81.0, 79.0, 88.0, 85.0, 83.0, 83.0, 73.0, 56.0, 49.0, 35.0, 29.0, 21.0, 16.0, 9.0, 5.0, 2.0, 1.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.505859375, -0.48883056640625, -0.4718017578125, -0.45477294921875, -0.437744140625, -0.42071533203125, -0.4036865234375, -0.38665771484375, -0.36962890625, -0.35260009765625, -0.3355712890625, -0.31854248046875, -0.301513671875, -0.28448486328125, -0.2674560546875, -0.25042724609375, -0.2333984375, -0.21636962890625, -0.1993408203125, -0.18231201171875, -0.165283203125, -0.14825439453125, -0.1312255859375, -0.11419677734375, -0.09716796875, -0.08013916015625, -0.0631103515625, -0.04608154296875, -0.029052734375, -0.01202392578125, 0.0050048828125, 0.02203369140625, 0.0390625, 0.05609130859375, 0.0731201171875, 0.09014892578125, 0.107177734375, 0.12420654296875, 0.1412353515625, 0.15826416015625, 0.17529296875, 0.19232177734375, 0.2093505859375, 0.22637939453125, 0.243408203125, 0.26043701171875, 0.2774658203125, 0.29449462890625, 0.3115234375, 0.32855224609375, 0.3455810546875, 0.36260986328125, 0.379638671875, 0.39666748046875, 0.4136962890625, 0.43072509765625, 0.44775390625, 0.46478271484375, 0.4818115234375, 0.49884033203125, 0.515869140625, 0.53289794921875, 0.5499267578125, 0.56695556640625, 0.583984375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 9.0, 11.0, 12.0, 21.0, 15.0, 26.0, 28.0, 49.0, 87.0, 124.0, 170.0, 250.0, 345.0, 583.0, 945.0, 1541.0, 2763.0, 5376.0, 12731.0, 39861.0, 302609.0, 3712368.0, 78541.0, 19637.0, 7505.0, 3548.0, 1956.0, 1127.0, 724.0, 405.0, 284.0, 191.0, 108.0, 85.0, 72.0, 52.0, 29.0, 17.0, 19.0, 15.0, 11.0, 10.0, 8.0, 2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.77685546875, -0.7527389526367188, -0.7286224365234375, -0.7045059204101562, -0.680389404296875, -0.6562728881835938, -0.6321563720703125, -0.6080398559570312, -0.58392333984375, -0.5598068237304688, -0.5356903076171875, -0.5115737915039062, -0.487457275390625, -0.46334075927734375, -0.4392242431640625, -0.41510772705078125, -0.3909912109375, -0.36687469482421875, -0.3427581787109375, -0.31864166259765625, -0.294525146484375, -0.27040863037109375, -0.2462921142578125, -0.22217559814453125, -0.19805908203125, -0.17394256591796875, -0.1498260498046875, -0.12570953369140625, -0.101593017578125, -0.07747650146484375, -0.0533599853515625, -0.02924346923828125, -0.005126953125, 0.01898956298828125, 0.0431060791015625, 0.06722259521484375, 0.091339111328125, 0.11545562744140625, 0.1395721435546875, 0.16368865966796875, 0.18780517578125, 0.21192169189453125, 0.2360382080078125, 0.26015472412109375, 0.284271240234375, 0.30838775634765625, 0.3325042724609375, 0.35662078857421875, 0.3807373046875, 0.40485382080078125, 0.4289703369140625, 0.45308685302734375, 0.477203369140625, 0.5013198852539062, 0.5254364013671875, 0.5495529174804688, 0.57366943359375, 0.5977859497070312, 0.6219024658203125, 0.6460189819335938, 0.670135498046875, 0.6942520141601562, 0.7183685302734375, 0.7424850463867188, 0.7666015625]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 2.0, 6.0, 14.0, 27.0, 36.0, 42.0, 75.0, 205.0, 2986.0, 422.0, 124.0, 50.0, 19.0, 13.0, 8.0, 8.0, 6.0, 7.0, 2.0, 5.0, 6.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.345947265625, -0.33725738525390625, -0.3285675048828125, -0.31987762451171875, -0.311187744140625, -0.30249786376953125, -0.2938079833984375, -0.28511810302734375, -0.27642822265625, -0.26773834228515625, -0.2590484619140625, -0.25035858154296875, -0.241668701171875, -0.23297882080078125, -0.2242889404296875, -0.21559906005859375, -0.2069091796875, -0.19821929931640625, -0.1895294189453125, -0.18083953857421875, -0.172149658203125, -0.16345977783203125, -0.1547698974609375, -0.14608001708984375, -0.13739013671875, -0.12870025634765625, -0.1200103759765625, -0.11132049560546875, -0.102630615234375, -0.09394073486328125, -0.0852508544921875, -0.07656097412109375, -0.06787109375, -0.05918121337890625, -0.0504913330078125, -0.04180145263671875, -0.033111572265625, -0.02442169189453125, -0.0157318115234375, -0.00704193115234375, 0.00164794921875, 0.01033782958984375, 0.0190277099609375, 0.02771759033203125, 0.036407470703125, 0.04509735107421875, 0.0537872314453125, 0.06247711181640625, 0.0711669921875, 0.07985687255859375, 0.0885467529296875, 0.09723663330078125, 0.105926513671875, 0.11461639404296875, 0.1233062744140625, 0.13199615478515625, 0.14068603515625, 0.14937591552734375, 0.1580657958984375, 0.16675567626953125, 0.175445556640625, 0.18413543701171875, 0.1928253173828125, 0.20151519775390625, 0.210205078125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 31.0, 115.0, 335.0, 368.0, 136.0, 20.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.01705801486969, -0.9083320498466492, -0.7996061444282532, -0.6908801794052124, -0.5821542739868164, -0.47342830896377563, -0.36470234394073486, -0.25597643852233887, -0.1472504734992981, -0.038524530827999115, 0.07020141184329987, 0.17892736196517944, 0.2876532971858978, 0.3963792324066162, 0.505105197429657, 0.613831102848053, 0.7225570678710938, 0.8312830328941345, 0.9400089383125305, 1.0487349033355713, 1.1574608087539673, 1.2661867141723633, 1.3749127388000488, 1.4836386442184448, 1.5923645496368408, 1.7010904550552368, 1.8098164796829224, 1.9185423851013184, 2.027268409729004, 2.1359941959381104, 2.244720220565796, 2.3534460067749023, 2.462172269821167, 2.5708982944488525, 2.679624080657959, 2.7883501052856445, 2.89707612991333, 3.0058019161224365, 3.114527940750122, 3.2232537269592285, 3.331979751586914, 3.4407057762145996, 3.549431562423706, 3.6581575870513916, 3.766883611679077, 3.8756093978881836, 3.984335422515869, 4.093061447143555, 4.20178747177124, 4.310513496398926, 4.419239521026611, 4.527965545654297, 4.636691093444824, 4.74541711807251, 4.854143142700195, 4.962869167327881, 5.071594715118408, 5.180320739746094, 5.289046764373779, 5.397772789001465, 5.506498336791992, 5.615224361419678, 5.723950386047363, 5.832676410675049, 5.941402435302734]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 9.0, 6.0, 10.0, 15.0, 20.0, 18.0, 30.0, 19.0, 35.0, 41.0, 24.0, 37.0, 44.0, 50.0, 49.0, 41.0, 46.0, 45.0, 40.0, 52.0, 45.0, 42.0, 32.0, 48.0, 29.0, 28.0, 23.0, 24.0, 24.0, 19.0, 17.0, 11.0, 8.0, 7.0, 7.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.8331725001335144, -0.8096960186958313, -0.7862194776535034, -0.7627429962158203, -0.7392664551734924, -0.7157899737358093, -0.6923134326934814, -0.6688369512557983, -0.6453604102134705, -0.6218839287757874, -0.5984073877334595, -0.5749309062957764, -0.5514543652534485, -0.5279778838157654, -0.5045013427734375, -0.4810248613357544, -0.4575483500957489, -0.4340718388557434, -0.4105953276157379, -0.3871188163757324, -0.36364230513572693, -0.34016579389572144, -0.31668931245803833, -0.29321277141571045, -0.26973628997802734, -0.24625977873802185, -0.22278326749801636, -0.19930675625801086, -0.17583024501800537, -0.15235373377799988, -0.12887723743915558, -0.10540072619915009, -0.0819242000579834, -0.058447688817977905, -0.03497118130326271, -0.011494673788547516, 0.011981837451457977, 0.03545834869146347, 0.05893485248088837, 0.08241136372089386, 0.10588787496089935, 0.12936438620090485, 0.15284089744091034, 0.17631739377975464, 0.19979390501976013, 0.22327041625976562, 0.24674692749977112, 0.2702234387397766, 0.2936999499797821, 0.3171764612197876, 0.3406529724597931, 0.3641294836997986, 0.3876059949398041, 0.41108250617980957, 0.4345589876174927, 0.45803552865982056, 0.48151201009750366, 0.5049884915351868, 0.5284650325775146, 0.5519415140151978, 0.5754180550575256, 0.5988945364952087, 0.6223710775375366, 0.6458475589752197, 0.6693241000175476]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 10.0, 3.0, 6.0, 12.0, 22.0, 38.0, 37.0, 48.0, 92.0, 156.0, 286.0, 563.0, 1300.0, 3426.0, 11466.0, 55955.0, 357714.0, 502522.0, 90191.0, 16869.0, 4697.0, 1671.0, 710.0, 305.0, 172.0, 118.0, 49.0, 42.0, 33.0, 12.0, 11.0, 5.0, 7.0, 4.0, 4.0, 5.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.3154296875, -1.283447265625, -1.25146484375, -1.219482421875, -1.1875, -1.155517578125, -1.12353515625, -1.091552734375, -1.0595703125, -1.027587890625, -0.99560546875, -0.963623046875, -0.931640625, -0.899658203125, -0.86767578125, -0.835693359375, -0.8037109375, -0.771728515625, -0.73974609375, -0.707763671875, -0.67578125, -0.643798828125, -0.61181640625, -0.579833984375, -0.5478515625, -0.515869140625, -0.48388671875, -0.451904296875, -0.419921875, -0.387939453125, -0.35595703125, -0.323974609375, -0.2919921875, -0.260009765625, -0.22802734375, -0.196044921875, -0.1640625, -0.132080078125, -0.10009765625, -0.068115234375, -0.0361328125, -0.004150390625, 0.02783203125, 0.059814453125, 0.091796875, 0.123779296875, 0.15576171875, 0.187744140625, 0.2197265625, 0.251708984375, 0.28369140625, 0.315673828125, 0.34765625, 0.379638671875, 0.41162109375, 0.443603515625, 0.4755859375, 0.507568359375, 0.53955078125, 0.571533203125, 0.603515625, 0.635498046875, 0.66748046875, 0.699462890625, 0.7314453125]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 5.0, 7.0, 9.0, 8.0, 19.0, 13.0, 33.0, 34.0, 54.0, 69.0, 75.0, 83.0, 77.0, 75.0, 87.0, 65.0, 55.0, 62.0, 46.0, 31.0, 27.0, 25.0, 18.0, 10.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4921875, -0.47595977783203125, -0.4597320556640625, -0.44350433349609375, -0.427276611328125, -0.41104888916015625, -0.3948211669921875, -0.37859344482421875, -0.36236572265625, -0.34613800048828125, -0.3299102783203125, -0.31368255615234375, -0.297454833984375, -0.28122711181640625, -0.2649993896484375, -0.24877166748046875, -0.2325439453125, -0.21631622314453125, -0.2000885009765625, -0.18386077880859375, -0.167633056640625, -0.15140533447265625, -0.1351776123046875, -0.11894989013671875, -0.10272216796875, -0.08649444580078125, -0.0702667236328125, -0.05403900146484375, -0.037811279296875, -0.02158355712890625, -0.0053558349609375, 0.01087188720703125, 0.027099609375, 0.04332733154296875, 0.0595550537109375, 0.07578277587890625, 0.092010498046875, 0.10823822021484375, 0.1244659423828125, 0.14069366455078125, 0.15692138671875, 0.17314910888671875, 0.1893768310546875, 0.20560455322265625, 0.221832275390625, 0.23805999755859375, 0.2542877197265625, 0.27051544189453125, 0.2867431640625, 0.30297088623046875, 0.3191986083984375, 0.33542633056640625, 0.351654052734375, 0.36788177490234375, 0.3841094970703125, 0.40033721923828125, 0.41656494140625, 0.43279266357421875, 0.4490203857421875, 0.46524810791015625, 0.481475830078125, 0.49770355224609375, 0.5139312744140625, 0.5301589965820312, 0.54638671875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 4.0, 9.0, 7.0, 10.0, 18.0, 13.0, 24.0, 38.0, 46.0, 94.0, 152.0, 237.0, 461.0, 1009.0, 3496.0, 26122.0, 569163.0, 422451.0, 20317.0, 2984.0, 926.0, 371.0, 215.0, 125.0, 93.0, 46.0, 26.0, 24.0, 14.0, 17.0, 9.0, 6.0, 9.0, 6.0, 4.0, 4.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8115234375, -1.7581634521484375, -1.704803466796875, -1.6514434814453125, -1.59808349609375, -1.5447235107421875, -1.491363525390625, -1.4380035400390625, -1.3846435546875, -1.3312835693359375, -1.277923583984375, -1.2245635986328125, -1.17120361328125, -1.1178436279296875, -1.064483642578125, -1.0111236572265625, -0.957763671875, -0.9044036865234375, -0.851043701171875, -0.7976837158203125, -0.74432373046875, -0.6909637451171875, -0.637603759765625, -0.5842437744140625, -0.5308837890625, -0.4775238037109375, -0.424163818359375, -0.3708038330078125, -0.31744384765625, -0.2640838623046875, -0.210723876953125, -0.1573638916015625, -0.10400390625, -0.0506439208984375, 0.002716064453125, 0.0560760498046875, 0.10943603515625, 0.1627960205078125, 0.216156005859375, 0.2695159912109375, 0.3228759765625, 0.3762359619140625, 0.429595947265625, 0.4829559326171875, 0.53631591796875, 0.5896759033203125, 0.643035888671875, 0.6963958740234375, 0.749755859375, 0.8031158447265625, 0.856475830078125, 0.9098358154296875, 0.96319580078125, 1.0165557861328125, 1.069915771484375, 1.1232757568359375, 1.1766357421875, 1.2299957275390625, 1.283355712890625, 1.3367156982421875, 1.39007568359375, 1.4434356689453125, 1.496795654296875, 1.5501556396484375, 1.603515625]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 4.0, 5.0, 3.0, 8.0, 9.0, 17.0, 23.0, 15.0, 17.0, 28.0, 30.0, 27.0, 53.0, 41.0, 44.0, 56.0, 44.0, 56.0, 42.0, 38.0, 59.0, 55.0, 45.0, 49.0, 40.0, 40.0, 32.0, 22.0, 23.0, 17.0, 14.0, 15.0, 9.0, 5.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.837890625, -1.7791748046875, -1.720458984375, -1.6617431640625, -1.60302734375, -1.5443115234375, -1.485595703125, -1.4268798828125, -1.3681640625, -1.3094482421875, -1.250732421875, -1.1920166015625, -1.13330078125, -1.0745849609375, -1.015869140625, -0.9571533203125, -0.8984375, -0.8397216796875, -0.781005859375, -0.7222900390625, -0.66357421875, -0.6048583984375, -0.546142578125, -0.4874267578125, -0.4287109375, -0.3699951171875, -0.311279296875, -0.2525634765625, -0.19384765625, -0.1351318359375, -0.076416015625, -0.0177001953125, 0.041015625, 0.0997314453125, 0.158447265625, 0.2171630859375, 0.27587890625, 0.3345947265625, 0.393310546875, 0.4520263671875, 0.5107421875, 0.5694580078125, 0.628173828125, 0.6868896484375, 0.74560546875, 0.8043212890625, 0.863037109375, 0.9217529296875, 0.98046875, 1.0391845703125, 1.097900390625, 1.1566162109375, 1.21533203125, 1.2740478515625, 1.332763671875, 1.3914794921875, 1.4501953125, 1.5089111328125, 1.567626953125, 1.6263427734375, 1.68505859375, 1.7437744140625, 1.802490234375, 1.8612060546875, 1.919921875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 13.0, 24.0, 28.0, 78.0, 159.0, 432.0, 1933.0, 37273.0, 997819.0, 9198.0, 1051.0, 299.0, 130.0, 53.0, 25.0, 18.0, 12.0, 5.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.599609375, -2.519195556640625, -2.43878173828125, -2.358367919921875, -2.2779541015625, -2.197540283203125, -2.11712646484375, -2.036712646484375, -1.956298828125, -1.875885009765625, -1.79547119140625, -1.715057373046875, -1.6346435546875, -1.554229736328125, -1.47381591796875, -1.393402099609375, -1.31298828125, -1.232574462890625, -1.15216064453125, -1.071746826171875, -0.9913330078125, -0.910919189453125, -0.83050537109375, -0.750091552734375, -0.669677734375, -0.589263916015625, -0.50885009765625, -0.428436279296875, -0.3480224609375, -0.267608642578125, -0.18719482421875, -0.106781005859375, -0.0263671875, 0.054046630859375, 0.13446044921875, 0.214874267578125, 0.2952880859375, 0.375701904296875, 0.45611572265625, 0.536529541015625, 0.616943359375, 0.697357177734375, 0.77777099609375, 0.858184814453125, 0.9385986328125, 1.019012451171875, 1.09942626953125, 1.179840087890625, 1.26025390625, 1.340667724609375, 1.42108154296875, 1.501495361328125, 1.5819091796875, 1.662322998046875, 1.74273681640625, 1.823150634765625, 1.903564453125, 1.983978271484375, 2.06439208984375, 2.144805908203125, 2.2252197265625, 2.305633544921875, 2.38604736328125, 2.466461181640625, 2.546875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 7.0, 13.0, 14.0, 23.0, 45.0, 46.0, 94.0, 124.0, 110.0, 152.0, 121.0, 93.0, 65.0, 40.0, 20.0, 17.0, 6.0, 6.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.846687316894531e-05, -9.468942880630493e-05, -9.091198444366455e-05, -8.713454008102417e-05, -8.335709571838379e-05, -7.957965135574341e-05, -7.580220699310303e-05, -7.202476263046265e-05, -6.824731826782227e-05, -6.446987390518188e-05, -6.0692429542541504e-05, -5.691498517990112e-05, -5.313754081726074e-05, -4.936009645462036e-05, -4.558265209197998e-05, -4.18052077293396e-05, -3.802776336669922e-05, -3.425031900405884e-05, -3.0472874641418457e-05, -2.6695430278778076e-05, -2.2917985916137695e-05, -1.9140541553497314e-05, -1.5363097190856934e-05, -1.1585652828216553e-05, -7.808208465576172e-06, -4.030764102935791e-06, -2.5331974029541016e-07, 3.5241246223449707e-06, 7.3015689849853516e-06, 1.1079013347625732e-05, 1.4856457710266113e-05, 1.8633902072906494e-05, 2.2411346435546875e-05, 2.6188790798187256e-05, 2.9966235160827637e-05, 3.374367952346802e-05, 3.75211238861084e-05, 4.129856824874878e-05, 4.507601261138916e-05, 4.885345697402954e-05, 5.263090133666992e-05, 5.64083456993103e-05, 6.0185790061950684e-05, 6.396323442459106e-05, 6.774067878723145e-05, 7.151812314987183e-05, 7.529556751251221e-05, 7.907301187515259e-05, 8.285045623779297e-05, 8.662790060043335e-05, 9.040534496307373e-05, 9.418278932571411e-05, 9.796023368835449e-05, 0.00010173767805099487, 0.00010551512241363525, 0.00010929256677627563, 0.00011307001113891602, 0.0001168474555015564, 0.00012062489986419678, 0.00012440234422683716, 0.00012817978858947754, 0.00013195723295211792, 0.0001357346773147583, 0.00013951212167739868, 0.00014328956604003906]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 0.0, 4.0, 4.0, 5.0, 11.0, 15.0, 22.0, 55.0, 86.0, 165.0, 356.0, 1276.0, 6676.0, 507332.0, 523814.0, 6632.0, 1281.0, 415.0, 190.0, 102.0, 40.0, 15.0, 14.0, 21.0, 7.0, 7.0, 7.0, 1.0, 1.0, 6.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4453125, -2.389739990234375, -2.33416748046875, -2.278594970703125, -2.2230224609375, -2.167449951171875, -2.11187744140625, -2.056304931640625, -2.000732421875, -1.945159912109375, -1.88958740234375, -1.834014892578125, -1.7784423828125, -1.722869873046875, -1.66729736328125, -1.611724853515625, -1.55615234375, -1.500579833984375, -1.44500732421875, -1.389434814453125, -1.3338623046875, -1.278289794921875, -1.22271728515625, -1.167144775390625, -1.111572265625, -1.055999755859375, -1.00042724609375, -0.944854736328125, -0.8892822265625, -0.833709716796875, -0.77813720703125, -0.722564697265625, -0.6669921875, -0.611419677734375, -0.55584716796875, -0.500274658203125, -0.4447021484375, -0.389129638671875, -0.33355712890625, -0.277984619140625, -0.222412109375, -0.166839599609375, -0.11126708984375, -0.055694580078125, -0.0001220703125, 0.055450439453125, 0.11102294921875, 0.166595458984375, 0.22216796875, 0.277740478515625, 0.33331298828125, 0.388885498046875, 0.4444580078125, 0.500030517578125, 0.55560302734375, 0.611175537109375, 0.666748046875, 0.722320556640625, 0.77789306640625, 0.833465576171875, 0.8890380859375, 0.944610595703125, 1.00018310546875, 1.055755615234375, 1.111328125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 4.0, 10.0, 22.0, 22.0, 47.0, 41.0, 91.0, 134.0, 133.0, 149.0, 112.0, 84.0, 45.0, 26.0, 26.0, 22.0, 14.0, 4.0, 4.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.734375, -0.705047607421875, -0.67572021484375, -0.646392822265625, -0.6170654296875, -0.587738037109375, -0.55841064453125, -0.529083251953125, -0.499755859375, -0.470428466796875, -0.44110107421875, -0.411773681640625, -0.3824462890625, -0.353118896484375, -0.32379150390625, -0.294464111328125, -0.26513671875, -0.235809326171875, -0.20648193359375, -0.177154541015625, -0.1478271484375, -0.118499755859375, -0.08917236328125, -0.059844970703125, -0.030517578125, -0.001190185546875, 0.02813720703125, 0.057464599609375, 0.0867919921875, 0.116119384765625, 0.14544677734375, 0.174774169921875, 0.2041015625, 0.233428955078125, 0.26275634765625, 0.292083740234375, 0.3214111328125, 0.350738525390625, 0.38006591796875, 0.409393310546875, 0.438720703125, 0.468048095703125, 0.49737548828125, 0.526702880859375, 0.5560302734375, 0.585357666015625, 0.61468505859375, 0.644012451171875, 0.67333984375, 0.702667236328125, 0.73199462890625, 0.761322021484375, 0.7906494140625, 0.819976806640625, 0.84930419921875, 0.878631591796875, 0.907958984375, 0.937286376953125, 0.96661376953125, 0.995941162109375, 1.0252685546875, 1.054595947265625, 1.08392333984375, 1.113250732421875, 1.142578125]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 14.0, 108.0, 344.0, 376.0, 120.0, 29.0, 9.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-47.40241241455078, -46.4531364440918, -45.50386428833008, -44.554588317871094, -43.605316162109375, -42.65604019165039, -41.706764221191406, -40.75749206542969, -39.8082160949707, -38.85894012451172, -37.90966796875, -36.960391998291016, -36.0111198425293, -35.06184387207031, -34.112571716308594, -33.16329574584961, -32.214019775390625, -31.264745712280273, -30.315471649169922, -29.366195678710938, -28.416921615600586, -27.467647552490234, -26.518373489379883, -25.56909942626953, -24.619827270507812, -23.67055320739746, -22.72127914428711, -21.772003173828125, -20.822729110717773, -19.873455047607422, -18.92418098449707, -17.97490692138672, -17.025630950927734, -16.076356887817383, -15.127081871032715, -14.177807807922363, -13.228532791137695, -12.279258728027344, -11.329984664916992, -10.38071060180664, -9.431435585021973, -8.482161521911621, -7.532886505126953, -6.583612442016602, -5.634337902069092, -4.685063362121582, -3.7357892990112305, -2.7865147590637207, -1.837240219116211, -0.8879657983779907, 0.06130862236022949, 1.0105829238891602, 1.95985746383667, 2.9091320037841797, 3.8584060668945312, 4.807680606842041, 5.756955146789551, 6.7062296867370605, 7.65550422668457, 8.604778289794922, 9.554052352905273, 10.503327369689941, 11.452601432800293, 12.401876449584961, 13.351150512695312]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 10.0, 11.0, 10.0, 18.0, 21.0, 19.0, 22.0, 32.0, 40.0, 34.0, 54.0, 42.0, 55.0, 71.0, 63.0, 52.0, 52.0, 62.0, 44.0, 40.0, 40.0, 32.0, 36.0, 34.0, 26.0, 17.0, 15.0, 10.0, 8.0, 8.0, 7.0, 5.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.956792831420898, -6.676063060760498, -6.395333290100098, -6.1146039962768555, -5.833874225616455, -5.553144454956055, -5.272414684295654, -4.991684913635254, -4.710955619812012, -4.430225849151611, -4.149496078491211, -3.8687665462493896, -3.5880370140075684, -3.307307243347168, -3.0265774726867676, -2.745847702026367, -2.465117931365967, -2.1843881607055664, -1.9036586284637451, -1.6229288578033447, -1.3421992063522339, -1.061469554901123, -0.7807397842407227, -0.5000101327896118, -0.21928048133850098, 0.06144919991493225, 0.3421788811683655, 0.6229085922241211, 0.9036382436752319, 1.1843678951263428, 1.4650976657867432, 1.745827317237854, 2.026556968688965, 2.3072867393493652, 2.5880162715911865, 2.868746042251587, 3.149475574493408, 3.4302053451538086, 3.710935115814209, 3.9916648864746094, 4.272394180297852, 4.553123950958252, 4.833853721618652, 5.1145830154418945, 5.395312786102295, 5.676042556762695, 5.956772327423096, 6.237502098083496, 6.5182318687438965, 6.798961639404297, 7.079691410064697, 7.360421180725098, 7.64115047454834, 7.92188024520874, 8.20261001586914, 8.483339309692383, 8.764069557189941, 9.044798851013184, 9.325529098510742, 9.606258392333984, 9.886988639831543, 10.167717933654785, 10.448448181152344, 10.729177474975586, 11.009906768798828]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 5.0, 6.0, 9.0, 19.0, 45.0, 67.0, 134.0, 258.0, 717.0, 3635.0, 121295.0, 4060281.0, 6075.0, 1019.0, 358.0, 125.0, 92.0, 55.0, 29.0, 16.0, 10.0, 8.0, 7.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.724609375, -3.629364013671875, -3.53411865234375, -3.438873291015625, -3.3436279296875, -3.248382568359375, -3.15313720703125, -3.057891845703125, -2.962646484375, -2.867401123046875, -2.77215576171875, -2.676910400390625, -2.5816650390625, -2.486419677734375, -2.39117431640625, -2.295928955078125, -2.20068359375, -2.105438232421875, -2.01019287109375, -1.914947509765625, -1.8197021484375, -1.724456787109375, -1.62921142578125, -1.533966064453125, -1.438720703125, -1.343475341796875, -1.24822998046875, -1.152984619140625, -1.0577392578125, -0.962493896484375, -0.86724853515625, -0.772003173828125, -0.6767578125, -0.581512451171875, -0.48626708984375, -0.391021728515625, -0.2957763671875, -0.200531005859375, -0.10528564453125, -0.010040283203125, 0.085205078125, 0.180450439453125, 0.27569580078125, 0.370941162109375, 0.4661865234375, 0.561431884765625, 0.65667724609375, 0.751922607421875, 0.84716796875, 0.942413330078125, 1.03765869140625, 1.132904052734375, 1.2281494140625, 1.323394775390625, 1.41864013671875, 1.513885498046875, 1.609130859375, 1.704376220703125, 1.79962158203125, 1.894866943359375, 1.9901123046875, 2.085357666015625, 2.18060302734375, 2.275848388671875, 2.37109375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 8.0, 6.0, 17.0, 21.0, 28.0, 29.0, 56.0, 59.0, 93.0, 82.0, 84.0, 101.0, 85.0, 70.0, 60.0, 51.0, 42.0, 34.0, 14.0, 20.0, 20.0, 9.0, 3.0, 4.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.4090843200683594, -0.39067840576171875, -0.3722724914550781, -0.3538665771484375, -0.3354606628417969, -0.31705474853515625, -0.2986488342285156, -0.280242919921875, -0.2618370056152344, -0.24343109130859375, -0.22502517700195312, -0.2066192626953125, -0.18821334838867188, -0.16980743408203125, -0.15140151977539062, -0.13299560546875, -0.11458969116210938, -0.09618377685546875, -0.07777786254882812, -0.0593719482421875, -0.040966033935546875, -0.02256011962890625, -0.004154205322265625, 0.014251708984375, 0.032657623291015625, 0.05106353759765625, 0.06946945190429688, 0.0878753662109375, 0.10628128051757812, 0.12468719482421875, 0.14309310913085938, 0.1614990234375, 0.17990493774414062, 0.19831085205078125, 0.21671676635742188, 0.2351226806640625, 0.2535285949707031, 0.27193450927734375, 0.2903404235839844, 0.308746337890625, 0.3271522521972656, 0.34555816650390625, 0.3639640808105469, 0.3823699951171875, 0.4007759094238281, 0.41918182373046875, 0.4375877380371094, 0.45599365234375, 0.4743995666503906, 0.49280548095703125, 0.5112113952636719, 0.5296173095703125, 0.5480232238769531, 0.5664291381835938, 0.5848350524902344, 0.603240966796875, 0.6216468811035156, 0.6400527954101562, 0.6584587097167969, 0.6768646240234375, 0.6952705383300781, 0.7136764526367188, 0.7320823669433594, 0.75048828125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 8.0, 14.0, 12.0, 14.0, 24.0, 38.0, 60.0, 69.0, 93.0, 127.0, 189.0, 248.0, 383.0, 615.0, 820.0, 1445.0, 2585.0, 5238.0, 14015.0, 74482.0, 3986723.0, 80242.0, 14768.0, 5432.0, 2628.0, 1390.0, 819.0, 517.0, 367.0, 241.0, 179.0, 134.0, 112.0, 75.0, 46.0, 32.0, 34.0, 19.0, 18.0, 13.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9736328125, -0.9417266845703125, -0.909820556640625, -0.8779144287109375, -0.84600830078125, -0.8141021728515625, -0.782196044921875, -0.7502899169921875, -0.7183837890625, -0.6864776611328125, -0.654571533203125, -0.6226654052734375, -0.59075927734375, -0.5588531494140625, -0.526947021484375, -0.4950408935546875, -0.463134765625, -0.4312286376953125, -0.399322509765625, -0.3674163818359375, -0.33551025390625, -0.3036041259765625, -0.271697998046875, -0.2397918701171875, -0.2078857421875, -0.1759796142578125, -0.144073486328125, -0.1121673583984375, -0.08026123046875, -0.0483551025390625, -0.016448974609375, 0.0154571533203125, 0.04736328125, 0.0792694091796875, 0.111175537109375, 0.1430816650390625, 0.17498779296875, 0.2068939208984375, 0.238800048828125, 0.2707061767578125, 0.3026123046875, 0.3345184326171875, 0.366424560546875, 0.3983306884765625, 0.43023681640625, 0.4621429443359375, 0.494049072265625, 0.5259552001953125, 0.557861328125, 0.5897674560546875, 0.621673583984375, 0.6535797119140625, 0.68548583984375, 0.7173919677734375, 0.749298095703125, 0.7812042236328125, 0.8131103515625, 0.8450164794921875, 0.876922607421875, 0.9088287353515625, 0.94073486328125, 0.9726409912109375, 1.004547119140625, 1.0364532470703125, 1.068359375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 5.0, 4.0, 3.0, 6.0, 4.0, 12.0, 20.0, 37.0, 60.0, 184.0, 3427.0, 172.0, 60.0, 29.0, 23.0, 6.0, 7.0, 4.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.298583984375, -0.2887916564941406, -0.27899932861328125, -0.2692070007324219, -0.2594146728515625, -0.24962234497070312, -0.23983001708984375, -0.23003768920898438, -0.220245361328125, -0.21045303344726562, -0.20066070556640625, -0.19086837768554688, -0.1810760498046875, -0.17128372192382812, -0.16149139404296875, -0.15169906616210938, -0.14190673828125, -0.13211441040039062, -0.12232208251953125, -0.11252975463867188, -0.1027374267578125, -0.09294509887695312, -0.08315277099609375, -0.07336044311523438, -0.063568115234375, -0.053775787353515625, -0.04398345947265625, -0.034191131591796875, -0.0243988037109375, -0.014606475830078125, -0.00481414794921875, 0.004978179931640625, 0.0147705078125, 0.024562835693359375, 0.03435516357421875, 0.044147491455078125, 0.0539398193359375, 0.06373214721679688, 0.07352447509765625, 0.08331680297851562, 0.093109130859375, 0.10290145874023438, 0.11269378662109375, 0.12248611450195312, 0.1322784423828125, 0.14207077026367188, 0.15186309814453125, 0.16165542602539062, 0.17144775390625, 0.18124008178710938, 0.19103240966796875, 0.20082473754882812, 0.2106170654296875, 0.22040939331054688, 0.23020172119140625, 0.23999404907226562, 0.249786376953125, 0.2595787048339844, 0.26937103271484375, 0.2791633605957031, 0.2889556884765625, 0.2987480163574219, 0.30854034423828125, 0.3183326721191406, 0.328125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 4.0, 3.0, 17.0, 8.0, 22.0, 32.0, 40.0, 49.0, 77.0, 106.0, 119.0, 126.0, 106.0, 81.0, 55.0, 47.0, 33.0, 28.0, 11.0, 11.0, 6.0, 5.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.132209300994873, -1.1035312414169312, -1.0748530626296997, -1.0461750030517578, -1.017496943473816, -0.9888188242912292, -0.9601407051086426, -0.9314626455307007, -0.902784526348114, -0.8741064071655273, -0.8454283475875854, -0.8167502284049988, -0.7880721092224121, -0.7593940496444702, -0.7307159304618835, -0.7020378112792969, -0.673359751701355, -0.6446816325187683, -0.6160035729408264, -0.5873254537582397, -0.5586473345756531, -0.5299692749977112, -0.5012911558151245, -0.47261306643486023, -0.44393491744995117, -0.4152568280696869, -0.3865787088871002, -0.35790061950683594, -0.32922253012657166, -0.3005444407463074, -0.2718663215637207, -0.24318823218345642, -0.21451014280319214, -0.18583203852176666, -0.15715394914150238, -0.1284758448600769, -0.09979774802923203, -0.07111965119838715, -0.04244154691696167, -0.013763457536697388, 0.014914646744728088, 0.04359274357557297, 0.07227084040641785, 0.10094894468784332, 0.1296270489692688, 0.15830513834953308, 0.18698324263095856, 0.21566133201122284, 0.24433943629264832, 0.2730175256729126, 0.30169564485549927, 0.33037373423576355, 0.35905182361602783, 0.3877299427986145, 0.4164080321788788, 0.44508612155914307, 0.47376424074172974, 0.5024423599243164, 0.5311204195022583, 0.559798538684845, 0.5884766578674316, 0.6171547174453735, 0.6458328366279602, 0.6745109558105469, 0.7031890153884888]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 2.0, 6.0, 3.0, 6.0, 9.0, 9.0, 13.0, 23.0, 22.0, 21.0, 26.0, 32.0, 25.0, 49.0, 41.0, 51.0, 48.0, 40.0, 71.0, 53.0, 45.0, 50.0, 42.0, 44.0, 32.0, 35.0, 47.0, 32.0, 27.0, 24.0, 19.0, 18.0, 13.0, 9.0, 7.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.8347029685974121, -0.8139520287513733, -0.7932010293006897, -0.7724500894546509, -0.7516990900039673, -0.7309481501579285, -0.7101972103118896, -0.689446210861206, -0.6686952710151672, -0.6479443311691284, -0.6271933317184448, -0.606442391872406, -0.5856914520263672, -0.5649404525756836, -0.5441895127296448, -0.523438572883606, -0.5026875734329224, -0.48193660378456116, -0.46118563413619995, -0.44043469429016113, -0.4196837246417999, -0.3989327549934387, -0.3781818151473999, -0.3574308454990387, -0.3366798758506775, -0.3159289062023163, -0.2951779365539551, -0.27442699670791626, -0.25367602705955505, -0.23292505741119385, -0.21217410266399384, -0.19142314791679382, -0.17067217826843262, -0.1499212086200714, -0.1291702538728714, -0.10841929167509079, -0.08766832947731018, -0.06691736727952957, -0.04616640508174896, -0.02541545033454895, -0.004664480686187744, 0.016086481511592865, 0.036837443709373474, 0.05758840590715408, 0.07833936810493469, 0.0990903303027153, 0.11984129250049591, 0.14059224724769592, 0.16134321689605713, 0.18209418654441833, 0.20284514129161835, 0.22359609603881836, 0.24434706568717957, 0.26509803533554077, 0.2858489751815796, 0.3065999448299408, 0.327350914478302, 0.3481018841266632, 0.3688528537750244, 0.38960379362106323, 0.41035476326942444, 0.43110573291778564, 0.45185667276382446, 0.47260764241218567, 0.4933586120605469]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 16.0, 14.0, 27.0, 31.0, 81.0, 136.0, 297.0, 634.0, 1946.0, 7948.0, 51294.0, 438976.0, 477965.0, 57143.0, 8615.0, 2097.0, 722.0, 287.0, 133.0, 77.0, 47.0, 15.0, 23.0, 13.0, 3.0, 3.0, 1.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.65234375, -0.6180572509765625, -0.583770751953125, -0.5494842529296875, -0.51519775390625, -0.4809112548828125, -0.446624755859375, -0.4123382568359375, -0.3780517578125, -0.3437652587890625, -0.309478759765625, -0.2751922607421875, -0.24090576171875, -0.2066192626953125, -0.172332763671875, -0.1380462646484375, -0.103759765625, -0.0694732666015625, -0.035186767578125, -0.0009002685546875, 0.03338623046875, 0.0676727294921875, 0.101959228515625, 0.1362457275390625, 0.1705322265625, 0.2048187255859375, 0.239105224609375, 0.2733917236328125, 0.30767822265625, 0.3419647216796875, 0.376251220703125, 0.4105377197265625, 0.44482421875, 0.4791107177734375, 0.513397216796875, 0.5476837158203125, 0.58197021484375, 0.6162567138671875, 0.650543212890625, 0.6848297119140625, 0.7191162109375, 0.7534027099609375, 0.787689208984375, 0.8219757080078125, 0.85626220703125, 0.8905487060546875, 0.924835205078125, 0.9591217041015625, 0.993408203125, 1.0276947021484375, 1.061981201171875, 1.0962677001953125, 1.13055419921875, 1.1648406982421875, 1.199127197265625, 1.2334136962890625, 1.2677001953125, 1.3019866943359375, 1.336273193359375, 1.3705596923828125, 1.40484619140625, 1.4391326904296875, 1.473419189453125, 1.5077056884765625, 1.5419921875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 5.0, 15.0, 8.0, 21.0, 19.0, 28.0, 34.0, 52.0, 73.0, 74.0, 82.0, 74.0, 108.0, 66.0, 60.0, 60.0, 60.0, 35.0, 32.0, 31.0, 18.0, 23.0, 7.0, 11.0, 3.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.418212890625, -0.4010047912597656, -0.38379669189453125, -0.3665885925292969, -0.3493804931640625, -0.3321723937988281, -0.31496429443359375, -0.2977561950683594, -0.280548095703125, -0.2633399963378906, -0.24613189697265625, -0.22892379760742188, -0.2117156982421875, -0.19450759887695312, -0.17729949951171875, -0.16009140014648438, -0.14288330078125, -0.12567520141601562, -0.10846710205078125, -0.09125900268554688, -0.0740509033203125, -0.056842803955078125, -0.03963470458984375, -0.022426605224609375, -0.005218505859375, 0.011989593505859375, 0.02919769287109375, 0.046405792236328125, 0.0636138916015625, 0.08082199096679688, 0.09803009033203125, 0.11523818969726562, 0.1324462890625, 0.14965438842773438, 0.16686248779296875, 0.18407058715820312, 0.2012786865234375, 0.21848678588867188, 0.23569488525390625, 0.2529029846191406, 0.270111083984375, 0.2873191833496094, 0.30452728271484375, 0.3217353820800781, 0.3389434814453125, 0.3561515808105469, 0.37335968017578125, 0.3905677795410156, 0.40777587890625, 0.4249839782714844, 0.44219207763671875, 0.4594001770019531, 0.4766082763671875, 0.4938163757324219, 0.5110244750976562, 0.5282325744628906, 0.545440673828125, 0.5626487731933594, 0.5798568725585938, 0.5970649719238281, 0.6142730712890625, 0.6314811706542969, 0.6486892700195312, 0.6658973693847656, 0.68310546875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 3.0, 0.0, 4.0, 8.0, 3.0, 9.0, 14.0, 16.0, 17.0, 21.0, 30.0, 43.0, 57.0, 65.0, 98.0, 138.0, 220.0, 277.0, 487.0, 876.0, 2006.0, 6839.0, 52287.0, 643901.0, 309290.0, 24078.0, 4184.0, 1509.0, 757.0, 394.0, 286.0, 172.0, 119.0, 80.0, 58.0, 46.0, 39.0, 21.0, 20.0, 14.0, 18.0, 13.0, 10.0, 4.0, 6.0, 8.0, 3.0, 4.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-1.1953125, -1.1609954833984375, -1.126678466796875, -1.0923614501953125, -1.05804443359375, -1.0237274169921875, -0.989410400390625, -0.9550933837890625, -0.9207763671875, -0.8864593505859375, -0.852142333984375, -0.8178253173828125, -0.78350830078125, -0.7491912841796875, -0.714874267578125, -0.6805572509765625, -0.646240234375, -0.6119232177734375, -0.577606201171875, -0.5432891845703125, -0.50897216796875, -0.4746551513671875, -0.440338134765625, -0.4060211181640625, -0.3717041015625, -0.3373870849609375, -0.303070068359375, -0.2687530517578125, -0.23443603515625, -0.2001190185546875, -0.165802001953125, -0.1314849853515625, -0.09716796875, -0.0628509521484375, -0.028533935546875, 0.0057830810546875, 0.04010009765625, 0.0744171142578125, 0.108734130859375, 0.1430511474609375, 0.1773681640625, 0.2116851806640625, 0.246002197265625, 0.2803192138671875, 0.31463623046875, 0.3489532470703125, 0.383270263671875, 0.4175872802734375, 0.451904296875, 0.4862213134765625, 0.520538330078125, 0.5548553466796875, 0.58917236328125, 0.6234893798828125, 0.657806396484375, 0.6921234130859375, 0.7264404296875, 0.7607574462890625, 0.795074462890625, 0.8293914794921875, 0.86370849609375, 0.8980255126953125, 0.932342529296875, 0.9666595458984375, 1.0009765625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 10.0, 8.0, 12.0, 15.0, 12.0, 15.0, 14.0, 22.0, 31.0, 28.0, 34.0, 30.0, 40.0, 48.0, 50.0, 46.0, 48.0, 51.0, 55.0, 46.0, 45.0, 43.0, 42.0, 43.0, 25.0, 32.0, 21.0, 28.0, 16.0, 12.0, 16.0, 14.0, 12.0, 9.0, 6.0, 3.0, 7.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.24609375, -1.1991424560546875, -1.152191162109375, -1.1052398681640625, -1.05828857421875, -1.0113372802734375, -0.964385986328125, -0.9174346923828125, -0.8704833984375, -0.8235321044921875, -0.776580810546875, -0.7296295166015625, -0.68267822265625, -0.6357269287109375, -0.588775634765625, -0.5418243408203125, -0.494873046875, -0.4479217529296875, -0.400970458984375, -0.3540191650390625, -0.30706787109375, -0.2601165771484375, -0.213165283203125, -0.1662139892578125, -0.1192626953125, -0.0723114013671875, -0.025360107421875, 0.0215911865234375, 0.06854248046875, 0.1154937744140625, 0.162445068359375, 0.2093963623046875, 0.25634765625, 0.3032989501953125, 0.350250244140625, 0.3972015380859375, 0.44415283203125, 0.4911041259765625, 0.538055419921875, 0.5850067138671875, 0.6319580078125, 0.6789093017578125, 0.725860595703125, 0.7728118896484375, 0.81976318359375, 0.8667144775390625, 0.913665771484375, 0.9606170654296875, 1.007568359375, 1.0545196533203125, 1.101470947265625, 1.1484222412109375, 1.19537353515625, 1.2423248291015625, 1.289276123046875, 1.3362274169921875, 1.3831787109375, 1.4301300048828125, 1.477081298828125, 1.5240325927734375, 1.57098388671875, 1.6179351806640625, 1.664886474609375, 1.7118377685546875, 1.7587890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 9.0, 6.0, 13.0, 15.0, 28.0, 40.0, 77.0, 144.0, 278.0, 645.0, 2403.0, 23593.0, 886282.0, 127702.0, 5410.0, 1154.0, 379.0, 169.0, 84.0, 52.0, 20.0, 12.0, 13.0, 12.0, 7.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.29296875, -1.2586898803710938, -1.2244110107421875, -1.1901321411132812, -1.155853271484375, -1.1215744018554688, -1.0872955322265625, -1.0530166625976562, -1.01873779296875, -0.9844589233398438, -0.9501800537109375, -0.9159011840820312, -0.881622314453125, -0.8473434448242188, -0.8130645751953125, -0.7787857055664062, -0.7445068359375, -0.7102279663085938, -0.6759490966796875, -0.6416702270507812, -0.607391357421875, -0.5731124877929688, -0.5388336181640625, -0.5045547485351562, -0.47027587890625, -0.43599700927734375, -0.4017181396484375, -0.36743927001953125, -0.333160400390625, -0.29888153076171875, -0.2646026611328125, -0.23032379150390625, -0.196044921875, -0.16176605224609375, -0.1274871826171875, -0.09320831298828125, -0.058929443359375, -0.02465057373046875, 0.0096282958984375, 0.04390716552734375, 0.07818603515625, 0.11246490478515625, 0.1467437744140625, 0.18102264404296875, 0.215301513671875, 0.24958038330078125, 0.2838592529296875, 0.31813812255859375, 0.3524169921875, 0.38669586181640625, 0.4209747314453125, 0.45525360107421875, 0.489532470703125, 0.5238113403320312, 0.5580902099609375, 0.5923690795898438, 0.62664794921875, 0.6609268188476562, 0.6952056884765625, 0.7294845581054688, 0.763763427734375, 0.7980422973632812, 0.8323211669921875, 0.8666000366210938, 0.90087890625]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 8.0, 19.0, 29.0, 41.0, 64.0, 77.0, 101.0, 125.0, 143.0, 109.0, 86.0, 60.0, 56.0, 23.0, 18.0, 13.0, 14.0, 4.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00010877847671508789, -0.00010568927973508835, -0.0001026000827550888, -9.951088577508926e-05, -9.642168879508972e-05, -9.333249181509018e-05, -9.024329483509064e-05, -8.71540978550911e-05, -8.406490087509155e-05, -8.097570389509201e-05, -7.788650691509247e-05, -7.479730993509293e-05, -7.170811295509338e-05, -6.861891597509384e-05, -6.55297189950943e-05, -6.244052201509476e-05, -5.9351325035095215e-05, -5.626212805509567e-05, -5.317293107509613e-05, -5.008373409509659e-05, -4.6994537115097046e-05, -4.3905340135097504e-05, -4.081614315509796e-05, -3.772694617509842e-05, -3.463774919509888e-05, -3.1548552215099335e-05, -2.8459355235099792e-05, -2.537015825510025e-05, -2.2280961275100708e-05, -1.9191764295101166e-05, -1.6102567315101624e-05, -1.3013370335102081e-05, -9.924173355102539e-06, -6.834976375102997e-06, -3.7457793951034546e-06, -6.565824151039124e-07, 2.43261456489563e-06, 5.521811544895172e-06, 8.611008524894714e-06, 1.1700205504894257e-05, 1.4789402484893799e-05, 1.787859946489334e-05, 2.0967796444892883e-05, 2.4056993424892426e-05, 2.7146190404891968e-05, 3.023538738489151e-05, 3.332458436489105e-05, 3.6413781344890594e-05, 3.950297832489014e-05, 4.259217530488968e-05, 4.568137228488922e-05, 4.8770569264888763e-05, 5.1859766244888306e-05, 5.494896322488785e-05, 5.803816020488739e-05, 6.112735718488693e-05, 6.421655416488647e-05, 6.730575114488602e-05, 7.039494812488556e-05, 7.34841451048851e-05, 7.657334208488464e-05, 7.966253906488419e-05, 8.275173604488373e-05, 8.584093302488327e-05, 8.893013000488281e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 7.0, 6.0, 10.0, 20.0, 32.0, 58.0, 115.0, 197.0, 561.0, 1710.0, 9228.0, 339190.0, 680873.0, 13304.0, 2049.0, 628.0, 252.0, 132.0, 80.0, 31.0, 14.0, 20.0, 13.0, 4.0, 5.0, 4.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2236328125, -1.1897201538085938, -1.1558074951171875, -1.1218948364257812, -1.087982177734375, -1.0540695190429688, -1.0201568603515625, -0.9862442016601562, -0.95233154296875, -0.9184188842773438, -0.8845062255859375, -0.8505935668945312, -0.816680908203125, -0.7827682495117188, -0.7488555908203125, -0.7149429321289062, -0.6810302734375, -0.6471176147460938, -0.6132049560546875, -0.5792922973632812, -0.545379638671875, -0.5114669799804688, -0.4775543212890625, -0.44364166259765625, -0.40972900390625, -0.37581634521484375, -0.3419036865234375, -0.30799102783203125, -0.274078369140625, -0.24016571044921875, -0.2062530517578125, -0.17234039306640625, -0.138427734375, -0.10451507568359375, -0.0706024169921875, -0.03668975830078125, -0.002777099609375, 0.03113555908203125, 0.0650482177734375, 0.09896087646484375, 0.13287353515625, 0.16678619384765625, 0.2006988525390625, 0.23461151123046875, 0.268524169921875, 0.30243682861328125, 0.3363494873046875, 0.37026214599609375, 0.4041748046875, 0.43808746337890625, 0.4720001220703125, 0.5059127807617188, 0.539825439453125, 0.5737380981445312, 0.6076507568359375, 0.6415634155273438, 0.67547607421875, 0.7093887329101562, 0.7433013916015625, 0.7772140502929688, 0.811126708984375, 0.8450393676757812, 0.8789520263671875, 0.9128646850585938, 0.94677734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 5.0, 14.0, 13.0, 19.0, 28.0, 56.0, 64.0, 100.0, 95.0, 115.0, 98.0, 91.0, 92.0, 55.0, 49.0, 33.0, 21.0, 14.0, 6.0, 5.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.6669921875, -0.6483917236328125, -0.629791259765625, -0.6111907958984375, -0.59259033203125, -0.5739898681640625, -0.555389404296875, -0.5367889404296875, -0.5181884765625, -0.4995880126953125, -0.480987548828125, -0.4623870849609375, -0.44378662109375, -0.4251861572265625, -0.406585693359375, -0.3879852294921875, -0.369384765625, -0.3507843017578125, -0.332183837890625, -0.3135833740234375, -0.29498291015625, -0.2763824462890625, -0.257781982421875, -0.2391815185546875, -0.2205810546875, -0.2019805908203125, -0.183380126953125, -0.1647796630859375, -0.14617919921875, -0.1275787353515625, -0.108978271484375, -0.0903778076171875, -0.07177734375, -0.0531768798828125, -0.034576416015625, -0.0159759521484375, 0.00262451171875, 0.0212249755859375, 0.039825439453125, 0.0584259033203125, 0.0770263671875, 0.0956268310546875, 0.114227294921875, 0.1328277587890625, 0.15142822265625, 0.1700286865234375, 0.188629150390625, 0.2072296142578125, 0.225830078125, 0.2444305419921875, 0.263031005859375, 0.2816314697265625, 0.30023193359375, 0.3188323974609375, 0.337432861328125, 0.3560333251953125, 0.3746337890625, 0.3932342529296875, 0.411834716796875, 0.4304351806640625, 0.44903564453125, 0.4676361083984375, 0.486236572265625, 0.5048370361328125, 0.5234375]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 16.0, 69.0, 254.0, 386.0, 210.0, 60.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.07623291015625, -32.43429946899414, -31.792367935180664, -31.150436401367188, -30.50850486755371, -29.8665714263916, -29.224639892578125, -28.582706451416016, -27.94077491760254, -27.298843383789062, -26.656909942626953, -26.014978408813477, -25.373046875, -24.73111343383789, -24.089181900024414, -23.447250366210938, -22.805316925048828, -22.16338539123535, -21.521451950073242, -20.879520416259766, -20.23758888244629, -19.59565544128418, -18.953723907470703, -18.311790466308594, -17.66986083984375, -17.027929306030273, -16.385995864868164, -15.744064331054688, -15.102131843566895, -14.460199356079102, -13.818267822265625, -13.176335334777832, -12.534403800964355, -11.892471313476562, -11.250539779663086, -10.608607292175293, -9.9666748046875, -9.324743270874023, -8.68281078338623, -8.040878295898438, -7.398946285247803, -6.757014274597168, -6.115081787109375, -5.47314977645874, -4.8312177658081055, -4.1892852783203125, -3.5473532676696777, -2.9054207801818848, -2.26348876953125, -1.6215565204620361, -0.9796243906021118, -0.3376922607421875, 0.30423998832702637, 0.9461722373962402, 1.588104248046875, 2.230036735534668, 2.8719687461853027, 3.5139009952545166, 4.1558332443237305, 4.797765254974365, 5.439697265625, 6.081629753112793, 6.723561763763428, 7.365494251251221, 8.007426261901855]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 4.0, 8.0, 6.0, 9.0, 8.0, 17.0, 9.0, 16.0, 31.0, 24.0, 30.0, 33.0, 38.0, 40.0, 52.0, 70.0, 49.0, 65.0, 60.0, 71.0, 54.0, 52.0, 46.0, 36.0, 29.0, 26.0, 27.0, 17.0, 21.0, 13.0, 13.0, 11.0, 6.0, 7.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-8.877392768859863, -8.642253875732422, -8.407115936279297, -8.171977043151855, -7.936838626861572, -7.701700210571289, -7.466561317443848, -7.2314229011535645, -6.996284484863281, -6.761146068572998, -6.526007175445557, -6.290868759155273, -6.05573034286499, -5.820591926574707, -5.585453033447266, -5.350314617156982, -5.115175724029541, -4.880037307739258, -4.644898414611816, -4.409759998321533, -4.17462158203125, -3.9394829273223877, -3.7043442726135254, -3.469205856323242, -3.23406720161438, -2.9989285469055176, -2.7637901306152344, -2.528651475906372, -2.2935128211975098, -2.0583744049072266, -1.8232357501983643, -1.5880972146987915, -1.3529586791992188, -1.117820143699646, -0.8826815485954285, -0.6475429534912109, -0.4124044179916382, -0.17726588249206543, 0.057872772216796875, 0.29301130771636963, 0.5281498432159424, 0.7632883787155151, 0.9984269738197327, 1.2335655689239502, 1.468704104423523, 1.7038426399230957, 1.938981294631958, 2.1741199493408203, 2.4092583656311035, 2.644397020339966, 2.879535436630249, 3.1146740913391113, 3.3498125076293945, 3.584951162338257, 3.820089817047119, 4.055228233337402, 4.290367126464844, 4.525505542755127, 4.760644435882568, 4.995782852172852, 5.230921268463135, 5.466059684753418, 5.701198577880859, 5.936336994171143, 6.171475410461426]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 5.0, 12.0, 18.0, 21.0, 31.0, 45.0, 57.0, 77.0, 120.0, 240.0, 419.0, 795.0, 1796.0, 4819.0, 19238.0, 282889.0, 3839688.0, 32593.0, 6830.0, 2385.0, 1003.0, 477.0, 269.0, 159.0, 85.0, 61.0, 46.0, 37.0, 19.0, 22.0, 9.0, 9.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.1220703125, -1.087158203125, -1.05224609375, -1.017333984375, -0.982421875, -0.947509765625, -0.91259765625, -0.877685546875, -0.8427734375, -0.807861328125, -0.77294921875, -0.738037109375, -0.703125, -0.668212890625, -0.63330078125, -0.598388671875, -0.5634765625, -0.528564453125, -0.49365234375, -0.458740234375, -0.423828125, -0.388916015625, -0.35400390625, -0.319091796875, -0.2841796875, -0.249267578125, -0.21435546875, -0.179443359375, -0.14453125, -0.109619140625, -0.07470703125, -0.039794921875, -0.0048828125, 0.030029296875, 0.06494140625, 0.099853515625, 0.134765625, 0.169677734375, 0.20458984375, 0.239501953125, 0.2744140625, 0.309326171875, 0.34423828125, 0.379150390625, 0.4140625, 0.448974609375, 0.48388671875, 0.518798828125, 0.5537109375, 0.588623046875, 0.62353515625, 0.658447265625, 0.693359375, 0.728271484375, 0.76318359375, 0.798095703125, 0.8330078125, 0.867919921875, 0.90283203125, 0.937744140625, 0.97265625, 1.007568359375, 1.04248046875, 1.077392578125, 1.1123046875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 6.0, 9.0, 15.0, 16.0, 24.0, 22.0, 26.0, 38.0, 43.0, 52.0, 56.0, 55.0, 60.0, 44.0, 78.0, 66.0, 54.0, 46.0, 42.0, 44.0, 31.0, 40.0, 20.0, 26.0, 16.0, 7.0, 18.0, 9.0, 4.0, 9.0, 4.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4248046875, -0.4130439758300781, -0.40128326416015625, -0.3895225524902344, -0.3777618408203125, -0.3660011291503906, -0.35424041748046875, -0.3424797058105469, -0.330718994140625, -0.3189582824707031, -0.30719757080078125, -0.2954368591308594, -0.2836761474609375, -0.2719154357910156, -0.26015472412109375, -0.24839401245117188, -0.23663330078125, -0.22487258911132812, -0.21311187744140625, -0.20135116577148438, -0.1895904541015625, -0.17782974243164062, -0.16606903076171875, -0.15430831909179688, -0.142547607421875, -0.13078689575195312, -0.11902618408203125, -0.10726547241210938, -0.0955047607421875, -0.08374404907226562, -0.07198333740234375, -0.060222625732421875, -0.0484619140625, -0.036701202392578125, -0.02494049072265625, -0.013179779052734375, -0.0014190673828125, 0.010341644287109375, 0.02210235595703125, 0.033863067626953125, 0.045623779296875, 0.057384490966796875, 0.06914520263671875, 0.08090591430664062, 0.0926666259765625, 0.10442733764648438, 0.11618804931640625, 0.12794876098632812, 0.13970947265625, 0.15147018432617188, 0.16323089599609375, 0.17499160766601562, 0.1867523193359375, 0.19851303100585938, 0.21027374267578125, 0.22203445434570312, 0.233795166015625, 0.24555587768554688, 0.25731658935546875, 0.2690773010253906, 0.2808380126953125, 0.2925987243652344, 0.30435943603515625, 0.3161201477050781, 0.327880859375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 1.0, 3.0, 14.0, 12.0, 13.0, 25.0, 27.0, 30.0, 35.0, 69.0, 99.0, 154.0, 213.0, 350.0, 628.0, 1376.0, 3610.0, 10659.0, 43274.0, 845681.0, 3219674.0, 49757.0, 11553.0, 3825.0, 1458.0, 652.0, 351.0, 242.0, 137.0, 88.0, 65.0, 55.0, 33.0, 24.0, 29.0, 22.0, 11.0, 10.0, 10.0, 6.0, 2.0, 3.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6943359375, -0.6704254150390625, -0.646514892578125, -0.6226043701171875, -0.59869384765625, -0.5747833251953125, -0.550872802734375, -0.5269622802734375, -0.5030517578125, -0.4791412353515625, -0.455230712890625, -0.4313201904296875, -0.40740966796875, -0.3834991455078125, -0.359588623046875, -0.3356781005859375, -0.311767578125, -0.2878570556640625, -0.263946533203125, -0.2400360107421875, -0.21612548828125, -0.1922149658203125, -0.168304443359375, -0.1443939208984375, -0.1204833984375, -0.0965728759765625, -0.072662353515625, -0.0487518310546875, -0.02484130859375, -0.0009307861328125, 0.022979736328125, 0.0468902587890625, 0.07080078125, 0.0947113037109375, 0.118621826171875, 0.1425323486328125, 0.16644287109375, 0.1903533935546875, 0.214263916015625, 0.2381744384765625, 0.2620849609375, 0.2859954833984375, 0.309906005859375, 0.3338165283203125, 0.35772705078125, 0.3816375732421875, 0.405548095703125, 0.4294586181640625, 0.453369140625, 0.4772796630859375, 0.501190185546875, 0.5251007080078125, 0.54901123046875, 0.5729217529296875, 0.596832275390625, 0.6207427978515625, 0.6446533203125, 0.6685638427734375, 0.692474365234375, 0.7163848876953125, 0.74029541015625, 0.7642059326171875, 0.788116455078125, 0.8120269775390625, 0.8359375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 4.0, 9.0, 7.0, 17.0, 16.0, 37.0, 66.0, 178.0, 743.0, 2651.0, 191.0, 73.0, 46.0, 12.0, 10.0, 3.0, 6.0, 4.0, 2.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25537109375, -0.2395172119140625, -0.223663330078125, -0.2078094482421875, -0.19195556640625, -0.1761016845703125, -0.160247802734375, -0.1443939208984375, -0.1285400390625, -0.1126861572265625, -0.096832275390625, -0.0809783935546875, -0.06512451171875, -0.0492706298828125, -0.033416748046875, -0.0175628662109375, -0.001708984375, 0.0141448974609375, 0.029998779296875, 0.0458526611328125, 0.06170654296875, 0.0775604248046875, 0.093414306640625, 0.1092681884765625, 0.1251220703125, 0.1409759521484375, 0.156829833984375, 0.1726837158203125, 0.18853759765625, 0.2043914794921875, 0.220245361328125, 0.2360992431640625, 0.251953125, 0.2678070068359375, 0.283660888671875, 0.2995147705078125, 0.31536865234375, 0.3312225341796875, 0.347076416015625, 0.3629302978515625, 0.3787841796875, 0.3946380615234375, 0.410491943359375, 0.4263458251953125, 0.44219970703125, 0.4580535888671875, 0.473907470703125, 0.4897613525390625, 0.505615234375, 0.5214691162109375, 0.537322998046875, 0.5531768798828125, 0.56903076171875, 0.5848846435546875, 0.600738525390625, 0.6165924072265625, 0.6324462890625, 0.6483001708984375, 0.664154052734375, 0.6800079345703125, 0.69586181640625, 0.7117156982421875, 0.727569580078125, 0.7434234619140625, 0.75927734375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 7.0, 10.0, 30.0, 41.0, 59.0, 96.0, 158.0, 190.0, 148.0, 90.0, 76.0, 45.0, 18.0, 10.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6267790794372559, -1.569570541381836, -1.512362003326416, -1.455153465270996, -1.3979449272155762, -1.3407363891601562, -1.2835278511047363, -1.2263193130493164, -1.1691107749938965, -1.1119022369384766, -1.0546936988830566, -0.9974851608276367, -0.9402766227722168, -0.8830680847167969, -0.825859546661377, -0.768651008605957, -0.7114425301551819, -0.654233992099762, -0.597025454044342, -0.5398169159889221, -0.4826083779335022, -0.42539986968040466, -0.36819133162498474, -0.3109827935695648, -0.2537742555141449, -0.19656571745872498, -0.13935717940330505, -0.08214865624904633, -0.024940118193626404, 0.032268404960632324, 0.08947694301605225, 0.14668548107147217, 0.2038940191268921, 0.261102557182312, 0.31831109523773193, 0.37551963329315186, 0.4327281713485718, 0.4899366796016693, 0.5471452474594116, 0.6043537855148315, 0.6615623235702515, 0.7187708616256714, 0.7759793996810913, 0.8331879377365112, 0.8903964757919312, 0.9476050138473511, 1.004813551902771, 1.062022089958191, 1.1192305088043213, 1.1764390468597412, 1.2336475849151611, 1.290856122970581, 1.348064661026001, 1.405273199081421, 1.4624817371368408, 1.5196902751922607, 1.5768988132476807, 1.6341073513031006, 1.6913158893585205, 1.7485244274139404, 1.8057329654693604, 1.8629415035247803, 1.9201500415802002, 1.9773585796356201, 2.03456711769104]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 12.0, 5.0, 13.0, 26.0, 22.0, 33.0, 35.0, 44.0, 44.0, 57.0, 51.0, 52.0, 65.0, 49.0, 62.0, 68.0, 66.0, 51.0, 52.0, 31.0, 33.0, 22.0, 19.0, 27.0, 15.0, 13.0, 8.0, 9.0, 5.0, 3.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.322529911994934, -1.2774688005447388, -1.2324076890945435, -1.1873466968536377, -1.1422855854034424, -1.097224473953247, -1.0521633625030518, -1.0071022510528564, -0.9620412588119507, -0.9169801473617554, -0.8719190955162048, -0.8268579840660095, -0.781796932220459, -0.7367358207702637, -0.6916747093200684, -0.6466136574745178, -0.6015525460243225, -0.5564914345741272, -0.5114303827285767, -0.46636927127838135, -0.4213082194328308, -0.3762471079826355, -0.3311860263347626, -0.28612494468688965, -0.24106386303901672, -0.1960027813911438, -0.15094169974327087, -0.10588060319423676, -0.06081952154636383, -0.015758439898490906, 0.029302656650543213, 0.07436373829841614, 0.11942481994628906, 0.164485901594162, 0.2095469832420349, 0.2546080946922302, 0.29966914653778076, 0.3447302579879761, 0.389791339635849, 0.4348524212837219, 0.47991350293159485, 0.5249745845794678, 0.5700356960296631, 0.6150967478752136, 0.6601578593254089, 0.7052189111709595, 0.7502800226211548, 0.7953411340713501, 0.8404021859169006, 0.885463297367096, 0.9305243492126465, 0.9755854606628418, 1.020646572113037, 1.0657075643539429, 1.1107686758041382, 1.1558297872543335, 1.2008908987045288, 1.2459520101547241, 1.2910131216049194, 1.3360741138458252, 1.3811352252960205, 1.4261963367462158, 1.4712574481964111, 1.5163185596466064, 1.5613795518875122]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 9.0, 4.0, 9.0, 14.0, 26.0, 36.0, 74.0, 129.0, 288.0, 775.0, 2280.0, 8726.0, 46445.0, 326665.0, 548438.0, 94109.0, 15184.0, 3515.0, 1078.0, 389.0, 154.0, 90.0, 36.0, 33.0, 14.0, 14.0, 5.0, 5.0, 5.0, 2.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91064453125, -0.881439208984375, -0.85223388671875, -0.823028564453125, -0.7938232421875, -0.764617919921875, -0.73541259765625, -0.706207275390625, -0.677001953125, -0.647796630859375, -0.61859130859375, -0.589385986328125, -0.5601806640625, -0.530975341796875, -0.50177001953125, -0.472564697265625, -0.443359375, -0.414154052734375, -0.38494873046875, -0.355743408203125, -0.3265380859375, -0.297332763671875, -0.26812744140625, -0.238922119140625, -0.209716796875, -0.180511474609375, -0.15130615234375, -0.122100830078125, -0.0928955078125, -0.063690185546875, -0.03448486328125, -0.005279541015625, 0.02392578125, 0.053131103515625, 0.08233642578125, 0.111541748046875, 0.1407470703125, 0.169952392578125, 0.19915771484375, 0.228363037109375, 0.257568359375, 0.286773681640625, 0.31597900390625, 0.345184326171875, 0.3743896484375, 0.403594970703125, 0.43280029296875, 0.462005615234375, 0.4912109375, 0.520416259765625, 0.54962158203125, 0.578826904296875, 0.6080322265625, 0.637237548828125, 0.66644287109375, 0.695648193359375, 0.724853515625, 0.754058837890625, 0.78326416015625, 0.812469482421875, 0.8416748046875, 0.870880126953125, 0.90008544921875, 0.929290771484375, 0.95849609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 7.0, 9.0, 12.0, 9.0, 18.0, 26.0, 28.0, 29.0, 35.0, 30.0, 45.0, 51.0, 58.0, 56.0, 61.0, 59.0, 57.0, 47.0, 46.0, 36.0, 43.0, 39.0, 29.0, 35.0, 28.0, 16.0, 22.0, 11.0, 13.0, 13.0, 4.0, 3.0, 6.0, 5.0, 9.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.41650390625, -0.40511322021484375, -0.3937225341796875, -0.38233184814453125, -0.370941162109375, -0.35955047607421875, -0.3481597900390625, -0.33676910400390625, -0.32537841796875, -0.31398773193359375, -0.3025970458984375, -0.29120635986328125, -0.279815673828125, -0.26842498779296875, -0.2570343017578125, -0.24564361572265625, -0.2342529296875, -0.22286224365234375, -0.2114715576171875, -0.20008087158203125, -0.188690185546875, -0.17729949951171875, -0.1659088134765625, -0.15451812744140625, -0.14312744140625, -0.13173675537109375, -0.1203460693359375, -0.10895538330078125, -0.097564697265625, -0.08617401123046875, -0.0747833251953125, -0.06339263916015625, -0.052001953125, -0.04061126708984375, -0.0292205810546875, -0.01782989501953125, -0.006439208984375, 0.00495147705078125, 0.0163421630859375, 0.02773284912109375, 0.03912353515625, 0.05051422119140625, 0.0619049072265625, 0.07329559326171875, 0.084686279296875, 0.09607696533203125, 0.1074676513671875, 0.11885833740234375, 0.1302490234375, 0.14163970947265625, 0.1530303955078125, 0.16442108154296875, 0.175811767578125, 0.18720245361328125, 0.1985931396484375, 0.20998382568359375, 0.22137451171875, 0.23276519775390625, 0.2441558837890625, 0.25554656982421875, 0.266937255859375, 0.27832794189453125, 0.2897186279296875, 0.30110931396484375, 0.3125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 7.0, 19.0, 16.0, 22.0, 28.0, 47.0, 66.0, 105.0, 161.0, 306.0, 564.0, 1481.0, 5766.0, 83151.0, 880885.0, 68000.0, 5185.0, 1350.0, 597.0, 288.0, 168.0, 107.0, 82.0, 48.0, 31.0, 14.0, 19.0, 9.0, 10.0, 2.0, 1.0, 1.0, 5.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7880859375, -1.7390594482421875, -1.690032958984375, -1.6410064697265625, -1.59197998046875, -1.5429534912109375, -1.493927001953125, -1.4449005126953125, -1.3958740234375, -1.3468475341796875, -1.297821044921875, -1.2487945556640625, -1.19976806640625, -1.1507415771484375, -1.101715087890625, -1.0526885986328125, -1.003662109375, -0.9546356201171875, -0.905609130859375, -0.8565826416015625, -0.80755615234375, -0.7585296630859375, -0.709503173828125, -0.6604766845703125, -0.6114501953125, -0.5624237060546875, -0.513397216796875, -0.4643707275390625, -0.41534423828125, -0.3663177490234375, -0.317291259765625, -0.2682647705078125, -0.21923828125, -0.1702117919921875, -0.121185302734375, -0.0721588134765625, -0.02313232421875, 0.0258941650390625, 0.074920654296875, 0.1239471435546875, 0.1729736328125, 0.2220001220703125, 0.271026611328125, 0.3200531005859375, 0.36907958984375, 0.4181060791015625, 0.467132568359375, 0.5161590576171875, 0.565185546875, 0.6142120361328125, 0.663238525390625, 0.7122650146484375, 0.76129150390625, 0.8103179931640625, 0.859344482421875, 0.9083709716796875, 0.9573974609375, 1.0064239501953125, 1.055450439453125, 1.1044769287109375, 1.15350341796875, 1.2025299072265625, 1.251556396484375, 1.3005828857421875, 1.349609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 6.0, 7.0, 10.0, 15.0, 10.0, 8.0, 26.0, 18.0, 21.0, 24.0, 45.0, 40.0, 50.0, 63.0, 57.0, 57.0, 69.0, 60.0, 62.0, 51.0, 47.0, 49.0, 39.0, 24.0, 30.0, 20.0, 24.0, 21.0, 13.0, 13.0, 8.0, 4.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.09765625, -2.0431365966796875, -1.988616943359375, -1.9340972900390625, -1.87957763671875, -1.8250579833984375, -1.770538330078125, -1.7160186767578125, -1.6614990234375, -1.6069793701171875, -1.552459716796875, -1.4979400634765625, -1.44342041015625, -1.3889007568359375, -1.334381103515625, -1.2798614501953125, -1.225341796875, -1.1708221435546875, -1.116302490234375, -1.0617828369140625, -1.00726318359375, -0.9527435302734375, -0.898223876953125, -0.8437042236328125, -0.7891845703125, -0.7346649169921875, -0.680145263671875, -0.6256256103515625, -0.57110595703125, -0.5165863037109375, -0.462066650390625, -0.4075469970703125, -0.35302734375, -0.2985076904296875, -0.243988037109375, -0.1894683837890625, -0.13494873046875, -0.0804290771484375, -0.025909423828125, 0.0286102294921875, 0.0831298828125, 0.1376495361328125, 0.192169189453125, 0.2466888427734375, 0.30120849609375, 0.3557281494140625, 0.410247802734375, 0.4647674560546875, 0.519287109375, 0.5738067626953125, 0.628326416015625, 0.6828460693359375, 0.73736572265625, 0.7918853759765625, 0.846405029296875, 0.9009246826171875, 0.9554443359375, 1.0099639892578125, 1.064483642578125, 1.1190032958984375, 1.17352294921875, 1.2280426025390625, 1.282562255859375, 1.3370819091796875, 1.3916015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 5.0, 13.0, 8.0, 15.0, 31.0, 38.0, 46.0, 120.0, 228.0, 535.0, 1663.0, 9503.0, 269139.0, 743583.0, 19787.0, 2543.0, 714.0, 273.0, 134.0, 79.0, 33.0, 19.0, 11.0, 13.0, 6.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52783203125, -0.5090789794921875, -0.490325927734375, -0.4715728759765625, -0.45281982421875, -0.4340667724609375, -0.415313720703125, -0.3965606689453125, -0.3778076171875, -0.3590545654296875, -0.340301513671875, -0.3215484619140625, -0.30279541015625, -0.2840423583984375, -0.265289306640625, -0.2465362548828125, -0.227783203125, -0.2090301513671875, -0.190277099609375, -0.1715240478515625, -0.15277099609375, -0.1340179443359375, -0.115264892578125, -0.0965118408203125, -0.0777587890625, -0.0590057373046875, -0.040252685546875, -0.0214996337890625, -0.00274658203125, 0.0160064697265625, 0.034759521484375, 0.0535125732421875, 0.072265625, 0.0910186767578125, 0.109771728515625, 0.1285247802734375, 0.14727783203125, 0.1660308837890625, 0.184783935546875, 0.2035369873046875, 0.2222900390625, 0.2410430908203125, 0.259796142578125, 0.2785491943359375, 0.29730224609375, 0.3160552978515625, 0.334808349609375, 0.3535614013671875, 0.372314453125, 0.3910675048828125, 0.409820556640625, 0.4285736083984375, 0.44732666015625, 0.4660797119140625, 0.484832763671875, 0.5035858154296875, 0.5223388671875, 0.5410919189453125, 0.559844970703125, 0.5785980224609375, 0.59735107421875, 0.6161041259765625, 0.634857177734375, 0.6536102294921875, 0.67236328125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 7.0, 5.0, 16.0, 12.0, 20.0, 16.0, 26.0, 27.0, 38.0, 44.0, 56.0, 90.0, 113.0, 101.0, 86.0, 62.0, 47.0, 49.0, 28.0, 25.0, 31.0, 16.0, 11.0, 14.0, 15.0, 7.0, 3.0, 5.0, 8.0, 6.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.7206878662109375e-05, -4.526600241661072e-05, -4.332512617111206e-05, -4.13842499256134e-05, -3.9443373680114746e-05, -3.750249743461609e-05, -3.556162118911743e-05, -3.3620744943618774e-05, -3.167986869812012e-05, -2.973899245262146e-05, -2.7798116207122803e-05, -2.5857239961624146e-05, -2.3916363716125488e-05, -2.197548747062683e-05, -2.0034611225128174e-05, -1.8093734979629517e-05, -1.615285873413086e-05, -1.4211982488632202e-05, -1.2271106243133545e-05, -1.0330229997634888e-05, -8.38935375213623e-06, -6.448477506637573e-06, -4.507601261138916e-06, -2.566725015640259e-06, -6.258487701416016e-07, 1.3150274753570557e-06, 3.255903720855713e-06, 5.19677996635437e-06, 7.137656211853027e-06, 9.078532457351685e-06, 1.1019408702850342e-05, 1.2960284948348999e-05, 1.4901161193847656e-05, 1.6842037439346313e-05, 1.878291368484497e-05, 2.0723789930343628e-05, 2.2664666175842285e-05, 2.4605542421340942e-05, 2.65464186668396e-05, 2.8487294912338257e-05, 3.0428171157836914e-05, 3.236904740333557e-05, 3.430992364883423e-05, 3.6250799894332886e-05, 3.819167613983154e-05, 4.01325523853302e-05, 4.207342863082886e-05, 4.4014304876327515e-05, 4.595518112182617e-05, 4.789605736732483e-05, 4.9836933612823486e-05, 5.1777809858322144e-05, 5.37186861038208e-05, 5.565956234931946e-05, 5.7600438594818115e-05, 5.954131484031677e-05, 6.148219108581543e-05, 6.342306733131409e-05, 6.536394357681274e-05, 6.73048198223114e-05, 6.924569606781006e-05, 7.118657231330872e-05, 7.312744855880737e-05, 7.506832480430603e-05, 7.700920104980469e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 4.0, 4.0, 2.0, 6.0, 9.0, 13.0, 14.0, 20.0, 34.0, 53.0, 76.0, 148.0, 249.0, 569.0, 1518.0, 6934.0, 122046.0, 869582.0, 41052.0, 4079.0, 1097.0, 468.0, 240.0, 131.0, 89.0, 44.0, 24.0, 15.0, 10.0, 5.0, 7.0, 4.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53125, -0.5143051147460938, -0.4973602294921875, -0.48041534423828125, -0.463470458984375, -0.44652557373046875, -0.4295806884765625, -0.41263580322265625, -0.39569091796875, -0.37874603271484375, -0.3618011474609375, -0.34485626220703125, -0.327911376953125, -0.31096649169921875, -0.2940216064453125, -0.27707672119140625, -0.2601318359375, -0.24318695068359375, -0.2262420654296875, -0.20929718017578125, -0.192352294921875, -0.17540740966796875, -0.1584625244140625, -0.14151763916015625, -0.12457275390625, -0.10762786865234375, -0.0906829833984375, -0.07373809814453125, -0.056793212890625, -0.03984832763671875, -0.0229034423828125, -0.00595855712890625, 0.010986328125, 0.02793121337890625, 0.0448760986328125, 0.06182098388671875, 0.078765869140625, 0.09571075439453125, 0.1126556396484375, 0.12960052490234375, 0.14654541015625, 0.16349029541015625, 0.1804351806640625, 0.19738006591796875, 0.214324951171875, 0.23126983642578125, 0.2482147216796875, 0.26515960693359375, 0.2821044921875, 0.29904937744140625, 0.3159942626953125, 0.33293914794921875, 0.349884033203125, 0.36682891845703125, 0.3837738037109375, 0.40071868896484375, 0.41766357421875, 0.43460845947265625, 0.4515533447265625, 0.46849822998046875, 0.485443115234375, 0.5023880004882812, 0.5193328857421875, 0.5362777709960938, 0.55322265625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 15.0, 18.0, 31.0, 41.0, 75.0, 90.0, 117.0, 130.0, 135.0, 100.0, 65.0, 63.0, 35.0, 22.0, 17.0, 13.0, 3.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.681640625, -0.664398193359375, -0.64715576171875, -0.629913330078125, -0.6126708984375, -0.595428466796875, -0.57818603515625, -0.560943603515625, -0.543701171875, -0.526458740234375, -0.50921630859375, -0.491973876953125, -0.4747314453125, -0.457489013671875, -0.44024658203125, -0.423004150390625, -0.40576171875, -0.388519287109375, -0.37127685546875, -0.354034423828125, -0.3367919921875, -0.319549560546875, -0.30230712890625, -0.285064697265625, -0.267822265625, -0.250579833984375, -0.23333740234375, -0.216094970703125, -0.1988525390625, -0.181610107421875, -0.16436767578125, -0.147125244140625, -0.1298828125, -0.112640380859375, -0.09539794921875, -0.078155517578125, -0.0609130859375, -0.043670654296875, -0.02642822265625, -0.009185791015625, 0.008056640625, 0.025299072265625, 0.04254150390625, 0.059783935546875, 0.0770263671875, 0.094268798828125, 0.11151123046875, 0.128753662109375, 0.14599609375, 0.163238525390625, 0.18048095703125, 0.197723388671875, 0.2149658203125, 0.232208251953125, 0.24945068359375, 0.266693115234375, 0.283935546875, 0.301177978515625, 0.31842041015625, 0.335662841796875, 0.3529052734375, 0.370147705078125, 0.38739013671875, 0.404632568359375, 0.421875]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 3.0, 8.0, 18.0, 24.0, 61.0, 96.0, 146.0, 174.0, 176.0, 129.0, 87.0, 40.0, 18.0, 5.0, 8.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.523820877075195, -10.287788391113281, -10.051756858825684, -9.81572437286377, -9.579692840576172, -9.343660354614258, -9.10762882232666, -8.871596336364746, -8.635564804077148, -8.399532318115234, -8.163500785827637, -7.927468776702881, -7.691436767578125, -7.455404758453369, -7.219372749328613, -6.983340263366699, -6.747308254241943, -6.5112762451171875, -6.275244235992432, -6.039212226867676, -5.80318021774292, -5.567148208618164, -5.33111572265625, -5.095084190368652, -4.859051704406738, -4.623019695281982, -4.386987686157227, -4.150955677032471, -3.914923667907715, -3.678891658782959, -3.442859411239624, -3.206827402114868, -2.970795154571533, -2.7347631454467773, -2.4987311363220215, -2.2626991271972656, -2.0266671180725098, -1.7906349897384644, -1.554602861404419, -1.318570852279663, -1.0825388431549072, -0.8465068340301514, -0.6104747653007507, -0.3744426965713501, -0.13841068744659424, 0.09762132167816162, 0.33365345001220703, 0.5696854591369629, 0.8057174682617188, 1.0417494773864746, 1.2777814865112305, 1.5138136148452759, 1.7498456239700317, 1.9858776330947876, 2.221909761428833, 2.457941770553589, 2.6939737796783447, 2.9300057888031006, 3.1660377979278564, 3.4020700454711914, 3.6381020545959473, 3.874134063720703, 4.110166072845459, 4.346198081970215, 4.582230091094971]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 6.0, 4.0, 6.0, 7.0, 6.0, 6.0, 17.0, 16.0, 9.0, 15.0, 29.0, 20.0, 33.0, 35.0, 26.0, 41.0, 44.0, 53.0, 59.0, 51.0, 46.0, 39.0, 40.0, 51.0, 42.0, 39.0, 36.0, 31.0, 28.0, 22.0, 30.0, 21.0, 15.0, 16.0, 12.0, 8.0, 13.0, 9.0, 8.0, 5.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.311617374420166, -7.106485366821289, -6.901353359222412, -6.696221351623535, -6.491089344024658, -6.285957336425781, -6.080825328826904, -5.875693321228027, -5.67056131362915, -5.465429306030273, -5.2602972984313965, -5.0551652908325195, -4.850033283233643, -4.644901275634766, -4.439769268035889, -4.234637260437012, -4.029505729675293, -3.824373722076416, -3.619241714477539, -3.414109706878662, -3.208977699279785, -3.003845691680908, -2.7987136840820312, -2.5935816764831543, -2.3884496688842773, -2.1833176612854004, -1.9781856536865234, -1.7730536460876465, -1.5679216384887695, -1.3627897500991821, -1.1576577425003052, -0.9525257349014282, -0.7473936080932617, -0.5422616004943848, -0.3371296226978302, -0.13199764490127563, 0.07313436269760132, 0.2782663106918335, 0.48339831829071045, 0.6885303258895874, 0.8936623334884644, 1.0987943410873413, 1.3039263486862183, 1.5090582370758057, 1.7141902446746826, 1.9193222522735596, 2.1244542598724365, 2.3295862674713135, 2.5347182750701904, 2.7398502826690674, 2.9449822902679443, 3.1501142978668213, 3.3552463054656982, 3.560378074645996, 3.765510082244873, 3.97064208984375, 4.175774097442627, 4.380906105041504, 4.586038112640381, 4.791170120239258, 4.996302127838135, 5.201434135437012, 5.406566143035889, 5.611698150634766, 5.816830158233643]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 6.0, 7.0, 15.0, 10.0, 16.0, 32.0, 51.0, 68.0, 107.0, 168.0, 345.0, 758.0, 1840.0, 5469.0, 23315.0, 194374.0, 3598815.0, 327494.0, 30499.0, 6955.0, 2188.0, 865.0, 386.0, 199.0, 120.0, 55.0, 39.0, 24.0, 24.0, 11.0, 4.0, 6.0, 6.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64697265625, -0.6243362426757812, -0.6016998291015625, -0.5790634155273438, -0.556427001953125, -0.5337905883789062, -0.5111541748046875, -0.48851776123046875, -0.46588134765625, -0.44324493408203125, -0.4206085205078125, -0.39797210693359375, -0.375335693359375, -0.35269927978515625, -0.3300628662109375, -0.30742645263671875, -0.2847900390625, -0.26215362548828125, -0.2395172119140625, -0.21688079833984375, -0.194244384765625, -0.17160797119140625, -0.1489715576171875, -0.12633514404296875, -0.10369873046875, -0.08106231689453125, -0.0584259033203125, -0.03578948974609375, -0.013153076171875, 0.00948333740234375, 0.0321197509765625, 0.05475616455078125, 0.077392578125, 0.10002899169921875, 0.1226654052734375, 0.14530181884765625, 0.167938232421875, 0.19057464599609375, 0.2132110595703125, 0.23584747314453125, 0.25848388671875, 0.28112030029296875, 0.3037567138671875, 0.32639312744140625, 0.349029541015625, 0.37166595458984375, 0.3943023681640625, 0.41693878173828125, 0.4395751953125, 0.46221160888671875, 0.4848480224609375, 0.5074844360351562, 0.530120849609375, 0.5527572631835938, 0.5753936767578125, 0.5980300903320312, 0.62066650390625, 0.6433029174804688, 0.6659393310546875, 0.6885757446289062, 0.711212158203125, 0.7338485717773438, 0.7564849853515625, 0.7791213989257812, 0.8017578125]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 3.0, 4.0, 2.0, 4.0, 5.0, 6.0, 8.0, 10.0, 10.0, 20.0, 35.0, 23.0, 37.0, 26.0, 49.0, 48.0, 49.0, 59.0, 57.0, 61.0, 54.0, 49.0, 53.0, 52.0, 49.0, 37.0, 37.0, 33.0, 15.0, 22.0, 15.0, 17.0, 21.0, 9.0, 13.0, 11.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.420654296875, -0.40985870361328125, -0.3990631103515625, -0.38826751708984375, -0.377471923828125, -0.36667633056640625, -0.3558807373046875, -0.34508514404296875, -0.33428955078125, -0.32349395751953125, -0.3126983642578125, -0.30190277099609375, -0.291107177734375, -0.28031158447265625, -0.2695159912109375, -0.25872039794921875, -0.2479248046875, -0.23712921142578125, -0.2263336181640625, -0.21553802490234375, -0.204742431640625, -0.19394683837890625, -0.1831512451171875, -0.17235565185546875, -0.16156005859375, -0.15076446533203125, -0.1399688720703125, -0.12917327880859375, -0.118377685546875, -0.10758209228515625, -0.0967864990234375, -0.08599090576171875, -0.0751953125, -0.06439971923828125, -0.0536041259765625, -0.04280853271484375, -0.032012939453125, -0.02121734619140625, -0.0104217529296875, 0.00037384033203125, 0.01116943359375, 0.02196502685546875, 0.0327606201171875, 0.04355621337890625, 0.054351806640625, 0.06514739990234375, 0.0759429931640625, 0.08673858642578125, 0.0975341796875, 0.10832977294921875, 0.1191253662109375, 0.12992095947265625, 0.140716552734375, 0.15151214599609375, 0.1623077392578125, 0.17310333251953125, 0.18389892578125, 0.19469451904296875, 0.2054901123046875, 0.21628570556640625, 0.227081298828125, 0.23787689208984375, 0.2486724853515625, 0.25946807861328125, 0.270263671875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 6.0, 8.0, 11.0, 19.0, 26.0, 52.0, 88.0, 187.0, 444.0, 1275.0, 6548.0, 93327.0, 3982582.0, 101671.0, 6301.0, 1054.0, 369.0, 143.0, 59.0, 40.0, 22.0, 18.0, 7.0, 8.0, 6.0, 5.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0615234375, -1.021484375, -0.9814453125, -0.94140625, -0.9013671875, -0.861328125, -0.8212890625, -0.78125, -0.7412109375, -0.701171875, -0.6611328125, -0.62109375, -0.5810546875, -0.541015625, -0.5009765625, -0.4609375, -0.4208984375, -0.380859375, -0.3408203125, -0.30078125, -0.2607421875, -0.220703125, -0.1806640625, -0.140625, -0.1005859375, -0.060546875, -0.0205078125, 0.01953125, 0.0595703125, 0.099609375, 0.1396484375, 0.1796875, 0.2197265625, 0.259765625, 0.2998046875, 0.33984375, 0.3798828125, 0.419921875, 0.4599609375, 0.5, 0.5400390625, 0.580078125, 0.6201171875, 0.66015625, 0.7001953125, 0.740234375, 0.7802734375, 0.8203125, 0.8603515625, 0.900390625, 0.9404296875, 0.98046875, 1.0205078125, 1.060546875, 1.1005859375, 1.140625, 1.1806640625, 1.220703125, 1.2607421875, 1.30078125, 1.3408203125, 1.380859375, 1.4208984375, 1.4609375, 1.5009765625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 8.0, 4.0, 3.0, 6.0, 10.0, 8.0, 16.0, 18.0, 29.0, 40.0, 102.0, 245.0, 816.0, 1584.0, 713.0, 238.0, 111.0, 43.0, 36.0, 19.0, 9.0, 5.0, 9.0, 6.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4873046875, -1.4505538940429688, -1.4138031005859375, -1.3770523071289062, -1.340301513671875, -1.3035507202148438, -1.2667999267578125, -1.2300491333007812, -1.19329833984375, -1.1565475463867188, -1.1197967529296875, -1.0830459594726562, -1.046295166015625, -1.0095443725585938, -0.9727935791015625, -0.9360427856445312, -0.8992919921875, -0.8625411987304688, -0.8257904052734375, -0.7890396118164062, -0.752288818359375, -0.7155380249023438, -0.6787872314453125, -0.6420364379882812, -0.60528564453125, -0.5685348510742188, -0.5317840576171875, -0.49503326416015625, -0.458282470703125, -0.42153167724609375, -0.3847808837890625, -0.34803009033203125, -0.311279296875, -0.27452850341796875, -0.2377777099609375, -0.20102691650390625, -0.164276123046875, -0.12752532958984375, -0.0907745361328125, -0.05402374267578125, -0.01727294921875, 0.01947784423828125, 0.0562286376953125, 0.09297943115234375, 0.129730224609375, 0.16648101806640625, 0.2032318115234375, 0.23998260498046875, 0.2767333984375, 0.31348419189453125, 0.3502349853515625, 0.38698577880859375, 0.423736572265625, 0.46048736572265625, 0.4972381591796875, 0.5339889526367188, 0.57073974609375, 0.6074905395507812, 0.6442413330078125, 0.6809921264648438, 0.717742919921875, 0.7544937133789062, 0.7912445068359375, 0.8279953002929688, 0.86474609375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 17.0, 53.0, 187.0, 339.0, 256.0, 88.0, 25.0, 12.0, 8.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.358696937561035, -6.035796642303467, -5.712896347045898, -5.389995574951172, -5.0670952796936035, -4.744194984436035, -4.421294212341309, -4.09839391708374, -3.775493621826172, -3.4525933265686035, -3.129692792892456, -2.8067922592163086, -2.4838919639587402, -2.160991668701172, -1.8380911350250244, -1.515190601348877, -1.1922903060913086, -0.8693898916244507, -0.5464894771575928, -0.22358906269073486, 0.09931135177612305, 0.42221176624298096, 0.7451121807098389, 1.0680127143859863, 1.3909130096435547, 1.7138134241104126, 2.0367138385772705, 2.359614372253418, 2.6825146675109863, 3.0054149627685547, 3.328315496444702, 3.6512160301208496, 3.9741172790527344, 4.297017574310303, 4.619917869567871, 4.942818641662598, 5.265718936920166, 5.588619232177734, 5.911520004272461, 6.234420299530029, 6.557320594787598, 6.880220890045166, 7.203121185302734, 7.526021957397461, 7.848922252655029, 8.171822547912598, 8.494723320007324, 8.817623138427734, 9.140523910522461, 9.463424682617188, 9.786324501037598, 10.109225273132324, 10.432125091552734, 10.755025863647461, 11.077926635742188, 11.400827407836914, 11.723727226257324, 12.04662799835205, 12.369527816772461, 12.692428588867188, 13.015329360961914, 13.338229179382324, 13.66112995147705, 13.984029769897461, 14.306930541992188]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 4.0, 5.0, 7.0, 11.0, 11.0, 13.0, 18.0, 31.0, 40.0, 30.0, 56.0, 49.0, 56.0, 68.0, 75.0, 56.0, 62.0, 68.0, 60.0, 54.0, 44.0, 36.0, 27.0, 39.0, 29.0, 20.0, 11.0, 10.0, 3.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1486897468566895, -5.9911980628967285, -5.833705902099609, -5.676214218139648, -5.518722057342529, -5.361230373382568, -5.203738212585449, -5.046246528625488, -4.888754844665527, -4.731263160705566, -4.573770999908447, -4.416279315948486, -4.258787155151367, -4.101295471191406, -3.943803548812866, -3.786311626434326, -3.628819465637207, -3.471327543258667, -3.313835620880127, -3.156343698501587, -2.998851776123047, -2.841360092163086, -2.683868169784546, -2.526376247406006, -2.368884325027466, -2.211392402648926, -2.0539004802703857, -1.8964086771011353, -1.7389167547225952, -1.5814248323440552, -1.4239330291748047, -1.2664411067962646, -1.1089489459991455, -0.9514570236206055, -0.7939651608467102, -0.6364732980728149, -0.4789813756942749, -0.32148945331573486, -0.1639975905418396, -0.006505727767944336, 0.1509861946105957, 0.30847808718681335, 0.465969979763031, 0.6234618425369263, 0.7809537649154663, 0.9384456872940063, 1.0959374904632568, 1.2534294128417969, 1.410921335220337, 1.568413257598877, 1.725905179977417, 1.8833969831466675, 2.040888786315918, 2.198380947113037, 2.355872631072998, 2.513364553451538, 2.670856475830078, 2.828348398208618, 2.985840320587158, 3.1433322429656982, 3.3008241653442383, 3.458315849304199, 3.6158077716827393, 3.7732996940612793, 3.9307916164398193]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 7.0, 6.0, 4.0, 16.0, 22.0, 39.0, 57.0, 67.0, 97.0, 176.0, 292.0, 469.0, 783.0, 1362.0, 2514.0, 4712.0, 9566.0, 21567.0, 52314.0, 135726.0, 323136.0, 293887.0, 118351.0, 45946.0, 19224.0, 8643.0, 4208.0, 2261.0, 1201.0, 712.0, 433.0, 271.0, 181.0, 98.0, 73.0, 50.0, 30.0, 24.0, 16.0, 10.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.447265625, -0.4351539611816406, -0.42304229736328125, -0.4109306335449219, -0.3988189697265625, -0.3867073059082031, -0.37459564208984375, -0.3624839782714844, -0.350372314453125, -0.3382606506347656, -0.32614898681640625, -0.3140373229980469, -0.3019256591796875, -0.2898139953613281, -0.27770233154296875, -0.2655906677246094, -0.25347900390625, -0.24136734008789062, -0.22925567626953125, -0.21714401245117188, -0.2050323486328125, -0.19292068481445312, -0.18080902099609375, -0.16869735717773438, -0.156585693359375, -0.14447402954101562, -0.13236236572265625, -0.12025070190429688, -0.1081390380859375, -0.09602737426757812, -0.08391571044921875, -0.07180404663085938, -0.0596923828125, -0.047580718994140625, -0.03546905517578125, -0.023357391357421875, -0.0112457275390625, 0.000865936279296875, 0.01297760009765625, 0.025089263916015625, 0.037200927734375, 0.049312591552734375, 0.06142425537109375, 0.07353591918945312, 0.0856475830078125, 0.09775924682617188, 0.10987091064453125, 0.12198257446289062, 0.13409423828125, 0.14620590209960938, 0.15831756591796875, 0.17042922973632812, 0.1825408935546875, 0.19465255737304688, 0.20676422119140625, 0.21887588500976562, 0.230987548828125, 0.24309921264648438, 0.25521087646484375, 0.2673225402832031, 0.2794342041015625, 0.2915458679199219, 0.30365753173828125, 0.3157691955566406, 0.327880859375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 2.0, 2.0, 1.0, 6.0, 6.0, 10.0, 13.0, 14.0, 29.0, 23.0, 40.0, 35.0, 37.0, 60.0, 44.0, 68.0, 50.0, 47.0, 58.0, 58.0, 52.0, 48.0, 50.0, 39.0, 39.0, 30.0, 28.0, 27.0, 14.0, 21.0, 5.0, 12.0, 9.0, 10.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.41845703125, -0.408050537109375, -0.39764404296875, -0.387237548828125, -0.3768310546875, -0.366424560546875, -0.35601806640625, -0.345611572265625, -0.335205078125, -0.324798583984375, -0.31439208984375, -0.303985595703125, -0.2935791015625, -0.283172607421875, -0.27276611328125, -0.262359619140625, -0.251953125, -0.241546630859375, -0.23114013671875, -0.220733642578125, -0.2103271484375, -0.199920654296875, -0.18951416015625, -0.179107666015625, -0.168701171875, -0.158294677734375, -0.14788818359375, -0.137481689453125, -0.1270751953125, -0.116668701171875, -0.10626220703125, -0.095855712890625, -0.08544921875, -0.075042724609375, -0.06463623046875, -0.054229736328125, -0.0438232421875, -0.033416748046875, -0.02301025390625, -0.012603759765625, -0.002197265625, 0.008209228515625, 0.01861572265625, 0.029022216796875, 0.0394287109375, 0.049835205078125, 0.06024169921875, 0.070648193359375, 0.0810546875, 0.091461181640625, 0.10186767578125, 0.112274169921875, 0.1226806640625, 0.133087158203125, 0.14349365234375, 0.153900146484375, 0.164306640625, 0.174713134765625, 0.18511962890625, 0.195526123046875, 0.2059326171875, 0.216339111328125, 0.22674560546875, 0.237152099609375, 0.24755859375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 8.0, 10.0, 14.0, 14.0, 21.0, 27.0, 29.0, 41.0, 63.0, 95.0, 157.0, 198.0, 273.0, 462.0, 779.0, 1412.0, 3629.0, 13516.0, 121449.0, 765750.0, 119842.0, 13580.0, 3616.0, 1427.0, 754.0, 456.0, 294.0, 179.0, 128.0, 89.0, 65.0, 39.0, 24.0, 26.0, 20.0, 20.0, 9.0, 8.0, 6.0, 4.0, 2.0, 5.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79443359375, -0.7675018310546875, -0.740570068359375, -0.7136383056640625, -0.68670654296875, -0.6597747802734375, -0.632843017578125, -0.6059112548828125, -0.5789794921875, -0.5520477294921875, -0.525115966796875, -0.4981842041015625, -0.47125244140625, -0.4443206787109375, -0.417388916015625, -0.3904571533203125, -0.363525390625, -0.3365936279296875, -0.309661865234375, -0.2827301025390625, -0.25579833984375, -0.2288665771484375, -0.201934814453125, -0.1750030517578125, -0.1480712890625, -0.1211395263671875, -0.094207763671875, -0.0672760009765625, -0.04034423828125, -0.0134124755859375, 0.013519287109375, 0.0404510498046875, 0.0673828125, 0.0943145751953125, 0.121246337890625, 0.1481781005859375, 0.17510986328125, 0.2020416259765625, 0.228973388671875, 0.2559051513671875, 0.2828369140625, 0.3097686767578125, 0.336700439453125, 0.3636322021484375, 0.39056396484375, 0.4174957275390625, 0.444427490234375, 0.4713592529296875, 0.498291015625, 0.5252227783203125, 0.552154541015625, 0.5790863037109375, 0.60601806640625, 0.6329498291015625, 0.659881591796875, 0.6868133544921875, 0.7137451171875, 0.7406768798828125, 0.767608642578125, 0.7945404052734375, 0.82147216796875, 0.8484039306640625, 0.875335693359375, 0.9022674560546875, 0.92919921875]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 2.0, 1.0, 4.0, 10.0, 13.0, 14.0, 15.0, 14.0, 16.0, 17.0, 23.0, 29.0, 25.0, 32.0, 32.0, 35.0, 41.0, 42.0, 52.0, 55.0, 47.0, 56.0, 51.0, 58.0, 43.0, 43.0, 37.0, 31.0, 28.0, 28.0, 23.0, 20.0, 15.0, 11.0, 8.0, 5.0, 4.0, 3.0, 9.0, 2.0, 5.0, 1.0, 3.0, 2.0, 5.0], "bins": [-1.6083984375, -1.5679244995117188, -1.5274505615234375, -1.4869766235351562, -1.446502685546875, -1.4060287475585938, -1.3655548095703125, -1.3250808715820312, -1.28460693359375, -1.2441329956054688, -1.2036590576171875, -1.1631851196289062, -1.122711181640625, -1.0822372436523438, -1.0417633056640625, -1.0012893676757812, -0.9608154296875, -0.9203414916992188, -0.8798675537109375, -0.8393936157226562, -0.798919677734375, -0.7584457397460938, -0.7179718017578125, -0.6774978637695312, -0.63702392578125, -0.5965499877929688, -0.5560760498046875, -0.5156021118164062, -0.475128173828125, -0.43465423583984375, -0.3941802978515625, -0.35370635986328125, -0.313232421875, -0.27275848388671875, -0.2322845458984375, -0.19181060791015625, -0.151336669921875, -0.11086273193359375, -0.0703887939453125, -0.02991485595703125, 0.01055908203125, 0.05103302001953125, 0.0915069580078125, 0.13198089599609375, 0.172454833984375, 0.21292877197265625, 0.2534027099609375, 0.29387664794921875, 0.3343505859375, 0.37482452392578125, 0.4152984619140625, 0.45577239990234375, 0.496246337890625, 0.5367202758789062, 0.5771942138671875, 0.6176681518554688, 0.65814208984375, 0.6986160278320312, 0.7390899658203125, 0.7795639038085938, 0.820037841796875, 0.8605117797851562, 0.9009857177734375, 0.9414596557617188, 0.98193359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 5.0, 4.0, 11.0, 22.0, 19.0, 40.0, 80.0, 135.0, 265.0, 609.0, 1823.0, 11572.0, 407758.0, 608902.0, 13979.0, 2083.0, 647.0, 258.0, 132.0, 61.0, 53.0, 28.0, 23.0, 11.0, 7.0, 4.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.49560546875, -0.47963714599609375, -0.4636688232421875, -0.44770050048828125, -0.431732177734375, -0.41576385498046875, -0.3997955322265625, -0.38382720947265625, -0.36785888671875, -0.35189056396484375, -0.3359222412109375, -0.31995391845703125, -0.303985595703125, -0.28801727294921875, -0.2720489501953125, -0.25608062744140625, -0.2401123046875, -0.22414398193359375, -0.2081756591796875, -0.19220733642578125, -0.176239013671875, -0.16027069091796875, -0.1443023681640625, -0.12833404541015625, -0.11236572265625, -0.09639739990234375, -0.0804290771484375, -0.06446075439453125, -0.048492431640625, -0.03252410888671875, -0.0165557861328125, -0.00058746337890625, 0.015380859375, 0.03134918212890625, 0.0473175048828125, 0.06328582763671875, 0.079254150390625, 0.09522247314453125, 0.1111907958984375, 0.12715911865234375, 0.14312744140625, 0.15909576416015625, 0.1750640869140625, 0.19103240966796875, 0.207000732421875, 0.22296905517578125, 0.2389373779296875, 0.25490570068359375, 0.2708740234375, 0.28684234619140625, 0.3028106689453125, 0.31877899169921875, 0.334747314453125, 0.35071563720703125, 0.3666839599609375, 0.38265228271484375, 0.39862060546875, 0.41458892822265625, 0.4305572509765625, 0.44652557373046875, 0.462493896484375, 0.47846221923828125, 0.4944305419921875, 0.5103988647460938, 0.5263671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 9.0, 10.0, 7.0, 12.0, 11.0, 14.0, 20.0, 27.0, 32.0, 44.0, 62.0, 60.0, 90.0, 80.0, 102.0, 81.0, 69.0, 55.0, 48.0, 26.0, 20.0, 23.0, 15.0, 11.0, 17.0, 10.0, 9.0, 5.0, 7.0, 3.0, 6.0, 0.0, 4.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-4.57763671875e-05, -4.42061573266983e-05, -4.2635947465896606e-05, -4.106573760509491e-05, -3.949552774429321e-05, -3.7925317883491516e-05, -3.635510802268982e-05, -3.478489816188812e-05, -3.3214688301086426e-05, -3.164447844028473e-05, -3.0074268579483032e-05, -2.8504058718681335e-05, -2.693384885787964e-05, -2.5363638997077942e-05, -2.3793429136276245e-05, -2.222321927547455e-05, -2.065300941467285e-05, -1.9082799553871155e-05, -1.7512589693069458e-05, -1.594237983226776e-05, -1.4372169971466064e-05, -1.2801960110664368e-05, -1.1231750249862671e-05, -9.661540389060974e-06, -8.091330528259277e-06, -6.5211206674575806e-06, -4.950910806655884e-06, -3.380700945854187e-06, -1.8104910850524902e-06, -2.4028122425079346e-07, 1.3299286365509033e-06, 2.9001384973526e-06, 4.470348358154297e-06, 6.040558218955994e-06, 7.6107680797576904e-06, 9.180977940559387e-06, 1.0751187801361084e-05, 1.232139766216278e-05, 1.3891607522964478e-05, 1.5461817383766174e-05, 1.703202724456787e-05, 1.8602237105369568e-05, 2.0172446966171265e-05, 2.174265682697296e-05, 2.3312866687774658e-05, 2.4883076548576355e-05, 2.6453286409378052e-05, 2.802349627017975e-05, 2.9593706130981445e-05, 3.116391599178314e-05, 3.273412585258484e-05, 3.4304335713386536e-05, 3.587454557418823e-05, 3.744475543498993e-05, 3.9014965295791626e-05, 4.058517515659332e-05, 4.215538501739502e-05, 4.3725594878196716e-05, 4.529580473899841e-05, 4.686601459980011e-05, 4.843622446060181e-05, 5.0006434321403503e-05, 5.15766441822052e-05, 5.31468540430069e-05, 5.4717063903808594e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 6.0, 5.0, 3.0, 9.0, 9.0, 16.0, 24.0, 44.0, 77.0, 124.0, 194.0, 377.0, 754.0, 1886.0, 6937.0, 73096.0, 865256.0, 88409.0, 7691.0, 1971.0, 746.0, 380.0, 213.0, 111.0, 63.0, 42.0, 37.0, 32.0, 12.0, 14.0, 6.0, 8.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.46826171875, -0.4550819396972656, -0.44190216064453125, -0.4287223815917969, -0.4155426025390625, -0.4023628234863281, -0.38918304443359375, -0.3760032653808594, -0.362823486328125, -0.3496437072753906, -0.33646392822265625, -0.3232841491699219, -0.3101043701171875, -0.2969245910644531, -0.28374481201171875, -0.2705650329589844, -0.25738525390625, -0.24420547485351562, -0.23102569580078125, -0.21784591674804688, -0.2046661376953125, -0.19148635864257812, -0.17830657958984375, -0.16512680053710938, -0.151947021484375, -0.13876724243164062, -0.12558746337890625, -0.11240768432617188, -0.0992279052734375, -0.08604812622070312, -0.07286834716796875, -0.059688568115234375, -0.0465087890625, -0.033329010009765625, -0.02014923095703125, -0.006969451904296875, 0.0062103271484375, 0.019390106201171875, 0.03256988525390625, 0.045749664306640625, 0.058929443359375, 0.07210922241210938, 0.08528900146484375, 0.09846878051757812, 0.1116485595703125, 0.12482833862304688, 0.13800811767578125, 0.15118789672851562, 0.16436767578125, 0.17754745483398438, 0.19072723388671875, 0.20390701293945312, 0.2170867919921875, 0.23026657104492188, 0.24344635009765625, 0.2566261291503906, 0.269805908203125, 0.2829856872558594, 0.29616546630859375, 0.3093452453613281, 0.3225250244140625, 0.3357048034667969, 0.34888458251953125, 0.3620643615722656, 0.375244140625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 1.0, 2.0, 7.0, 2.0, 8.0, 11.0, 17.0, 18.0, 42.0, 45.0, 57.0, 67.0, 94.0, 104.0, 120.0, 94.0, 74.0, 72.0, 46.0, 35.0, 24.0, 21.0, 11.0, 9.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.395263671875, -0.3830146789550781, -0.37076568603515625, -0.3585166931152344, -0.3462677001953125, -0.3340187072753906, -0.32176971435546875, -0.3095207214355469, -0.297271728515625, -0.2850227355957031, -0.27277374267578125, -0.2605247497558594, -0.2482757568359375, -0.23602676391601562, -0.22377777099609375, -0.21152877807617188, -0.19927978515625, -0.18703079223632812, -0.17478179931640625, -0.16253280639648438, -0.1502838134765625, -0.13803482055664062, -0.12578582763671875, -0.11353683471679688, -0.101287841796875, -0.08903884887695312, -0.07678985595703125, -0.06454086303710938, -0.0522918701171875, -0.040042877197265625, -0.02779388427734375, -0.015544891357421875, -0.0032958984375, 0.008953094482421875, 0.02120208740234375, 0.033451080322265625, 0.0457000732421875, 0.057949066162109375, 0.07019805908203125, 0.08244705200195312, 0.094696044921875, 0.10694503784179688, 0.11919403076171875, 0.13144302368164062, 0.1436920166015625, 0.15594100952148438, 0.16819000244140625, 0.18043899536132812, 0.19268798828125, 0.20493698120117188, 0.21718597412109375, 0.22943496704101562, 0.2416839599609375, 0.2539329528808594, 0.26618194580078125, 0.2784309387207031, 0.290679931640625, 0.3029289245605469, 0.31517791748046875, 0.3274269104003906, 0.3396759033203125, 0.3519248962402344, 0.36417388916015625, 0.3764228820800781, 0.388671875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 39.0, 194.0, 478.0, 225.0, 45.0, 10.0, 4.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.693227767944336, -12.213361740112305, -11.73349666595459, -11.253630638122559, -10.773765563964844, -10.293899536132812, -9.814033508300781, -9.33416748046875, -8.854302406311035, -8.374436378479004, -7.894571304321289, -7.414705276489258, -6.934839725494385, -6.454974174499512, -5.9751081466674805, -5.495242595672607, -5.015377044677734, -4.535511493682861, -4.055645942687988, -3.575779914855957, -3.095914363861084, -2.616048812866211, -2.136183023452759, -1.6563172340393066, -1.1764516830444336, -0.696586012840271, -0.2167203426361084, 0.2631453275680542, 0.7430109977722168, 1.2228765487670898, 1.702742338180542, 2.182608127593994, 2.662473678588867, 3.1423392295837402, 3.6222050189971924, 4.1020708084106445, 4.581936359405518, 5.061801910400391, 5.541667938232422, 6.021533489227295, 6.501399040222168, 6.981264591217041, 7.461130142211914, 7.940996170043945, 8.420862197875977, 8.900727272033691, 9.380593299865723, 9.860458374023438, 10.340324401855469, 10.8201904296875, 11.300055503845215, 11.779921531677246, 12.259786605834961, 12.739652633666992, 13.219518661499023, 13.699384689331055, 14.17924976348877, 14.6591157913208, 15.138980865478516, 15.618846893310547, 16.098712921142578, 16.57857894897461, 17.058443069458008, 17.53830909729004, 18.01817512512207]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 6.0, 7.0, 14.0, 12.0, 23.0, 28.0, 21.0, 25.0, 43.0, 51.0, 59.0, 53.0, 59.0, 66.0, 74.0, 61.0, 55.0, 59.0, 50.0, 43.0, 39.0, 31.0, 25.0, 22.0, 19.0, 17.0, 16.0, 4.0, 7.0, 4.0, 6.0, 2.0, 3.0, 2.0, 0.0, 3.0], "bins": [-8.431958198547363, -8.234298706054688, -8.036640167236328, -7.838980674743652, -7.641321659088135, -7.443662643432617, -7.2460036277771, -7.048344612121582, -6.850685119628906, -6.653026103973389, -6.455367088317871, -6.257707595825195, -6.060048580169678, -5.86238956451416, -5.664730548858643, -5.467071533203125, -5.269412517547607, -5.07175350189209, -4.874094486236572, -4.676435470581055, -4.478775978088379, -4.281116962432861, -4.083457946777344, -3.885798931121826, -3.6881396770477295, -3.490480661392212, -3.2928214073181152, -3.0951623916625977, -2.89750337600708, -2.6998441219329834, -2.502185106277466, -2.304525852203369, -2.1068663597106934, -1.9092072248458862, -1.711548089981079, -1.5138890743255615, -1.3162299394607544, -1.1185708045959473, -0.9209117889404297, -0.7232526540756226, -0.5255935192108154, -0.3279344141483307, -0.13027530908584595, 0.0673837661743164, 0.26504290103912354, 0.46270203590393066, 0.6603610515594482, 0.8580201864242554, 1.0556793212890625, 1.2533384561538696, 1.4509975910186768, 1.6486566066741943, 1.8463157415390015, 2.0439748764038086, 2.241633892059326, 2.4392929077148438, 2.6369521617889404, 2.834611177444458, 3.0322704315185547, 3.2299294471740723, 3.42758846282959, 3.6252477169036865, 3.822906732559204, 4.020565986633301, 4.218225002288818]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 8.0, 10.0, 9.0, 20.0, 34.0, 46.0, 76.0, 108.0, 177.0, 276.0, 728.0, 4189072.0, 2850.0, 312.0, 193.0, 126.0, 59.0, 68.0, 35.0, 22.0, 18.0, 12.0, 7.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.36328125, -6.16839599609375, -5.9735107421875, -5.77862548828125, -5.583740234375, -5.38885498046875, -5.1939697265625, -4.99908447265625, -4.80419921875, -4.60931396484375, -4.4144287109375, -4.21954345703125, -4.024658203125, -3.82977294921875, -3.6348876953125, -3.44000244140625, -3.2451171875, -3.05023193359375, -2.8553466796875, -2.66046142578125, -2.465576171875, -2.27069091796875, -2.0758056640625, -1.88092041015625, -1.68603515625, -1.49114990234375, -1.2962646484375, -1.10137939453125, -0.906494140625, -0.71160888671875, -0.5167236328125, -0.32183837890625, -0.126953125, 0.06793212890625, 0.2628173828125, 0.45770263671875, 0.652587890625, 0.84747314453125, 1.0423583984375, 1.23724365234375, 1.43212890625, 1.62701416015625, 1.8218994140625, 2.01678466796875, 2.211669921875, 2.40655517578125, 2.6014404296875, 2.79632568359375, 2.9912109375, 3.18609619140625, 3.3809814453125, 3.57586669921875, 3.770751953125, 3.96563720703125, 4.1605224609375, 4.35540771484375, 4.55029296875, 4.74517822265625, 4.9400634765625, 5.13494873046875, 5.329833984375, 5.52471923828125, 5.7196044921875, 5.91448974609375, 6.109375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 8.0, 5.0, 21.0, 22.0, 38.0, 42.0, 61.0, 69.0, 96.0, 88.0, 92.0, 77.0, 81.0, 75.0, 53.0, 45.0, 41.0, 34.0, 18.0, 16.0, 9.0, 5.0, 5.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.71240234375, -0.697113037109375, -0.68182373046875, -0.666534423828125, -0.6512451171875, -0.635955810546875, -0.62066650390625, -0.605377197265625, -0.590087890625, -0.574798583984375, -0.55950927734375, -0.544219970703125, -0.5289306640625, -0.513641357421875, -0.49835205078125, -0.483062744140625, -0.4677734375, -0.452484130859375, -0.43719482421875, -0.421905517578125, -0.4066162109375, -0.391326904296875, -0.37603759765625, -0.360748291015625, -0.345458984375, -0.330169677734375, -0.31488037109375, -0.299591064453125, -0.2843017578125, -0.269012451171875, -0.25372314453125, -0.238433837890625, -0.22314453125, -0.207855224609375, -0.19256591796875, -0.177276611328125, -0.1619873046875, -0.146697998046875, -0.13140869140625, -0.116119384765625, -0.100830078125, -0.085540771484375, -0.07025146484375, -0.054962158203125, -0.0396728515625, -0.024383544921875, -0.00909423828125, 0.006195068359375, 0.021484375, 0.036773681640625, 0.05206298828125, 0.067352294921875, 0.0826416015625, 0.097930908203125, 0.11322021484375, 0.128509521484375, 0.143798828125, 0.159088134765625, 0.17437744140625, 0.189666748046875, 0.2049560546875, 0.220245361328125, 0.23553466796875, 0.250823974609375, 0.26611328125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 10.0, 23.0, 28.0, 86.0, 151.0, 435.0, 1612.0, 11238.0, 323114.0, 3818347.0, 34868.0, 3458.0, 606.0, 188.0, 57.0, 41.0, 14.0, 4.0, 7.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.79638671875, -0.7635116577148438, -0.7306365966796875, -0.6977615356445312, -0.664886474609375, -0.6320114135742188, -0.5991363525390625, -0.5662612915039062, -0.53338623046875, -0.5005111694335938, -0.4676361083984375, -0.43476104736328125, -0.401885986328125, -0.36901092529296875, -0.3361358642578125, -0.30326080322265625, -0.2703857421875, -0.23751068115234375, -0.2046356201171875, -0.17176055908203125, -0.138885498046875, -0.10601043701171875, -0.0731353759765625, -0.04026031494140625, -0.00738525390625, 0.02548980712890625, 0.0583648681640625, 0.09123992919921875, 0.124114990234375, 0.15699005126953125, 0.1898651123046875, 0.22274017333984375, 0.255615234375, 0.28849029541015625, 0.3213653564453125, 0.35424041748046875, 0.387115478515625, 0.41999053955078125, 0.4528656005859375, 0.48574066162109375, 0.51861572265625, 0.5514907836914062, 0.5843658447265625, 0.6172409057617188, 0.650115966796875, 0.6829910278320312, 0.7158660888671875, 0.7487411499023438, 0.7816162109375, 0.8144912719726562, 0.8473663330078125, 0.8802413940429688, 0.913116455078125, 0.9459915161132812, 0.9788665771484375, 1.0117416381835938, 1.04461669921875, 1.0774917602539062, 1.1103668212890625, 1.1432418823242188, 1.176116943359375, 1.2089920043945312, 1.2418670654296875, 1.2747421264648438, 1.3076171875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 1.0, 6.0, 7.0, 3.0, 9.0, 9.0, 25.0, 34.0, 59.0, 89.0, 251.0, 823.0, 1573.0, 743.0, 227.0, 103.0, 51.0, 15.0, 15.0, 14.0, 5.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.083984375, -1.0584335327148438, -1.0328826904296875, -1.0073318481445312, -0.981781005859375, -0.9562301635742188, -0.9306793212890625, -0.9051284790039062, -0.87957763671875, -0.8540267944335938, -0.8284759521484375, -0.8029251098632812, -0.777374267578125, -0.7518234252929688, -0.7262725830078125, -0.7007217407226562, -0.6751708984375, -0.6496200561523438, -0.6240692138671875, -0.5985183715820312, -0.572967529296875, -0.5474166870117188, -0.5218658447265625, -0.49631500244140625, -0.47076416015625, -0.44521331787109375, -0.4196624755859375, -0.39411163330078125, -0.368560791015625, -0.34300994873046875, -0.3174591064453125, -0.29190826416015625, -0.266357421875, -0.24080657958984375, -0.2152557373046875, -0.18970489501953125, -0.164154052734375, -0.13860321044921875, -0.1130523681640625, -0.08750152587890625, -0.06195068359375, -0.03639984130859375, -0.0108489990234375, 0.01470184326171875, 0.040252685546875, 0.06580352783203125, 0.0913543701171875, 0.11690521240234375, 0.1424560546875, 0.16800689697265625, 0.1935577392578125, 0.21910858154296875, 0.244659423828125, 0.27021026611328125, 0.2957611083984375, 0.32131195068359375, 0.34686279296875, 0.37241363525390625, 0.3979644775390625, 0.42351531982421875, 0.449066162109375, 0.47461700439453125, 0.5001678466796875, 0.5257186889648438, 0.55126953125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 6.0, 9.0, 52.0, 222.0, 424.0, 214.0, 49.0, 14.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.852296829223633, -5.5910797119140625, -5.32986307144165, -5.06864595413208, -4.807429313659668, -4.546212196350098, -4.284995079040527, -4.023777961730957, -3.762561321258545, -3.5013444423675537, -3.2401275634765625, -2.978910446166992, -2.717693567276001, -2.4564766883850098, -2.1952595710754395, -1.9340426921844482, -1.672825813293457, -1.4116089344024658, -1.150391936302185, -0.8891749978065491, -0.6279580593109131, -0.3667411804199219, -0.10552418231964111, 0.15569281578063965, 0.41690969467163086, 0.6781266331672668, 0.9393435716629028, 1.2005605697631836, 1.4617774486541748, 1.722994327545166, 1.9842113256454468, 2.2454283237457275, 2.5066442489624023, 2.7678611278533936, 3.0290780067443848, 3.290295124053955, 3.5515120029449463, 3.8127288818359375, 4.073945999145508, 4.335163116455078, 4.59637975692749, 4.8575968742370605, 5.118813514709473, 5.380030632019043, 5.641247749328613, 5.902464389801025, 6.163681507110596, 6.424898147583008, 6.686115264892578, 6.947332382202148, 7.2085490226745605, 7.469766139984131, 7.730982780456543, 7.992199897766113, 8.253417015075684, 8.514634132385254, 8.775850296020508, 9.037067413330078, 9.298284530639648, 9.559500694274902, 9.820717811584473, 10.081934928894043, 10.343152046203613, 10.604369163513184, 10.865586280822754]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 7.0, 6.0, 4.0, 6.0, 10.0, 10.0, 11.0, 25.0, 33.0, 37.0, 35.0, 49.0, 45.0, 66.0, 59.0, 69.0, 60.0, 80.0, 75.0, 58.0, 38.0, 51.0, 37.0, 34.0, 22.0, 31.0, 14.0, 15.0, 11.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0146944522857666, -2.9176440238952637, -2.8205933570861816, -2.7235429286956787, -2.626492500305176, -2.5294418334960938, -2.432391405105591, -2.335340976715088, -2.238290309906006, -2.141239881515503, -2.044189214706421, -1.947138786315918, -1.8500882387161255, -1.753037691116333, -1.65598726272583, -1.5589367151260376, -1.4618861675262451, -1.3648356199264526, -1.2677850723266602, -1.1707346439361572, -1.0736840963363647, -0.9766335487365723, -0.8795830607414246, -0.7825325727462769, -0.6854820251464844, -0.5884314775466919, -0.4913809895515442, -0.3943304717540741, -0.297279953956604, -0.2002294361591339, -0.10317891836166382, -0.006128430366516113, 0.09092235565185547, 0.18797287344932556, 0.28502339124679565, 0.38207390904426575, 0.47912442684173584, 0.5761749744415283, 0.673225462436676, 0.7702759504318237, 0.8673264980316162, 0.9643770456314087, 1.0614275932312012, 1.158478021621704, 1.2555285692214966, 1.352579116821289, 1.449629545211792, 1.5466800928115845, 1.643730640411377, 1.7407811880111694, 1.837831735610962, 1.9348821640014648, 2.031932830810547, 2.12898325920105, 2.2260336875915527, 2.3230843544006348, 2.4201347827911377, 2.5171852111816406, 2.6142358779907227, 2.7112863063812256, 2.8083367347717285, 2.9053874015808105, 3.0024378299713135, 3.0994882583618164, 3.1965389251708984]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 5.0, 7.0, 5.0, 12.0, 16.0, 23.0, 42.0, 67.0, 98.0, 154.0, 231.0, 312.0, 503.0, 810.0, 1345.0, 2342.0, 4319.0, 8144.0, 16035.0, 33892.0, 77859.0, 188512.0, 342455.0, 210204.0, 86541.0, 37208.0, 17609.0, 8764.0, 4542.0, 2534.0, 1482.0, 914.0, 545.0, 379.0, 215.0, 148.0, 92.0, 60.0, 46.0, 32.0, 21.0, 16.0, 5.0, 3.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.32568359375, -0.31568145751953125, -0.3056793212890625, -0.29567718505859375, -0.285675048828125, -0.27567291259765625, -0.2656707763671875, -0.25566864013671875, -0.24566650390625, -0.23566436767578125, -0.2256622314453125, -0.21566009521484375, -0.205657958984375, -0.19565582275390625, -0.1856536865234375, -0.17565155029296875, -0.1656494140625, -0.15564727783203125, -0.1456451416015625, -0.13564300537109375, -0.125640869140625, -0.11563873291015625, -0.1056365966796875, -0.09563446044921875, -0.08563232421875, -0.07563018798828125, -0.0656280517578125, -0.05562591552734375, -0.045623779296875, -0.03562164306640625, -0.0256195068359375, -0.01561737060546875, -0.005615234375, 0.00438690185546875, 0.0143890380859375, 0.02439117431640625, 0.034393310546875, 0.04439544677734375, 0.0543975830078125, 0.06439971923828125, 0.07440185546875, 0.08440399169921875, 0.0944061279296875, 0.10440826416015625, 0.114410400390625, 0.12441253662109375, 0.1344146728515625, 0.14441680908203125, 0.1544189453125, 0.16442108154296875, 0.1744232177734375, 0.18442535400390625, 0.194427490234375, 0.20442962646484375, 0.2144317626953125, 0.22443389892578125, 0.23443603515625, 0.24443817138671875, 0.2544403076171875, 0.26444244384765625, 0.274444580078125, 0.28444671630859375, 0.2944488525390625, 0.30445098876953125, 0.314453125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 4.0, 4.0, 8.0, 13.0, 22.0, 23.0, 33.0, 37.0, 55.0, 30.0, 58.0, 59.0, 68.0, 72.0, 70.0, 58.0, 52.0, 53.0, 54.0, 35.0, 41.0, 38.0, 34.0, 17.0, 17.0, 15.0, 10.0, 8.0, 6.0, 2.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.423583984375, -0.41251373291015625, -0.4014434814453125, -0.39037322998046875, -0.379302978515625, -0.36823272705078125, -0.3571624755859375, -0.34609222412109375, -0.33502197265625, -0.32395172119140625, -0.3128814697265625, -0.30181121826171875, -0.290740966796875, -0.27967071533203125, -0.2686004638671875, -0.25753021240234375, -0.2464599609375, -0.23538970947265625, -0.2243194580078125, -0.21324920654296875, -0.202178955078125, -0.19110870361328125, -0.1800384521484375, -0.16896820068359375, -0.15789794921875, -0.14682769775390625, -0.1357574462890625, -0.12468719482421875, -0.113616943359375, -0.10254669189453125, -0.0914764404296875, -0.08040618896484375, -0.0693359375, -0.05826568603515625, -0.0471954345703125, -0.03612518310546875, -0.025054931640625, -0.01398468017578125, -0.0029144287109375, 0.00815582275390625, 0.01922607421875, 0.03029632568359375, 0.0413665771484375, 0.05243682861328125, 0.063507080078125, 0.07457733154296875, 0.0856475830078125, 0.09671783447265625, 0.1077880859375, 0.11885833740234375, 0.1299285888671875, 0.14099884033203125, 0.152069091796875, 0.16313934326171875, 0.1742095947265625, 0.18527984619140625, 0.19635009765625, 0.20742034912109375, 0.2184906005859375, 0.22956085205078125, 0.240631103515625, 0.25170135498046875, 0.2627716064453125, 0.27384185791015625, 0.284912109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 7.0, 6.0, 3.0, 14.0, 8.0, 17.0, 30.0, 51.0, 79.0, 139.0, 258.0, 504.0, 1173.0, 3655.0, 21337.0, 274335.0, 690073.0, 47747.0, 6110.0, 1656.0, 644.0, 294.0, 172.0, 85.0, 59.0, 34.0, 25.0, 11.0, 8.0, 11.0, 3.0, 4.0, 7.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.279296875, -1.24896240234375, -1.2186279296875, -1.18829345703125, -1.157958984375, -1.12762451171875, -1.0972900390625, -1.06695556640625, -1.03662109375, -1.00628662109375, -0.9759521484375, -0.94561767578125, -0.915283203125, -0.88494873046875, -0.8546142578125, -0.82427978515625, -0.7939453125, -0.76361083984375, -0.7332763671875, -0.70294189453125, -0.672607421875, -0.64227294921875, -0.6119384765625, -0.58160400390625, -0.55126953125, -0.52093505859375, -0.4906005859375, -0.46026611328125, -0.429931640625, -0.39959716796875, -0.3692626953125, -0.33892822265625, -0.30859375, -0.27825927734375, -0.2479248046875, -0.21759033203125, -0.187255859375, -0.15692138671875, -0.1265869140625, -0.09625244140625, -0.06591796875, -0.03558349609375, -0.0052490234375, 0.02508544921875, 0.055419921875, 0.08575439453125, 0.1160888671875, 0.14642333984375, 0.1767578125, 0.20709228515625, 0.2374267578125, 0.26776123046875, 0.298095703125, 0.32843017578125, 0.3587646484375, 0.38909912109375, 0.41943359375, 0.44976806640625, 0.4801025390625, 0.51043701171875, 0.540771484375, 0.57110595703125, 0.6014404296875, 0.63177490234375, 0.662109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 4.0, 7.0, 3.0, 3.0, 8.0, 5.0, 9.0, 8.0, 4.0, 13.0, 15.0, 22.0, 19.0, 22.0, 28.0, 18.0, 36.0, 41.0, 34.0, 29.0, 35.0, 52.0, 45.0, 43.0, 51.0, 66.0, 53.0, 50.0, 35.0, 30.0, 28.0, 27.0, 26.0, 19.0, 15.0, 11.0, 11.0, 16.0, 15.0, 13.0, 9.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0], "bins": [-1.0302734375, -1.0002975463867188, -0.9703216552734375, -0.9403457641601562, -0.910369873046875, -0.8803939819335938, -0.8504180908203125, -0.8204421997070312, -0.79046630859375, -0.7604904174804688, -0.7305145263671875, -0.7005386352539062, -0.670562744140625, -0.6405868530273438, -0.6106109619140625, -0.5806350708007812, -0.5506591796875, -0.5206832885742188, -0.4907073974609375, -0.46073150634765625, -0.430755615234375, -0.40077972412109375, -0.3708038330078125, -0.34082794189453125, -0.31085205078125, -0.28087615966796875, -0.2509002685546875, -0.22092437744140625, -0.190948486328125, -0.16097259521484375, -0.1309967041015625, -0.10102081298828125, -0.071044921875, -0.04106903076171875, -0.0110931396484375, 0.01888275146484375, 0.048858642578125, 0.07883453369140625, 0.1088104248046875, 0.13878631591796875, 0.16876220703125, 0.19873809814453125, 0.2287139892578125, 0.25868988037109375, 0.288665771484375, 0.31864166259765625, 0.3486175537109375, 0.37859344482421875, 0.4085693359375, 0.43854522705078125, 0.4685211181640625, 0.49849700927734375, 0.528472900390625, 0.5584487915039062, 0.5884246826171875, 0.6184005737304688, 0.64837646484375, 0.6783523559570312, 0.7083282470703125, 0.7383041381835938, 0.768280029296875, 0.7982559204101562, 0.8282318115234375, 0.8582077026367188, 0.88818359375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 5.0, 3.0, 10.0, 6.0, 16.0, 25.0, 36.0, 78.0, 147.0, 324.0, 996.0, 4290.0, 86637.0, 932152.0, 20442.0, 2268.0, 648.0, 210.0, 106.0, 54.0, 31.0, 19.0, 14.0, 7.0, 7.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.5889511108398438, -0.5665740966796875, -0.5441970825195312, -0.521820068359375, -0.49944305419921875, -0.4770660400390625, -0.45468902587890625, -0.43231201171875, -0.40993499755859375, -0.3875579833984375, -0.36518096923828125, -0.342803955078125, -0.32042694091796875, -0.2980499267578125, -0.27567291259765625, -0.2532958984375, -0.23091888427734375, -0.2085418701171875, -0.18616485595703125, -0.163787841796875, -0.14141082763671875, -0.1190338134765625, -0.09665679931640625, -0.07427978515625, -0.05190277099609375, -0.0295257568359375, -0.00714874267578125, 0.015228271484375, 0.03760528564453125, 0.0599822998046875, 0.08235931396484375, 0.104736328125, 0.12711334228515625, 0.1494903564453125, 0.17186737060546875, 0.194244384765625, 0.21662139892578125, 0.2389984130859375, 0.26137542724609375, 0.28375244140625, 0.30612945556640625, 0.3285064697265625, 0.35088348388671875, 0.373260498046875, 0.39563751220703125, 0.4180145263671875, 0.44039154052734375, 0.4627685546875, 0.48514556884765625, 0.5075225830078125, 0.5298995971679688, 0.552276611328125, 0.5746536254882812, 0.5970306396484375, 0.6194076538085938, 0.64178466796875, 0.6641616821289062, 0.6865386962890625, 0.7089157104492188, 0.731292724609375, 0.7536697387695312, 0.7760467529296875, 0.7984237670898438, 0.82080078125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 2.0, 4.0, 9.0, 12.0, 7.0, 13.0, 20.0, 31.0, 25.0, 33.0, 30.0, 59.0, 62.0, 101.0, 80.0, 97.0, 101.0, 63.0, 57.0, 36.0, 29.0, 29.0, 23.0, 19.0, 17.0, 10.0, 8.0, 10.0, 6.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.02467155456543e-05, -4.861690104007721e-05, -4.698708653450012e-05, -4.5357272028923035e-05, -4.372745752334595e-05, -4.209764301776886e-05, -4.046782851219177e-05, -3.8838014006614685e-05, -3.72081995010376e-05, -3.557838499546051e-05, -3.394857048988342e-05, -3.2318755984306335e-05, -3.068894147872925e-05, -2.905912697315216e-05, -2.7429312467575073e-05, -2.5799497961997986e-05, -2.41696834564209e-05, -2.253986895084381e-05, -2.0910054445266724e-05, -1.9280239939689636e-05, -1.765042543411255e-05, -1.602061092853546e-05, -1.4390796422958374e-05, -1.2760981917381287e-05, -1.11311674118042e-05, -9.501352906227112e-06, -7.871538400650024e-06, -6.241723895072937e-06, -4.61190938949585e-06, -2.982094883918762e-06, -1.3522803783416748e-06, 2.775341272354126e-07, 1.9073486328125e-06, 3.5371631383895874e-06, 5.166977643966675e-06, 6.796792149543762e-06, 8.42660665512085e-06, 1.0056421160697937e-05, 1.1686235666275024e-05, 1.3316050171852112e-05, 1.49458646774292e-05, 1.6575679183006287e-05, 1.8205493688583374e-05, 1.983530819416046e-05, 2.146512269973755e-05, 2.3094937205314636e-05, 2.4724751710891724e-05, 2.635456621646881e-05, 2.79843807220459e-05, 2.9614195227622986e-05, 3.124400973320007e-05, 3.287382423877716e-05, 3.450363874435425e-05, 3.6133453249931335e-05, 3.776326775550842e-05, 3.939308226108551e-05, 4.10228967666626e-05, 4.2652711272239685e-05, 4.428252577781677e-05, 4.591234028339386e-05, 4.754215478897095e-05, 4.9171969294548035e-05, 5.080178380012512e-05, 5.243159830570221e-05, 5.40614128112793e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 5.0, 4.0, 10.0, 14.0, 9.0, 13.0, 35.0, 46.0, 56.0, 123.0, 196.0, 355.0, 815.0, 2380.0, 10517.0, 209944.0, 790775.0, 26957.0, 3931.0, 1254.0, 514.0, 232.0, 128.0, 88.0, 55.0, 36.0, 18.0, 9.0, 15.0, 3.0, 6.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.445556640625, -0.4308052062988281, -0.41605377197265625, -0.4013023376464844, -0.3865509033203125, -0.3717994689941406, -0.35704803466796875, -0.3422966003417969, -0.327545166015625, -0.3127937316894531, -0.29804229736328125, -0.2832908630371094, -0.2685394287109375, -0.2537879943847656, -0.23903656005859375, -0.22428512573242188, -0.20953369140625, -0.19478225708007812, -0.18003082275390625, -0.16527938842773438, -0.1505279541015625, -0.13577651977539062, -0.12102508544921875, -0.10627365112304688, -0.091522216796875, -0.07677078247070312, -0.06201934814453125, -0.047267913818359375, -0.0325164794921875, -0.017765045166015625, -0.00301361083984375, 0.011737823486328125, 0.0264892578125, 0.041240692138671875, 0.05599212646484375, 0.07074356079101562, 0.0854949951171875, 0.10024642944335938, 0.11499786376953125, 0.12974929809570312, 0.144500732421875, 0.15925216674804688, 0.17400360107421875, 0.18875503540039062, 0.2035064697265625, 0.21825790405273438, 0.23300933837890625, 0.24776077270507812, 0.26251220703125, 0.2772636413574219, 0.29201507568359375, 0.3067665100097656, 0.3215179443359375, 0.3362693786621094, 0.35102081298828125, 0.3657722473144531, 0.380523681640625, 0.3952751159667969, 0.41002655029296875, 0.4247779846191406, 0.4395294189453125, 0.4542808532714844, 0.46903228759765625, 0.4837837219238281, 0.49853515625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 15.0, 28.0, 81.0, 99.0, 142.0, 194.0, 172.0, 113.0, 67.0, 39.0, 25.0, 10.0, 8.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6474609375, -0.6263427734375, -0.605224609375, -0.5841064453125, -0.56298828125, -0.5418701171875, -0.520751953125, -0.4996337890625, -0.478515625, -0.4573974609375, -0.436279296875, -0.4151611328125, -0.39404296875, -0.3729248046875, -0.351806640625, -0.3306884765625, -0.3095703125, -0.2884521484375, -0.267333984375, -0.2462158203125, -0.22509765625, -0.2039794921875, -0.182861328125, -0.1617431640625, -0.140625, -0.1195068359375, -0.098388671875, -0.0772705078125, -0.05615234375, -0.0350341796875, -0.013916015625, 0.0072021484375, 0.0283203125, 0.0494384765625, 0.070556640625, 0.0916748046875, 0.11279296875, 0.1339111328125, 0.155029296875, 0.1761474609375, 0.197265625, 0.2183837890625, 0.239501953125, 0.2606201171875, 0.28173828125, 0.3028564453125, 0.323974609375, 0.3450927734375, 0.3662109375, 0.3873291015625, 0.408447265625, 0.4295654296875, 0.45068359375, 0.4718017578125, 0.492919921875, 0.5140380859375, 0.53515625, 0.5562744140625, 0.577392578125, 0.5985107421875, 0.61962890625, 0.6407470703125, 0.661865234375, 0.6829833984375, 0.7041015625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 0.0, 10.0, 36.0, 90.0, 239.0, 322.0, 161.0, 77.0, 36.0, 13.0, 7.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-12.114429473876953, -11.83338737487793, -11.55234432220459, -11.271302223205566, -10.990260124206543, -10.709217071533203, -10.42817497253418, -10.147132873535156, -9.866090774536133, -9.58504867553711, -9.30400562286377, -9.022963523864746, -8.741921424865723, -8.460878372192383, -8.17983627319336, -7.898794174194336, -7.617751121520996, -7.3367085456848145, -7.055666446685791, -6.774623870849609, -6.493581771850586, -6.212539196014404, -5.931496620178223, -5.650454521179199, -5.369411945343018, -5.088369369506836, -4.8073272705078125, -4.526284694671631, -4.245242118835449, -3.964200019836426, -3.683157444000244, -3.4021151065826416, -3.121072292327881, -2.8400299549102783, -2.558987617492676, -2.277945041656494, -1.9969027042388916, -1.715860366821289, -1.434817910194397, -1.1537754535675049, -0.8727331161499023, -0.591690719127655, -0.3106483221054077, -0.0296059250831604, 0.2514364719390869, 0.5324788093566895, 0.8135212659835815, 1.0945637226104736, 1.3756060600280762, 1.6566483974456787, 1.9376908540725708, 2.218733310699463, 2.4997756481170654, 2.780817985534668, 3.0618605613708496, 3.342902898788452, 3.6239452362060547, 3.9049875736236572, 4.18602991104126, 4.467072486877441, 4.748114585876465, 5.0291571617126465, 5.310199737548828, 5.591241836547852, 5.872284412384033]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 10.0, 8.0, 6.0, 3.0, 11.0, 19.0, 21.0, 20.0, 24.0, 30.0, 33.0, 41.0, 34.0, 41.0, 45.0, 56.0, 61.0, 51.0, 56.0, 57.0, 58.0, 41.0, 38.0, 39.0, 30.0, 30.0, 23.0, 25.0, 21.0, 18.0, 13.0, 9.0, 9.0, 5.0, 4.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.871244430541992, -4.730114936828613, -4.588985443115234, -4.4478559494018555, -4.306726455688477, -4.165597438812256, -4.024467945098877, -3.883338451385498, -3.742208957672119, -3.6010794639587402, -3.4599499702453613, -3.3188207149505615, -3.1776912212371826, -3.0365617275238037, -2.895432472229004, -2.754302978515625, -2.613173484802246, -2.472043991088867, -2.3309144973754883, -2.1897852420806885, -2.0486557483673096, -1.9075262546539307, -1.7663968801498413, -1.625267505645752, -1.484138011932373, -1.3430085182189941, -1.2018791437149048, -1.0607497692108154, -0.9196202754974365, -0.7784908413887024, -0.6373614072799683, -0.49623197317123413, -0.3551025390625, -0.21397310495376587, -0.07284367084503174, 0.06828576326370239, 0.20941519737243652, 0.35054463148117065, 0.4916740655899048, 0.6328034996986389, 0.773932933807373, 0.9150623679161072, 1.0561918020248413, 1.1973211765289307, 1.3384506702423096, 1.4795801639556885, 1.6207095384597778, 1.7618389129638672, 1.902968406677246, 2.044097900390625, 2.185227394104004, 2.3263566493988037, 2.4674861431121826, 2.6086156368255615, 2.7497448921203613, 2.8908743858337402, 3.032003879547119, 3.173133373260498, 3.314262866973877, 3.4553921222686768, 3.5965216159820557, 3.7376511096954346, 3.8787803649902344, 4.019909858703613, 4.161039352416992]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 9.0, 25.0, 32.0, 62.0, 105.0, 182.0, 503.0, 2057.0, 14205.0, 485173.0, 3620824.0, 64115.0, 5382.0, 969.0, 320.0, 122.0, 64.0, 37.0, 31.0, 20.0, 9.0, 6.0, 7.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.80859375, -0.7849960327148438, -0.7613983154296875, -0.7378005981445312, -0.714202880859375, -0.6906051635742188, -0.6670074462890625, -0.6434097290039062, -0.61981201171875, -0.5962142944335938, -0.5726165771484375, -0.5490188598632812, -0.525421142578125, -0.5018234252929688, -0.4782257080078125, -0.45462799072265625, -0.4310302734375, -0.40743255615234375, -0.3838348388671875, -0.36023712158203125, -0.336639404296875, -0.31304168701171875, -0.2894439697265625, -0.26584625244140625, -0.24224853515625, -0.21865081787109375, -0.1950531005859375, -0.17145538330078125, -0.147857666015625, -0.12425994873046875, -0.1006622314453125, -0.07706451416015625, -0.053466796875, -0.02986907958984375, -0.0062713623046875, 0.01732635498046875, 0.040924072265625, 0.06452178955078125, 0.0881195068359375, 0.11171722412109375, 0.13531494140625, 0.15891265869140625, 0.1825103759765625, 0.20610809326171875, 0.229705810546875, 0.25330352783203125, 0.2769012451171875, 0.30049896240234375, 0.3240966796875, 0.34769439697265625, 0.3712921142578125, 0.39488983154296875, 0.418487548828125, 0.44208526611328125, 0.4656829833984375, 0.48928070068359375, 0.51287841796875, 0.5364761352539062, 0.5600738525390625, 0.5836715698242188, 0.607269287109375, 0.6308670043945312, 0.6544647216796875, 0.6780624389648438, 0.70166015625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 9.0, 7.0, 16.0, 27.0, 33.0, 35.0, 40.0, 39.0, 54.0, 61.0, 67.0, 70.0, 93.0, 59.0, 71.0, 59.0, 47.0, 46.0, 38.0, 31.0, 26.0, 15.0, 17.0, 10.0, 9.0, 9.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.423095703125, -0.4123649597167969, -0.40163421630859375, -0.3909034729003906, -0.3801727294921875, -0.3694419860839844, -0.35871124267578125, -0.3479804992675781, -0.337249755859375, -0.3265190124511719, -0.31578826904296875, -0.3050575256347656, -0.2943267822265625, -0.2835960388183594, -0.27286529541015625, -0.2621345520019531, -0.25140380859375, -0.24067306518554688, -0.22994232177734375, -0.21921157836914062, -0.2084808349609375, -0.19775009155273438, -0.18701934814453125, -0.17628860473632812, -0.165557861328125, -0.15482711791992188, -0.14409637451171875, -0.13336563110351562, -0.1226348876953125, -0.11190414428710938, -0.10117340087890625, -0.09044265747070312, -0.0797119140625, -0.06898117065429688, -0.05825042724609375, -0.047519683837890625, -0.0367889404296875, -0.026058197021484375, -0.01532745361328125, -0.004596710205078125, 0.006134033203125, 0.016864776611328125, 0.02759552001953125, 0.038326263427734375, 0.0490570068359375, 0.059787750244140625, 0.07051849365234375, 0.08124923706054688, 0.09197998046875, 0.10271072387695312, 0.11344146728515625, 0.12417221069335938, 0.1349029541015625, 0.14563369750976562, 0.15636444091796875, 0.16709518432617188, 0.177825927734375, 0.18855667114257812, 0.19928741455078125, 0.21001815795898438, 0.2207489013671875, 0.23147964477539062, 0.24221038818359375, 0.2529411315917969, 0.263671875]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 0.0, 10.0, 10.0, 10.0, 15.0, 30.0, 47.0, 62.0, 145.0, 219.0, 487.0, 1113.0, 3668.0, 15624.0, 119704.0, 3301875.0, 703613.0, 37460.0, 6938.0, 1923.0, 694.0, 291.0, 135.0, 75.0, 41.0, 31.0, 18.0, 13.0, 8.0, 8.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58056640625, -0.56170654296875, -0.5428466796875, -0.52398681640625, -0.505126953125, -0.48626708984375, -0.4674072265625, -0.44854736328125, -0.4296875, -0.41082763671875, -0.3919677734375, -0.37310791015625, -0.354248046875, -0.33538818359375, -0.3165283203125, -0.29766845703125, -0.27880859375, -0.25994873046875, -0.2410888671875, -0.22222900390625, -0.203369140625, -0.18450927734375, -0.1656494140625, -0.14678955078125, -0.1279296875, -0.10906982421875, -0.0902099609375, -0.07135009765625, -0.052490234375, -0.03363037109375, -0.0147705078125, 0.00408935546875, 0.02294921875, 0.04180908203125, 0.0606689453125, 0.07952880859375, 0.098388671875, 0.11724853515625, 0.1361083984375, 0.15496826171875, 0.173828125, 0.19268798828125, 0.2115478515625, 0.23040771484375, 0.249267578125, 0.26812744140625, 0.2869873046875, 0.30584716796875, 0.32470703125, 0.34356689453125, 0.3624267578125, 0.38128662109375, 0.400146484375, 0.41900634765625, 0.4378662109375, 0.45672607421875, 0.4755859375, 0.49444580078125, 0.5133056640625, 0.53216552734375, 0.551025390625, 0.56988525390625, 0.5887451171875, 0.60760498046875, 0.62646484375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 3.0, 10.0, 7.0, 13.0, 6.0, 16.0, 26.0, 37.0, 39.0, 77.0, 97.0, 141.0, 220.0, 423.0, 742.0, 896.0, 563.0, 300.0, 164.0, 98.0, 63.0, 37.0, 17.0, 21.0, 15.0, 12.0, 4.0, 5.0, 2.0, 5.0, 1.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.57275390625, -0.5549697875976562, -0.5371856689453125, -0.5194015502929688, -0.501617431640625, -0.48383331298828125, -0.4660491943359375, -0.44826507568359375, -0.43048095703125, -0.41269683837890625, -0.3949127197265625, -0.37712860107421875, -0.359344482421875, -0.34156036376953125, -0.3237762451171875, -0.30599212646484375, -0.2882080078125, -0.27042388916015625, -0.2526397705078125, -0.23485565185546875, -0.217071533203125, -0.19928741455078125, -0.1815032958984375, -0.16371917724609375, -0.14593505859375, -0.12815093994140625, -0.1103668212890625, -0.09258270263671875, -0.074798583984375, -0.05701446533203125, -0.0392303466796875, -0.02144622802734375, -0.003662109375, 0.01412200927734375, 0.0319061279296875, 0.04969024658203125, 0.067474365234375, 0.08525848388671875, 0.1030426025390625, 0.12082672119140625, 0.13861083984375, 0.15639495849609375, 0.1741790771484375, 0.19196319580078125, 0.209747314453125, 0.22753143310546875, 0.2453155517578125, 0.26309967041015625, 0.2808837890625, 0.29866790771484375, 0.3164520263671875, 0.33423614501953125, 0.352020263671875, 0.36980438232421875, 0.3875885009765625, 0.40537261962890625, 0.42315673828125, 0.44094085693359375, 0.4587249755859375, 0.47650909423828125, 0.494293212890625, 0.5120773315429688, 0.5298614501953125, 0.5476455688476562, 0.5654296875]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 5.0, 6.0, 22.0, 118.0, 349.0, 361.0, 105.0, 19.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.454782485961914, -13.102960586547852, -12.751137733459473, -12.39931583404541, -12.047492980957031, -11.695671081542969, -11.343849182128906, -10.992027282714844, -10.640204429626465, -10.288382530212402, -9.936559677124023, -9.584737777709961, -9.232915878295898, -8.88109302520752, -8.529271125793457, -8.177448272705078, -7.825626373291016, -7.473803997039795, -7.121981620788574, -6.770159721374512, -6.418337345123291, -6.06651496887207, -5.714693069458008, -5.362870693206787, -5.011048316955566, -4.659225940704346, -4.307403564453125, -3.9555816650390625, -3.603759288787842, -3.251936912536621, -2.9001147747039795, -2.548292636871338, -2.196470260620117, -1.844648003578186, -1.4928257465362549, -1.1410034894943237, -0.7891812324523926, -0.4373589754104614, -0.08553671836853027, 0.26628541946411133, 0.618107795715332, 0.9699300527572632, 1.3217523097991943, 1.6735745668411255, 2.0253968238830566, 2.3772192001342773, 2.729041337966919, 3.0808634757995605, 3.4326858520507812, 3.784508228302002, 4.136330604553223, 4.488152503967285, 4.839974880218506, 5.191797256469727, 5.543619155883789, 5.89544153213501, 6.2472639083862305, 6.599086284637451, 6.950908660888672, 7.302730560302734, 7.654552936553955, 8.006375312805176, 8.358197212219238, 8.710020065307617, 9.06184196472168]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 3.0, 3.0, 12.0, 5.0, 11.0, 11.0, 20.0, 25.0, 41.0, 26.0, 37.0, 39.0, 45.0, 58.0, 55.0, 70.0, 65.0, 68.0, 61.0, 58.0, 69.0, 47.0, 46.0, 33.0, 23.0, 20.0, 18.0, 5.0, 9.0, 8.0, 3.0, 3.0, 1.0, 7.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.024430274963379, -3.8982365131378174, -3.7720425128936768, -3.6458487510681152, -3.5196547508239746, -3.393460988998413, -3.2672672271728516, -3.141073226928711, -3.0148792266845703, -2.888685464859009, -2.762491464614868, -2.6362977027893066, -2.510103702545166, -2.3839099407196045, -2.257716178894043, -2.1315221786499023, -2.005328416824341, -1.8791345357894897, -1.7529406547546387, -1.6267468929290771, -1.5005528926849365, -1.374359130859375, -1.248165249824524, -1.1219713687896729, -0.9957774877548218, -0.8695836067199707, -0.7433897256851196, -0.6171959042549133, -0.49100202322006226, -0.3648081421852112, -0.23861432075500488, -0.11242043972015381, 0.013773441314697266, 0.13996730744838715, 0.266161173582077, 0.3923550248146057, 0.5185489058494568, 0.6447427868843079, 0.7709366083145142, 0.8971304893493652, 1.0233243703842163, 1.1495182514190674, 1.2757121324539185, 1.4019060134887695, 1.528099775314331, 1.6542937755584717, 1.7804875373840332, 1.9066814184188843, 2.0328752994537354, 2.159069061279297, 2.2852630615234375, 2.411456823348999, 2.5376508235931396, 2.663844585418701, 2.790038585662842, 2.9162323474884033, 3.042426109313965, 3.1686198711395264, 3.294813871383667, 3.4210076332092285, 3.547201633453369, 3.6733953952789307, 3.799589157104492, 3.925783157348633, 4.051977157592773]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 12.0, 8.0, 10.0, 16.0, 17.0, 26.0, 51.0, 55.0, 101.0, 125.0, 191.0, 268.0, 402.0, 722.0, 1044.0, 1806.0, 3200.0, 5835.0, 10822.0, 21552.0, 43026.0, 85417.0, 166472.0, 264734.0, 211998.0, 113329.0, 57035.0, 28331.0, 14381.0, 7544.0, 3994.0, 2252.0, 1307.0, 854.0, 579.0, 343.0, 187.0, 154.0, 92.0, 73.0, 58.0, 46.0, 23.0, 18.0, 13.0, 12.0, 8.0, 7.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.262451171875, -0.25417327880859375, -0.2458953857421875, -0.23761749267578125, -0.229339599609375, -0.22106170654296875, -0.2127838134765625, -0.20450592041015625, -0.19622802734375, -0.18795013427734375, -0.1796722412109375, -0.17139434814453125, -0.163116455078125, -0.15483856201171875, -0.1465606689453125, -0.13828277587890625, -0.1300048828125, -0.12172698974609375, -0.1134490966796875, -0.10517120361328125, -0.096893310546875, -0.08861541748046875, -0.0803375244140625, -0.07205963134765625, -0.06378173828125, -0.05550384521484375, -0.0472259521484375, -0.03894805908203125, -0.030670166015625, -0.02239227294921875, -0.0141143798828125, -0.00583648681640625, 0.00244140625, 0.01071929931640625, 0.0189971923828125, 0.02727508544921875, 0.035552978515625, 0.04383087158203125, 0.0521087646484375, 0.06038665771484375, 0.06866455078125, 0.07694244384765625, 0.0852203369140625, 0.09349822998046875, 0.101776123046875, 0.11005401611328125, 0.1183319091796875, 0.12660980224609375, 0.1348876953125, 0.14316558837890625, 0.1514434814453125, 0.15972137451171875, 0.167999267578125, 0.17627716064453125, 0.1845550537109375, 0.19283294677734375, 0.20111083984375, 0.20938873291015625, 0.2176666259765625, 0.22594451904296875, 0.234222412109375, 0.24250030517578125, 0.2507781982421875, 0.25905609130859375, 0.267333984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 14.0, 18.0, 31.0, 33.0, 30.0, 44.0, 45.0, 54.0, 65.0, 78.0, 58.0, 78.0, 63.0, 68.0, 72.0, 46.0, 38.0, 38.0, 35.0, 23.0, 14.0, 12.0, 13.0, 5.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.430908203125, -0.4198951721191406, -0.40888214111328125, -0.3978691101074219, -0.3868560791015625, -0.3758430480957031, -0.36483001708984375, -0.3538169860839844, -0.342803955078125, -0.3317909240722656, -0.32077789306640625, -0.3097648620605469, -0.2987518310546875, -0.2877388000488281, -0.27672576904296875, -0.2657127380371094, -0.25469970703125, -0.24368667602539062, -0.23267364501953125, -0.22166061401367188, -0.2106475830078125, -0.19963455200195312, -0.18862152099609375, -0.17760848999023438, -0.166595458984375, -0.15558242797851562, -0.14456939697265625, -0.13355636596679688, -0.1225433349609375, -0.11153030395507812, -0.10051727294921875, -0.08950424194335938, -0.0784912109375, -0.06747817993164062, -0.05646514892578125, -0.045452117919921875, -0.0344390869140625, -0.023426055908203125, -0.01241302490234375, -0.001399993896484375, 0.009613037109375, 0.020626068115234375, 0.03163909912109375, 0.042652130126953125, 0.0536651611328125, 0.06467819213867188, 0.07569122314453125, 0.08670425415039062, 0.09771728515625, 0.10873031616210938, 0.11974334716796875, 0.13075637817382812, 0.1417694091796875, 0.15278244018554688, 0.16379547119140625, 0.17480850219726562, 0.185821533203125, 0.19683456420898438, 0.20784759521484375, 0.21886062622070312, 0.2298736572265625, 0.24088668823242188, 0.25189971923828125, 0.2629127502441406, 0.27392578125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0, 3.0, 2.0, 8.0, 6.0, 10.0, 10.0, 17.0, 34.0, 26.0, 31.0, 68.0, 77.0, 99.0, 156.0, 217.0, 304.0, 482.0, 796.0, 1315.0, 2405.0, 5658.0, 19820.0, 110602.0, 639068.0, 216366.0, 35012.0, 8355.0, 3246.0, 1566.0, 922.0, 563.0, 385.0, 253.0, 196.0, 120.0, 101.0, 58.0, 52.0, 33.0, 34.0, 20.0, 18.0, 10.0, 9.0, 9.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.5673828125, -0.54888916015625, -0.5303955078125, -0.51190185546875, -0.493408203125, -0.47491455078125, -0.4564208984375, -0.43792724609375, -0.41943359375, -0.40093994140625, -0.3824462890625, -0.36395263671875, -0.345458984375, -0.32696533203125, -0.3084716796875, -0.28997802734375, -0.271484375, -0.25299072265625, -0.2344970703125, -0.21600341796875, -0.197509765625, -0.17901611328125, -0.1605224609375, -0.14202880859375, -0.12353515625, -0.10504150390625, -0.0865478515625, -0.06805419921875, -0.049560546875, -0.03106689453125, -0.0125732421875, 0.00592041015625, 0.0244140625, 0.04290771484375, 0.0614013671875, 0.07989501953125, 0.098388671875, 0.11688232421875, 0.1353759765625, 0.15386962890625, 0.17236328125, 0.19085693359375, 0.2093505859375, 0.22784423828125, 0.246337890625, 0.26483154296875, 0.2833251953125, 0.30181884765625, 0.3203125, 0.33880615234375, 0.3572998046875, 0.37579345703125, 0.394287109375, 0.41278076171875, 0.4312744140625, 0.44976806640625, 0.46826171875, 0.48675537109375, 0.5052490234375, 0.52374267578125, 0.542236328125, 0.56072998046875, 0.5792236328125, 0.59771728515625, 0.6162109375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 5.0, 8.0, 7.0, 5.0, 9.0, 11.0, 17.0, 15.0, 27.0, 22.0, 22.0, 28.0, 31.0, 38.0, 30.0, 40.0, 45.0, 64.0, 47.0, 55.0, 46.0, 52.0, 37.0, 34.0, 47.0, 24.0, 41.0, 31.0, 23.0, 24.0, 25.0, 19.0, 10.0, 13.0, 14.0, 6.0, 7.0, 5.0, 7.0, 3.0, 3.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.95751953125, -0.9260482788085938, -0.8945770263671875, -0.8631057739257812, -0.831634521484375, -0.8001632690429688, -0.7686920166015625, -0.7372207641601562, -0.70574951171875, -0.6742782592773438, -0.6428070068359375, -0.6113357543945312, -0.579864501953125, -0.5483932495117188, -0.5169219970703125, -0.48545074462890625, -0.4539794921875, -0.42250823974609375, -0.3910369873046875, -0.35956573486328125, -0.328094482421875, -0.29662322998046875, -0.2651519775390625, -0.23368072509765625, -0.20220947265625, -0.17073822021484375, -0.1392669677734375, -0.10779571533203125, -0.076324462890625, -0.04485321044921875, -0.0133819580078125, 0.01808929443359375, 0.049560546875, 0.08103179931640625, 0.1125030517578125, 0.14397430419921875, 0.175445556640625, 0.20691680908203125, 0.2383880615234375, 0.26985931396484375, 0.30133056640625, 0.33280181884765625, 0.3642730712890625, 0.39574432373046875, 0.427215576171875, 0.45868682861328125, 0.4901580810546875, 0.5216293334960938, 0.5531005859375, 0.5845718383789062, 0.6160430908203125, 0.6475143432617188, 0.678985595703125, 0.7104568481445312, 0.7419281005859375, 0.7733993530273438, 0.80487060546875, 0.8363418579101562, 0.8678131103515625, 0.8992843627929688, 0.930755615234375, 0.9622268676757812, 0.9936981201171875, 1.0251693725585938, 1.056640625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 9.0, 9.0, 19.0, 23.0, 35.0, 58.0, 102.0, 217.0, 647.0, 2198.0, 13396.0, 278468.0, 724573.0, 24284.0, 3076.0, 815.0, 321.0, 139.0, 61.0, 29.0, 28.0, 18.0, 9.0, 8.0, 7.0, 1.0, 1.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.365478515625, -0.3524818420410156, -0.33948516845703125, -0.3264884948730469, -0.3134918212890625, -0.3004951477050781, -0.28749847412109375, -0.2745018005371094, -0.261505126953125, -0.24850845336914062, -0.23551177978515625, -0.22251510620117188, -0.2095184326171875, -0.19652175903320312, -0.18352508544921875, -0.17052841186523438, -0.15753173828125, -0.14453506469726562, -0.13153839111328125, -0.11854171752929688, -0.1055450439453125, -0.09254837036132812, -0.07955169677734375, -0.06655502319335938, -0.053558349609375, -0.040561676025390625, -0.02756500244140625, -0.014568328857421875, -0.0015716552734375, 0.011425018310546875, 0.02442169189453125, 0.037418365478515625, 0.0504150390625, 0.06341171264648438, 0.07640838623046875, 0.08940505981445312, 0.1024017333984375, 0.11539840698242188, 0.12839508056640625, 0.14139175415039062, 0.154388427734375, 0.16738510131835938, 0.18038177490234375, 0.19337844848632812, 0.2063751220703125, 0.21937179565429688, 0.23236846923828125, 0.24536514282226562, 0.25836181640625, 0.2713584899902344, 0.28435516357421875, 0.2973518371582031, 0.3103485107421875, 0.3233451843261719, 0.33634185791015625, 0.3493385314941406, 0.362335205078125, 0.3753318786621094, 0.38832855224609375, 0.4013252258300781, 0.4143218994140625, 0.4273185729980469, 0.44031524658203125, 0.4533119201660156, 0.46630859375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 3.0, 6.0, 3.0, 2.0, 2.0, 8.0, 6.0, 12.0, 10.0, 10.0, 18.0, 28.0, 15.0, 19.0, 18.0, 38.0, 33.0, 41.0, 61.0, 77.0, 75.0, 99.0, 69.0, 51.0, 39.0, 36.0, 45.0, 33.0, 23.0, 18.0, 19.0, 8.0, 10.0, 14.0, 10.0, 6.0, 3.0, 7.0, 5.0, 3.0, 5.0, 5.0, 2.0, 0.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.875659942626953e-05, -4.7326087951660156e-05, -4.589557647705078e-05, -4.4465065002441406e-05, -4.303455352783203e-05, -4.1604042053222656e-05, -4.017353057861328e-05, -3.8743019104003906e-05, -3.731250762939453e-05, -3.5881996154785156e-05, -3.445148468017578e-05, -3.3020973205566406e-05, -3.159046173095703e-05, -3.0159950256347656e-05, -2.872943878173828e-05, -2.7298927307128906e-05, -2.586841583251953e-05, -2.4437904357910156e-05, -2.300739288330078e-05, -2.1576881408691406e-05, -2.014636993408203e-05, -1.8715858459472656e-05, -1.728534698486328e-05, -1.5854835510253906e-05, -1.4424324035644531e-05, -1.2993812561035156e-05, -1.1563301086425781e-05, -1.0132789611816406e-05, -8.702278137207031e-06, -7.271766662597656e-06, -5.841255187988281e-06, -4.410743713378906e-06, -2.9802322387695312e-06, -1.5497207641601562e-06, -1.1920928955078125e-07, 1.3113021850585938e-06, 2.7418136596679688e-06, 4.172325134277344e-06, 5.602836608886719e-06, 7.033348083496094e-06, 8.463859558105469e-06, 9.894371032714844e-06, 1.1324882507324219e-05, 1.2755393981933594e-05, 1.4185905456542969e-05, 1.5616416931152344e-05, 1.704692840576172e-05, 1.8477439880371094e-05, 1.990795135498047e-05, 2.1338462829589844e-05, 2.276897430419922e-05, 2.4199485778808594e-05, 2.562999725341797e-05, 2.7060508728027344e-05, 2.849102020263672e-05, 2.9921531677246094e-05, 3.135204315185547e-05, 3.2782554626464844e-05, 3.421306610107422e-05, 3.5643577575683594e-05, 3.707408905029297e-05, 3.8504600524902344e-05, 3.993511199951172e-05, 4.1365623474121094e-05, 4.279613494873047e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 8.0, 8.0, 8.0, 18.0, 32.0, 43.0, 86.0, 133.0, 303.0, 746.0, 2311.0, 13000.0, 306808.0, 700960.0, 19466.0, 2996.0, 892.0, 340.0, 152.0, 99.0, 50.0, 31.0, 21.0, 16.0, 14.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.472900390625, -0.4597969055175781, -0.44669342041015625, -0.4335899353027344, -0.4204864501953125, -0.4073829650878906, -0.39427947998046875, -0.3811759948730469, -0.368072509765625, -0.3549690246582031, -0.34186553955078125, -0.3287620544433594, -0.3156585693359375, -0.3025550842285156, -0.28945159912109375, -0.2763481140136719, -0.26324462890625, -0.2501411437988281, -0.23703765869140625, -0.22393417358398438, -0.2108306884765625, -0.19772720336914062, -0.18462371826171875, -0.17152023315429688, -0.158416748046875, -0.14531326293945312, -0.13220977783203125, -0.11910629272460938, -0.1060028076171875, -0.09289932250976562, -0.07979583740234375, -0.06669235229492188, -0.0535888671875, -0.040485382080078125, -0.02738189697265625, -0.014278411865234375, -0.0011749267578125, 0.011928558349609375, 0.02503204345703125, 0.038135528564453125, 0.051239013671875, 0.06434249877929688, 0.07744598388671875, 0.09054946899414062, 0.1036529541015625, 0.11675643920898438, 0.12985992431640625, 0.14296340942382812, 0.15606689453125, 0.16917037963867188, 0.18227386474609375, 0.19537734985351562, 0.2084808349609375, 0.22158432006835938, 0.23468780517578125, 0.24779129028320312, 0.260894775390625, 0.2739982604980469, 0.28710174560546875, 0.3002052307128906, 0.3133087158203125, 0.3264122009277344, 0.33951568603515625, 0.3526191711425781, 0.36572265625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 2.0, 7.0, 3.0, 8.0, 13.0, 16.0, 15.0, 21.0, 27.0, 43.0, 65.0, 65.0, 87.0, 87.0, 95.0, 89.0, 80.0, 73.0, 45.0, 45.0, 33.0, 15.0, 14.0, 21.0, 8.0, 8.0, 7.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3955078125, -0.3857231140136719, -0.37593841552734375, -0.3661537170410156, -0.3563690185546875, -0.3465843200683594, -0.33679962158203125, -0.3270149230957031, -0.317230224609375, -0.3074455261230469, -0.29766082763671875, -0.2878761291503906, -0.2780914306640625, -0.2683067321777344, -0.25852203369140625, -0.24873733520507812, -0.23895263671875, -0.22916793823242188, -0.21938323974609375, -0.20959854125976562, -0.1998138427734375, -0.19002914428710938, -0.18024444580078125, -0.17045974731445312, -0.160675048828125, -0.15089035034179688, -0.14110565185546875, -0.13132095336914062, -0.1215362548828125, -0.11175155639648438, -0.10196685791015625, -0.09218215942382812, -0.0823974609375, -0.07261276245117188, -0.06282806396484375, -0.053043365478515625, -0.0432586669921875, -0.033473968505859375, -0.02368927001953125, -0.013904571533203125, -0.004119873046875, 0.005664825439453125, 0.01544952392578125, 0.025234222412109375, 0.0350189208984375, 0.044803619384765625, 0.05458831787109375, 0.06437301635742188, 0.07415771484375, 0.08394241333007812, 0.09372711181640625, 0.10351181030273438, 0.1132965087890625, 0.12308120727539062, 0.13286590576171875, 0.14265060424804688, 0.152435302734375, 0.16222000122070312, 0.17200469970703125, 0.18178939819335938, 0.1915740966796875, 0.20135879516601562, 0.21114349365234375, 0.22092819213867188, 0.230712890625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 11.0, 46.0, 224.0, 540.0, 155.0, 21.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.110833168029785, -12.647407531738281, -12.183981895446777, -11.720556259155273, -11.25713062286377, -10.793704986572266, -10.330278396606445, -9.866853713989258, -9.403427124023438, -8.940001487731934, -8.47657585144043, -8.013150215148926, -7.549724578857422, -7.086298942565918, -6.622872829437256, -6.159447193145752, -5.696022033691406, -5.232596397399902, -4.769170761108398, -4.3057451248168945, -3.8423192501068115, -3.3788936138153076, -2.9154677391052246, -2.4520421028137207, -1.9886164665222168, -1.525190830230713, -1.0617650747299194, -0.598339319229126, -0.13491368293762207, 0.32851195335388184, 0.7919378280639648, 1.2553634643554688, 1.7187881469726562, 2.18221378326416, 2.645639419555664, 3.109065294265747, 3.572490930557251, 4.035916328430176, 4.499342441558838, 4.962768077850342, 5.426193714141846, 5.88961935043335, 6.3530449867248535, 6.816471099853516, 7.2798967361450195, 7.743322372436523, 8.206748008728027, 8.670173645019531, 9.133599281311035, 9.597024917602539, 10.060450553894043, 10.523876190185547, 10.98730182647705, 11.450727462768555, 11.914154052734375, 12.377578735351562, 12.841005325317383, 13.304430961608887, 13.76785659790039, 14.231282234191895, 14.694707870483398, 15.158133506774902, 15.621559143066406, 16.084985733032227, 16.548410415649414]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 5.0, 2.0, 1.0, 5.0, 2.0, 2.0, 5.0, 5.0, 8.0, 10.0, 11.0, 6.0, 15.0, 14.0, 14.0, 27.0, 15.0, 13.0, 21.0, 22.0, 23.0, 30.0, 29.0, 30.0, 43.0, 51.0, 42.0, 62.0, 58.0, 68.0, 35.0, 31.0, 33.0, 34.0, 30.0, 30.0, 20.0, 20.0, 20.0, 17.0, 15.0, 15.0, 12.0, 7.0, 9.0, 11.0, 4.0, 1.0, 3.0, 6.0, 5.0, 5.0, 4.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.617647409439087, -3.504509449005127, -3.391371250152588, -3.278233289718628, -3.165095329284668, -3.051957130432129, -2.938819169998169, -2.825681209564209, -2.71254301071167, -2.59940505027771, -2.486266851425171, -2.373128890991211, -2.259990692138672, -2.146852731704712, -2.033714771270752, -1.9205766916275024, -1.807438611984253, -1.6943005323410034, -1.581162452697754, -1.468024492263794, -1.3548864126205444, -1.241748332977295, -1.128610372543335, -1.0154722929000854, -0.9023342132568359, -0.7891961336135864, -0.6760581135749817, -0.562920093536377, -0.44978201389312744, -0.33664393424987793, -0.2235059142112732, -0.11036789417266846, 0.0027704238891601562, 0.11590847373008728, 0.2290465235710144, 0.34218457341194153, 0.45532262325286865, 0.5684607028961182, 0.6815987229347229, 0.7947367429733276, 0.9078748226165771, 1.0210129022598267, 1.1341509819030762, 1.2472889423370361, 1.3604270219802856, 1.4735651016235352, 1.5867030620574951, 1.6998411417007446, 1.8129792213439941, 1.9261173009872437, 2.039255380630493, 2.152393341064453, 2.265531539916992, 2.378669500350952, 2.491807460784912, 2.604945659637451, 2.718083620071411, 2.831221580505371, 2.94435977935791, 3.05749773979187, 3.17063570022583, 3.283773899078369, 3.396911859512329, 3.510049819946289, 3.623188018798828]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 3.0, 6.0, 10.0, 19.0, 22.0, 35.0, 69.0, 107.0, 177.0, 355.0, 747.0, 1958.0, 5790.0, 21505.0, 157158.0, 2065225.0, 1780267.0, 132014.0, 20227.0, 5417.0, 1747.0, 696.0, 304.0, 173.0, 92.0, 69.0, 33.0, 29.0, 9.0, 8.0, 9.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378173828125, -0.36794281005859375, -0.3577117919921875, -0.34748077392578125, -0.337249755859375, -0.32701873779296875, -0.3167877197265625, -0.30655670166015625, -0.29632568359375, -0.28609466552734375, -0.2758636474609375, -0.26563262939453125, -0.255401611328125, -0.24517059326171875, -0.2349395751953125, -0.22470855712890625, -0.2144775390625, -0.20424652099609375, -0.1940155029296875, -0.18378448486328125, -0.173553466796875, -0.16332244873046875, -0.1530914306640625, -0.14286041259765625, -0.13262939453125, -0.12239837646484375, -0.1121673583984375, -0.10193634033203125, -0.091705322265625, -0.08147430419921875, -0.0712432861328125, -0.06101226806640625, -0.05078125, -0.04055023193359375, -0.0303192138671875, -0.02008819580078125, -0.009857177734375, 0.00037384033203125, 0.0106048583984375, 0.02083587646484375, 0.03106689453125, 0.04129791259765625, 0.0515289306640625, 0.06175994873046875, 0.071990966796875, 0.08222198486328125, 0.0924530029296875, 0.10268402099609375, 0.1129150390625, 0.12314605712890625, 0.1333770751953125, 0.14360809326171875, 0.153839111328125, 0.16407012939453125, 0.1743011474609375, 0.18453216552734375, 0.19476318359375, 0.20499420166015625, 0.2152252197265625, 0.22545623779296875, 0.235687255859375, 0.24591827392578125, 0.2561492919921875, 0.26638031005859375, 0.276611328125]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 9.0, 8.0, 10.0, 14.0, 12.0, 25.0, 32.0, 43.0, 46.0, 57.0, 60.0, 61.0, 88.0, 72.0, 63.0, 62.0, 64.0, 58.0, 51.0, 35.0, 33.0, 19.0, 23.0, 30.0, 7.0, 7.0, 8.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.432373046875, -0.4214668273925781, -0.41056060791015625, -0.3996543884277344, -0.3887481689453125, -0.3778419494628906, -0.36693572998046875, -0.3560295104980469, -0.345123291015625, -0.3342170715332031, -0.32331085205078125, -0.3124046325683594, -0.3014984130859375, -0.2905921936035156, -0.27968597412109375, -0.2687797546386719, -0.25787353515625, -0.24696731567382812, -0.23606109619140625, -0.22515487670898438, -0.2142486572265625, -0.20334243774414062, -0.19243621826171875, -0.18152999877929688, -0.170623779296875, -0.15971755981445312, -0.14881134033203125, -0.13790512084960938, -0.1269989013671875, -0.11609268188476562, -0.10518646240234375, -0.09428024291992188, -0.0833740234375, -0.07246780395507812, -0.06156158447265625, -0.050655364990234375, -0.0397491455078125, -0.028842926025390625, -0.01793670654296875, -0.007030487060546875, 0.003875732421875, 0.014781951904296875, 0.02568817138671875, 0.036594390869140625, 0.0475006103515625, 0.058406829833984375, 0.06931304931640625, 0.08021926879882812, 0.09112548828125, 0.10203170776367188, 0.11293792724609375, 0.12384414672851562, 0.1347503662109375, 0.14565658569335938, 0.15656280517578125, 0.16746902465820312, 0.178375244140625, 0.18928146362304688, 0.20018768310546875, 0.21109390258789062, 0.2220001220703125, 0.23290634155273438, 0.24381256103515625, 0.2547187805175781, 0.265625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 17.0, 21.0, 32.0, 52.0, 68.0, 132.0, 239.0, 354.0, 920.0, 2435.0, 10985.0, 131155.0, 3793952.0, 234828.0, 14124.0, 2995.0, 1076.0, 413.0, 219.0, 91.0, 57.0, 30.0, 35.0, 13.0, 12.0, 6.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0], "bins": [-0.68505859375, -0.6646652221679688, -0.6442718505859375, -0.6238784790039062, -0.603485107421875, -0.5830917358398438, -0.5626983642578125, -0.5423049926757812, -0.52191162109375, -0.5015182495117188, -0.4811248779296875, -0.46073150634765625, -0.440338134765625, -0.41994476318359375, -0.3995513916015625, -0.37915802001953125, -0.3587646484375, -0.33837127685546875, -0.3179779052734375, -0.29758453369140625, -0.277191162109375, -0.25679779052734375, -0.2364044189453125, -0.21601104736328125, -0.19561767578125, -0.17522430419921875, -0.1548309326171875, -0.13443756103515625, -0.114044189453125, -0.09365081787109375, -0.0732574462890625, -0.05286407470703125, -0.032470703125, -0.01207733154296875, 0.0083160400390625, 0.02870941162109375, 0.049102783203125, 0.06949615478515625, 0.0898895263671875, 0.11028289794921875, 0.13067626953125, 0.15106964111328125, 0.1714630126953125, 0.19185638427734375, 0.212249755859375, 0.23264312744140625, 0.2530364990234375, 0.27342987060546875, 0.2938232421875, 0.31421661376953125, 0.3346099853515625, 0.35500335693359375, 0.375396728515625, 0.39579010009765625, 0.4161834716796875, 0.43657684326171875, 0.45697021484375, 0.47736358642578125, 0.4977569580078125, 0.5181503295898438, 0.538543701171875, 0.5589370727539062, 0.5793304443359375, 0.5997238159179688, 0.6201171875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 4.0, 9.0, 9.0, 15.0, 27.0, 36.0, 39.0, 91.0, 149.0, 357.0, 699.0, 1164.0, 829.0, 319.0, 140.0, 75.0, 37.0, 26.0, 19.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.7685546875, -0.7475204467773438, -0.7264862060546875, -0.7054519653320312, -0.684417724609375, -0.6633834838867188, -0.6423492431640625, -0.6213150024414062, -0.60028076171875, -0.5792465209960938, -0.5582122802734375, -0.5371780395507812, -0.516143798828125, -0.49510955810546875, -0.4740753173828125, -0.45304107666015625, -0.4320068359375, -0.41097259521484375, -0.3899383544921875, -0.36890411376953125, -0.347869873046875, -0.32683563232421875, -0.3058013916015625, -0.28476715087890625, -0.26373291015625, -0.24269866943359375, -0.2216644287109375, -0.20063018798828125, -0.179595947265625, -0.15856170654296875, -0.1375274658203125, -0.11649322509765625, -0.095458984375, -0.07442474365234375, -0.0533905029296875, -0.03235626220703125, -0.011322021484375, 0.00971221923828125, 0.0307464599609375, 0.05178070068359375, 0.07281494140625, 0.09384918212890625, 0.1148834228515625, 0.13591766357421875, 0.156951904296875, 0.17798614501953125, 0.1990203857421875, 0.22005462646484375, 0.2410888671875, 0.26212310791015625, 0.2831573486328125, 0.30419158935546875, 0.325225830078125, 0.34626007080078125, 0.3672943115234375, 0.38832855224609375, 0.40936279296875, 0.43039703369140625, 0.4514312744140625, 0.47246551513671875, 0.493499755859375, 0.5145339965820312, 0.5355682373046875, 0.5566024780273438, 0.57763671875]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 9.0, 8.0, 16.0, 32.0, 78.0, 164.0, 253.0, 240.0, 109.0, 44.0, 20.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.740957260131836, -7.561505317687988, -7.382052898406982, -7.202600955963135, -7.023148536682129, -6.843696594238281, -6.664244651794434, -6.484792709350586, -6.30534029006958, -6.125888347625732, -5.946435928344727, -5.766983985900879, -5.587532043457031, -5.408079624176025, -5.228627681732178, -5.049175262451172, -4.869723320007324, -4.690271377563477, -4.510818958282471, -4.331367015838623, -4.151914596557617, -3.9724626541137695, -3.793010711669922, -3.613558530807495, -3.4341063499450684, -3.2546541690826416, -3.075201988220215, -2.895750045776367, -2.7162978649139404, -2.5368456840515137, -2.357393741607666, -2.1779415607452393, -1.9984889030456543, -1.8190367221832275, -1.6395846605300903, -1.4601325988769531, -1.2806804180145264, -1.1012282371520996, -0.9217761754989624, -0.7423241138458252, -0.5628719329833984, -0.38341981172561646, -0.20396769046783447, -0.02451556921005249, 0.1549365520477295, 0.3343886733055115, 0.5138407945632935, 0.6932928562164307, 0.8727450370788574, 1.0521972179412842, 1.2316492795944214, 1.4111013412475586, 1.5905535221099854, 1.770005702972412, 1.9494577646255493, 2.1289098262786865, 2.3083620071411133, 2.48781418800354, 2.667266368865967, 2.8467183113098145, 3.026170492172241, 3.205622673034668, 3.3850746154785156, 3.5645267963409424, 3.743978977203369]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 6.0, 13.0, 11.0, 11.0, 16.0, 21.0, 27.0, 27.0, 29.0, 22.0, 45.0, 31.0, 43.0, 47.0, 53.0, 51.0, 40.0, 51.0, 60.0, 61.0, 36.0, 45.0, 40.0, 35.0, 27.0, 26.0, 23.0, 26.0, 12.0, 13.0, 13.0, 7.0, 7.0, 4.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.6104893684387207, -2.5285751819610596, -2.4466609954833984, -2.3647470474243164, -2.2828328609466553, -2.200918674468994, -2.119004487991333, -2.037090301513672, -1.9551761150360107, -1.8732619285583496, -1.791347861289978, -1.709433674812317, -1.6275194883346558, -1.5456054210662842, -1.463691234588623, -1.381777048110962, -1.2998629808425903, -1.2179487943649292, -1.1360347270965576, -1.0541205406188965, -0.9722063541412354, -0.890292227268219, -0.8083781003952026, -0.7264639139175415, -0.6445497870445251, -0.5626356601715088, -0.48072147369384766, -0.3988073468208313, -0.31689319014549255, -0.2349790334701538, -0.15306490659713745, -0.07115072011947632, 0.010763406753540039, 0.09267755597829819, 0.17459170520305634, 0.2565058469772339, 0.33842000365257263, 0.4203341603279114, 0.5022482872009277, 0.5841624736785889, 0.6660766005516052, 0.7479907274246216, 0.8299049139022827, 0.9118190407752991, 0.9937331676483154, 1.0756473541259766, 1.1575615406036377, 1.2394757270812988, 1.3213897943496704, 1.4033039808273315, 1.4852180480957031, 1.5671322345733643, 1.6490464210510254, 1.7309606075286865, 1.812874674797058, 1.8947888612747192, 1.9767029285430908, 2.058617115020752, 2.140531301498413, 2.222445487976074, 2.3043594360351562, 2.3862736225128174, 2.4681878089904785, 2.5501019954681396, 2.632016181945801]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 5.0, 11.0, 15.0, 28.0, 41.0, 60.0, 86.0, 153.0, 261.0, 450.0, 772.0, 1462.0, 2719.0, 5717.0, 13467.0, 34797.0, 95065.0, 268114.0, 376673.0, 155639.0, 55525.0, 20712.0, 8479.0, 3785.0, 1934.0, 1037.0, 631.0, 351.0, 210.0, 135.0, 67.0, 52.0, 26.0, 24.0, 12.0, 9.0, 9.0, 8.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.366943359375, -0.355560302734375, -0.34417724609375, -0.332794189453125, -0.3214111328125, -0.310028076171875, -0.29864501953125, -0.287261962890625, -0.27587890625, -0.264495849609375, -0.25311279296875, -0.241729736328125, -0.2303466796875, -0.218963623046875, -0.20758056640625, -0.196197509765625, -0.184814453125, -0.173431396484375, -0.16204833984375, -0.150665283203125, -0.1392822265625, -0.127899169921875, -0.11651611328125, -0.105133056640625, -0.09375, -0.082366943359375, -0.07098388671875, -0.059600830078125, -0.0482177734375, -0.036834716796875, -0.02545166015625, -0.014068603515625, -0.002685546875, 0.008697509765625, 0.02008056640625, 0.031463623046875, 0.0428466796875, 0.054229736328125, 0.06561279296875, 0.076995849609375, 0.08837890625, 0.099761962890625, 0.11114501953125, 0.122528076171875, 0.1339111328125, 0.145294189453125, 0.15667724609375, 0.168060302734375, 0.179443359375, 0.190826416015625, 0.20220947265625, 0.213592529296875, 0.2249755859375, 0.236358642578125, 0.24774169921875, 0.259124755859375, 0.2705078125, 0.281890869140625, 0.29327392578125, 0.304656982421875, 0.3160400390625, 0.327423095703125, 0.33880615234375, 0.350189208984375, 0.361572265625]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 6.0, 2.0, 6.0, 13.0, 8.0, 22.0, 15.0, 40.0, 39.0, 52.0, 52.0, 61.0, 57.0, 78.0, 83.0, 66.0, 62.0, 69.0, 55.0, 44.0, 31.0, 45.0, 31.0, 17.0, 14.0, 19.0, 8.0, 6.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-0.443359375, -0.43247222900390625, -0.4215850830078125, -0.41069793701171875, -0.399810791015625, -0.38892364501953125, -0.3780364990234375, -0.36714935302734375, -0.35626220703125, -0.34537506103515625, -0.3344879150390625, -0.32360076904296875, -0.312713623046875, -0.30182647705078125, -0.2909393310546875, -0.28005218505859375, -0.2691650390625, -0.25827789306640625, -0.2473907470703125, -0.23650360107421875, -0.225616455078125, -0.21472930908203125, -0.2038421630859375, -0.19295501708984375, -0.18206787109375, -0.17118072509765625, -0.1602935791015625, -0.14940643310546875, -0.138519287109375, -0.12763214111328125, -0.1167449951171875, -0.10585784912109375, -0.094970703125, -0.08408355712890625, -0.0731964111328125, -0.06230926513671875, -0.051422119140625, -0.04053497314453125, -0.0296478271484375, -0.01876068115234375, -0.00787353515625, 0.00301361083984375, 0.0139007568359375, 0.02478790283203125, 0.035675048828125, 0.04656219482421875, 0.0574493408203125, 0.06833648681640625, 0.0792236328125, 0.09011077880859375, 0.1009979248046875, 0.11188507080078125, 0.122772216796875, 0.13365936279296875, 0.1445465087890625, 0.15543365478515625, 0.16632080078125, 0.17720794677734375, 0.1880950927734375, 0.19898223876953125, 0.209869384765625, 0.22075653076171875, 0.2316436767578125, 0.24253082275390625, 0.25341796875]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 2.0, 6.0, 9.0, 13.0, 14.0, 18.0, 42.0, 44.0, 51.0, 85.0, 134.0, 185.0, 247.0, 450.0, 801.0, 1558.0, 3628.0, 11636.0, 57150.0, 548437.0, 358834.0, 48379.0, 10120.0, 3245.0, 1494.0, 700.0, 456.0, 258.0, 171.0, 117.0, 75.0, 63.0, 22.0, 23.0, 22.0, 15.0, 15.0, 13.0, 10.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.568359375, -0.5487289428710938, -0.5290985107421875, -0.5094680786132812, -0.489837646484375, -0.47020721435546875, -0.4505767822265625, -0.43094635009765625, -0.41131591796875, -0.39168548583984375, -0.3720550537109375, -0.35242462158203125, -0.332794189453125, -0.31316375732421875, -0.2935333251953125, -0.27390289306640625, -0.2542724609375, -0.23464202880859375, -0.2150115966796875, -0.19538116455078125, -0.175750732421875, -0.15612030029296875, -0.1364898681640625, -0.11685943603515625, -0.09722900390625, -0.07759857177734375, -0.0579681396484375, -0.03833770751953125, -0.018707275390625, 0.00092315673828125, 0.0205535888671875, 0.04018402099609375, 0.059814453125, 0.07944488525390625, 0.0990753173828125, 0.11870574951171875, 0.138336181640625, 0.15796661376953125, 0.1775970458984375, 0.19722747802734375, 0.21685791015625, 0.23648834228515625, 0.2561187744140625, 0.27574920654296875, 0.295379638671875, 0.31501007080078125, 0.3346405029296875, 0.35427093505859375, 0.3739013671875, 0.39353179931640625, 0.4131622314453125, 0.43279266357421875, 0.452423095703125, 0.47205352783203125, 0.4916839599609375, 0.5113143920898438, 0.53094482421875, 0.5505752563476562, 0.5702056884765625, 0.5898361206054688, 0.609466552734375, 0.6290969848632812, 0.6487274169921875, 0.6683578491210938, 0.68798828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 4.0, 3.0, 3.0, 7.0, 5.0, 13.0, 6.0, 4.0, 17.0, 9.0, 15.0, 17.0, 22.0, 27.0, 46.0, 45.0, 34.0, 48.0, 55.0, 46.0, 51.0, 52.0, 50.0, 61.0, 47.0, 42.0, 43.0, 38.0, 31.0, 34.0, 33.0, 18.0, 9.0, 18.0, 15.0, 10.0, 5.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.025390625, -0.9954681396484375, -0.965545654296875, -0.9356231689453125, -0.90570068359375, -0.8757781982421875, -0.845855712890625, -0.8159332275390625, -0.7860107421875, -0.7560882568359375, -0.726165771484375, -0.6962432861328125, -0.66632080078125, -0.6363983154296875, -0.606475830078125, -0.5765533447265625, -0.546630859375, -0.5167083740234375, -0.486785888671875, -0.4568634033203125, -0.42694091796875, -0.3970184326171875, -0.367095947265625, -0.3371734619140625, -0.3072509765625, -0.2773284912109375, -0.247406005859375, -0.2174835205078125, -0.18756103515625, -0.1576385498046875, -0.127716064453125, -0.0977935791015625, -0.06787109375, -0.0379486083984375, -0.008026123046875, 0.0218963623046875, 0.05181884765625, 0.0817413330078125, 0.111663818359375, 0.1415863037109375, 0.1715087890625, 0.2014312744140625, 0.231353759765625, 0.2612762451171875, 0.29119873046875, 0.3211212158203125, 0.351043701171875, 0.3809661865234375, 0.410888671875, 0.4408111572265625, 0.470733642578125, 0.5006561279296875, 0.53057861328125, 0.5605010986328125, 0.590423583984375, 0.6203460693359375, 0.6502685546875, 0.6801910400390625, 0.710113525390625, 0.7400360107421875, 0.76995849609375, 0.7998809814453125, 0.829803466796875, 0.8597259521484375, 0.8896484375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 1.0, 4.0, 6.0, 2.0, 5.0, 9.0, 9.0, 13.0, 21.0, 21.0, 53.0, 72.0, 93.0, 169.0, 309.0, 568.0, 1099.0, 2533.0, 7329.0, 28186.0, 150627.0, 700438.0, 122062.0, 24068.0, 6397.0, 2334.0, 958.0, 486.0, 255.0, 153.0, 79.0, 47.0, 45.0, 28.0, 18.0, 12.0, 11.0, 10.0, 8.0, 3.0, 1.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.2276611328125, -0.2206439971923828, -0.21362686157226562, -0.20660972595214844, -0.19959259033203125, -0.19257545471191406, -0.18555831909179688, -0.1785411834716797, -0.1715240478515625, -0.1645069122314453, -0.15748977661132812, -0.15047264099121094, -0.14345550537109375, -0.13643836975097656, -0.12942123413085938, -0.12240409851074219, -0.115386962890625, -0.10836982727050781, -0.10135269165039062, -0.09433555603027344, -0.08731842041015625, -0.08030128479003906, -0.07328414916992188, -0.06626701354980469, -0.0592498779296875, -0.05223274230957031, -0.045215606689453125, -0.03819847106933594, -0.03118133544921875, -0.024164199829101562, -0.017147064208984375, -0.010129928588867188, -0.00311279296875, 0.0039043426513671875, 0.010921478271484375, 0.017938613891601562, 0.02495574951171875, 0.03197288513183594, 0.038990020751953125, 0.04600715637207031, 0.0530242919921875, 0.06004142761230469, 0.06705856323242188, 0.07407569885253906, 0.08109283447265625, 0.08810997009277344, 0.09512710571289062, 0.10214424133300781, 0.109161376953125, 0.11617851257324219, 0.12319564819335938, 0.13021278381347656, 0.13722991943359375, 0.14424705505371094, 0.15126419067382812, 0.1582813262939453, 0.1652984619140625, 0.1723155975341797, 0.17933273315429688, 0.18634986877441406, 0.19336700439453125, 0.20038414001464844, 0.20740127563476562, 0.2144184112548828, 0.221435546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 8.0, 5.0, 15.0, 15.0, 14.0, 18.0, 30.0, 31.0, 29.0, 60.0, 84.0, 120.0, 115.0, 126.0, 88.0, 57.0, 37.0, 31.0, 27.0, 23.0, 16.0, 16.0, 16.0, 4.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-6.431341171264648e-05, -6.24489039182663e-05, -6.058439612388611e-05, -5.871988832950592e-05, -5.685538053512573e-05, -5.4990872740745544e-05, -5.3126364946365356e-05, -5.126185715198517e-05, -4.939734935760498e-05, -4.753284156322479e-05, -4.5668333768844604e-05, -4.3803825974464417e-05, -4.193931818008423e-05, -4.007481038570404e-05, -3.821030259132385e-05, -3.6345794796943665e-05, -3.4481287002563477e-05, -3.261677920818329e-05, -3.07522714138031e-05, -2.8887763619422913e-05, -2.7023255825042725e-05, -2.5158748030662537e-05, -2.329424023628235e-05, -2.142973244190216e-05, -1.9565224647521973e-05, -1.7700716853141785e-05, -1.5836209058761597e-05, -1.3971701264381409e-05, -1.210719347000122e-05, -1.0242685675621033e-05, -8.378177881240845e-06, -6.513670086860657e-06, -4.649162292480469e-06, -2.7846544981002808e-06, -9.201467037200928e-07, 9.443610906600952e-07, 2.808868885040283e-06, 4.673376679420471e-06, 6.537884473800659e-06, 8.402392268180847e-06, 1.0266900062561035e-05, 1.2131407856941223e-05, 1.3995915651321411e-05, 1.58604234457016e-05, 1.7724931240081787e-05, 1.9589439034461975e-05, 2.1453946828842163e-05, 2.331845462322235e-05, 2.518296241760254e-05, 2.7047470211982727e-05, 2.8911978006362915e-05, 3.07764858007431e-05, 3.264099359512329e-05, 3.450550138950348e-05, 3.637000918388367e-05, 3.8234516978263855e-05, 4.009902477264404e-05, 4.196353256702423e-05, 4.382804036140442e-05, 4.569254815578461e-05, 4.7557055950164795e-05, 4.942156374454498e-05, 5.128607153892517e-05, 5.315057933330536e-05, 5.501508712768555e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 6.0, 9.0, 13.0, 19.0, 33.0, 46.0, 69.0, 84.0, 168.0, 220.0, 494.0, 1010.0, 2313.0, 6545.0, 27309.0, 197107.0, 711139.0, 80090.0, 14353.0, 4231.0, 1610.0, 756.0, 354.0, 201.0, 135.0, 80.0, 55.0, 25.0, 21.0, 18.0, 13.0, 9.0, 7.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.29296875, -0.28551292419433594, -0.2780570983886719, -0.2706012725830078, -0.26314544677734375, -0.2556896209716797, -0.24823379516601562, -0.24077796936035156, -0.2333221435546875, -0.22586631774902344, -0.21841049194335938, -0.2109546661376953, -0.20349884033203125, -0.1960430145263672, -0.18858718872070312, -0.18113136291503906, -0.173675537109375, -0.16621971130371094, -0.15876388549804688, -0.1513080596923828, -0.14385223388671875, -0.1363964080810547, -0.12894058227539062, -0.12148475646972656, -0.1140289306640625, -0.10657310485839844, -0.09911727905273438, -0.09166145324707031, -0.08420562744140625, -0.07674980163574219, -0.06929397583007812, -0.06183815002441406, -0.05438232421875, -0.04692649841308594, -0.039470672607421875, -0.03201484680175781, -0.02455902099609375, -0.017103195190429688, -0.009647369384765625, -0.0021915435791015625, 0.0052642822265625, 0.012720108032226562, 0.020175933837890625, 0.027631759643554688, 0.03508758544921875, 0.04254341125488281, 0.049999237060546875, 0.05745506286621094, 0.064910888671875, 0.07236671447753906, 0.07982254028320312, 0.08727836608886719, 0.09473419189453125, 0.10219001770019531, 0.10964584350585938, 0.11710166931152344, 0.1245574951171875, 0.13201332092285156, 0.13946914672851562, 0.1469249725341797, 0.15438079833984375, 0.1618366241455078, 0.16929244995117188, 0.17674827575683594, 0.1842041015625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 3.0, 5.0, 3.0, 7.0, 2.0, 8.0, 11.0, 8.0, 13.0, 21.0, 32.0, 22.0, 44.0, 51.0, 79.0, 101.0, 114.0, 108.0, 92.0, 69.0, 48.0, 38.0, 34.0, 15.0, 14.0, 14.0, 14.0, 5.0, 7.0, 2.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.211669921875, -0.203125, -0.194580078125, -0.18603515625, -0.177490234375, -0.1689453125, -0.160400390625, -0.15185546875, -0.143310546875, -0.134765625, -0.126220703125, -0.11767578125, -0.109130859375, -0.1005859375, -0.092041015625, -0.08349609375, -0.074951171875, -0.06640625, -0.057861328125, -0.04931640625, -0.040771484375, -0.0322265625, -0.023681640625, -0.01513671875, -0.006591796875, 0.001953125, 0.010498046875, 0.01904296875, 0.027587890625, 0.0361328125, 0.044677734375, 0.05322265625, 0.061767578125, 0.0703125, 0.078857421875, 0.08740234375, 0.095947265625, 0.1044921875, 0.113037109375, 0.12158203125, 0.130126953125, 0.138671875, 0.147216796875, 0.15576171875, 0.164306640625, 0.1728515625, 0.181396484375, 0.18994140625, 0.198486328125, 0.20703125, 0.215576171875, 0.22412109375, 0.232666015625, 0.2412109375, 0.249755859375, 0.25830078125, 0.266845703125, 0.275390625, 0.283935546875, 0.29248046875, 0.301025390625, 0.3095703125, 0.318115234375, 0.32666015625, 0.335205078125]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 6.0, 5.0, 7.0, 26.0, 61.0, 117.0, 247.0, 247.0, 138.0, 68.0, 26.0, 26.0, 7.0, 7.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.209273338317871, -8.022273063659668, -7.835272789001465, -7.6482720375061035, -7.4612717628479, -7.274271488189697, -7.087270736694336, -6.900270462036133, -6.71327018737793, -6.526269912719727, -6.339269638061523, -6.152268886566162, -5.965268611907959, -5.778268337249756, -5.5912675857543945, -5.404267311096191, -5.217267036437988, -5.030266761779785, -4.843266487121582, -4.656265735626221, -4.469265460968018, -4.2822651863098145, -4.095264434814453, -3.90826416015625, -3.721263885498047, -3.5342636108398438, -3.3472630977630615, -3.1602625846862793, -2.973262310028076, -2.786262035369873, -2.599261522293091, -2.4122610092163086, -2.2252607345581055, -2.0382604598999023, -1.8512599468231201, -1.6642595529556274, -1.4772591590881348, -1.290258765220642, -1.1032583713531494, -0.9162579774856567, -0.7292575836181641, -0.5422571897506714, -0.3552567958831787, -0.16825640201568604, 0.01874399185180664, 0.20574438571929932, 0.392744779586792, 0.5797451734542847, 0.7667455673217773, 0.95374596118927, 1.1407463550567627, 1.3277467489242554, 1.514747142791748, 1.7017475366592407, 1.8887479305267334, 2.0757484436035156, 2.2627487182617188, 2.449748992919922, 2.636749505996704, 2.8237500190734863, 3.0107502937316895, 3.1977505683898926, 3.384751081466675, 3.571751594543457, 3.75875186920166]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 7.0, 2.0, 7.0, 6.0, 8.0, 9.0, 12.0, 5.0, 15.0, 17.0, 23.0, 12.0, 24.0, 39.0, 20.0, 30.0, 52.0, 40.0, 60.0, 57.0, 70.0, 96.0, 63.0, 50.0, 39.0, 45.0, 29.0, 28.0, 20.0, 23.0, 16.0, 11.0, 12.0, 14.0, 13.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 5.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.66599178314209, -3.538444757461548, -3.4108974933624268, -3.2833504676818848, -3.1558032035827637, -3.0282561779022217, -2.9007091522216797, -2.7731618881225586, -2.6456148624420166, -2.5180678367614746, -2.3905205726623535, -2.2629735469818115, -2.1354265213012695, -2.0078792572021484, -1.8803322315216064, -1.752785086631775, -1.6252379417419434, -1.4976907968521118, -1.3701436519622803, -1.2425966262817383, -1.1150494813919067, -0.9875023365020752, -0.8599552512168884, -0.7324081659317017, -0.6048610210418701, -0.47731390595436096, -0.3497667908668518, -0.22221967577934265, -0.0946725606918335, 0.03287458419799805, 0.16042166948318481, 0.2879687547683716, 0.4155158996582031, 0.5430630445480347, 0.6706101298332214, 0.7981572151184082, 0.9257043600082397, 1.0532515048980713, 1.1807985305786133, 1.3083456754684448, 1.4358928203582764, 1.563439965248108, 1.6909871101379395, 1.8185341358184814, 1.946081280708313, 2.0736284255981445, 2.2011754512786865, 2.3287224769592285, 2.4562697410583496, 2.5838167667388916, 2.7113640308380127, 2.8389110565185547, 2.966458320617676, 3.0940053462982178, 3.2215523719787598, 3.349099636077881, 3.476646661758423, 3.604193687438965, 3.731740951538086, 3.859287977218628, 3.98683500289917, 4.114382266998291, 4.241929531097412, 4.369476318359375, 4.497023582458496]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 5.0, 1.0, 2.0, 6.0, 10.0, 11.0, 17.0, 31.0, 68.0, 98.0, 176.0, 340.0, 793.0, 1809.0, 5322.0, 27005.0, 425272.0, 3361231.0, 337511.0, 25448.0, 5712.0, 1922.0, 721.0, 349.0, 179.0, 108.0, 56.0, 33.0, 15.0, 14.0, 7.0, 7.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.48876953125, -0.47669219970703125, -0.4646148681640625, -0.45253753662109375, -0.440460205078125, -0.42838287353515625, -0.4163055419921875, -0.40422821044921875, -0.39215087890625, -0.38007354736328125, -0.3679962158203125, -0.35591888427734375, -0.343841552734375, -0.33176422119140625, -0.3196868896484375, -0.30760955810546875, -0.2955322265625, -0.28345489501953125, -0.2713775634765625, -0.25930023193359375, -0.247222900390625, -0.23514556884765625, -0.2230682373046875, -0.21099090576171875, -0.19891357421875, -0.18683624267578125, -0.1747589111328125, -0.16268157958984375, -0.150604248046875, -0.13852691650390625, -0.1264495849609375, -0.11437225341796875, -0.102294921875, -0.09021759033203125, -0.0781402587890625, -0.06606292724609375, -0.053985595703125, -0.04190826416015625, -0.0298309326171875, -0.01775360107421875, -0.00567626953125, 0.00640106201171875, 0.0184783935546875, 0.03055572509765625, 0.042633056640625, 0.05471038818359375, 0.0667877197265625, 0.07886505126953125, 0.0909423828125, 0.10301971435546875, 0.1150970458984375, 0.12717437744140625, 0.139251708984375, 0.15132904052734375, 0.1634063720703125, 0.17548370361328125, 0.18756103515625, 0.19963836669921875, 0.2117156982421875, 0.22379302978515625, 0.235870361328125, 0.24794769287109375, 0.2600250244140625, 0.27210235595703125, 0.2841796875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 6.0, 7.0, 7.0, 11.0, 21.0, 35.0, 38.0, 35.0, 63.0, 69.0, 72.0, 81.0, 72.0, 82.0, 66.0, 50.0, 65.0, 39.0, 49.0, 38.0, 20.0, 21.0, 16.0, 12.0, 8.0, 9.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.44140625, -0.4303321838378906, -0.41925811767578125, -0.4081840515136719, -0.3971099853515625, -0.3860359191894531, -0.37496185302734375, -0.3638877868652344, -0.352813720703125, -0.3417396545410156, -0.33066558837890625, -0.3195915222167969, -0.3085174560546875, -0.2974433898925781, -0.28636932373046875, -0.2752952575683594, -0.26422119140625, -0.2531471252441406, -0.24207305908203125, -0.23099899291992188, -0.2199249267578125, -0.20885086059570312, -0.19777679443359375, -0.18670272827148438, -0.175628662109375, -0.16455459594726562, -0.15348052978515625, -0.14240646362304688, -0.1313323974609375, -0.12025833129882812, -0.10918426513671875, -0.09811019897460938, -0.0870361328125, -0.07596206665039062, -0.06488800048828125, -0.053813934326171875, -0.0427398681640625, -0.031665802001953125, -0.02059173583984375, -0.009517669677734375, 0.001556396484375, 0.012630462646484375, 0.02370452880859375, 0.034778594970703125, 0.0458526611328125, 0.056926727294921875, 0.06800079345703125, 0.07907485961914062, 0.09014892578125, 0.10122299194335938, 0.11229705810546875, 0.12337112426757812, 0.1344451904296875, 0.14551925659179688, 0.15659332275390625, 0.16766738891601562, 0.178741455078125, 0.18981552124023438, 0.20088958740234375, 0.21196365356445312, 0.2230377197265625, 0.23411178588867188, 0.24518585205078125, 0.2562599182128906, 0.267333984375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 3.0, 7.0, 7.0, 19.0, 23.0, 46.0, 117.0, 189.0, 432.0, 1061.0, 3214.0, 17211.0, 536841.0, 3572547.0, 52842.0, 6840.0, 1751.0, 608.0, 248.0, 121.0, 60.0, 37.0, 26.0, 10.0, 11.0, 5.0, 3.0, 1.0, 4.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70263671875, -0.68267822265625, -0.6627197265625, -0.64276123046875, -0.622802734375, -0.60284423828125, -0.5828857421875, -0.56292724609375, -0.54296875, -0.52301025390625, -0.5030517578125, -0.48309326171875, -0.463134765625, -0.44317626953125, -0.4232177734375, -0.40325927734375, -0.38330078125, -0.36334228515625, -0.3433837890625, -0.32342529296875, -0.303466796875, -0.28350830078125, -0.2635498046875, -0.24359130859375, -0.2236328125, -0.20367431640625, -0.1837158203125, -0.16375732421875, -0.143798828125, -0.12384033203125, -0.1038818359375, -0.08392333984375, -0.06396484375, -0.04400634765625, -0.0240478515625, -0.00408935546875, 0.015869140625, 0.03582763671875, 0.0557861328125, 0.07574462890625, 0.095703125, 0.11566162109375, 0.1356201171875, 0.15557861328125, 0.175537109375, 0.19549560546875, 0.2154541015625, 0.23541259765625, 0.25537109375, 0.27532958984375, 0.2952880859375, 0.31524658203125, 0.335205078125, 0.35516357421875, 0.3751220703125, 0.39508056640625, 0.4150390625, 0.43499755859375, 0.4549560546875, 0.47491455078125, 0.494873046875, 0.51483154296875, 0.5347900390625, 0.55474853515625, 0.57470703125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 9.0, 14.0, 10.0, 15.0, 18.0, 14.0, 49.0, 49.0, 85.0, 164.0, 216.0, 415.0, 661.0, 730.0, 568.0, 400.0, 250.0, 130.0, 70.0, 51.0, 31.0, 26.0, 15.0, 13.0, 18.0, 9.0, 11.0, 3.0, 2.0, 6.0, 2.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-0.359375, -0.3482704162597656, -0.33716583251953125, -0.3260612487792969, -0.3149566650390625, -0.3038520812988281, -0.29274749755859375, -0.2816429138183594, -0.270538330078125, -0.2594337463378906, -0.24832916259765625, -0.23722457885742188, -0.2261199951171875, -0.21501541137695312, -0.20391082763671875, -0.19280624389648438, -0.18170166015625, -0.17059707641601562, -0.15949249267578125, -0.14838790893554688, -0.1372833251953125, -0.12617874145507812, -0.11507415771484375, -0.10396957397460938, -0.092864990234375, -0.08176040649414062, -0.07065582275390625, -0.059551239013671875, -0.0484466552734375, -0.037342071533203125, -0.02623748779296875, -0.015132904052734375, -0.0040283203125, 0.007076263427734375, 0.01818084716796875, 0.029285430908203125, 0.0403900146484375, 0.051494598388671875, 0.06259918212890625, 0.07370376586914062, 0.084808349609375, 0.09591293334960938, 0.10701751708984375, 0.11812210083007812, 0.1292266845703125, 0.14033126831054688, 0.15143585205078125, 0.16254043579101562, 0.17364501953125, 0.18474960327148438, 0.19585418701171875, 0.20695877075195312, 0.2180633544921875, 0.22916793823242188, 0.24027252197265625, 0.2513771057128906, 0.262481689453125, 0.2735862731933594, 0.28469085693359375, 0.2957954406738281, 0.3069000244140625, 0.3180046081542969, 0.32910919189453125, 0.3402137756347656, 0.351318359375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 7.0, 6.0, 28.0, 76.0, 152.0, 253.0, 219.0, 124.0, 66.0, 18.0, 9.0, 4.0, 6.0, 8.0, 3.0, 0.0, 6.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.645571231842041, -4.503230571746826, -4.360889911651611, -4.218548774719238, -4.076208114624023, -3.9338674545288086, -3.7915267944335938, -3.649186134338379, -3.506845235824585, -3.36450457572937, -3.222163677215576, -3.0798230171203613, -2.9374823570251465, -2.7951414585113525, -2.6528007984161377, -2.5104598999023438, -2.368119239807129, -2.225778579711914, -2.08343768119812, -1.9410970211029053, -1.7987562417984009, -1.6564154624938965, -1.5140748023986816, -1.3717340230941772, -1.2293932437896729, -1.0870524644851685, -0.9447117447853088, -0.8023710250854492, -0.6600302457809448, -0.5176894664764404, -0.3753487467765808, -0.2330080270767212, -0.0906672477722168, 0.05167350172996521, 0.19401425123214722, 0.3363550007343292, 0.47869575023651123, 0.6210365295410156, 0.7633772492408752, 0.9057179689407349, 1.0480587482452393, 1.1903995275497437, 1.332740306854248, 1.475080966949463, 1.6174217462539673, 1.7597625255584717, 1.9021031856536865, 2.0444440841674805, 2.1867847442626953, 2.32912540435791, 2.471466302871704, 2.613806962966919, 2.756147861480713, 2.8984885215759277, 3.0408291816711426, 3.1831698417663574, 3.3255107402801514, 3.467851400375366, 3.61019229888916, 3.752532958984375, 3.89487361907959, 4.037214279174805, 4.179555416107178, 4.321896076202393, 4.464236736297607]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 2.0, 8.0, 6.0, 7.0, 7.0, 11.0, 13.0, 13.0, 16.0, 15.0, 18.0, 26.0, 29.0, 26.0, 41.0, 30.0, 31.0, 38.0, 50.0, 41.0, 42.0, 40.0, 46.0, 51.0, 44.0, 33.0, 34.0, 39.0, 36.0, 29.0, 32.0, 23.0, 17.0, 16.0, 18.0, 17.0, 6.0, 6.0, 7.0, 7.0, 3.0, 8.0, 6.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-1.4055123329162598, -1.3603719472885132, -1.3152316808700562, -1.2700912952423096, -1.224950909614563, -1.1798105239868164, -1.1346702575683594, -1.0895298719406128, -1.0443894863128662, -0.9992491602897644, -0.9541087746620178, -0.908968448638916, -0.8638280630111694, -0.8186877369880676, -0.7735474109649658, -0.7284070253372192, -0.6832666993141174, -0.6381263732910156, -0.592985987663269, -0.5478456616401672, -0.5027052760124207, -0.45756494998931885, -0.41242459416389465, -0.36728423833847046, -0.32214388251304626, -0.27700352668762207, -0.23186317086219788, -0.18672282993793488, -0.14158247411251068, -0.09644211828708649, -0.051301777362823486, -0.006161421537399292, 0.0389789342880249, 0.0841192901134491, 0.1292596459388733, 0.1743999868631363, 0.21954034268856049, 0.2646806836128235, 0.3098210394382477, 0.3549613952636719, 0.40010175108909607, 0.44524210691452026, 0.49038246273994446, 0.5355228185653687, 0.5806631445884705, 0.625803530216217, 0.6709438562393188, 0.7160842418670654, 0.7612245678901672, 0.806364893913269, 0.8515052795410156, 0.8966456055641174, 0.941785991191864, 0.9869263172149658, 1.0320667028427124, 1.077207088470459, 1.122347354888916, 1.1674877405166626, 1.2126280069351196, 1.2577683925628662, 1.3029087781906128, 1.3480491638183594, 1.3931894302368164, 1.438329815864563, 1.4834702014923096]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 7.0, 7.0, 18.0, 30.0, 57.0, 79.0, 135.0, 212.0, 429.0, 900.0, 1945.0, 5089.0, 16827.0, 70095.0, 329515.0, 466711.0, 117927.0, 26229.0, 7362.0, 2641.0, 1093.0, 558.0, 273.0, 164.0, 86.0, 55.0, 33.0, 19.0, 17.0, 11.0, 11.0, 7.0, 7.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45166015625, -0.4371681213378906, -0.42267608642578125, -0.4081840515136719, -0.3936920166015625, -0.3791999816894531, -0.36470794677734375, -0.3502159118652344, -0.335723876953125, -0.3212318420410156, -0.30673980712890625, -0.2922477722167969, -0.2777557373046875, -0.2632637023925781, -0.24877166748046875, -0.23427963256835938, -0.21978759765625, -0.20529556274414062, -0.19080352783203125, -0.17631149291992188, -0.1618194580078125, -0.14732742309570312, -0.13283538818359375, -0.11834335327148438, -0.103851318359375, -0.08935928344726562, -0.07486724853515625, -0.060375213623046875, -0.0458831787109375, -0.031391143798828125, -0.01689910888671875, -0.002407073974609375, 0.0120849609375, 0.026576995849609375, 0.04106903076171875, 0.055561065673828125, 0.0700531005859375, 0.08454513549804688, 0.09903717041015625, 0.11352920532226562, 0.128021240234375, 0.14251327514648438, 0.15700531005859375, 0.17149734497070312, 0.1859893798828125, 0.20048141479492188, 0.21497344970703125, 0.22946548461914062, 0.24395751953125, 0.2584495544433594, 0.27294158935546875, 0.2874336242675781, 0.3019256591796875, 0.3164176940917969, 0.33090972900390625, 0.3454017639160156, 0.359893798828125, 0.3743858337402344, 0.38887786865234375, 0.4033699035644531, 0.4178619384765625, 0.4323539733886719, 0.44684600830078125, 0.4613380432128906, 0.475830078125]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 8.0, 13.0, 14.0, 17.0, 23.0, 36.0, 37.0, 67.0, 68.0, 92.0, 79.0, 78.0, 86.0, 43.0, 63.0, 66.0, 47.0, 37.0, 28.0, 30.0, 18.0, 14.0, 9.0, 14.0, 6.0, 6.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.44189453125, -0.4307861328125, -0.419677734375, -0.4085693359375, -0.3974609375, -0.3863525390625, -0.375244140625, -0.3641357421875, -0.35302734375, -0.3419189453125, -0.330810546875, -0.3197021484375, -0.30859375, -0.2974853515625, -0.286376953125, -0.2752685546875, -0.26416015625, -0.2530517578125, -0.241943359375, -0.2308349609375, -0.2197265625, -0.2086181640625, -0.197509765625, -0.1864013671875, -0.17529296875, -0.1641845703125, -0.153076171875, -0.1419677734375, -0.130859375, -0.1197509765625, -0.108642578125, -0.0975341796875, -0.08642578125, -0.0753173828125, -0.064208984375, -0.0531005859375, -0.0419921875, -0.0308837890625, -0.019775390625, -0.0086669921875, 0.00244140625, 0.0135498046875, 0.024658203125, 0.0357666015625, 0.046875, 0.0579833984375, 0.069091796875, 0.0802001953125, 0.09130859375, 0.1024169921875, 0.113525390625, 0.1246337890625, 0.1357421875, 0.1468505859375, 0.157958984375, 0.1690673828125, 0.18017578125, 0.1912841796875, 0.202392578125, 0.2135009765625, 0.224609375, 0.2357177734375, 0.246826171875, 0.2579345703125, 0.26904296875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 7.0, 6.0, 11.0, 5.0, 13.0, 20.0, 15.0, 23.0, 55.0, 77.0, 120.0, 197.0, 493.0, 1289.0, 4521.0, 22773.0, 176302.0, 722752.0, 100403.0, 14334.0, 3248.0, 1019.0, 351.0, 183.0, 112.0, 69.0, 36.0, 27.0, 25.0, 20.0, 9.0, 10.0, 10.0, 5.0, 4.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.6650390625, -0.645111083984375, -0.62518310546875, -0.605255126953125, -0.5853271484375, -0.565399169921875, -0.54547119140625, -0.525543212890625, -0.505615234375, -0.485687255859375, -0.46575927734375, -0.445831298828125, -0.4259033203125, -0.405975341796875, -0.38604736328125, -0.366119384765625, -0.34619140625, -0.326263427734375, -0.30633544921875, -0.286407470703125, -0.2664794921875, -0.246551513671875, -0.22662353515625, -0.206695556640625, -0.186767578125, -0.166839599609375, -0.14691162109375, -0.126983642578125, -0.1070556640625, -0.087127685546875, -0.06719970703125, -0.047271728515625, -0.02734375, -0.007415771484375, 0.01251220703125, 0.032440185546875, 0.0523681640625, 0.072296142578125, 0.09222412109375, 0.112152099609375, 0.132080078125, 0.152008056640625, 0.17193603515625, 0.191864013671875, 0.2117919921875, 0.231719970703125, 0.25164794921875, 0.271575927734375, 0.29150390625, 0.311431884765625, 0.33135986328125, 0.351287841796875, 0.3712158203125, 0.391143798828125, 0.41107177734375, 0.430999755859375, 0.450927734375, 0.470855712890625, 0.49078369140625, 0.510711669921875, 0.5306396484375, 0.550567626953125, 0.57049560546875, 0.590423583984375, 0.6103515625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 3.0, 7.0, 4.0, 3.0, 7.0, 12.0, 13.0, 16.0, 19.0, 26.0, 24.0, 46.0, 37.0, 40.0, 52.0, 61.0, 34.0, 55.0, 59.0, 49.0, 60.0, 49.0, 57.0, 51.0, 39.0, 29.0, 35.0, 32.0, 18.0, 23.0, 10.0, 10.0, 11.0, 4.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.9365234375, -0.90771484375, -0.87890625, -0.85009765625, -0.8212890625, -0.79248046875, -0.763671875, -0.73486328125, -0.7060546875, -0.67724609375, -0.6484375, -0.61962890625, -0.5908203125, -0.56201171875, -0.533203125, -0.50439453125, -0.4755859375, -0.44677734375, -0.41796875, -0.38916015625, -0.3603515625, -0.33154296875, -0.302734375, -0.27392578125, -0.2451171875, -0.21630859375, -0.1875, -0.15869140625, -0.1298828125, -0.10107421875, -0.072265625, -0.04345703125, -0.0146484375, 0.01416015625, 0.04296875, 0.07177734375, 0.1005859375, 0.12939453125, 0.158203125, 0.18701171875, 0.2158203125, 0.24462890625, 0.2734375, 0.30224609375, 0.3310546875, 0.35986328125, 0.388671875, 0.41748046875, 0.4462890625, 0.47509765625, 0.50390625, 0.53271484375, 0.5615234375, 0.59033203125, 0.619140625, 0.64794921875, 0.6767578125, 0.70556640625, 0.734375, 0.76318359375, 0.7919921875, 0.82080078125, 0.849609375, 0.87841796875, 0.9072265625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 8.0, 10.0, 14.0, 39.0, 100.0, 238.0, 837.0, 3923.0, 25942.0, 627158.0, 363545.0, 22097.0, 3415.0, 837.0, 230.0, 93.0, 38.0, 19.0, 8.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3486328125, -0.33866119384765625, -0.3286895751953125, -0.31871795654296875, -0.308746337890625, -0.29877471923828125, -0.2888031005859375, -0.27883148193359375, -0.26885986328125, -0.25888824462890625, -0.2489166259765625, -0.23894500732421875, -0.228973388671875, -0.21900177001953125, -0.2090301513671875, -0.19905853271484375, -0.1890869140625, -0.17911529541015625, -0.1691436767578125, -0.15917205810546875, -0.149200439453125, -0.13922882080078125, -0.1292572021484375, -0.11928558349609375, -0.10931396484375, -0.09934234619140625, -0.0893707275390625, -0.07939910888671875, -0.069427490234375, -0.05945587158203125, -0.0494842529296875, -0.03951263427734375, -0.029541015625, -0.01956939697265625, -0.0095977783203125, 0.00037384033203125, 0.010345458984375, 0.02031707763671875, 0.0302886962890625, 0.04026031494140625, 0.05023193359375, 0.06020355224609375, 0.0701751708984375, 0.08014678955078125, 0.090118408203125, 0.10009002685546875, 0.1100616455078125, 0.12003326416015625, 0.1300048828125, 0.13997650146484375, 0.1499481201171875, 0.15991973876953125, 0.169891357421875, 0.17986297607421875, 0.1898345947265625, 0.19980621337890625, 0.20977783203125, 0.21974945068359375, 0.2297210693359375, 0.23969268798828125, 0.249664306640625, 0.25963592529296875, 0.2696075439453125, 0.27957916259765625, 0.28955078125]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 9.0, 12.0, 18.0, 39.0, 65.0, 128.0, 182.0, 192.0, 147.0, 94.0, 49.0, 18.0, 17.0, 8.0, 3.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.840726852416992e-05, -9.588897228240967e-05, -9.337067604064941e-05, -9.085237979888916e-05, -8.83340835571289e-05, -8.581578731536865e-05, -8.32974910736084e-05, -8.077919483184814e-05, -7.826089859008789e-05, -7.574260234832764e-05, -7.322430610656738e-05, -7.070600986480713e-05, -6.818771362304688e-05, -6.566941738128662e-05, -6.315112113952637e-05, -6.063282489776611e-05, -5.811452865600586e-05, -5.5596232414245605e-05, -5.307793617248535e-05, -5.05596399307251e-05, -4.8041343688964844e-05, -4.552304744720459e-05, -4.3004751205444336e-05, -4.048645496368408e-05, -3.796815872192383e-05, -3.5449862480163574e-05, -3.293156623840332e-05, -3.0413269996643066e-05, -2.7894973754882812e-05, -2.537667751312256e-05, -2.2858381271362305e-05, -2.034008502960205e-05, -1.7821788787841797e-05, -1.5303492546081543e-05, -1.2785196304321289e-05, -1.0266900062561035e-05, -7.748603820800781e-06, -5.230307579040527e-06, -2.7120113372802734e-06, -1.9371509552001953e-07, 2.3245811462402344e-06, 4.842877388000488e-06, 7.361173629760742e-06, 9.879469871520996e-06, 1.239776611328125e-05, 1.4916062355041504e-05, 1.7434358596801758e-05, 1.9952654838562012e-05, 2.2470951080322266e-05, 2.498924732208252e-05, 2.7507543563842773e-05, 3.0025839805603027e-05, 3.254413604736328e-05, 3.5062432289123535e-05, 3.758072853088379e-05, 4.009902477264404e-05, 4.26173210144043e-05, 4.513561725616455e-05, 4.7653913497924805e-05, 5.017220973968506e-05, 5.269050598144531e-05, 5.5208802223205566e-05, 5.772709846496582e-05, 6.0245394706726074e-05, 6.276369094848633e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 9.0, 16.0, 29.0, 85.0, 220.0, 806.0, 4964.0, 84317.0, 910197.0, 43711.0, 3308.0, 553.0, 189.0, 71.0, 41.0, 17.0, 13.0, 8.0, 1.0, 0.0, 4.0, 0.0, 2.0], "bins": [-0.64697265625, -0.6338768005371094, -0.6207809448242188, -0.6076850891113281, -0.5945892333984375, -0.5814933776855469, -0.5683975219726562, -0.5553016662597656, -0.542205810546875, -0.5291099548339844, -0.5160140991210938, -0.5029182434082031, -0.4898223876953125, -0.4767265319824219, -0.46363067626953125, -0.4505348205566406, -0.43743896484375, -0.4243431091308594, -0.41124725341796875, -0.3981513977050781, -0.3850555419921875, -0.3719596862792969, -0.35886383056640625, -0.3457679748535156, -0.332672119140625, -0.3195762634277344, -0.30648040771484375, -0.2933845520019531, -0.2802886962890625, -0.2671928405761719, -0.25409698486328125, -0.24100112915039062, -0.2279052734375, -0.21480941772460938, -0.20171356201171875, -0.18861770629882812, -0.1755218505859375, -0.16242599487304688, -0.14933013916015625, -0.13623428344726562, -0.123138427734375, -0.11004257202148438, -0.09694671630859375, -0.08385086059570312, -0.0707550048828125, -0.057659149169921875, -0.04456329345703125, -0.031467437744140625, -0.01837158203125, -0.005275726318359375, 0.00782012939453125, 0.020915985107421875, 0.0340118408203125, 0.047107696533203125, 0.06020355224609375, 0.07329940795898438, 0.086395263671875, 0.09949111938476562, 0.11258697509765625, 0.12568283081054688, 0.1387786865234375, 0.15187454223632812, 0.16497039794921875, 0.17806625366210938, 0.191162109375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 2.0, 5.0, 5.0, 4.0, 15.0, 12.0, 19.0, 30.0, 46.0, 50.0, 63.0, 87.0, 119.0, 126.0, 108.0, 83.0, 56.0, 39.0, 38.0, 22.0, 17.0, 13.0, 8.0, 8.0, 7.0, 7.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.159912109375, -0.15304183959960938, -0.14617156982421875, -0.13930130004882812, -0.1324310302734375, -0.12556076049804688, -0.11869049072265625, -0.11182022094726562, -0.104949951171875, -0.09807968139648438, -0.09120941162109375, -0.08433914184570312, -0.0774688720703125, -0.07059860229492188, -0.06372833251953125, -0.056858062744140625, -0.04998779296875, -0.043117523193359375, -0.03624725341796875, -0.029376983642578125, -0.0225067138671875, -0.015636444091796875, -0.00876617431640625, -0.001895904541015625, 0.004974365234375, 0.011844635009765625, 0.01871490478515625, 0.025585174560546875, 0.0324554443359375, 0.039325714111328125, 0.04619598388671875, 0.053066253662109375, 0.0599365234375, 0.06680679321289062, 0.07367706298828125, 0.08054733276367188, 0.0874176025390625, 0.09428787231445312, 0.10115814208984375, 0.10802841186523438, 0.114898681640625, 0.12176895141601562, 0.12863922119140625, 0.13550949096679688, 0.1423797607421875, 0.14925003051757812, 0.15612030029296875, 0.16299057006835938, 0.16986083984375, 0.17673110961914062, 0.18360137939453125, 0.19047164916992188, 0.1973419189453125, 0.20421218872070312, 0.21108245849609375, 0.21795272827148438, 0.224822998046875, 0.23169326782226562, 0.23856353759765625, 0.24543380737304688, 0.2523040771484375, 0.2591743469238281, 0.26604461669921875, 0.2729148864746094, 0.27978515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 12.0, 11.0, 25.0, 73.0, 135.0, 342.0, 231.0, 107.0, 29.0, 13.0, 10.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.509293556213379, -7.320627212524414, -7.131961345672607, -6.943295001983643, -6.754628658294678, -6.565962791442871, -6.377296447753906, -6.188630104064941, -5.999963760375977, -5.811297416687012, -5.622631549835205, -5.43396520614624, -5.245298862457275, -5.056632995605469, -4.867966651916504, -4.679300308227539, -4.490634441375732, -4.301968097686768, -4.113302230834961, -3.924635887145996, -3.7359695434570312, -3.5473034381866455, -3.3586373329162598, -3.169970989227295, -2.981304883956909, -2.7926387786865234, -2.6039724349975586, -2.415306329727173, -2.226640224456787, -2.0379738807678223, -1.8493077754974365, -1.6606415510177612, -1.471975326538086, -1.2833091020584106, -1.0946428775787354, -0.9059767723083496, -0.7173105478286743, -0.528644323348999, -0.3399782180786133, -0.151311993598938, 0.037354230880737305, 0.2260204255580902, 0.4146866202354431, 0.6033527851104736, 0.7920190095901489, 0.9806852340698242, 1.16935133934021, 1.3580175638198853, 1.5466837882995605, 1.7353500127792358, 1.9240162372589111, 2.112682342529297, 2.3013486862182617, 2.4900147914886475, 2.678680896759033, 2.867347240447998, 3.056013345718384, 3.2446794509887695, 3.4333457946777344, 3.62201189994812, 3.810678005218506, 3.9993443489074707, 4.188010215759277, 4.376676559448242, 4.565342903137207]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 1.0, 8.0, 9.0, 6.0, 11.0, 12.0, 15.0, 21.0, 9.0, 32.0, 26.0, 28.0, 32.0, 31.0, 32.0, 45.0, 50.0, 85.0, 62.0, 54.0, 56.0, 50.0, 38.0, 39.0, 38.0, 23.0, 23.0, 25.0, 20.0, 19.0, 12.0, 19.0, 10.0, 9.0, 10.0, 7.0, 6.0, 6.0, 5.0, 4.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.7817845344543457, -2.687992572784424, -2.594200849533081, -2.500408887863159, -2.4066169261932373, -2.3128252029418945, -2.2190332412719727, -2.125241279602051, -2.031449317932129, -1.9376574754714966, -1.8438655138015747, -1.7500736713409424, -1.6562817096710205, -1.5624898672103882, -1.4686980247497559, -1.374906063079834, -1.2811143398284912, -1.1873224973678589, -1.093530535697937, -0.9997386932373047, -0.9059467911720276, -0.8121548891067505, -0.7183630466461182, -0.6245711445808411, -0.530779242515564, -0.43698734045028687, -0.34319546818733215, -0.24940359592437744, -0.15561169385910034, -0.06181979179382324, 0.03197205066680908, 0.12576395273208618, 0.21955561637878418, 0.3133475184440613, 0.407139390707016, 0.5009312629699707, 0.5947231650352478, 0.6885150671005249, 0.7823069095611572, 0.8760988116264343, 0.9698907136917114, 1.0636825561523438, 1.1574745178222656, 1.251266360282898, 1.3450582027435303, 1.4388501644134521, 1.5326420068740845, 1.6264338493347168, 1.7202258110046387, 1.814017653465271, 1.9078096151351929, 2.001601457595825, 2.095393419265747, 2.18918514251709, 2.2829771041870117, 2.3767690658569336, 2.4705610275268555, 2.5643529891967773, 2.65814471244812, 2.751936674118042, 2.845728635787964, 2.9395203590393066, 3.0333123207092285, 3.1271042823791504, 3.220896005630493]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 10.0, 15.0, 17.0, 30.0, 39.0, 80.0, 146.0, 257.0, 641.0, 1567.0, 4711.0, 22805.0, 248263.0, 3074168.0, 775774.0, 51850.0, 9573.0, 2636.0, 944.0, 386.0, 181.0, 77.0, 38.0, 23.0, 18.0, 3.0, 2.0, 2.0, 7.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.4921875, -0.4809226989746094, -0.46965789794921875, -0.4583930969238281, -0.4471282958984375, -0.4358634948730469, -0.42459869384765625, -0.4133338928222656, -0.402069091796875, -0.3908042907714844, -0.37953948974609375, -0.3682746887207031, -0.3570098876953125, -0.3457450866699219, -0.33448028564453125, -0.3232154846191406, -0.31195068359375, -0.3006858825683594, -0.28942108154296875, -0.2781562805175781, -0.2668914794921875, -0.2556266784667969, -0.24436187744140625, -0.23309707641601562, -0.221832275390625, -0.21056747436523438, -0.19930267333984375, -0.18803787231445312, -0.1767730712890625, -0.16550827026367188, -0.15424346923828125, -0.14297866821289062, -0.1317138671875, -0.12044906616210938, -0.10918426513671875, -0.09791946411132812, -0.0866546630859375, -0.07538986206054688, -0.06412506103515625, -0.052860260009765625, -0.041595458984375, -0.030330657958984375, -0.01906585693359375, -0.007801055908203125, 0.0034637451171875, 0.014728546142578125, 0.02599334716796875, 0.037258148193359375, 0.04852294921875, 0.059787750244140625, 0.07105255126953125, 0.08231735229492188, 0.0935821533203125, 0.10484695434570312, 0.11611175537109375, 0.12737655639648438, 0.138641357421875, 0.14990615844726562, 0.16117095947265625, 0.17243576049804688, 0.1837005615234375, 0.19496536254882812, 0.20623016357421875, 0.21749496459960938, 0.228759765625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 7.0, 11.0, 14.0, 24.0, 36.0, 32.0, 35.0, 58.0, 58.0, 77.0, 92.0, 64.0, 76.0, 79.0, 65.0, 64.0, 52.0, 45.0, 20.0, 24.0, 25.0, 11.0, 8.0, 6.0, 10.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.4423828125, -0.4312477111816406, -0.42011260986328125, -0.4089775085449219, -0.3978424072265625, -0.3867073059082031, -0.37557220458984375, -0.3644371032714844, -0.353302001953125, -0.3421669006347656, -0.33103179931640625, -0.3198966979980469, -0.3087615966796875, -0.2976264953613281, -0.28649139404296875, -0.2753562927246094, -0.26422119140625, -0.2530860900878906, -0.24195098876953125, -0.23081588745117188, -0.2196807861328125, -0.20854568481445312, -0.19741058349609375, -0.18627548217773438, -0.175140380859375, -0.16400527954101562, -0.15287017822265625, -0.14173507690429688, -0.1305999755859375, -0.11946487426757812, -0.10832977294921875, -0.09719467163085938, -0.0860595703125, -0.07492446899414062, -0.06378936767578125, -0.052654266357421875, -0.0415191650390625, -0.030384063720703125, -0.01924896240234375, -0.008113861083984375, 0.003021240234375, 0.014156341552734375, 0.02529144287109375, 0.036426544189453125, 0.0475616455078125, 0.058696746826171875, 0.06983184814453125, 0.08096694946289062, 0.09210205078125, 0.10323715209960938, 0.11437225341796875, 0.12550735473632812, 0.1366424560546875, 0.14777755737304688, 0.15891265869140625, 0.17004776000976562, 0.181182861328125, 0.19231796264648438, 0.20345306396484375, 0.21458816528320312, 0.2257232666015625, 0.23685836791992188, 0.24799346923828125, 0.2591285705566406, 0.270263671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 13.0, 20.0, 29.0, 52.0, 75.0, 157.0, 388.0, 1133.0, 6598.0, 204461.0, 3936347.0, 40485.0, 3208.0, 793.0, 284.0, 101.0, 60.0, 24.0, 17.0, 11.0, 10.0, 9.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68212890625, -0.6562042236328125, -0.630279541015625, -0.6043548583984375, -0.57843017578125, -0.5525054931640625, -0.526580810546875, -0.5006561279296875, -0.4747314453125, -0.4488067626953125, -0.422882080078125, -0.3969573974609375, -0.37103271484375, -0.3451080322265625, -0.319183349609375, -0.2932586669921875, -0.267333984375, -0.2414093017578125, -0.215484619140625, -0.1895599365234375, -0.16363525390625, -0.1377105712890625, -0.111785888671875, -0.0858612060546875, -0.0599365234375, -0.0340118408203125, -0.008087158203125, 0.0178375244140625, 0.04376220703125, 0.0696868896484375, 0.095611572265625, 0.1215362548828125, 0.1474609375, 0.1733856201171875, 0.199310302734375, 0.2252349853515625, 0.25115966796875, 0.2770843505859375, 0.303009033203125, 0.3289337158203125, 0.3548583984375, 0.3807830810546875, 0.406707763671875, 0.4326324462890625, 0.45855712890625, 0.4844818115234375, 0.510406494140625, 0.5363311767578125, 0.562255859375, 0.5881805419921875, 0.614105224609375, 0.6400299072265625, 0.66595458984375, 0.6918792724609375, 0.717803955078125, 0.7437286376953125, 0.7696533203125, 0.7955780029296875, 0.821502685546875, 0.8474273681640625, 0.87335205078125, 0.8992767333984375, 0.925201416015625, 0.9511260986328125, 0.97705078125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 10.0, 16.0, 21.0, 26.0, 56.0, 87.0, 193.0, 420.0, 835.0, 1070.0, 664.0, 294.0, 147.0, 76.0, 55.0, 33.0, 20.0, 16.0, 5.0, 8.0, 4.0, 4.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.494140625, -0.4783477783203125, -0.462554931640625, -0.4467620849609375, -0.43096923828125, -0.4151763916015625, -0.399383544921875, -0.3835906982421875, -0.3677978515625, -0.3520050048828125, -0.336212158203125, -0.3204193115234375, -0.30462646484375, -0.2888336181640625, -0.273040771484375, -0.2572479248046875, -0.241455078125, -0.2256622314453125, -0.209869384765625, -0.1940765380859375, -0.17828369140625, -0.1624908447265625, -0.146697998046875, -0.1309051513671875, -0.1151123046875, -0.0993194580078125, -0.083526611328125, -0.0677337646484375, -0.05194091796875, -0.0361480712890625, -0.020355224609375, -0.0045623779296875, 0.01123046875, 0.0270233154296875, 0.042816162109375, 0.0586090087890625, 0.07440185546875, 0.0901947021484375, 0.105987548828125, 0.1217803955078125, 0.1375732421875, 0.1533660888671875, 0.169158935546875, 0.1849517822265625, 0.20074462890625, 0.2165374755859375, 0.232330322265625, 0.2481231689453125, 0.263916015625, 0.2797088623046875, 0.295501708984375, 0.3112945556640625, 0.32708740234375, 0.3428802490234375, 0.358673095703125, 0.3744659423828125, 0.3902587890625, 0.4060516357421875, 0.421844482421875, 0.4376373291015625, 0.45343017578125, 0.4692230224609375, 0.485015869140625, 0.5008087158203125, 0.5166015625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 5.0, 15.0, 16.0, 34.0, 126.0, 240.0, 304.0, 169.0, 63.0, 17.0, 9.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.195561170578003, -3.027519702911377, -2.85947847366333, -2.691437244415283, -2.5233957767486572, -2.3553543090820312, -2.1873130798339844, -2.0192718505859375, -1.8512303829193115, -1.683189034461975, -1.5151476860046387, -1.3471063375473022, -1.1790649890899658, -1.0110236406326294, -0.842982292175293, -0.6749409437179565, -0.5068995952606201, -0.3388582468032837, -0.17081689834594727, -0.00277554988861084, 0.16526579856872559, 0.333307147026062, 0.5013484954833984, 0.6693898439407349, 0.8374311923980713, 1.0054725408554077, 1.1735138893127441, 1.3415552377700806, 1.509596586227417, 1.6776379346847534, 1.8456792831420898, 2.0137205123901367, 2.1817617416381836, 2.3498029708862305, 2.5178444385528564, 2.6858859062194824, 2.8539271354675293, 3.021968364715576, 3.190009832382202, 3.358051300048828, 3.526092529296875, 3.694133758544922, 3.862175226211548, 4.030216693878174, 4.198257923126221, 4.366299152374268, 4.534340858459473, 4.7023820877075195, 4.870423316955566, 5.038464546203613, 5.20650577545166, 5.374547481536865, 5.542588710784912, 5.710629940032959, 5.878671646118164, 6.046712875366211, 6.214754104614258, 6.382795333862305, 6.550836563110352, 6.718878269195557, 6.8869194984436035, 7.05496072769165, 7.2230024337768555, 7.391043663024902, 7.559084892272949]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 3.0, 2.0, 2.0, 11.0, 3.0, 8.0, 8.0, 11.0, 10.0, 9.0, 11.0, 22.0, 20.0, 28.0, 28.0, 19.0, 36.0, 16.0, 37.0, 38.0, 35.0, 48.0, 64.0, 49.0, 43.0, 39.0, 41.0, 44.0, 42.0, 38.0, 26.0, 34.0, 22.0, 22.0, 21.0, 21.0, 18.0, 20.0, 13.0, 7.0, 9.0, 9.0, 5.0, 5.0, 2.0, 2.0, 1.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.5893402099609375, -1.5412148237228394, -1.4930894374847412, -1.4449641704559326, -1.3968387842178345, -1.3487133979797363, -1.3005880117416382, -1.25246262550354, -1.2043373584747314, -1.1562119722366333, -1.1080865859985352, -1.0599613189697266, -1.0118359327316284, -0.9637105464935303, -0.9155851602554321, -0.867459774017334, -0.8193343877792358, -0.7712090015411377, -0.7230836749076843, -0.6749582886695862, -0.6268329620361328, -0.5787075757980347, -0.5305821895599365, -0.48245683312416077, -0.434331476688385, -0.38620612025260925, -0.3380807638168335, -0.28995537757873535, -0.2418300211429596, -0.19370466470718384, -0.1455792784690857, -0.09745392203330994, -0.04932856559753418, -0.001203201711177826, 0.04692216217517853, 0.09504753351211548, 0.14317288994789124, 0.191298246383667, 0.23942363262176514, 0.2875489890575409, 0.33567434549331665, 0.3837997019290924, 0.43192505836486816, 0.4800504446029663, 0.5281758308410645, 0.5763011574745178, 0.624426543712616, 0.6725518703460693, 0.7206772565841675, 0.7688026428222656, 0.816927969455719, 0.8650533556938171, 0.9131786823272705, 0.9613040685653687, 1.0094294548034668, 1.057554841041565, 1.105680227279663, 1.1538056135177612, 1.2019309997558594, 1.250056266784668, 1.2981816530227661, 1.3463070392608643, 1.3944324254989624, 1.4425578117370605, 1.4906830787658691]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 2.0, 3.0, 7.0, 9.0, 18.0, 26.0, 31.0, 66.0, 115.0, 187.0, 414.0, 770.0, 1824.0, 4886.0, 15485.0, 59653.0, 291319.0, 507328.0, 124441.0, 28598.0, 8274.0, 2850.0, 1139.0, 508.0, 253.0, 150.0, 70.0, 54.0, 29.0, 19.0, 11.0, 9.0, 8.0, 4.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.54248046875, -0.5279121398925781, -0.5133438110351562, -0.4987754821777344, -0.4842071533203125, -0.4696388244628906, -0.45507049560546875, -0.4405021667480469, -0.425933837890625, -0.4113655090332031, -0.39679718017578125, -0.3822288513183594, -0.3676605224609375, -0.3530921936035156, -0.33852386474609375, -0.3239555358886719, -0.30938720703125, -0.2948188781738281, -0.28025054931640625, -0.2656822204589844, -0.2511138916015625, -0.23654556274414062, -0.22197723388671875, -0.20740890502929688, -0.192840576171875, -0.17827224731445312, -0.16370391845703125, -0.14913558959960938, -0.1345672607421875, -0.11999893188476562, -0.10543060302734375, -0.09086227416992188, -0.0762939453125, -0.061725616455078125, -0.04715728759765625, -0.032588958740234375, -0.0180206298828125, -0.003452301025390625, 0.01111602783203125, 0.025684356689453125, 0.040252685546875, 0.054821014404296875, 0.06938934326171875, 0.08395767211914062, 0.0985260009765625, 0.11309432983398438, 0.12766265869140625, 0.14223098754882812, 0.15679931640625, 0.17136764526367188, 0.18593597412109375, 0.20050430297851562, 0.2150726318359375, 0.22964096069335938, 0.24420928955078125, 0.2587776184082031, 0.273345947265625, 0.2879142761230469, 0.30248260498046875, 0.3170509338378906, 0.3316192626953125, 0.3461875915527344, 0.36075592041015625, 0.3753242492675781, 0.389892578125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 5.0, 6.0, 13.0, 13.0, 19.0, 32.0, 26.0, 47.0, 58.0, 50.0, 84.0, 81.0, 68.0, 84.0, 62.0, 68.0, 60.0, 68.0, 48.0, 33.0, 21.0, 17.0, 11.0, 13.0, 5.0, 3.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.44140625, -0.43033599853515625, -0.4192657470703125, -0.40819549560546875, -0.397125244140625, -0.38605499267578125, -0.3749847412109375, -0.36391448974609375, -0.35284423828125, -0.34177398681640625, -0.3307037353515625, -0.31963348388671875, -0.308563232421875, -0.29749298095703125, -0.2864227294921875, -0.27535247802734375, -0.2642822265625, -0.25321197509765625, -0.2421417236328125, -0.23107147216796875, -0.220001220703125, -0.20893096923828125, -0.1978607177734375, -0.18679046630859375, -0.17572021484375, -0.16464996337890625, -0.1535797119140625, -0.14250946044921875, -0.131439208984375, -0.12036895751953125, -0.1092987060546875, -0.09822845458984375, -0.087158203125, -0.07608795166015625, -0.0650177001953125, -0.05394744873046875, -0.042877197265625, -0.03180694580078125, -0.0207366943359375, -0.00966644287109375, 0.00140380859375, 0.01247406005859375, 0.0235443115234375, 0.03461456298828125, 0.045684814453125, 0.05675506591796875, 0.0678253173828125, 0.07889556884765625, 0.0899658203125, 0.10103607177734375, 0.1121063232421875, 0.12317657470703125, 0.134246826171875, 0.14531707763671875, 0.1563873291015625, 0.16745758056640625, 0.17852783203125, 0.18959808349609375, 0.2006683349609375, 0.21173858642578125, 0.222808837890625, 0.23387908935546875, 0.2449493408203125, 0.25601959228515625, 0.26708984375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 6.0, 7.0, 6.0, 10.0, 7.0, 10.0, 16.0, 27.0, 48.0, 73.0, 99.0, 157.0, 249.0, 433.0, 796.0, 1832.0, 5260.0, 20084.0, 102847.0, 690132.0, 182536.0, 31521.0, 7644.0, 2411.0, 1049.0, 496.0, 286.0, 190.0, 103.0, 79.0, 55.0, 38.0, 16.0, 15.0, 7.0, 8.0, 2.0, 1.0, 1.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.453125, -0.43730926513671875, -0.4214935302734375, -0.40567779541015625, -0.389862060546875, -0.37404632568359375, -0.3582305908203125, -0.34241485595703125, -0.32659912109375, -0.31078338623046875, -0.2949676513671875, -0.27915191650390625, -0.263336181640625, -0.24752044677734375, -0.2317047119140625, -0.21588897705078125, -0.2000732421875, -0.18425750732421875, -0.1684417724609375, -0.15262603759765625, -0.136810302734375, -0.12099456787109375, -0.1051788330078125, -0.08936309814453125, -0.07354736328125, -0.05773162841796875, -0.0419158935546875, -0.02610015869140625, -0.010284423828125, 0.00553131103515625, 0.0213470458984375, 0.03716278076171875, 0.052978515625, 0.06879425048828125, 0.0846099853515625, 0.10042572021484375, 0.116241455078125, 0.13205718994140625, 0.1478729248046875, 0.16368865966796875, 0.17950439453125, 0.19532012939453125, 0.2111358642578125, 0.22695159912109375, 0.242767333984375, 0.25858306884765625, 0.2743988037109375, 0.29021453857421875, 0.3060302734375, 0.32184600830078125, 0.3376617431640625, 0.35347747802734375, 0.369293212890625, 0.38510894775390625, 0.4009246826171875, 0.41674041748046875, 0.43255615234375, 0.44837188720703125, 0.4641876220703125, 0.48000335693359375, 0.495819091796875, 0.5116348266601562, 0.5274505615234375, 0.5432662963867188, 0.55908203125]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 11.0, 8.0, 12.0, 11.0, 4.0, 13.0, 15.0, 27.0, 17.0, 20.0, 34.0, 35.0, 47.0, 47.0, 40.0, 51.0, 56.0, 60.0, 61.0, 59.0, 52.0, 44.0, 37.0, 39.0, 30.0, 31.0, 29.0, 22.0, 14.0, 16.0, 9.0, 10.0, 17.0, 2.0, 11.0, 4.0, 1.0, 2.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.72509765625, -0.6989593505859375, -0.672821044921875, -0.6466827392578125, -0.62054443359375, -0.5944061279296875, -0.568267822265625, -0.5421295166015625, -0.5159912109375, -0.4898529052734375, -0.463714599609375, -0.4375762939453125, -0.41143798828125, -0.3852996826171875, -0.359161376953125, -0.3330230712890625, -0.306884765625, -0.2807464599609375, -0.254608154296875, -0.2284698486328125, -0.20233154296875, -0.1761932373046875, -0.150054931640625, -0.1239166259765625, -0.0977783203125, -0.0716400146484375, -0.045501708984375, -0.0193634033203125, 0.00677490234375, 0.0329132080078125, 0.059051513671875, 0.0851898193359375, 0.111328125, 0.1374664306640625, 0.163604736328125, 0.1897430419921875, 0.21588134765625, 0.2420196533203125, 0.268157958984375, 0.2942962646484375, 0.3204345703125, 0.3465728759765625, 0.372711181640625, 0.3988494873046875, 0.42498779296875, 0.4511260986328125, 0.477264404296875, 0.5034027099609375, 0.529541015625, 0.5556793212890625, 0.581817626953125, 0.6079559326171875, 0.63409423828125, 0.6602325439453125, 0.686370849609375, 0.7125091552734375, 0.7386474609375, 0.7647857666015625, 0.790924072265625, 0.8170623779296875, 0.84320068359375, 0.8693389892578125, 0.895477294921875, 0.9216156005859375, 0.94775390625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 5.0, 10.0, 6.0, 29.0, 38.0, 39.0, 80.0, 162.0, 223.0, 451.0, 937.0, 1938.0, 4610.0, 11937.0, 37385.0, 154142.0, 684370.0, 107124.0, 28454.0, 9588.0, 3665.0, 1594.0, 770.0, 403.0, 237.0, 130.0, 80.0, 35.0, 32.0, 21.0, 17.0, 9.0, 9.0, 4.0, 3.0, 4.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.116943359375, -0.11233711242675781, -0.10773086547851562, -0.10312461853027344, -0.09851837158203125, -0.09391212463378906, -0.08930587768554688, -0.08469963073730469, -0.0800933837890625, -0.07548713684082031, -0.07088088989257812, -0.06627464294433594, -0.06166839599609375, -0.05706214904785156, -0.052455902099609375, -0.04784965515136719, -0.043243408203125, -0.03863716125488281, -0.034030914306640625, -0.029424667358398438, -0.02481842041015625, -0.020212173461914062, -0.015605926513671875, -0.010999679565429688, -0.0063934326171875, -0.0017871856689453125, 0.002819061279296875, 0.0074253082275390625, 0.01203155517578125, 0.016637802124023438, 0.021244049072265625, 0.025850296020507812, 0.03045654296875, 0.03506278991699219, 0.039669036865234375, 0.04427528381347656, 0.04888153076171875, 0.05348777770996094, 0.058094024658203125, 0.06270027160644531, 0.0673065185546875, 0.07191276550292969, 0.07651901245117188, 0.08112525939941406, 0.08573150634765625, 0.09033775329589844, 0.09494400024414062, 0.09955024719238281, 0.104156494140625, 0.10876274108886719, 0.11336898803710938, 0.11797523498535156, 0.12258148193359375, 0.12718772888183594, 0.13179397583007812, 0.1364002227783203, 0.1410064697265625, 0.1456127166748047, 0.15021896362304688, 0.15482521057128906, 0.15943145751953125, 0.16403770446777344, 0.16864395141601562, 0.1732501983642578, 0.1778564453125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 6.0, 3.0, 5.0, 7.0, 4.0, 10.0, 9.0, 10.0, 28.0, 24.0, 34.0, 32.0, 44.0, 49.0, 75.0, 96.0, 100.0, 98.0, 89.0, 63.0, 50.0, 43.0, 19.0, 15.0, 17.0, 9.0, 13.0, 7.0, 6.0, 8.0, 4.0, 3.0, 4.0, 8.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.559755325317383e-05, -4.428531974554062e-05, -4.297308623790741e-05, -4.16608527302742e-05, -4.034861922264099e-05, -3.903638571500778e-05, -3.772415220737457e-05, -3.6411918699741364e-05, -3.5099685192108154e-05, -3.3787451684474945e-05, -3.2475218176841736e-05, -3.1162984669208527e-05, -2.9850751161575317e-05, -2.8538517653942108e-05, -2.72262841463089e-05, -2.591405063867569e-05, -2.460181713104248e-05, -2.328958362340927e-05, -2.1977350115776062e-05, -2.0665116608142853e-05, -1.9352883100509644e-05, -1.8040649592876434e-05, -1.6728416085243225e-05, -1.5416182577610016e-05, -1.4103949069976807e-05, -1.2791715562343597e-05, -1.1479482054710388e-05, -1.0167248547077179e-05, -8.85501503944397e-06, -7.5427815318107605e-06, -6.230548024177551e-06, -4.918314516544342e-06, -3.606081008911133e-06, -2.2938475012779236e-06, -9.816139936447144e-07, 3.3061951398849487e-07, 1.642853021621704e-06, 2.9550865292549133e-06, 4.2673200368881226e-06, 5.579553544521332e-06, 6.891787052154541e-06, 8.20402055978775e-06, 9.51625406742096e-06, 1.0828487575054169e-05, 1.2140721082687378e-05, 1.3452954590320587e-05, 1.4765188097953796e-05, 1.6077421605587006e-05, 1.7389655113220215e-05, 1.8701888620853424e-05, 2.0014122128486633e-05, 2.1326355636119843e-05, 2.2638589143753052e-05, 2.395082265138626e-05, 2.526305615901947e-05, 2.657528966665268e-05, 2.788752317428589e-05, 2.9199756681919098e-05, 3.0511990189552307e-05, 3.1824223697185516e-05, 3.3136457204818726e-05, 3.4448690712451935e-05, 3.5760924220085144e-05, 3.707315772771835e-05, 3.838539123535156e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 10.0, 2.0, 5.0, 7.0, 10.0, 14.0, 26.0, 40.0, 47.0, 83.0, 146.0, 232.0, 420.0, 733.0, 1427.0, 3113.0, 7694.0, 21814.0, 75484.0, 565928.0, 280271.0, 60482.0, 18359.0, 6555.0, 2785.0, 1258.0, 672.0, 372.0, 214.0, 115.0, 84.0, 44.0, 37.0, 31.0, 12.0, 10.0, 11.0, 3.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1552734375, -0.15095043182373047, -0.14662742614746094, -0.1423044204711914, -0.13798141479492188, -0.13365840911865234, -0.1293354034423828, -0.12501239776611328, -0.12068939208984375, -0.11636638641357422, -0.11204338073730469, -0.10772037506103516, -0.10339736938476562, -0.0990743637084961, -0.09475135803222656, -0.09042835235595703, -0.0861053466796875, -0.08178234100341797, -0.07745933532714844, -0.0731363296508789, -0.06881332397460938, -0.06449031829833984, -0.06016731262207031, -0.05584430694580078, -0.05152130126953125, -0.04719829559326172, -0.04287528991699219, -0.038552284240722656, -0.034229278564453125, -0.029906272888183594, -0.025583267211914062, -0.02126026153564453, -0.016937255859375, -0.012614250183105469, -0.008291244506835938, -0.003968238830566406, 0.000354766845703125, 0.004677772521972656, 0.009000778198242188, 0.013323783874511719, 0.01764678955078125, 0.02196979522705078, 0.026292800903320312, 0.030615806579589844, 0.034938812255859375, 0.039261817932128906, 0.04358482360839844, 0.04790782928466797, 0.0522308349609375, 0.05655384063720703, 0.06087684631347656, 0.0651998519897461, 0.06952285766601562, 0.07384586334228516, 0.07816886901855469, 0.08249187469482422, 0.08681488037109375, 0.09113788604736328, 0.09546089172363281, 0.09978389739990234, 0.10410690307617188, 0.1084299087524414, 0.11275291442871094, 0.11707592010498047, 0.12139892578125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 2.0, 5.0, 4.0, 7.0, 10.0, 12.0, 24.0, 32.0, 26.0, 43.0, 41.0, 58.0, 74.0, 93.0, 105.0, 84.0, 89.0, 53.0, 43.0, 47.0, 26.0, 29.0, 27.0, 14.0, 6.0, 10.0, 9.0, 3.0, 6.0, 9.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1378173828125, -0.1328277587890625, -0.127838134765625, -0.1228485107421875, -0.11785888671875, -0.1128692626953125, -0.107879638671875, -0.1028900146484375, -0.097900390625, -0.0929107666015625, -0.087921142578125, -0.0829315185546875, -0.07794189453125, -0.0729522705078125, -0.067962646484375, -0.0629730224609375, -0.0579833984375, -0.0529937744140625, -0.048004150390625, -0.0430145263671875, -0.03802490234375, -0.0330352783203125, -0.028045654296875, -0.0230560302734375, -0.01806640625, -0.0130767822265625, -0.008087158203125, -0.0030975341796875, 0.00189208984375, 0.0068817138671875, 0.011871337890625, 0.0168609619140625, 0.0218505859375, 0.0268402099609375, 0.031829833984375, 0.0368194580078125, 0.04180908203125, 0.0467987060546875, 0.051788330078125, 0.0567779541015625, 0.061767578125, 0.0667572021484375, 0.071746826171875, 0.0767364501953125, 0.08172607421875, 0.0867156982421875, 0.091705322265625, 0.0966949462890625, 0.1016845703125, 0.1066741943359375, 0.111663818359375, 0.1166534423828125, 0.12164306640625, 0.1266326904296875, 0.131622314453125, 0.1366119384765625, 0.1416015625, 0.1465911865234375, 0.151580810546875, 0.1565704345703125, 0.16156005859375, 0.1665496826171875, 0.171539306640625, 0.1765289306640625, 0.1815185546875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 1.0, 7.0, 4.0, 8.0, 14.0, 30.0, 54.0, 98.0, 129.0, 297.0, 140.0, 83.0, 67.0, 21.0, 14.0, 18.0, 7.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.140110015869141, -4.020340442657471, -3.90057110786438, -3.78080153465271, -3.66103196144104, -3.541262626647949, -3.4214930534362793, -3.3017234802246094, -3.1819539070129395, -3.0621843338012695, -2.9424149990081787, -2.822645425796509, -2.702875852584839, -2.583106517791748, -2.463336944580078, -2.343567371368408, -2.2237977981567383, -2.1040282249450684, -1.984258770942688, -1.8644893169403076, -1.7447197437286377, -1.6249502897262573, -1.505180835723877, -1.385411262512207, -1.2656419277191162, -1.1458724737167358, -1.026102900505066, -0.9063334465026855, -0.7865638732910156, -0.6667944192886353, -0.5470249056816101, -0.42725539207458496, -0.30748581886291504, -0.1877163052558899, -0.06794680655002594, 0.05182269215583801, 0.17159220576286316, 0.2913616895675659, 0.41113120317459106, 0.5309007167816162, 0.6506702303886414, 0.7704397439956665, 0.8902092576026917, 1.0099787712097168, 1.1297482252120972, 1.2495176792144775, 1.3692872524261475, 1.4890568256378174, 1.6088262796401978, 1.7285957336425781, 1.848365306854248, 1.9681347608566284, 2.087904214859009, 2.2076737880706787, 2.3274433612823486, 2.4472126960754395, 2.5669822692871094, 2.6867518424987793, 2.80652117729187, 2.92629075050354, 3.04606032371521, 3.165829658508301, 3.2855992317199707, 3.4053688049316406, 3.5251383781433105]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 5.0, 8.0, 1.0, 9.0, 6.0, 12.0, 4.0, 16.0, 11.0, 21.0, 22.0, 17.0, 35.0, 27.0, 27.0, 24.0, 44.0, 38.0, 58.0, 72.0, 103.0, 85.0, 57.0, 36.0, 35.0, 26.0, 29.0, 27.0, 26.0, 17.0, 17.0, 18.0, 16.0, 15.0, 13.0, 6.0, 5.0, 5.0, 3.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.2381529808044434, -3.147207260131836, -3.0562615394592285, -2.965315818786621, -2.8743698596954346, -2.783424139022827, -2.6924784183502197, -2.6015326976776123, -2.510586977005005, -2.4196412563323975, -2.32869553565979, -2.2377495765686035, -2.146803855895996, -2.0558581352233887, -1.9649124145507812, -1.8739666938781738, -1.7830208539962769, -1.6920751333236694, -1.6011292934417725, -1.510183572769165, -1.4192378520965576, -1.3282921314239502, -1.2373462915420532, -1.1464005708694458, -1.0554547309875488, -0.9645089507102966, -0.8735632300376892, -0.782617449760437, -0.6916717290878296, -0.6007259488105774, -0.5097801685333252, -0.4188344478607178, -0.32788872718811035, -0.23694297671318054, -0.14599721133708954, -0.055051445960998535, 0.035894304513931274, 0.12684005498886108, 0.21778583526611328, 0.3087315559387207, 0.3996773362159729, 0.4906230866909027, 0.5815688371658325, 0.6725146174430847, 0.7634603977203369, 0.8544061183929443, 0.9453518986701965, 1.0362975597381592, 1.1272433996200562, 1.2181891202926636, 1.3091349601745605, 1.400080680847168, 1.4910264015197754, 1.5819721221923828, 1.6729179620742798, 1.7638636827468872, 1.8548095226287842, 1.9457552433013916, 2.036700963973999, 2.1276469230651855, 2.218592643737793, 2.3095383644104004, 2.400484085083008, 2.4914298057556152, 2.5823755264282227]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 8.0, 7.0, 15.0, 13.0, 30.0, 49.0, 59.0, 95.0, 169.0, 267.0, 540.0, 1010.0, 2885.0, 12507.0, 147681.0, 3028739.0, 944556.0, 45490.0, 6696.0, 1828.0, 720.0, 355.0, 219.0, 126.0, 73.0, 51.0, 31.0, 25.0, 12.0, 5.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.568359375, -0.5544204711914062, -0.5404815673828125, -0.5265426635742188, -0.512603759765625, -0.49866485595703125, -0.4847259521484375, -0.47078704833984375, -0.45684814453125, -0.44290924072265625, -0.4289703369140625, -0.41503143310546875, -0.401092529296875, -0.38715362548828125, -0.3732147216796875, -0.35927581787109375, -0.3453369140625, -0.33139801025390625, -0.3174591064453125, -0.30352020263671875, -0.289581298828125, -0.27564239501953125, -0.2617034912109375, -0.24776458740234375, -0.23382568359375, -0.21988677978515625, -0.2059478759765625, -0.19200897216796875, -0.178070068359375, -0.16413116455078125, -0.1501922607421875, -0.13625335693359375, -0.122314453125, -0.10837554931640625, -0.0944366455078125, -0.08049774169921875, -0.066558837890625, -0.05261993408203125, -0.0386810302734375, -0.02474212646484375, -0.01080322265625, 0.00313568115234375, 0.0170745849609375, 0.03101348876953125, 0.044952392578125, 0.05889129638671875, 0.0728302001953125, 0.08676910400390625, 0.1007080078125, 0.11464691162109375, 0.1285858154296875, 0.14252471923828125, 0.156463623046875, 0.17040252685546875, 0.1843414306640625, 0.19828033447265625, 0.21221923828125, 0.22615814208984375, 0.2400970458984375, 0.25403594970703125, 0.267974853515625, 0.28191375732421875, 0.2958526611328125, 0.30979156494140625, 0.32373046875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 4.0, 6.0, 10.0, 15.0, 21.0, 24.0, 33.0, 48.0, 36.0, 64.0, 55.0, 71.0, 86.0, 83.0, 64.0, 66.0, 59.0, 53.0, 63.0, 38.0, 22.0, 35.0, 20.0, 9.0, 5.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.4365234375, -0.42540740966796875, -0.4142913818359375, -0.40317535400390625, -0.392059326171875, -0.38094329833984375, -0.3698272705078125, -0.35871124267578125, -0.34759521484375, -0.33647918701171875, -0.3253631591796875, -0.31424713134765625, -0.303131103515625, -0.29201507568359375, -0.2808990478515625, -0.26978302001953125, -0.2586669921875, -0.24755096435546875, -0.2364349365234375, -0.22531890869140625, -0.214202880859375, -0.20308685302734375, -0.1919708251953125, -0.18085479736328125, -0.16973876953125, -0.15862274169921875, -0.1475067138671875, -0.13639068603515625, -0.125274658203125, -0.11415863037109375, -0.1030426025390625, -0.09192657470703125, -0.080810546875, -0.06969451904296875, -0.0585784912109375, -0.04746246337890625, -0.036346435546875, -0.02523040771484375, -0.0141143798828125, -0.00299835205078125, 0.00811767578125, 0.01923370361328125, 0.0303497314453125, 0.04146575927734375, 0.052581787109375, 0.06369781494140625, 0.0748138427734375, 0.08592987060546875, 0.0970458984375, 0.10816192626953125, 0.1192779541015625, 0.13039398193359375, 0.141510009765625, 0.15262603759765625, 0.1637420654296875, 0.17485809326171875, 0.18597412109375, 0.19709014892578125, 0.2082061767578125, 0.21932220458984375, 0.230438232421875, 0.24155426025390625, 0.2526702880859375, 0.26378631591796875, 0.27490234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 6.0, 9.0, 16.0, 33.0, 93.0, 286.0, 942.0, 5851.0, 1017280.0, 3159892.0, 8151.0, 1110.0, 371.0, 134.0, 50.0, 22.0, 9.0, 10.0, 7.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.3076171875, -1.26922607421875, -1.2308349609375, -1.19244384765625, -1.154052734375, -1.11566162109375, -1.0772705078125, -1.03887939453125, -1.00048828125, -0.96209716796875, -0.9237060546875, -0.88531494140625, -0.846923828125, -0.80853271484375, -0.7701416015625, -0.73175048828125, -0.693359375, -0.65496826171875, -0.6165771484375, -0.57818603515625, -0.539794921875, -0.50140380859375, -0.4630126953125, -0.42462158203125, -0.38623046875, -0.34783935546875, -0.3094482421875, -0.27105712890625, -0.232666015625, -0.19427490234375, -0.1558837890625, -0.11749267578125, -0.0791015625, -0.04071044921875, -0.0023193359375, 0.03607177734375, 0.074462890625, 0.11285400390625, 0.1512451171875, 0.18963623046875, 0.22802734375, 0.26641845703125, 0.3048095703125, 0.34320068359375, 0.381591796875, 0.41998291015625, 0.4583740234375, 0.49676513671875, 0.53515625, 0.57354736328125, 0.6119384765625, 0.65032958984375, 0.688720703125, 0.72711181640625, 0.7655029296875, 0.80389404296875, 0.84228515625, 0.88067626953125, 0.9190673828125, 0.95745849609375, 0.995849609375, 1.03424072265625, 1.0726318359375, 1.11102294921875, 1.1494140625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 10.0, 13.0, 23.0, 23.0, 55.0, 137.0, 301.0, 769.0, 1261.0, 888.0, 326.0, 131.0, 58.0, 31.0, 26.0, 8.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.65087890625, -0.6280288696289062, -0.6051788330078125, -0.5823287963867188, -0.559478759765625, -0.5366287231445312, -0.5137786865234375, -0.49092864990234375, -0.46807861328125, -0.44522857666015625, -0.4223785400390625, -0.39952850341796875, -0.376678466796875, -0.35382843017578125, -0.3309783935546875, -0.30812835693359375, -0.2852783203125, -0.26242828369140625, -0.2395782470703125, -0.21672821044921875, -0.193878173828125, -0.17102813720703125, -0.1481781005859375, -0.12532806396484375, -0.10247802734375, -0.07962799072265625, -0.0567779541015625, -0.03392791748046875, -0.011077880859375, 0.01177215576171875, 0.0346221923828125, 0.05747222900390625, 0.080322265625, 0.10317230224609375, 0.1260223388671875, 0.14887237548828125, 0.171722412109375, 0.19457244873046875, 0.2174224853515625, 0.24027252197265625, 0.26312255859375, 0.28597259521484375, 0.3088226318359375, 0.33167266845703125, 0.354522705078125, 0.37737274169921875, 0.4002227783203125, 0.42307281494140625, 0.4459228515625, 0.46877288818359375, 0.4916229248046875, 0.5144729614257812, 0.537322998046875, 0.5601730346679688, 0.5830230712890625, 0.6058731079101562, 0.62872314453125, 0.6515731811523438, 0.6744232177734375, 0.6972732543945312, 0.720123291015625, 0.7429733276367188, 0.7658233642578125, 0.7886734008789062, 0.8115234375]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 4.0, 13.0, 24.0, 67.0, 129.0, 258.0, 250.0, 139.0, 71.0, 32.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.293276786804199, -4.113205909729004, -3.9331345558166504, -3.753063678741455, -3.5729925632476807, -3.3929214477539062, -3.212850332260132, -3.0327792167663574, -2.852708339691162, -2.6726372241973877, -2.4925661087036133, -2.312495231628418, -2.1324241161346436, -1.9523530006408691, -1.7722818851470947, -1.5922108888626099, -1.412139654159546, -1.2320685386657715, -1.0519975423812866, -0.8719264268875122, -0.6918553709983826, -0.5117843151092529, -0.3317131996154785, -0.15164220333099365, 0.02842891216278076, 0.2084999829530716, 0.3885710537433624, 0.5686421394348145, 0.7487131953239441, 0.9287842512130737, 1.1088553667068481, 1.288926362991333, 1.4689974784851074, 1.6490685939788818, 1.8291395902633667, 2.0092105865478516, 2.189281702041626, 2.3693528175354004, 2.549423933029175, 2.729495048522949, 2.9095659255981445, 3.089637041091919, 3.2697081565856934, 3.4497790336608887, 3.629850149154663, 3.8099212646484375, 3.989992380142212, 4.170063495635986, 4.35013484954834, 4.530205726623535, 4.710277080535889, 4.890347957611084, 5.0704193115234375, 5.250490188598633, 5.430561065673828, 5.610632419586182, 5.790703296661377, 5.970774173736572, 6.150845527648926, 6.330916404724121, 6.510987758636475, 6.69105863571167, 6.871129989624023, 7.051200866699219, 7.231271743774414]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 2.0, 3.0, 10.0, 10.0, 8.0, 10.0, 17.0, 8.0, 23.0, 19.0, 20.0, 28.0, 31.0, 30.0, 31.0, 31.0, 33.0, 33.0, 29.0, 38.0, 42.0, 31.0, 37.0, 37.0, 46.0, 43.0, 40.0, 33.0, 28.0, 32.0, 24.0, 32.0, 21.0, 21.0, 18.0, 20.0, 10.0, 19.0, 13.0, 5.0, 13.0, 6.0, 5.0, 3.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.8792067766189575, -1.8227035999298096, -1.7662004232406616, -1.7096972465515137, -1.6531941890716553, -1.5966910123825073, -1.5401878356933594, -1.4836846590042114, -1.4271814823150635, -1.3706783056259155, -1.3141751289367676, -1.2576720714569092, -1.2011688947677612, -1.1446657180786133, -1.0881625413894653, -1.0316593647003174, -0.975156307220459, -0.918653130531311, -0.8621500134468079, -0.8056468367576599, -0.7491437196731567, -0.6926405429840088, -0.6361373662948608, -0.5796341896057129, -0.5231310725212097, -0.46662792563438416, -0.4101247787475586, -0.35362160205841064, -0.2971184551715851, -0.24061530828475952, -0.18411213159561157, -0.127608984708786, -0.07110595703125, -0.014602802693843842, 0.04190035164356232, 0.09840351343154907, 0.15490666031837463, 0.2114098072052002, 0.26791298389434814, 0.3244161307811737, 0.38091927766799927, 0.43742242455482483, 0.4939255714416504, 0.5504287481307983, 0.6069319248199463, 0.6634350419044495, 0.7199382185935974, 0.7764413356781006, 0.8329445123672485, 0.8894476890563965, 0.9459508061408997, 1.0024540424346924, 1.0589570999145508, 1.1154602766036987, 1.1719634532928467, 1.2284666299819946, 1.2849698066711426, 1.3414729833602905, 1.3979761600494385, 1.4544792175292969, 1.5109823942184448, 1.5674855709075928, 1.6239887475967407, 1.6804919242858887, 1.736994981765747]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 4.0, 11.0, 24.0, 23.0, 27.0, 53.0, 88.0, 142.0, 262.0, 546.0, 1100.0, 2653.0, 6970.0, 21470.0, 81967.0, 391703.0, 417786.0, 88365.0, 22941.0, 7314.0, 2746.0, 1172.0, 542.0, 276.0, 140.0, 83.0, 51.0, 25.0, 22.0, 15.0, 11.0, 9.0, 8.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44921875, -0.43318939208984375, -0.4171600341796875, -0.40113067626953125, -0.385101318359375, -0.36907196044921875, -0.3530426025390625, -0.33701324462890625, -0.32098388671875, -0.30495452880859375, -0.2889251708984375, -0.27289581298828125, -0.256866455078125, -0.24083709716796875, -0.2248077392578125, -0.20877838134765625, -0.1927490234375, -0.17671966552734375, -0.1606903076171875, -0.14466094970703125, -0.128631591796875, -0.11260223388671875, -0.0965728759765625, -0.08054351806640625, -0.06451416015625, -0.04848480224609375, -0.0324554443359375, -0.01642608642578125, -0.000396728515625, 0.01563262939453125, 0.0316619873046875, 0.04769134521484375, 0.063720703125, 0.07975006103515625, 0.0957794189453125, 0.11180877685546875, 0.127838134765625, 0.14386749267578125, 0.1598968505859375, 0.17592620849609375, 0.19195556640625, 0.20798492431640625, 0.2240142822265625, 0.24004364013671875, 0.256072998046875, 0.27210235595703125, 0.2881317138671875, 0.30416107177734375, 0.3201904296875, 0.33621978759765625, 0.3522491455078125, 0.36827850341796875, 0.384307861328125, 0.40033721923828125, 0.4163665771484375, 0.43239593505859375, 0.44842529296875, 0.46445465087890625, 0.4804840087890625, 0.49651336669921875, 0.512542724609375, 0.5285720825195312, 0.5446014404296875, 0.5606307983398438, 0.57666015625]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 7.0, 7.0, 11.0, 12.0, 18.0, 24.0, 30.0, 37.0, 39.0, 55.0, 67.0, 70.0, 71.0, 67.0, 79.0, 78.0, 76.0, 48.0, 51.0, 42.0, 31.0, 27.0, 18.0, 13.0, 10.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.439208984375, -0.4280967712402344, -0.41698455810546875, -0.4058723449707031, -0.3947601318359375, -0.3836479187011719, -0.37253570556640625, -0.3614234924316406, -0.350311279296875, -0.3391990661621094, -0.32808685302734375, -0.3169746398925781, -0.3058624267578125, -0.2947502136230469, -0.28363800048828125, -0.2725257873535156, -0.26141357421875, -0.2503013610839844, -0.23918914794921875, -0.22807693481445312, -0.2169647216796875, -0.20585250854492188, -0.19474029541015625, -0.18362808227539062, -0.172515869140625, -0.16140365600585938, -0.15029144287109375, -0.13917922973632812, -0.1280670166015625, -0.11695480346679688, -0.10584259033203125, -0.09473037719726562, -0.0836181640625, -0.07250595092773438, -0.06139373779296875, -0.050281524658203125, -0.0391693115234375, -0.028057098388671875, -0.01694488525390625, -0.005832672119140625, 0.005279541015625, 0.016391754150390625, 0.02750396728515625, 0.038616180419921875, 0.0497283935546875, 0.060840606689453125, 0.07195281982421875, 0.08306503295898438, 0.09417724609375, 0.10528945922851562, 0.11640167236328125, 0.12751388549804688, 0.1386260986328125, 0.14973831176757812, 0.16085052490234375, 0.17196273803710938, 0.183074951171875, 0.19418716430664062, 0.20529937744140625, 0.21641159057617188, 0.2275238037109375, 0.23863601684570312, 0.24974822998046875, 0.2608604431152344, 0.27197265625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 8.0, 8.0, 15.0, 19.0, 31.0, 40.0, 53.0, 89.0, 135.0, 200.0, 292.0, 437.0, 735.0, 1395.0, 3421.0, 11841.0, 61443.0, 693580.0, 229871.0, 32226.0, 7160.0, 2496.0, 1144.0, 599.0, 417.0, 284.0, 191.0, 125.0, 94.0, 68.0, 32.0, 32.0, 18.0, 11.0, 10.0, 9.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.50732421875, -0.4890899658203125, -0.470855712890625, -0.4526214599609375, -0.43438720703125, -0.4161529541015625, -0.397918701171875, -0.3796844482421875, -0.3614501953125, -0.3432159423828125, -0.324981689453125, -0.3067474365234375, -0.28851318359375, -0.2702789306640625, -0.252044677734375, -0.2338104248046875, -0.215576171875, -0.1973419189453125, -0.179107666015625, -0.1608734130859375, -0.14263916015625, -0.1244049072265625, -0.106170654296875, -0.0879364013671875, -0.0697021484375, -0.0514678955078125, -0.033233642578125, -0.0149993896484375, 0.00323486328125, 0.0214691162109375, 0.039703369140625, 0.0579376220703125, 0.076171875, 0.0944061279296875, 0.112640380859375, 0.1308746337890625, 0.14910888671875, 0.1673431396484375, 0.185577392578125, 0.2038116455078125, 0.2220458984375, 0.2402801513671875, 0.258514404296875, 0.2767486572265625, 0.29498291015625, 0.3132171630859375, 0.331451416015625, 0.3496856689453125, 0.367919921875, 0.3861541748046875, 0.404388427734375, 0.4226226806640625, 0.44085693359375, 0.4590911865234375, 0.477325439453125, 0.4955596923828125, 0.5137939453125, 0.5320281982421875, 0.550262451171875, 0.5684967041015625, 0.58673095703125, 0.6049652099609375, 0.623199462890625, 0.6414337158203125, 0.65966796875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 8.0, 10.0, 8.0, 9.0, 11.0, 14.0, 16.0, 18.0, 26.0, 29.0, 34.0, 44.0, 42.0, 41.0, 40.0, 53.0, 51.0, 65.0, 58.0, 39.0, 47.0, 46.0, 43.0, 26.0, 34.0, 38.0, 24.0, 17.0, 22.0, 13.0, 18.0, 9.0, 15.0, 7.0, 10.0, 3.0, 4.0, 2.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.8505859375, -0.8237838745117188, -0.7969818115234375, -0.7701797485351562, -0.743377685546875, -0.7165756225585938, -0.6897735595703125, -0.6629714965820312, -0.63616943359375, -0.6093673706054688, -0.5825653076171875, -0.5557632446289062, -0.528961181640625, -0.5021591186523438, -0.4753570556640625, -0.44855499267578125, -0.4217529296875, -0.39495086669921875, -0.3681488037109375, -0.34134674072265625, -0.314544677734375, -0.28774261474609375, -0.2609405517578125, -0.23413848876953125, -0.20733642578125, -0.18053436279296875, -0.1537322998046875, -0.12693023681640625, -0.100128173828125, -0.07332611083984375, -0.0465240478515625, -0.01972198486328125, 0.007080078125, 0.03388214111328125, 0.0606842041015625, 0.08748626708984375, 0.114288330078125, 0.14109039306640625, 0.1678924560546875, 0.19469451904296875, 0.22149658203125, 0.24829864501953125, 0.2751007080078125, 0.30190277099609375, 0.328704833984375, 0.35550689697265625, 0.3823089599609375, 0.40911102294921875, 0.4359130859375, 0.46271514892578125, 0.4895172119140625, 0.5163192749023438, 0.543121337890625, 0.5699234008789062, 0.5967254638671875, 0.6235275268554688, 0.65032958984375, 0.6771316528320312, 0.7039337158203125, 0.7307357788085938, 0.757537841796875, 0.7843399047851562, 0.8111419677734375, 0.8379440307617188, 0.86474609375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 5.0, 4.0, 3.0, 4.0, 5.0, 5.0, 7.0, 9.0, 9.0, 15.0, 22.0, 20.0, 48.0, 59.0, 88.0, 169.0, 350.0, 735.0, 1974.0, 8205.0, 55199.0, 844342.0, 118658.0, 13786.0, 3010.0, 948.0, 352.0, 196.0, 102.0, 63.0, 30.0, 33.0, 22.0, 16.0, 13.0, 10.0, 14.0, 6.0, 6.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2108154296875, -0.20415496826171875, -0.1974945068359375, -0.19083404541015625, -0.184173583984375, -0.17751312255859375, -0.1708526611328125, -0.16419219970703125, -0.15753173828125, -0.15087127685546875, -0.1442108154296875, -0.13755035400390625, -0.130889892578125, -0.12422943115234375, -0.1175689697265625, -0.11090850830078125, -0.104248046875, -0.09758758544921875, -0.0909271240234375, -0.08426666259765625, -0.077606201171875, -0.07094573974609375, -0.0642852783203125, -0.05762481689453125, -0.05096435546875, -0.04430389404296875, -0.0376434326171875, -0.03098297119140625, -0.024322509765625, -0.01766204833984375, -0.0110015869140625, -0.00434112548828125, 0.0023193359375, 0.00897979736328125, 0.0156402587890625, 0.02230072021484375, 0.028961181640625, 0.03562164306640625, 0.0422821044921875, 0.04894256591796875, 0.05560302734375, 0.06226348876953125, 0.0689239501953125, 0.07558441162109375, 0.082244873046875, 0.08890533447265625, 0.0955657958984375, 0.10222625732421875, 0.10888671875, 0.11554718017578125, 0.1222076416015625, 0.12886810302734375, 0.135528564453125, 0.14218902587890625, 0.1488494873046875, 0.15550994873046875, 0.16217041015625, 0.16883087158203125, 0.1754913330078125, 0.18215179443359375, 0.188812255859375, 0.19547271728515625, 0.2021331787109375, 0.20879364013671875, 0.2154541015625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 7.0, 2.0, 4.0, 7.0, 6.0, 9.0, 13.0, 16.0, 22.0, 17.0, 33.0, 33.0, 38.0, 51.0, 52.0, 81.0, 86.0, 93.0, 80.0, 75.0, 56.0, 36.0, 29.0, 14.0, 20.0, 18.0, 26.0, 10.0, 12.0, 11.0, 7.0, 5.0, 4.0, 4.0, 6.0, 2.0, 5.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.236532211303711e-05, -3.1297095119953156e-05, -3.02288681268692e-05, -2.9160641133785248e-05, -2.8092414140701294e-05, -2.702418714761734e-05, -2.5955960154533386e-05, -2.4887733161449432e-05, -2.381950616836548e-05, -2.2751279175281525e-05, -2.168305218219757e-05, -2.0614825189113617e-05, -1.9546598196029663e-05, -1.847837120294571e-05, -1.7410144209861755e-05, -1.63419172167778e-05, -1.5273690223693848e-05, -1.4205463230609894e-05, -1.313723623752594e-05, -1.2069009244441986e-05, -1.1000782251358032e-05, -9.932555258274078e-06, -8.864328265190125e-06, -7.79610127210617e-06, -6.727874279022217e-06, -5.659647285938263e-06, -4.591420292854309e-06, -3.5231932997703552e-06, -2.4549663066864014e-06, -1.3867393136024475e-06, -3.1851232051849365e-07, 7.497146725654602e-07, 1.817941665649414e-06, 2.886168658733368e-06, 3.954395651817322e-06, 5.022622644901276e-06, 6.0908496379852295e-06, 7.159076631069183e-06, 8.227303624153137e-06, 9.295530617237091e-06, 1.0363757610321045e-05, 1.1431984603404999e-05, 1.2500211596488953e-05, 1.3568438589572906e-05, 1.463666558265686e-05, 1.5704892575740814e-05, 1.6773119568824768e-05, 1.7841346561908722e-05, 1.8909573554992676e-05, 1.997780054807663e-05, 2.1046027541160583e-05, 2.2114254534244537e-05, 2.318248152732849e-05, 2.4250708520412445e-05, 2.53189355134964e-05, 2.6387162506580353e-05, 2.7455389499664307e-05, 2.852361649274826e-05, 2.9591843485832214e-05, 3.066007047891617e-05, 3.172829747200012e-05, 3.2796524465084076e-05, 3.386475145816803e-05, 3.4932978451251984e-05, 3.600120544433594e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 9.0, 12.0, 12.0, 27.0, 36.0, 56.0, 62.0, 128.0, 174.0, 300.0, 520.0, 934.0, 2038.0, 4775.0, 14544.0, 58097.0, 641149.0, 263905.0, 42356.0, 11412.0, 4142.0, 1692.0, 878.0, 472.0, 249.0, 169.0, 122.0, 87.0, 60.0, 33.0, 25.0, 21.0, 19.0, 9.0, 5.0, 8.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1619873046875, -0.15759754180908203, -0.15320777893066406, -0.1488180160522461, -0.14442825317382812, -0.14003849029541016, -0.1356487274169922, -0.13125896453857422, -0.12686920166015625, -0.12247943878173828, -0.11808967590332031, -0.11369991302490234, -0.10931015014648438, -0.1049203872680664, -0.10053062438964844, -0.09614086151123047, -0.0917510986328125, -0.08736133575439453, -0.08297157287597656, -0.0785818099975586, -0.07419204711914062, -0.06980228424072266, -0.06541252136230469, -0.06102275848388672, -0.05663299560546875, -0.05224323272705078, -0.04785346984863281, -0.043463706970214844, -0.039073944091796875, -0.034684181213378906, -0.030294418334960938, -0.02590465545654297, -0.021514892578125, -0.01712512969970703, -0.012735366821289062, -0.008345603942871094, -0.003955841064453125, 0.00043392181396484375, 0.0048236846923828125, 0.009213447570800781, 0.01360321044921875, 0.01799297332763672, 0.022382736206054688, 0.026772499084472656, 0.031162261962890625, 0.035552024841308594, 0.03994178771972656, 0.04433155059814453, 0.0487213134765625, 0.05311107635498047, 0.05750083923339844, 0.061890602111816406, 0.06628036499023438, 0.07067012786865234, 0.07505989074707031, 0.07944965362548828, 0.08383941650390625, 0.08822917938232422, 0.09261894226074219, 0.09700870513916016, 0.10139846801757812, 0.1057882308959961, 0.11017799377441406, 0.11456775665283203, 0.11895751953125]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 4.0, 3.0, 4.0, 5.0, 8.0, 7.0, 8.0, 12.0, 12.0, 22.0, 27.0, 31.0, 45.0, 56.0, 81.0, 83.0, 118.0, 97.0, 88.0, 74.0, 43.0, 37.0, 26.0, 18.0, 24.0, 16.0, 9.0, 9.0, 10.0, 2.0, 8.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.1727294921875, -0.1677875518798828, -0.16284561157226562, -0.15790367126464844, -0.15296173095703125, -0.14801979064941406, -0.14307785034179688, -0.1381359100341797, -0.1331939697265625, -0.1282520294189453, -0.12331008911132812, -0.11836814880371094, -0.11342620849609375, -0.10848426818847656, -0.10354232788085938, -0.09860038757324219, -0.093658447265625, -0.08871650695800781, -0.08377456665039062, -0.07883262634277344, -0.07389068603515625, -0.06894874572753906, -0.06400680541992188, -0.05906486511230469, -0.0541229248046875, -0.04918098449707031, -0.044239044189453125, -0.03929710388183594, -0.03435516357421875, -0.029413223266601562, -0.024471282958984375, -0.019529342651367188, -0.01458740234375, -0.009645462036132812, -0.004703521728515625, 0.0002384185791015625, 0.00518035888671875, 0.010122299194335938, 0.015064239501953125, 0.020006179809570312, 0.0249481201171875, 0.029890060424804688, 0.034832000732421875, 0.03977394104003906, 0.04471588134765625, 0.04965782165527344, 0.054599761962890625, 0.05954170227050781, 0.064483642578125, 0.06942558288574219, 0.07436752319335938, 0.07930946350097656, 0.08425140380859375, 0.08919334411621094, 0.09413528442382812, 0.09907722473144531, 0.1040191650390625, 0.10896110534667969, 0.11390304565429688, 0.11884498596191406, 0.12378692626953125, 0.12872886657714844, 0.13367080688476562, 0.1386127471923828, 0.1435546875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 12.0, 22.0, 40.0, 86.0, 192.0, 373.0, 143.0, 58.0, 26.0, 27.0, 6.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.559589385986328, -6.392940044403076, -6.226290225982666, -6.059640884399414, -5.892991542816162, -5.72634220123291, -5.5596923828125, -5.393043041229248, -5.226393699645996, -5.059744358062744, -4.893094539642334, -4.726445198059082, -4.55979585647583, -4.393146514892578, -4.226496696472168, -4.059847354888916, -3.893197536468506, -3.726547956466675, -3.559898614883423, -3.393249034881592, -3.22659969329834, -3.059950113296509, -2.8933005332946777, -2.726651191711426, -2.5600016117095947, -2.3933520317077637, -2.2267026901245117, -2.0600531101226807, -1.8934036493301392, -1.7267541885375977, -1.5601046085357666, -1.393455147743225, -1.2268052101135254, -1.0601557493209839, -0.8935062289237976, -0.7268567085266113, -0.5602072477340698, -0.3935577869415283, -0.22690826654434204, -0.06025874614715576, 0.10639071464538574, 0.27304020524024963, 0.4396896958351135, 0.6063392162322998, 0.7729886770248413, 0.9396381378173828, 1.1062877178192139, 1.2729371786117554, 1.4395866394042969, 1.6062361001968384, 1.7728855609893799, 1.939535140991211, 2.106184482574463, 2.272834062576294, 2.439483642578125, 2.606132984161377, 2.772782564163208, 2.939432144165039, 3.106081485748291, 3.272731065750122, 3.439380645751953, 3.606029987335205, 3.772679567337036, 3.939329147338867, 4.105978488922119]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 5.0, 3.0, 3.0, 11.0, 6.0, 14.0, 10.0, 9.0, 21.0, 26.0, 22.0, 29.0, 33.0, 30.0, 50.0, 51.0, 95.0, 129.0, 111.0, 79.0, 50.0, 35.0, 28.0, 26.0, 24.0, 19.0, 21.0, 8.0, 17.0, 10.0, 7.0, 9.0, 4.0, 0.0, 8.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.768167495727539, -3.636963367462158, -3.5057592391967773, -3.3745553493499756, -3.2433512210845947, -3.112147092819214, -2.980943202972412, -2.8497390747070312, -2.7185349464416504, -2.5873308181762695, -2.4561266899108887, -2.324922800064087, -2.193718671798706, -2.062514543533325, -1.9313105344772339, -1.8001065254211426, -1.6689023971557617, -1.5376982688903809, -1.4064942598342896, -1.2752902507781982, -1.1440861225128174, -1.0128819942474365, -0.8816779851913452, -0.7504739165306091, -0.619269847869873, -0.48806577920913696, -0.3568617105484009, -0.2256576418876648, -0.09445357322692871, 0.03675049543380737, 0.16795456409454346, 0.29915863275527954, 0.43036317825317383, 0.5615672469139099, 0.692771315574646, 0.8239753842353821, 0.9551794528961182, 1.086383581161499, 1.2175875902175903, 1.3487915992736816, 1.4799957275390625, 1.6111998558044434, 1.7424038648605347, 1.873607873916626, 2.004812002182007, 2.1360161304473877, 2.2672200202941895, 2.3984241485595703, 2.529628276824951, 2.660832405090332, 2.792036533355713, 2.9232404232025146, 3.0544445514678955, 3.1856486797332764, 3.316852569580078, 3.448056697845459, 3.57926082611084, 3.7104649543762207, 3.8416690826416016, 3.9728729724884033, 4.104077339172363, 4.235280990600586, 4.366485118865967, 4.497689247131348, 4.6288933753967285]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 5.0, 9.0, 7.0, 8.0, 17.0, 12.0, 35.0, 48.0, 60.0, 115.0, 211.0, 381.0, 748.0, 1485.0, 3489.0, 10819.0, 48024.0, 384612.0, 2269542.0, 1275836.0, 160071.0, 26508.0, 7384.0, 2703.0, 1080.0, 499.0, 238.0, 139.0, 88.0, 47.0, 14.0, 19.0, 6.0, 8.0, 4.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45849609375, -0.44532012939453125, -0.4321441650390625, -0.41896820068359375, -0.405792236328125, -0.39261627197265625, -0.3794403076171875, -0.36626434326171875, -0.35308837890625, -0.33991241455078125, -0.3267364501953125, -0.31356048583984375, -0.300384521484375, -0.28720855712890625, -0.2740325927734375, -0.26085662841796875, -0.2476806640625, -0.23450469970703125, -0.2213287353515625, -0.20815277099609375, -0.194976806640625, -0.18180084228515625, -0.1686248779296875, -0.15544891357421875, -0.14227294921875, -0.12909698486328125, -0.1159210205078125, -0.10274505615234375, -0.089569091796875, -0.07639312744140625, -0.0632171630859375, -0.05004119873046875, -0.036865234375, -0.02368927001953125, -0.0105133056640625, 0.00266265869140625, 0.015838623046875, 0.02901458740234375, 0.0421905517578125, 0.05536651611328125, 0.06854248046875, 0.08171844482421875, 0.0948944091796875, 0.10807037353515625, 0.121246337890625, 0.13442230224609375, 0.1475982666015625, 0.16077423095703125, 0.1739501953125, 0.18712615966796875, 0.2003021240234375, 0.21347808837890625, 0.226654052734375, 0.23983001708984375, 0.2530059814453125, 0.26618194580078125, 0.27935791015625, 0.29253387451171875, 0.3057098388671875, 0.31888580322265625, 0.332061767578125, 0.34523773193359375, 0.3584136962890625, 0.37158966064453125, 0.384765625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 6.0, 7.0, 9.0, 11.0, 20.0, 14.0, 32.0, 39.0, 48.0, 47.0, 58.0, 84.0, 76.0, 89.0, 67.0, 80.0, 58.0, 53.0, 55.0, 41.0, 24.0, 25.0, 23.0, 10.0, 9.0, 6.0, 7.0, 4.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.43994140625, -0.4288063049316406, -0.41767120361328125, -0.4065361022949219, -0.3954010009765625, -0.3842658996582031, -0.37313079833984375, -0.3619956970214844, -0.350860595703125, -0.3397254943847656, -0.32859039306640625, -0.3174552917480469, -0.3063201904296875, -0.2951850891113281, -0.28404998779296875, -0.2729148864746094, -0.26177978515625, -0.2506446838378906, -0.23950958251953125, -0.22837448120117188, -0.2172393798828125, -0.20610427856445312, -0.19496917724609375, -0.18383407592773438, -0.172698974609375, -0.16156387329101562, -0.15042877197265625, -0.13929367065429688, -0.1281585693359375, -0.11702346801757812, -0.10588836669921875, -0.09475326538085938, -0.0836181640625, -0.07248306274414062, -0.06134796142578125, -0.050212860107421875, -0.0390777587890625, -0.027942657470703125, -0.01680755615234375, -0.005672454833984375, 0.005462646484375, 0.016597747802734375, 0.02773284912109375, 0.038867950439453125, 0.0500030517578125, 0.061138153076171875, 0.07227325439453125, 0.08340835571289062, 0.09454345703125, 0.10567855834960938, 0.11681365966796875, 0.12794876098632812, 0.1390838623046875, 0.15021896362304688, 0.16135406494140625, 0.17248916625976562, 0.183624267578125, 0.19475936889648438, 0.20589447021484375, 0.21702957153320312, 0.2281646728515625, 0.23929977416992188, 0.25043487548828125, 0.2615699768066406, 0.272705078125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 4.0, 7.0, 11.0, 14.0, 15.0, 35.0, 36.0, 60.0, 110.0, 162.0, 280.0, 662.0, 1647.0, 6833.0, 292322.0, 3868374.0, 19027.0, 2846.0, 871.0, 435.0, 204.0, 119.0, 66.0, 48.0, 29.0, 22.0, 10.0, 11.0, 10.0, 4.0, 3.0, 2.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.6708984375, -1.623443603515625, -1.57598876953125, -1.528533935546875, -1.4810791015625, -1.433624267578125, -1.38616943359375, -1.338714599609375, -1.291259765625, -1.243804931640625, -1.19635009765625, -1.148895263671875, -1.1014404296875, -1.053985595703125, -1.00653076171875, -0.959075927734375, -0.91162109375, -0.864166259765625, -0.81671142578125, -0.769256591796875, -0.7218017578125, -0.674346923828125, -0.62689208984375, -0.579437255859375, -0.531982421875, -0.484527587890625, -0.43707275390625, -0.389617919921875, -0.3421630859375, -0.294708251953125, -0.24725341796875, -0.199798583984375, -0.15234375, -0.104888916015625, -0.05743408203125, -0.009979248046875, 0.0374755859375, 0.084930419921875, 0.13238525390625, 0.179840087890625, 0.227294921875, 0.274749755859375, 0.32220458984375, 0.369659423828125, 0.4171142578125, 0.464569091796875, 0.51202392578125, 0.559478759765625, 0.60693359375, 0.654388427734375, 0.70184326171875, 0.749298095703125, 0.7967529296875, 0.844207763671875, 0.89166259765625, 0.939117431640625, 0.986572265625, 1.034027099609375, 1.08148193359375, 1.128936767578125, 1.1763916015625, 1.223846435546875, 1.27130126953125, 1.318756103515625, 1.3662109375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 8.0, 8.0, 12.0, 18.0, 23.0, 43.0, 62.0, 103.0, 172.0, 266.0, 441.0, 724.0, 756.0, 530.0, 367.0, 171.0, 127.0, 71.0, 55.0, 41.0, 22.0, 13.0, 14.0, 7.0, 4.0, 3.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.66943359375, -0.6415786743164062, -0.6137237548828125, -0.5858688354492188, -0.558013916015625, -0.5301589965820312, -0.5023040771484375, -0.47444915771484375, -0.44659423828125, -0.41873931884765625, -0.3908843994140625, -0.36302947998046875, -0.335174560546875, -0.30731964111328125, -0.2794647216796875, -0.25160980224609375, -0.2237548828125, -0.19589996337890625, -0.1680450439453125, -0.14019012451171875, -0.112335205078125, -0.08448028564453125, -0.0566253662109375, -0.02877044677734375, -0.00091552734375, 0.02693939208984375, 0.0547943115234375, 0.08264923095703125, 0.110504150390625, 0.13835906982421875, 0.1662139892578125, 0.19406890869140625, 0.221923828125, 0.24977874755859375, 0.2776336669921875, 0.30548858642578125, 0.333343505859375, 0.36119842529296875, 0.3890533447265625, 0.41690826416015625, 0.44476318359375, 0.47261810302734375, 0.5004730224609375, 0.5283279418945312, 0.556182861328125, 0.5840377807617188, 0.6118927001953125, 0.6397476196289062, 0.6676025390625, 0.6954574584960938, 0.7233123779296875, 0.7511672973632812, 0.779022216796875, 0.8068771362304688, 0.8347320556640625, 0.8625869750976562, 0.89044189453125, 0.9182968139648438, 0.9461517333984375, 0.9740066528320312, 1.001861572265625, 1.0297164916992188, 1.0575714111328125, 1.0854263305664062, 1.11328125]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 4.0, 3.0, 7.0, 15.0, 11.0, 20.0, 36.0, 65.0, 157.0, 207.0, 205.0, 107.0, 70.0, 43.0, 17.0, 8.0, 8.0, 8.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.789063930511475, -7.518535614013672, -7.248007297515869, -6.977478981018066, -6.706951141357422, -6.436422824859619, -6.165894508361816, -5.895366191864014, -5.624837875366211, -5.354309558868408, -5.0837812423706055, -4.813253402709961, -4.542725086212158, -4.2721967697143555, -4.001668453216553, -3.73114013671875, -3.4606122970581055, -3.1900839805603027, -2.919555902481079, -2.6490275859832764, -2.3784995079040527, -2.10797119140625, -1.8374428749084473, -1.566914677619934, -1.296386480331421, -1.0258582830429077, -0.7553300261497498, -0.4848017692565918, -0.2142735719680786, 0.05625462532043457, 0.3267829418182373, 0.5973111391067505, 0.8678388595581055, 1.1383670568466187, 1.4088952541351318, 1.6794235706329346, 1.9499517679214478, 2.220479965209961, 2.4910082817077637, 2.7615365982055664, 3.03206467628479, 3.3025929927825928, 3.5731210708618164, 3.843649387359619, 4.114177703857422, 4.384705543518066, 4.655234336853027, 4.925762176513672, 5.196290493011475, 5.466818809509277, 5.73734712600708, 6.007875442504883, 6.278403282165527, 6.54893159866333, 6.819459915161133, 7.0899882316589355, 7.360516548156738, 7.631044864654541, 7.901573181152344, 8.172101020812988, 8.44262981414795, 8.713157653808594, 8.983686447143555, 9.2542142868042, 9.524742126464844]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 1.0, 6.0, 2.0, 7.0, 9.0, 11.0, 13.0, 24.0, 15.0, 18.0, 36.0, 27.0, 34.0, 36.0, 40.0, 54.0, 52.0, 68.0, 68.0, 75.0, 61.0, 62.0, 54.0, 36.0, 34.0, 32.0, 24.0, 20.0, 13.0, 14.0, 12.0, 4.0, 13.0, 11.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.177767276763916, -5.024965286254883, -4.87216329574585, -4.719361305236816, -4.566559314727783, -4.41375732421875, -4.260955333709717, -4.108153343200684, -3.9553511142730713, -3.802549123764038, -3.649747133255005, -3.4969451427459717, -3.3441429138183594, -3.191340923309326, -3.038538932800293, -2.8857369422912598, -2.7329349517822266, -2.5801329612731934, -2.42733097076416, -2.274528980255127, -2.1217269897460938, -1.968924880027771, -1.8161227703094482, -1.663320779800415, -1.5105187892913818, -1.3577167987823486, -1.2049148082733154, -1.0521126985549927, -0.8993107080459595, -0.7465087175369263, -0.5937066674232483, -0.4409046173095703, -0.2881021499633789, -0.13530012965202332, 0.017501890659332275, 0.17030391097068787, 0.32310593128204346, 0.47590792179107666, 0.6287099719047546, 0.7815120220184326, 0.9343140125274658, 1.087116003036499, 1.2399179935455322, 1.392720103263855, 1.5455220937728882, 1.6983240842819214, 1.8511261940002441, 2.0039281845092773, 2.1567301750183105, 2.3095321655273438, 2.462334156036377, 2.61513614654541, 2.7679381370544434, 2.9207401275634766, 3.073542356491089, 3.226344347000122, 3.3791463375091553, 3.5319483280181885, 3.6847503185272217, 3.837552309036255, 3.990354537963867, 4.1431565284729, 4.295958518981934, 4.448760509490967, 4.6015625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 4.0, 9.0, 9.0, 18.0, 13.0, 30.0, 26.0, 57.0, 84.0, 139.0, 255.0, 551.0, 1042.0, 2550.0, 7612.0, 33396.0, 298388.0, 633568.0, 53878.0, 10828.0, 3438.0, 1359.0, 577.0, 300.0, 149.0, 108.0, 51.0, 37.0, 24.0, 19.0, 8.0, 6.0, 8.0, 4.0, 0.0, 5.0, 6.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5908203125, -0.5712127685546875, -0.551605224609375, -0.5319976806640625, -0.51239013671875, -0.4927825927734375, -0.473175048828125, -0.4535675048828125, -0.4339599609375, -0.4143524169921875, -0.394744873046875, -0.3751373291015625, -0.35552978515625, -0.3359222412109375, -0.316314697265625, -0.2967071533203125, -0.277099609375, -0.2574920654296875, -0.237884521484375, -0.2182769775390625, -0.19866943359375, -0.1790618896484375, -0.159454345703125, -0.1398468017578125, -0.1202392578125, -0.1006317138671875, -0.081024169921875, -0.0614166259765625, -0.04180908203125, -0.0222015380859375, -0.002593994140625, 0.0170135498046875, 0.03662109375, 0.0562286376953125, 0.075836181640625, 0.0954437255859375, 0.11505126953125, 0.1346588134765625, 0.154266357421875, 0.1738739013671875, 0.1934814453125, 0.2130889892578125, 0.232696533203125, 0.2523040771484375, 0.27191162109375, 0.2915191650390625, 0.311126708984375, 0.3307342529296875, 0.350341796875, 0.3699493408203125, 0.389556884765625, 0.4091644287109375, 0.42877197265625, 0.4483795166015625, 0.467987060546875, 0.4875946044921875, 0.5072021484375, 0.5268096923828125, 0.546417236328125, 0.5660247802734375, 0.58563232421875, 0.6052398681640625, 0.624847412109375, 0.6444549560546875, 0.6640625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 8.0, 10.0, 14.0, 9.0, 27.0, 29.0, 42.0, 50.0, 76.0, 73.0, 81.0, 61.0, 80.0, 81.0, 78.0, 67.0, 56.0, 38.0, 40.0, 21.0, 23.0, 14.0, 10.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.443115234375, -0.4283714294433594, -0.41362762451171875, -0.3988838195800781, -0.3841400146484375, -0.3693962097167969, -0.35465240478515625, -0.3399085998535156, -0.325164794921875, -0.3104209899902344, -0.29567718505859375, -0.2809333801269531, -0.2661895751953125, -0.2514457702636719, -0.23670196533203125, -0.22195816040039062, -0.20721435546875, -0.19247055053710938, -0.17772674560546875, -0.16298294067382812, -0.1482391357421875, -0.13349533081054688, -0.11875152587890625, -0.10400772094726562, -0.089263916015625, -0.07452011108398438, -0.05977630615234375, -0.045032501220703125, -0.0302886962890625, -0.015544891357421875, -0.00080108642578125, 0.013942718505859375, 0.0286865234375, 0.043430328369140625, 0.05817413330078125, 0.07291793823242188, 0.0876617431640625, 0.10240554809570312, 0.11714935302734375, 0.13189315795898438, 0.146636962890625, 0.16138076782226562, 0.17612457275390625, 0.19086837768554688, 0.2056121826171875, 0.22035598754882812, 0.23509979248046875, 0.24984359741210938, 0.26458740234375, 0.2793312072753906, 0.29407501220703125, 0.3088188171386719, 0.3235626220703125, 0.3383064270019531, 0.35305023193359375, 0.3677940368652344, 0.382537841796875, 0.3972816467285156, 0.41202545166015625, 0.4267692565917969, 0.4415130615234375, 0.4562568664550781, 0.47100067138671875, 0.4857444763183594, 0.50048828125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 7.0, 2.0, 8.0, 9.0, 5.0, 17.0, 24.0, 26.0, 41.0, 71.0, 99.0, 139.0, 215.0, 392.0, 719.0, 1700.0, 6218.0, 43978.0, 909437.0, 72842.0, 8596.0, 2096.0, 838.0, 405.0, 209.0, 130.0, 99.0, 66.0, 51.0, 24.0, 18.0, 11.0, 19.0, 12.0, 11.0, 6.0, 7.0, 2.0, 2.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.58447265625, -0.56329345703125, -0.5421142578125, -0.52093505859375, -0.499755859375, -0.47857666015625, -0.4573974609375, -0.43621826171875, -0.4150390625, -0.39385986328125, -0.3726806640625, -0.35150146484375, -0.330322265625, -0.30914306640625, -0.2879638671875, -0.26678466796875, -0.24560546875, -0.22442626953125, -0.2032470703125, -0.18206787109375, -0.160888671875, -0.13970947265625, -0.1185302734375, -0.09735107421875, -0.076171875, -0.05499267578125, -0.0338134765625, -0.01263427734375, 0.008544921875, 0.02972412109375, 0.0509033203125, 0.07208251953125, 0.09326171875, 0.11444091796875, 0.1356201171875, 0.15679931640625, 0.177978515625, 0.19915771484375, 0.2203369140625, 0.24151611328125, 0.2626953125, 0.28387451171875, 0.3050537109375, 0.32623291015625, 0.347412109375, 0.36859130859375, 0.3897705078125, 0.41094970703125, 0.43212890625, 0.45330810546875, 0.4744873046875, 0.49566650390625, 0.516845703125, 0.53802490234375, 0.5592041015625, 0.58038330078125, 0.6015625, 0.62274169921875, 0.6439208984375, 0.66510009765625, 0.686279296875, 0.70745849609375, 0.7286376953125, 0.74981689453125, 0.77099609375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 6.0, 10.0, 14.0, 17.0, 20.0, 17.0, 23.0, 26.0, 40.0, 27.0, 50.0, 68.0, 88.0, 93.0, 106.0, 85.0, 55.0, 51.0, 42.0, 38.0, 28.0, 23.0, 15.0, 15.0, 10.0, 10.0, 3.0, 12.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3525390625, -1.305908203125, -1.25927734375, -1.212646484375, -1.166015625, -1.119384765625, -1.07275390625, -1.026123046875, -0.9794921875, -0.932861328125, -0.88623046875, -0.839599609375, -0.79296875, -0.746337890625, -0.69970703125, -0.653076171875, -0.6064453125, -0.559814453125, -0.51318359375, -0.466552734375, -0.419921875, -0.373291015625, -0.32666015625, -0.280029296875, -0.2333984375, -0.186767578125, -0.14013671875, -0.093505859375, -0.046875, -0.000244140625, 0.04638671875, 0.093017578125, 0.1396484375, 0.186279296875, 0.23291015625, 0.279541015625, 0.326171875, 0.372802734375, 0.41943359375, 0.466064453125, 0.5126953125, 0.559326171875, 0.60595703125, 0.652587890625, 0.69921875, 0.745849609375, 0.79248046875, 0.839111328125, 0.8857421875, 0.932373046875, 0.97900390625, 1.025634765625, 1.072265625, 1.118896484375, 1.16552734375, 1.212158203125, 1.2587890625, 1.305419921875, 1.35205078125, 1.398681640625, 1.4453125, 1.491943359375, 1.53857421875, 1.585205078125, 1.6318359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 4.0, 3.0, 0.0, 4.0, 5.0, 8.0, 7.0, 7.0, 15.0, 11.0, 30.0, 40.0, 55.0, 116.0, 260.0, 638.0, 2243.0, 17997.0, 997083.0, 26053.0, 2614.0, 728.0, 298.0, 122.0, 74.0, 49.0, 25.0, 17.0, 9.0, 7.0, 6.0, 4.0, 8.0, 2.0, 2.0, 6.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25390625, -0.2461071014404297, -0.23830795288085938, -0.23050880432128906, -0.22270965576171875, -0.21491050720214844, -0.20711135864257812, -0.1993122100830078, -0.1915130615234375, -0.1837139129638672, -0.17591476440429688, -0.16811561584472656, -0.16031646728515625, -0.15251731872558594, -0.14471817016601562, -0.1369190216064453, -0.129119873046875, -0.12132072448730469, -0.11352157592773438, -0.10572242736816406, -0.09792327880859375, -0.09012413024902344, -0.08232498168945312, -0.07452583312988281, -0.0667266845703125, -0.05892753601074219, -0.051128387451171875, -0.04332923889160156, -0.03553009033203125, -0.027730941772460938, -0.019931793212890625, -0.012132644653320312, -0.00433349609375, 0.0034656524658203125, 0.011264801025390625, 0.019063949584960938, 0.02686309814453125, 0.03466224670410156, 0.042461395263671875, 0.05026054382324219, 0.0580596923828125, 0.06585884094238281, 0.07365798950195312, 0.08145713806152344, 0.08925628662109375, 0.09705543518066406, 0.10485458374023438, 0.11265373229980469, 0.120452880859375, 0.1282520294189453, 0.13605117797851562, 0.14385032653808594, 0.15164947509765625, 0.15944862365722656, 0.16724777221679688, 0.1750469207763672, 0.1828460693359375, 0.1906452178955078, 0.19844436645507812, 0.20624351501464844, 0.21404266357421875, 0.22184181213378906, 0.22964096069335938, 0.2374401092529297, 0.2452392578125]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 1.0, 1.0, 3.0, 4.0, 4.0, 4.0, 8.0, 7.0, 8.0, 11.0, 17.0, 25.0, 17.0, 27.0, 42.0, 51.0, 64.0, 64.0, 89.0, 117.0, 87.0, 71.0, 60.0, 40.0, 43.0, 23.0, 25.0, 20.0, 7.0, 7.0, 14.0, 8.0, 10.0, 5.0, 3.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.956390380859375e-05, -2.8653070330619812e-05, -2.7742236852645874e-05, -2.6831403374671936e-05, -2.5920569896697998e-05, -2.500973641872406e-05, -2.4098902940750122e-05, -2.3188069462776184e-05, -2.2277235984802246e-05, -2.1366402506828308e-05, -2.045556902885437e-05, -1.9544735550880432e-05, -1.8633902072906494e-05, -1.7723068594932556e-05, -1.6812235116958618e-05, -1.590140163898468e-05, -1.4990568161010742e-05, -1.4079734683036804e-05, -1.3168901205062866e-05, -1.2258067727088928e-05, -1.134723424911499e-05, -1.0436400771141052e-05, -9.525567293167114e-06, -8.614733815193176e-06, -7.703900337219238e-06, -6.7930668592453e-06, -5.882233381271362e-06, -4.971399903297424e-06, -4.060566425323486e-06, -3.1497329473495483e-06, -2.2388994693756104e-06, -1.3280659914016724e-06, -4.172325134277344e-07, 4.936009645462036e-07, 1.4044344425201416e-06, 2.3152679204940796e-06, 3.2261013984680176e-06, 4.1369348764419556e-06, 5.0477683544158936e-06, 5.9586018323898315e-06, 6.8694353103637695e-06, 7.780268788337708e-06, 8.691102266311646e-06, 9.601935744285583e-06, 1.0512769222259521e-05, 1.142360270023346e-05, 1.2334436178207397e-05, 1.3245269656181335e-05, 1.4156103134155273e-05, 1.5066936612129211e-05, 1.597777009010315e-05, 1.6888603568077087e-05, 1.7799437046051025e-05, 1.8710270524024963e-05, 1.96211040019989e-05, 2.053193747997284e-05, 2.1442770957946777e-05, 2.2353604435920715e-05, 2.3264437913894653e-05, 2.417527139186859e-05, 2.508610486984253e-05, 2.5996938347816467e-05, 2.6907771825790405e-05, 2.7818605303764343e-05, 2.872943878173828e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 6.0, 5.0, 12.0, 4.0, 4.0, 11.0, 14.0, 17.0, 17.0, 35.0, 59.0, 93.0, 118.0, 238.0, 427.0, 986.0, 2646.0, 7921.0, 32234.0, 791966.0, 180390.0, 21615.0, 5849.0, 2009.0, 902.0, 404.0, 217.0, 110.0, 69.0, 46.0, 27.0, 29.0, 16.0, 13.0, 11.0, 5.0, 6.0, 6.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0867919921875, -0.08398056030273438, -0.08116912841796875, -0.07835769653320312, -0.0755462646484375, -0.07273483276367188, -0.06992340087890625, -0.06711196899414062, -0.064300537109375, -0.061489105224609375, -0.05867767333984375, -0.055866241455078125, -0.0530548095703125, -0.050243377685546875, -0.04743194580078125, -0.044620513916015625, -0.04180908203125, -0.038997650146484375, -0.03618621826171875, -0.033374786376953125, -0.0305633544921875, -0.027751922607421875, -0.02494049072265625, -0.022129058837890625, -0.019317626953125, -0.016506195068359375, -0.01369476318359375, -0.010883331298828125, -0.0080718994140625, -0.005260467529296875, -0.00244903564453125, 0.000362396240234375, 0.003173828125, 0.005985260009765625, 0.00879669189453125, 0.011608123779296875, 0.0144195556640625, 0.017230987548828125, 0.02004241943359375, 0.022853851318359375, 0.025665283203125, 0.028476715087890625, 0.03128814697265625, 0.034099578857421875, 0.0369110107421875, 0.039722442626953125, 0.04253387451171875, 0.045345306396484375, 0.04815673828125, 0.050968170166015625, 0.05377960205078125, 0.056591033935546875, 0.0594024658203125, 0.062213897705078125, 0.06502532958984375, 0.06783676147460938, 0.070648193359375, 0.07345962524414062, 0.07627105712890625, 0.07908248901367188, 0.0818939208984375, 0.08470535278320312, 0.08751678466796875, 0.09032821655273438, 0.0931396484375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 8.0, 5.0, 5.0, 8.0, 12.0, 22.0, 30.0, 41.0, 85.0, 125.0, 244.0, 171.0, 86.0, 54.0, 32.0, 17.0, 19.0, 13.0, 11.0, 9.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.180419921875, -0.17488670349121094, -0.16935348510742188, -0.1638202667236328, -0.15828704833984375, -0.1527538299560547, -0.14722061157226562, -0.14168739318847656, -0.1361541748046875, -0.13062095642089844, -0.12508773803710938, -0.11955451965332031, -0.11402130126953125, -0.10848808288574219, -0.10295486450195312, -0.09742164611816406, -0.091888427734375, -0.08635520935058594, -0.08082199096679688, -0.07528877258300781, -0.06975555419921875, -0.06422233581542969, -0.058689117431640625, -0.05315589904785156, -0.0476226806640625, -0.04208946228027344, -0.036556243896484375, -0.031023025512695312, -0.02548980712890625, -0.019956588745117188, -0.014423370361328125, -0.008890151977539062, -0.00335693359375, 0.0021762847900390625, 0.007709503173828125, 0.013242721557617188, 0.01877593994140625, 0.024309158325195312, 0.029842376708984375, 0.03537559509277344, 0.0409088134765625, 0.04644203186035156, 0.051975250244140625, 0.05750846862792969, 0.06304168701171875, 0.06857490539550781, 0.07410812377929688, 0.07964134216308594, 0.085174560546875, 0.09070777893066406, 0.09624099731445312, 0.10177421569824219, 0.10730743408203125, 0.11284065246582031, 0.11837387084960938, 0.12390708923339844, 0.1294403076171875, 0.13497352600097656, 0.14050674438476562, 0.1460399627685547, 0.15157318115234375, 0.1571063995361328, 0.16263961791992188, 0.16817283630371094, 0.1737060546875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 9.0, 14.0, 19.0, 41.0, 135.0, 504.0, 165.0, 56.0, 25.0, 16.0, 10.0, 6.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.413158416748047, -5.20941686630249, -5.005674839019775, -4.801933288574219, -4.598191261291504, -4.394449710845947, -4.190708160400391, -3.986966133117676, -3.783224582672119, -3.5794827938079834, -3.3757410049438477, -3.171999454498291, -2.9682576656341553, -2.7645158767700195, -2.560774087905884, -2.357032299041748, -2.1532905101776123, -1.9495487213134766, -1.7458070516586304, -1.5420652627944946, -1.3383235931396484, -1.1345818042755127, -0.930840015411377, -0.7270983457565308, -0.523356556892395, -0.31961482763290405, -0.1158730685710907, 0.08786869049072266, 0.2916104197502136, 0.4953521490097046, 0.6990939378738403, 0.9028356075286865, 1.1065773963928223, 1.310319185256958, 1.5140608549118042, 1.71780264377594, 1.9215443134307861, 2.125286102294922, 2.3290278911590576, 2.5327696800231934, 2.73651123046875, 2.9402530193328857, 3.1439948081970215, 3.347736358642578, 3.551478147506714, 3.7552199363708496, 3.9589617252349854, 4.162703514099121, 4.366445541381836, 4.570187091827393, 4.773929119110107, 4.977670669555664, 5.181412696838379, 5.3851542472839355, 5.588895797729492, 5.792637825012207, 5.996379375457764, 6.20012092590332, 6.403862953186035, 6.607604503631592, 6.811346530914307, 7.015088081359863, 7.218830108642578, 7.422571659088135, 7.626313209533691]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 6.0, 2.0, 7.0, 3.0, 6.0, 7.0, 6.0, 18.0, 9.0, 18.0, 14.0, 18.0, 24.0, 28.0, 31.0, 63.0, 109.0, 124.0, 133.0, 108.0, 54.0, 28.0, 29.0, 20.0, 19.0, 8.0, 14.0, 13.0, 14.0, 9.0, 10.0, 10.0, 13.0, 10.0, 6.0, 5.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.9889779090881348, -2.8852453231811523, -2.781512975692749, -2.6777803897857666, -2.574047803878784, -2.470315456390381, -2.3665828704833984, -2.262850284576416, -2.1591179370880127, -2.0553853511810303, -1.9516528844833374, -1.8479204177856445, -1.7441879510879517, -1.6404554843902588, -1.5367228984832764, -1.4329904317855835, -1.329257845878601, -1.2255253791809082, -1.1217927932739258, -1.018060326576233, -0.91432785987854, -0.8105953335762024, -0.7068628072738647, -0.6031303405761719, -0.49939781427383423, -0.39566531777381897, -0.2919328212738037, -0.18820029497146606, -0.0844677984714508, 0.019264698028564453, 0.1229972243309021, 0.22672969102859497, 0.3304622173309326, 0.4341947138309479, 0.5379272103309631, 0.6416597366333008, 0.7453922033309937, 0.8491247296333313, 0.952857255935669, 1.0565897226333618, 1.1603221893310547, 1.2640546560287476, 1.36778724193573, 1.4715197086334229, 1.5752521753311157, 1.6789846420288086, 1.782717227935791, 1.8864496946334839, 1.9901822805404663, 2.093914747238159, 2.1976473331451416, 2.301379680633545, 2.4051122665405273, 2.5088448524475098, 2.612577438354492, 2.7163097858428955, 2.820042371749878, 2.9237749576568604, 3.0275073051452637, 3.131239891052246, 3.2349724769592285, 3.338704824447632, 3.4424374103546143, 3.5461697578430176, 3.64990234375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 4.0, 8.0, 10.0, 14.0, 10.0, 19.0, 23.0, 33.0, 25.0, 39.0, 45.0, 54.0, 246.0, 182.0, 55.0, 37.0, 35.0, 27.0, 28.0, 21.0, 19.0, 12.0, 6.0, 10.0, 8.0, 6.0, 6.0, 4.0, 4.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.366455078125, -0.3562660217285156, -0.34607696533203125, -0.3358879089355469, -0.3256988525390625, -0.3155097961425781, -0.30532073974609375, -0.2951316833496094, -0.284942626953125, -0.2747535705566406, -0.26456451416015625, -0.2543754577636719, -0.2441864013671875, -0.23399734497070312, -0.22380828857421875, -0.21361923217773438, -0.20343017578125, -0.19324111938476562, -0.18305206298828125, -0.17286300659179688, -0.1626739501953125, -0.15248489379882812, -0.14229583740234375, -0.13210678100585938, -0.121917724609375, -0.11172866821289062, -0.10153961181640625, -0.09135055541992188, -0.0811614990234375, -0.07097244262695312, -0.06078338623046875, -0.050594329833984375, -0.0404052734375, -0.030216217041015625, -0.02002716064453125, -0.009838104248046875, 0.0003509521484375, 0.010540008544921875, 0.02072906494140625, 0.030918121337890625, 0.041107177734375, 0.051296234130859375, 0.06148529052734375, 0.07167434692382812, 0.0818634033203125, 0.09205245971679688, 0.10224151611328125, 0.11243057250976562, 0.12261962890625, 0.13280868530273438, 0.14299774169921875, 0.15318679809570312, 0.1633758544921875, 0.17356491088867188, 0.18375396728515625, 0.19394302368164062, 0.204132080078125, 0.21432113647460938, 0.22451019287109375, 0.23469924926757812, 0.2448883056640625, 0.2550773620605469, 0.26526641845703125, 0.2754554748535156, 0.28564453125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 11.0, 6.0, 10.0, 14.0, 24.0, 34.0, 54.0, 82.0, 188.0, 428.0, 1302.0, 7673.0, 8353401.0, 21995.0, 2243.0, 606.0, 211.0, 109.0, 70.0, 42.0, 27.0, 15.0, 10.0, 14.0, 7.0, 1.0, 5.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-3.2009358406066895, -3.0998992919921875, -2.9988627433776855, -2.8978259563446045, -2.7967894077301025, -2.6957528591156006, -2.5947160720825195, -2.4936795234680176, -2.3926429748535156, -2.2916064262390137, -2.1905698776245117, -2.0895330905914307, -1.9884965419769287, -1.8874599933624268, -1.7864233255386353, -1.6853866577148438, -1.5843501091003418, -1.4833135604858398, -1.3822768926620483, -1.2812402248382568, -1.1802036762237549, -1.079167127609253, -0.9781304597854614, -0.8770938515663147, -0.776057243347168, -0.6750206351280212, -0.5739840269088745, -0.4729474186897278, -0.37191081047058105, -0.2708742022514343, -0.1698375940322876, -0.06880098581314087, 0.03223562240600586, 0.1332722306251526, 0.23430883884429932, 0.33534544706344604, 0.4363820552825928, 0.5374186635017395, 0.6384552717208862, 0.739491879940033, 0.8405284881591797, 0.9415650963783264, 1.0426017045974731, 1.1436383724212646, 1.2446749210357666, 1.3457114696502686, 1.44674813747406, 1.5477848052978516, 1.6488213539123535, 1.7498579025268555, 1.850894570350647, 1.9519312381744385, 2.0529677867889404, 2.1540043354034424, 2.2550411224365234, 2.3560776710510254, 2.4571142196655273, 2.5581507682800293, 2.6591873168945312, 2.7602241039276123, 2.8612606525421143, 2.962297201156616, 3.0633339881896973, 3.164370536804199, 3.265407085418701]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 7.0, 6.0, 8.0, 6.0, 3.0, 7.0, 3.0, 5.0, 2.0, 2.0, 5.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.642054557800293, -3.5252161026000977, -3.4083776473999023, -3.291539192199707, -3.1747007369995117, -3.0578622817993164, -2.941023826599121, -2.824185371398926, -2.7073469161987305, -2.590508460998535, -2.47367000579834, -2.3568315505981445, -2.239993095397949, -2.123154640197754, -2.0063161849975586, -1.8894778490066528, -1.772639513015747, -1.6558010578155518, -1.5389626026153564, -1.4221241474151611, -1.3052856922149658, -1.1884472370147705, -1.0716089010238647, -0.9547704458236694, -0.8379319906234741, -0.7210935354232788, -0.6042550802230835, -0.48741668462753296, -0.37057822942733765, -0.25373977422714233, -0.1369013786315918, -0.020062923431396484, 0.09677553176879883, 0.21361397206783295, 0.33045241236686707, 0.44729083776474, 0.5641292929649353, 0.6809677481651306, 0.7978061437606812, 0.9146445989608765, 1.0314830541610718, 1.148321509361267, 1.2651599645614624, 1.3819983005523682, 1.4988367557525635, 1.6156752109527588, 1.732513666152954, 1.8493521213531494, 1.9661905765533447, 2.08302903175354, 2.1998674869537354, 2.3167059421539307, 2.433544397354126, 2.5503828525543213, 2.6672210693359375, 2.784059524536133, 2.900897979736328, 3.0177364349365234, 3.1345748901367188, 3.251413345336914, 3.3682518005371094, 3.4850902557373047, 3.6019287109375, 3.7187671661376953, 3.8356056213378906]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 4.0, 2.0, 4.0, 2.0, 8.0, 12.0, 11.0, 21.0, 26.0, 49.0, 53.0, 91.0, 95.0, 149.0, 276.0, 367.0, 687.0, 1155.0, 2159.0, 4449.0, 9143.0, 20658.0, 48624.0, 114610.0, 164646.0, 89187.0, 36980.0, 16123.0, 7149.0, 3415.0, 1733.0, 957.0, 483.0, 297.0, 221.0, 110.0, 84.0, 45.0, 40.0, 42.0, 25.0, 17.0, 18.0, 8.0, 6.0, 8.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 4.0, 0.0, 2.0], "bins": [-1.3154296875, -1.2759857177734375, -1.236541748046875, -1.1970977783203125, -1.15765380859375, -1.1182098388671875, -1.078765869140625, -1.0393218994140625, -0.9998779296875, -0.9604339599609375, -0.920989990234375, -0.8815460205078125, -0.84210205078125, -0.8026580810546875, -0.763214111328125, -0.7237701416015625, -0.684326171875, -0.6448822021484375, -0.605438232421875, -0.5659942626953125, -0.52655029296875, -0.4871063232421875, -0.447662353515625, -0.4082183837890625, -0.3687744140625, -0.3293304443359375, -0.289886474609375, -0.2504425048828125, -0.21099853515625, -0.1715545654296875, -0.132110595703125, -0.0926666259765625, -0.05322265625, -0.0137786865234375, 0.025665283203125, 0.0651092529296875, 0.10455322265625, 0.1439971923828125, 0.183441162109375, 0.2228851318359375, 0.2623291015625, 0.3017730712890625, 0.341217041015625, 0.3806610107421875, 0.42010498046875, 0.4595489501953125, 0.498992919921875, 0.5384368896484375, 0.577880859375, 0.6173248291015625, 0.656768798828125, 0.6962127685546875, 0.73565673828125, 0.7751007080078125, 0.814544677734375, 0.8539886474609375, 0.8934326171875, 0.9328765869140625, 0.972320556640625, 1.0117645263671875, 1.05120849609375, 1.0906524658203125, 1.130096435546875, 1.1695404052734375, 1.208984375]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 4.0, 10.0, 21.0, 22.0, 39.0, 33.0, 55.0, 60.0, 79.0, 99.0, 100.0, 109.0, 78.0, 64.0, 78.0, 46.0, 25.0, 21.0, 20.0, 14.0, 9.0, 3.0, 5.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.377197265625, -0.3625831604003906, -0.34796905517578125, -0.3333549499511719, -0.3187408447265625, -0.3041267395019531, -0.28951263427734375, -0.2748985290527344, -0.260284423828125, -0.24567031860351562, -0.23105621337890625, -0.21644210815429688, -0.2018280029296875, -0.18721389770507812, -0.17259979248046875, -0.15798568725585938, -0.14337158203125, -0.12875747680664062, -0.11414337158203125, -0.09952926635742188, -0.0849151611328125, -0.07030105590820312, -0.05568695068359375, -0.041072845458984375, -0.026458740234375, -0.011844635009765625, 0.00276947021484375, 0.017383575439453125, 0.0319976806640625, 0.046611785888671875, 0.06122589111328125, 0.07583999633789062, 0.0904541015625, 0.10506820678710938, 0.11968231201171875, 0.13429641723632812, 0.1489105224609375, 0.16352462768554688, 0.17813873291015625, 0.19275283813476562, 0.207366943359375, 0.22198104858398438, 0.23659515380859375, 0.2512092590332031, 0.2658233642578125, 0.2804374694824219, 0.29505157470703125, 0.3096656799316406, 0.32427978515625, 0.3388938903808594, 0.35350799560546875, 0.3681221008300781, 0.3827362060546875, 0.3973503112792969, 0.41196441650390625, 0.4265785217285156, 0.441192626953125, 0.4558067321777344, 0.47042083740234375, 0.4850349426269531, 0.4996490478515625, 0.5142631530761719, 0.5288772583007812, 0.5434913635253906, 0.55810546875]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 0.0, 5.0, 2.0, 5.0, 2.0, 8.0, 15.0, 52.0, 94.0, 117.0, 79.0, 55.0, 15.0, 10.0, 13.0, 2.0, 3.0, 3.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.205970048904419, -2.1148102283477783, -2.023650646209717, -1.9324908256530762, -1.8413312435150146, -1.750171422958374, -1.659011721611023, -1.5678520202636719, -1.4766923189163208, -1.3855326175689697, -1.2943729162216187, -1.2032132148742676, -1.112053394317627, -1.0208938121795654, -0.9297339916229248, -0.8385742902755737, -0.7474145889282227, -0.6562548875808716, -0.5650951862335205, -0.47393542528152466, -0.3827757239341736, -0.2916160225868225, -0.20045626163482666, -0.10929656028747559, -0.01813685894012451, 0.07302285730838776, 0.16418257355690002, 0.2553423047065735, 0.34650200605392456, 0.43766170740127563, 0.5288214683532715, 0.6199811697006226, 0.7111411094665527, 0.8023008108139038, 0.8934605121612549, 0.9846202731132507, 1.075779914855957, 1.1669397354125977, 1.2580994367599487, 1.3492591381072998, 1.4404188394546509, 1.531578540802002, 1.622738242149353, 1.713897943496704, 1.8050577640533447, 1.8962173461914062, 1.9873771667480469, 2.0785369873046875, 2.169696569442749, 2.2608563899993896, 2.352015972137451, 2.443175792694092, 2.5343353748321533, 2.625495195388794, 2.7166547775268555, 2.807814598083496, 2.8989744186401367, 2.9901342391967773, 3.081293821334839, 3.1724536418914795, 3.263613224029541, 3.3547730445861816, 3.4459328651428223, 3.537092447280884, 3.6282520294189453]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 6.0, 8.0, 22.0, 37.0, 66.0, 87.0, 84.0, 60.0, 31.0, 22.0, 8.0, 9.0, 2.0, 5.0, 4.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7852325439453125, -1.7204234600067139, -1.6556144952774048, -1.5908054113388062, -1.525996446609497, -1.4611873626708984, -1.3963782787322998, -1.3315691947937012, -1.266760230064392, -1.2019511461257935, -1.1371421813964844, -1.0723330974578857, -1.007524013519287, -0.942715048789978, -0.8779059648513794, -0.8130969405174255, -0.7482879161834717, -0.6834788918495178, -0.618669867515564, -0.5538607835769653, -0.4890517592430115, -0.4242427349090576, -0.35943368077278137, -0.2946246266365051, -0.22981560230255127, -0.16500656306743622, -0.10019752383232117, -0.035388484597206116, 0.029420554637908936, 0.09422957897186279, 0.15903863310813904, 0.22384768724441528, 0.28865671157836914, 0.353465735912323, 0.41827479004859924, 0.4830838441848755, 0.5478928685188293, 0.6127018928527832, 0.6775109767913818, 0.7423200011253357, 0.8071290254592896, 0.8719380497932434, 0.9367470741271973, 1.001556158065796, 1.0663652420043945, 1.1311742067337036, 1.1959832906723022, 1.2607922554016113, 1.32560133934021, 1.3904104232788086, 1.4552193880081177, 1.5200284719467163, 1.5848374366760254, 1.649646520614624, 1.7144556045532227, 1.7792646884918213, 1.8440736532211304, 1.908882737159729, 1.973691701889038, 2.0385007858276367, 2.1033098697662354, 2.168118953704834, 2.2329277992248535, 2.297736883163452, 2.362545967102051]}, "train/train_runtime": 5167.2788, "train/train_samples_per_second": 5.523, "train/train_steps_per_second": 0.086, "train/total_flos": 0.0, "train/train_loss": 4.383164462487259, "eval/loss": 4.685743808746338, "eval/wer": 2.314676715589052, "eval/runtime": 1113.6363, "eval/samples_per_second": 2.372, "eval/steps_per_second": 0.297, "_wandb": {"runtime": 6665}}