{"train/loss": 3.4805, "train/learning_rate": 3.1152647975077885e-07, "train/epoch": 1.0, "train/global_step": 1784, "_runtime": 9938, "_timestamp": 1646164834, "_step": 1788, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 8.0, 17.0, 19.0, 52.0, 108.0, 280.0, 250.0, 111.0, 44.0, 41.0, 26.0, 16.0, 8.0, 5.0, 4.0, 2.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-254.1670684814453, -248.654052734375, -243.14105224609375, -237.62803649902344, -232.1150360107422, -226.60202026367188, -221.08901977539062, -215.5760040283203, -210.06298828125, -204.5499725341797, -199.03697204589844, -193.52395629882812, -188.01095581054688, -182.49794006347656, -176.98492431640625, -171.471923828125, -165.95892333984375, -160.44590759277344, -154.9329071044922, -149.41989135742188, -143.90689086914062, -138.3938751220703, -132.880859375, -127.36785888671875, -121.85485076904297, -116.34184265136719, -110.8288345336914, -105.31582641601562, -99.80281066894531, -94.28981018066406, -88.77679443359375, -83.26378631591797, -77.75078582763672, -72.23777770996094, -66.72476959228516, -61.21175765991211, -55.69874954223633, -50.18574142456055, -44.6727294921875, -39.15972137451172, -33.64671325683594, -28.133705139160156, -22.620695114135742, -17.107685089111328, -11.594676971435547, -6.081668853759766, -0.5686569213867188, 4.9443511962890625, 10.457359313964844, 15.970368385314941, 21.48337745666504, 26.996387481689453, 32.509395599365234, 38.022403717041016, 43.53541564941406, 49.048423767089844, 54.561431884765625, 60.074440002441406, 65.58744812011719, 71.1004638671875, 76.61346435546875, 82.12648010253906, 87.63948822021484, 93.15249633789062, 98.6655044555664]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 4.0, 1.0, 4.0, 0.0, 1.0, 6.0, 3.0, 9.0, 11.0, 8.0, 13.0, 8.0, 13.0, 12.0, 23.0, 17.0, 23.0, 24.0, 26.0, 21.0, 23.0, 43.0, 67.0, 77.0, 103.0, 92.0, 79.0, 66.0, 38.0, 29.0, 19.0, 15.0, 20.0, 20.0, 13.0, 11.0, 11.0, 10.0, 8.0, 11.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-328.735595703125, -319.05816650390625, -309.3807373046875, -299.70330810546875, -290.02587890625, -280.34844970703125, -270.6710205078125, -260.9935607910156, -251.31613159179688, -241.63870239257812, -231.96127319335938, -222.28384399414062, -212.6063995361328, -202.92897033691406, -193.2515411376953, -183.5740966796875, -173.8966827392578, -164.21925354003906, -154.5418243408203, -144.8643798828125, -135.18695068359375, -125.509521484375, -115.83209228515625, -106.15465545654297, -96.47722625732422, -86.79979705810547, -77.12236022949219, -67.44493103027344, -57.76749801635742, -48.090065002441406, -38.412635803222656, -28.735198974609375, -19.057769775390625, -9.380337715148926, 0.29709434509277344, 9.974525451660156, 19.651958465576172, 29.329391479492188, 39.00682067871094, 48.68425750732422, 58.36168670654297, 68.03911590576172, 77.716552734375, 87.39398193359375, 97.0714111328125, 106.74884796142578, 116.42627716064453, 126.10371398925781, 135.78114318847656, 145.4585723876953, 155.13600158691406, 164.81344604492188, 174.49087524414062, 184.16830444335938, 193.84573364257812, 203.52316284179688, 213.20059204101562, 222.87802124023438, 232.55545043945312, 242.23287963867188, 251.9103240966797, 261.5877685546875, 271.26519775390625, 280.942626953125, 290.62005615234375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 2.0, 0.0, 2.0, 4.0, 2.0, 1.0, 6.0, 7.0, 12.0, 11.0, 11.0, 8.0, 17.0, 19.0, 18.0, 19.0, 30.0, 16.0, 30.0, 29.0, 35.0, 72.0, 65.0, 79.0, 86.0, 75.0, 73.0, 55.0, 36.0, 33.0, 18.0, 19.0, 20.0, 18.0, 14.0, 10.0, 6.0, 11.0, 10.0, 7.0, 4.0, 4.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.234375, -9.9219970703125, -9.609619140625, -9.2972412109375, -8.98486328125, -8.6724853515625, -8.360107421875, -8.0477294921875, -7.7353515625, -7.4229736328125, -7.110595703125, -6.7982177734375, -6.48583984375, -6.1734619140625, -5.861083984375, -5.5487060546875, -5.236328125, -4.9239501953125, -4.611572265625, -4.2991943359375, -3.98681640625, -3.6744384765625, -3.362060546875, -3.0496826171875, -2.7373046875, -2.4249267578125, -2.112548828125, -1.8001708984375, -1.48779296875, -1.1754150390625, -0.863037109375, -0.5506591796875, -0.23828125, 0.0740966796875, 0.386474609375, 0.6988525390625, 1.01123046875, 1.3236083984375, 1.635986328125, 1.9483642578125, 2.2607421875, 2.5731201171875, 2.885498046875, 3.1978759765625, 3.51025390625, 3.8226318359375, 4.135009765625, 4.4473876953125, 4.759765625, 5.0721435546875, 5.384521484375, 5.6968994140625, 6.00927734375, 6.3216552734375, 6.634033203125, 6.9464111328125, 7.2587890625, 7.5711669921875, 7.883544921875, 8.1959228515625, 8.50830078125, 8.8206787109375, 9.133056640625, 9.4454345703125, 9.7578125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 2.0, 8.0, 7.0, 11.0, 15.0, 17.0, 28.0, 26.0, 45.0, 56.0, 58.0, 123.0, 160.0, 206.0, 339.0, 539.0, 915.0, 1751.0, 3869.0, 9968.0, 40686.0, 3829855.0, 278658.0, 16287.0, 5380.0, 2248.0, 1170.0, 611.0, 389.0, 238.0, 173.0, 111.0, 90.0, 63.0, 41.0, 33.0, 29.0, 13.0, 14.0, 14.0, 9.0, 8.0, 6.0, 5.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-73.9375, -71.6787109375, -69.419921875, -67.1611328125, -64.90234375, -62.6435546875, -60.384765625, -58.1259765625, -55.8671875, -53.6083984375, -51.349609375, -49.0908203125, -46.83203125, -44.5732421875, -42.314453125, -40.0556640625, -37.796875, -35.5380859375, -33.279296875, -31.0205078125, -28.76171875, -26.5029296875, -24.244140625, -21.9853515625, -19.7265625, -17.4677734375, -15.208984375, -12.9501953125, -10.69140625, -8.4326171875, -6.173828125, -3.9150390625, -1.65625, 0.6025390625, 2.861328125, 5.1201171875, 7.37890625, 9.6376953125, 11.896484375, 14.1552734375, 16.4140625, 18.6728515625, 20.931640625, 23.1904296875, 25.44921875, 27.7080078125, 29.966796875, 32.2255859375, 34.484375, 36.7431640625, 39.001953125, 41.2607421875, 43.51953125, 45.7783203125, 48.037109375, 50.2958984375, 52.5546875, 54.8134765625, 57.072265625, 59.3310546875, 61.58984375, 63.8486328125, 66.107421875, 68.3662109375, 70.625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 4.0, 3.0, 5.0, 2.0, 3.0, 4.0, 11.0, 9.0, 13.0, 16.0, 20.0, 27.0, 32.0, 38.0, 65.0, 83.0, 129.0, 271.0, 571.0, 910.0, 781.0, 413.0, 233.0, 125.0, 82.0, 50.0, 38.0, 30.0, 21.0, 19.0, 10.0, 9.0, 13.0, 9.0, 7.0, 6.0, 6.0, 4.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-39.8125, -38.70068359375, -37.5888671875, -36.47705078125, -35.365234375, -34.25341796875, -33.1416015625, -32.02978515625, -30.91796875, -29.80615234375, -28.6943359375, -27.58251953125, -26.470703125, -25.35888671875, -24.2470703125, -23.13525390625, -22.0234375, -20.91162109375, -19.7998046875, -18.68798828125, -17.576171875, -16.46435546875, -15.3525390625, -14.24072265625, -13.12890625, -12.01708984375, -10.9052734375, -9.79345703125, -8.681640625, -7.56982421875, -6.4580078125, -5.34619140625, -4.234375, -3.12255859375, -2.0107421875, -0.89892578125, 0.212890625, 1.32470703125, 2.4365234375, 3.54833984375, 4.66015625, 5.77197265625, 6.8837890625, 7.99560546875, 9.107421875, 10.21923828125, 11.3310546875, 12.44287109375, 13.5546875, 14.66650390625, 15.7783203125, 16.89013671875, 18.001953125, 19.11376953125, 20.2255859375, 21.33740234375, 22.44921875, 23.56103515625, 24.6728515625, 25.78466796875, 26.896484375, 28.00830078125, 29.1201171875, 30.23193359375, 31.34375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 9.0, 6.0, 14.0, 9.0, 18.0, 15.0, 21.0, 29.0, 42.0, 41.0, 63.0, 83.0, 113.0, 168.0, 251.0, 484.0, 1171.0, 5046.0, 40401.0, 3845028.0, 283300.0, 13704.0, 2394.0, 745.0, 391.0, 188.0, 138.0, 86.0, 79.0, 55.0, 38.0, 36.0, 26.0, 20.0, 14.0, 15.0, 11.0, 13.0, 6.0, 5.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.4375, -106.9609375, -103.484375, -100.0078125, -96.53125, -93.0546875, -89.578125, -86.1015625, -82.625, -79.1484375, -75.671875, -72.1953125, -68.71875, -65.2421875, -61.765625, -58.2890625, -54.8125, -51.3359375, -47.859375, -44.3828125, -40.90625, -37.4296875, -33.953125, -30.4765625, -27.0, -23.5234375, -20.046875, -16.5703125, -13.09375, -9.6171875, -6.140625, -2.6640625, 0.8125, 4.2890625, 7.765625, 11.2421875, 14.71875, 18.1953125, 21.671875, 25.1484375, 28.625, 32.1015625, 35.578125, 39.0546875, 42.53125, 46.0078125, 49.484375, 52.9609375, 56.4375, 59.9140625, 63.390625, 66.8671875, 70.34375, 73.8203125, 77.296875, 80.7734375, 84.25, 87.7265625, 91.203125, 94.6796875, 98.15625, 101.6328125, 105.109375, 108.5859375, 112.0625]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 1.0, 6.0, 5.0, 12.0, 8.0, 11.0, 11.0, 27.0, 35.0, 58.0, 88.0, 100.0, 134.0, 157.0, 120.0, 83.0, 48.0, 30.0, 25.0, 22.0, 13.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-51.20794677734375, -48.859764099121094, -46.51158142089844, -44.16339874267578, -41.815216064453125, -39.46703338623047, -37.11885070800781, -34.770668029785156, -32.4224853515625, -30.074302673339844, -27.726119995117188, -25.37793731689453, -23.029754638671875, -20.68157196044922, -18.333389282226562, -15.985206604003906, -13.63702392578125, -11.288841247558594, -8.940658569335938, -6.592475891113281, -4.244293212890625, -1.8961105346679688, 0.4520721435546875, 2.8002548217773438, 5.1484375, 7.496620178222656, 9.844802856445312, 12.192985534667969, 14.541168212890625, 16.88935089111328, 19.237533569335938, 21.585716247558594, 23.93390655517578, 26.282089233398438, 28.630271911621094, 30.97845458984375, 33.326637268066406, 35.67481994628906, 38.02300262451172, 40.371185302734375, 42.71936798095703, 45.06755065917969, 47.415733337402344, 49.763916015625, 52.112098693847656, 54.46028137207031, 56.80846405029297, 59.156646728515625, 61.50482940673828, 63.85301208496094, 66.2011947631836, 68.54937744140625, 70.8975601196289, 73.24574279785156, 75.59392547607422, 77.94210815429688, 80.29029083251953, 82.63847351074219, 84.98665618896484, 87.3348388671875, 89.68302154541016, 92.03120422363281, 94.37938690185547, 96.72756958007812, 99.07575225830078]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 7.0, 6.0, 4.0, 6.0, 2.0, 8.0, 5.0, 10.0, 9.0, 9.0, 12.0, 19.0, 23.0, 22.0, 25.0, 28.0, 28.0, 26.0, 35.0, 34.0, 35.0, 29.0, 35.0, 33.0, 40.0, 47.0, 40.0, 39.0, 31.0, 37.0, 35.0, 33.0, 33.0, 33.0, 24.0, 27.0, 24.0, 23.0, 15.0, 17.0, 17.0, 9.0, 6.0, 5.0, 6.0, 1.0, 4.0, 4.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0], "bins": [-96.27719116210938, -93.53274536132812, -90.78829956054688, -88.04385375976562, -85.29940795898438, -82.55496215820312, -79.81051635742188, -77.06607055664062, -74.32162475585938, -71.57717895507812, -68.83273315429688, -66.08828735351562, -63.343841552734375, -60.599395751953125, -57.85495376586914, -55.11050796508789, -52.366065979003906, -49.621620178222656, -46.877174377441406, -44.132728576660156, -41.388282775878906, -38.643836975097656, -35.89939498901367, -33.15494918823242, -30.410503387451172, -27.666057586669922, -24.921611785888672, -22.177167892456055, -19.432722091674805, -16.688276290893555, -13.943832397460938, -11.199386596679688, -8.454940795898438, -5.710495471954346, -2.966050148010254, -0.2216053009033203, 2.5228404998779297, 5.26728630065918, 8.011730194091797, 10.756175994873047, 13.500621795654297, 16.245067596435547, 18.989513397216797, 21.733957290649414, 24.478403091430664, 27.222848892211914, 29.96729278564453, 32.71173858642578, 35.45618438720703, 38.20063018798828, 40.94507598876953, 43.68952178955078, 46.43396759033203, 49.17841339111328, 51.922855377197266, 54.667301177978516, 57.411746978759766, 60.156192779541016, 62.900638580322266, 65.64508056640625, 68.3895263671875, 71.13397216796875, 73.87841796875, 76.62286376953125, 79.3673095703125]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 11.0, 10.0, 13.0, 10.0, 20.0, 15.0, 18.0, 16.0, 26.0, 24.0, 27.0, 37.0, 44.0, 49.0, 54.0, 84.0, 64.0, 72.0, 65.0, 67.0, 59.0, 31.0, 34.0, 14.0, 16.0, 13.0, 18.0, 17.0, 14.0, 6.0, 5.0, 0.0, 10.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-10.2734375, -9.971923828125, -9.67041015625, -9.368896484375, -9.0673828125, -8.765869140625, -8.46435546875, -8.162841796875, -7.861328125, -7.559814453125, -7.25830078125, -6.956787109375, -6.6552734375, -6.353759765625, -6.05224609375, -5.750732421875, -5.44921875, -5.147705078125, -4.84619140625, -4.544677734375, -4.2431640625, -3.941650390625, -3.64013671875, -3.338623046875, -3.037109375, -2.735595703125, -2.43408203125, -2.132568359375, -1.8310546875, -1.529541015625, -1.22802734375, -0.926513671875, -0.625, -0.323486328125, -0.02197265625, 0.279541015625, 0.5810546875, 0.882568359375, 1.18408203125, 1.485595703125, 1.787109375, 2.088623046875, 2.39013671875, 2.691650390625, 2.9931640625, 3.294677734375, 3.59619140625, 3.897705078125, 4.19921875, 4.500732421875, 4.80224609375, 5.103759765625, 5.4052734375, 5.706787109375, 6.00830078125, 6.309814453125, 6.611328125, 6.912841796875, 7.21435546875, 7.515869140625, 7.8173828125, 8.118896484375, 8.42041015625, 8.721923828125, 9.0234375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 6.0, 18.0, 16.0, 26.0, 38.0, 44.0, 60.0, 84.0, 124.0, 188.0, 239.0, 340.0, 540.0, 723.0, 1042.0, 1484.0, 2157.0, 3172.0, 4801.0, 7321.0, 11238.0, 18346.0, 31834.0, 60447.0, 130418.0, 262386.0, 252306.0, 120841.0, 57405.0, 30192.0, 17940.0, 11047.0, 7083.0, 4607.0, 3076.0, 2217.0, 1391.0, 947.0, 732.0, 483.0, 326.0, 251.0, 174.0, 134.0, 95.0, 62.0, 45.0, 34.0, 19.0, 19.0, 15.0, 7.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0], "bins": [-1.185546875, -1.1484527587890625, -1.111358642578125, -1.0742645263671875, -1.03717041015625, -1.0000762939453125, -0.962982177734375, -0.9258880615234375, -0.8887939453125, -0.8516998291015625, -0.814605712890625, -0.7775115966796875, -0.74041748046875, -0.7033233642578125, -0.666229248046875, -0.6291351318359375, -0.592041015625, -0.5549468994140625, -0.517852783203125, -0.4807586669921875, -0.44366455078125, -0.4065704345703125, -0.369476318359375, -0.3323822021484375, -0.2952880859375, -0.2581939697265625, -0.221099853515625, -0.1840057373046875, -0.14691162109375, -0.1098175048828125, -0.072723388671875, -0.0356292724609375, 0.00146484375, 0.0385589599609375, 0.075653076171875, 0.1127471923828125, 0.14984130859375, 0.1869354248046875, 0.224029541015625, 0.2611236572265625, 0.2982177734375, 0.3353118896484375, 0.372406005859375, 0.4095001220703125, 0.44659423828125, 0.4836883544921875, 0.520782470703125, 0.5578765869140625, 0.594970703125, 0.6320648193359375, 0.669158935546875, 0.7062530517578125, 0.74334716796875, 0.7804412841796875, 0.817535400390625, 0.8546295166015625, 0.8917236328125, 0.9288177490234375, 0.965911865234375, 1.0030059814453125, 1.04010009765625, 1.0771942138671875, 1.114288330078125, 1.1513824462890625, 1.1884765625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 7.0, 6.0, 12.0, 11.0, 10.0, 15.0, 15.0, 16.0, 22.0, 28.0, 26.0, 29.0, 29.0, 35.0, 30.0, 36.0, 45.0, 40.0, 38.0, 40.0, 1071.0, 34.0, 32.0, 39.0, 25.0, 42.0, 26.0, 24.0, 32.0, 29.0, 28.0, 19.0, 25.0, 23.0, 13.0, 15.0, 12.0, 8.0, 12.0, 5.0, 6.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.56640625, -4.422607421875, -4.27880859375, -4.135009765625, -3.9912109375, -3.847412109375, -3.70361328125, -3.559814453125, -3.416015625, -3.272216796875, -3.12841796875, -2.984619140625, -2.8408203125, -2.697021484375, -2.55322265625, -2.409423828125, -2.265625, -2.121826171875, -1.97802734375, -1.834228515625, -1.6904296875, -1.546630859375, -1.40283203125, -1.259033203125, -1.115234375, -0.971435546875, -0.82763671875, -0.683837890625, -0.5400390625, -0.396240234375, -0.25244140625, -0.108642578125, 0.03515625, 0.178955078125, 0.32275390625, 0.466552734375, 0.6103515625, 0.754150390625, 0.89794921875, 1.041748046875, 1.185546875, 1.329345703125, 1.47314453125, 1.616943359375, 1.7607421875, 1.904541015625, 2.04833984375, 2.192138671875, 2.3359375, 2.479736328125, 2.62353515625, 2.767333984375, 2.9111328125, 3.054931640625, 3.19873046875, 3.342529296875, 3.486328125, 3.630126953125, 3.77392578125, 3.917724609375, 4.0615234375, 4.205322265625, 4.34912109375, 4.492919921875, 4.63671875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 4.0, 4.0, 2.0, 6.0, 7.0, 8.0, 24.0, 30.0, 45.0, 79.0, 81.0, 120.0, 170.0, 240.0, 363.0, 568.0, 816.0, 1206.0, 1775.0, 2704.0, 4202.0, 6254.0, 10045.0, 15284.0, 24306.0, 39418.0, 65242.0, 108011.0, 172210.0, 1251262.0, 150025.0, 93137.0, 55945.0, 34130.0, 21241.0, 13224.0, 8507.0, 5678.0, 3608.0, 2371.0, 1565.0, 1042.0, 684.0, 459.0, 355.0, 211.0, 128.0, 115.0, 70.0, 46.0, 35.0, 24.0, 18.0, 16.0, 11.0, 5.0, 8.0, 0.0, 1.0, 3.0], "bins": [-0.6181640625, -0.5996246337890625, -0.581085205078125, -0.5625457763671875, -0.54400634765625, -0.5254669189453125, -0.506927490234375, -0.4883880615234375, -0.4698486328125, -0.4513092041015625, -0.432769775390625, -0.4142303466796875, -0.39569091796875, -0.3771514892578125, -0.358612060546875, -0.3400726318359375, -0.321533203125, -0.3029937744140625, -0.284454345703125, -0.2659149169921875, -0.24737548828125, -0.2288360595703125, -0.210296630859375, -0.1917572021484375, -0.1732177734375, -0.1546783447265625, -0.136138916015625, -0.1175994873046875, -0.09906005859375, -0.0805206298828125, -0.061981201171875, -0.0434417724609375, -0.02490234375, -0.0063629150390625, 0.012176513671875, 0.0307159423828125, 0.04925537109375, 0.0677947998046875, 0.086334228515625, 0.1048736572265625, 0.1234130859375, 0.1419525146484375, 0.160491943359375, 0.1790313720703125, 0.19757080078125, 0.2161102294921875, 0.234649658203125, 0.2531890869140625, 0.271728515625, 0.2902679443359375, 0.308807373046875, 0.3273468017578125, 0.34588623046875, 0.3644256591796875, 0.382965087890625, 0.4015045166015625, 0.4200439453125, 0.4385833740234375, 0.457122802734375, 0.4756622314453125, 0.49420166015625, 0.5127410888671875, 0.531280517578125, 0.5498199462890625, 0.568359375]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0, 2.0, 5.0, 2.0, 5.0, 8.0, 7.0, 11.0, 16.0, 15.0, 15.0, 27.0, 44.0, 41.0, 57.0, 70.0, 80.0, 87.0, 71.0, 73.0, 69.0, 58.0, 45.0, 39.0, 28.0, 28.0, 21.0, 19.0, 15.0, 9.0, 10.0, 4.0, 10.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.0063323974609375, -0.0061487555503845215, -0.005965113639831543, -0.0057814717292785645, -0.005597829818725586, -0.005414187908172607, -0.005230545997619629, -0.00504690408706665, -0.004863262176513672, -0.004679620265960693, -0.004495978355407715, -0.004312336444854736, -0.004128694534301758, -0.003945052623748779, -0.0037614107131958008, -0.0035777688026428223, -0.0033941268920898438, -0.0032104849815368652, -0.0030268430709838867, -0.002843201160430908, -0.0026595592498779297, -0.002475917339324951, -0.0022922754287719727, -0.002108633518218994, -0.0019249916076660156, -0.0017413496971130371, -0.0015577077865600586, -0.00137406587600708, -0.0011904239654541016, -0.001006782054901123, -0.0008231401443481445, -0.000639498233795166, -0.0004558563232421875, -0.000272214412689209, -8.857250213623047e-05, 9.506940841674805e-05, 0.00027871131896972656, 0.0004623532295227051, 0.0006459951400756836, 0.0008296370506286621, 0.0010132789611816406, 0.0011969208717346191, 0.0013805627822875977, 0.0015642046928405762, 0.0017478466033935547, 0.0019314885139465332, 0.0021151304244995117, 0.0022987723350524902, 0.0024824142456054688, 0.0026660561561584473, 0.0028496980667114258, 0.0030333399772644043, 0.003216981887817383, 0.0034006237983703613, 0.00358426570892334, 0.0037679076194763184, 0.003951549530029297, 0.004135191440582275, 0.004318833351135254, 0.004502475261688232, 0.004686117172241211, 0.0048697590827941895, 0.005053400993347168, 0.0052370429039001465, 0.005420684814453125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 6.0, 8.0, 8.0, 5.0, 3.0, 10.0, 12.0, 15.0, 25.0, 19.0, 35.0, 43.0, 42.0, 83.0, 111.0, 112.0, 205.0, 284.0, 534.0, 1481.0, 1022864.0, 20674.0, 798.0, 323.0, 225.0, 154.0, 110.0, 88.0, 68.0, 44.0, 41.0, 29.0, 28.0, 19.0, 9.0, 4.0, 8.0, 7.0, 4.0, 6.0, 6.0, 3.0, 1.0, 3.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10498046875, -0.10167598724365234, -0.09837150573730469, -0.09506702423095703, -0.09176254272460938, -0.08845806121826172, -0.08515357971191406, -0.0818490982055664, -0.07854461669921875, -0.0752401351928711, -0.07193565368652344, -0.06863117218017578, -0.06532669067382812, -0.06202220916748047, -0.05871772766113281, -0.055413246154785156, -0.0521087646484375, -0.048804283142089844, -0.04549980163574219, -0.04219532012939453, -0.038890838623046875, -0.03558635711669922, -0.03228187561035156, -0.028977394104003906, -0.02567291259765625, -0.022368431091308594, -0.019063949584960938, -0.01575946807861328, -0.012454986572265625, -0.009150505065917969, -0.0058460235595703125, -0.0025415420532226562, 0.000762939453125, 0.004067420959472656, 0.0073719024658203125, 0.010676383972167969, 0.013980865478515625, 0.01728534698486328, 0.020589828491210938, 0.023894309997558594, 0.02719879150390625, 0.030503273010253906, 0.03380775451660156, 0.03711223602294922, 0.040416717529296875, 0.04372119903564453, 0.04702568054199219, 0.050330162048339844, 0.0536346435546875, 0.056939125061035156, 0.06024360656738281, 0.06354808807373047, 0.06685256958007812, 0.07015705108642578, 0.07346153259277344, 0.0767660140991211, 0.08007049560546875, 0.0833749771118164, 0.08667945861816406, 0.08998394012451172, 0.09328842163085938, 0.09659290313720703, 0.09989738464355469, 0.10320186614990234, 0.10650634765625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 33.0, 981.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06518911570310593, -0.0632871463894844, -0.061385173350572586, -0.05948320031166077, -0.05758122727274895, -0.05567925423383713, -0.05377728492021561, -0.05187531188130379, -0.04997333884239197, -0.04807136580348015, -0.04616939648985863, -0.04426742345094681, -0.04236545041203499, -0.04046347737312317, -0.03856150805950165, -0.03665953502058983, -0.03475756198167801, -0.03285558894276619, -0.03095361776649952, -0.02905164659023285, -0.02714967355132103, -0.02524770237505436, -0.02334573119878769, -0.02144375815987587, -0.01954178884625435, -0.01763981766998768, -0.01573784463107586, -0.013835873454809189, -0.01193390041589737, -0.0100319292396307, -0.008129957132041454, -0.0062279850244522095, -0.00432601198554039, -0.002424039877951145, -0.000522068003192544, 0.0013799038715660572, 0.003281875979155302, 0.00518384762108326, 0.007085819728672504, 0.00898779183626175, 0.010889763943850994, 0.012791736051440239, 0.014693708159029484, 0.01659568026661873, 0.0184976514428854, 0.02039962261915207, 0.02230159565806389, 0.024203568696975708, 0.026105539873242378, 0.02800751104950905, 0.029909484088420868, 0.03181145712733269, 0.03371342644095421, 0.03561539947986603, 0.03751737251877785, 0.03941934555768967, 0.04132131487131119, 0.04322328791022301, 0.04512525722384453, 0.04702723026275635, 0.04892920330166817, 0.05083117634057999, 0.05273314565420151, 0.05463511869311333, 0.056537091732025146]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 4.0, 7.0, 10.0, 11.0, 13.0, 20.0, 27.0, 33.0, 54.0, 44.0, 57.0, 58.0, 48.0, 77.0, 65.0, 81.0, 66.0, 59.0, 54.0, 47.0, 35.0, 25.0, 22.0, 23.0, 18.0, 10.0, 12.0, 10.0, 6.0, 5.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004211902618408203, -0.004020778462290764, -0.0038296543061733246, -0.0036385301500558853, -0.003447405993938446, -0.0032562818378210068, -0.0030651576817035675, -0.0028740335255861282, -0.002682909369468689, -0.0024917852133512497, -0.0023006610572338104, -0.002109536901116371, -0.0019184127449989319, -0.0017272885888814926, -0.0015361644327640533, -0.001345040276646614, -0.0011539161205291748, -0.0009627919644117355, -0.0007716678082942963, -0.000580543652176857, -0.0003894194960594177, -0.00019829533994197845, -7.1711838245391846e-06, 0.00018395297229290009, 0.00037507712841033936, 0.0005662012845277786, 0.0007573254406452179, 0.0009484495967626572, 0.0011395737528800964, 0.0013306979089975357, 0.001521822065114975, 0.0017129462212324142, 0.0019040703773498535, 0.002095194533467293, 0.002286318689584732, 0.0024774428457021713, 0.0026685670018196106, 0.00285969115793705, 0.003050815314054489, 0.0032419394701719284, 0.0034330636262893677, 0.003624187782406807, 0.003815311938524246, 0.0040064360946416855, 0.004197560250759125, 0.004388684406876564, 0.004579808562994003, 0.0047709327191114426, 0.004962056875228882, 0.005153181031346321, 0.00534430518746376, 0.0055354293435812, 0.005726553499698639, 0.005917677655816078, 0.0061088018119335175, 0.006299925968050957, 0.006491050124168396, 0.006682174280285835, 0.0068732984364032745, 0.007064422592520714, 0.007255546748638153, 0.007446670904755592, 0.007637795060873032, 0.007828919216990471, 0.00802004337310791]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 0.0, 3.0, 1.0, 4.0, 5.0, 6.0, 11.0, 10.0, 13.0, 10.0, 20.0, 15.0, 18.0, 16.0, 26.0, 24.0, 27.0, 37.0, 44.0, 49.0, 54.0, 84.0, 64.0, 72.0, 65.0, 67.0, 59.0, 31.0, 34.0, 14.0, 16.0, 13.0, 18.0, 17.0, 14.0, 6.0, 5.0, 0.0, 10.0, 8.0, 5.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0], "bins": [-10.2734375, -9.971923828125, -9.67041015625, -9.368896484375, -9.0673828125, -8.765869140625, -8.46435546875, -8.162841796875, -7.861328125, -7.559814453125, -7.25830078125, -6.956787109375, -6.6552734375, -6.353759765625, -6.05224609375, -5.750732421875, -5.44921875, -5.147705078125, -4.84619140625, -4.544677734375, -4.2431640625, -3.941650390625, -3.64013671875, -3.338623046875, -3.037109375, -2.735595703125, -2.43408203125, -2.132568359375, -1.8310546875, -1.529541015625, -1.22802734375, -0.926513671875, -0.625, -0.323486328125, -0.02197265625, 0.279541015625, 0.5810546875, 0.882568359375, 1.18408203125, 1.485595703125, 1.787109375, 2.088623046875, 2.39013671875, 2.691650390625, 2.9931640625, 3.294677734375, 3.59619140625, 3.897705078125, 4.19921875, 4.500732421875, 4.80224609375, 5.103759765625, 5.4052734375, 5.706787109375, 6.00830078125, 6.309814453125, 6.611328125, 6.912841796875, 7.21435546875, 7.515869140625, 7.8173828125, 8.118896484375, 8.42041015625, 8.721923828125, 9.0234375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 6.0, 3.0, 7.0, 10.0, 13.0, 12.0, 21.0, 43.0, 57.0, 84.0, 106.0, 123.0, 151.0, 239.0, 390.0, 525.0, 715.0, 1089.0, 1541.0, 2357.0, 3712.0, 5885.0, 10908.0, 22385.0, 56508.0, 270048.0, 528212.0, 81037.0, 28779.0, 13629.0, 7365.0, 4239.0, 2621.0, 1770.0, 1249.0, 814.0, 535.0, 384.0, 273.0, 193.0, 143.0, 115.0, 72.0, 56.0, 30.0, 32.0, 23.0, 23.0, 13.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 2.0, 1.0], "bins": [-27.8125, -26.9736328125, -26.134765625, -25.2958984375, -24.45703125, -23.6181640625, -22.779296875, -21.9404296875, -21.1015625, -20.2626953125, -19.423828125, -18.5849609375, -17.74609375, -16.9072265625, -16.068359375, -15.2294921875, -14.390625, -13.5517578125, -12.712890625, -11.8740234375, -11.03515625, -10.1962890625, -9.357421875, -8.5185546875, -7.6796875, -6.8408203125, -6.001953125, -5.1630859375, -4.32421875, -3.4853515625, -2.646484375, -1.8076171875, -0.96875, -0.1298828125, 0.708984375, 1.5478515625, 2.38671875, 3.2255859375, 4.064453125, 4.9033203125, 5.7421875, 6.5810546875, 7.419921875, 8.2587890625, 9.09765625, 9.9365234375, 10.775390625, 11.6142578125, 12.453125, 13.2919921875, 14.130859375, 14.9697265625, 15.80859375, 16.6474609375, 17.486328125, 18.3251953125, 19.1640625, 20.0029296875, 20.841796875, 21.6806640625, 22.51953125, 23.3583984375, 24.197265625, 25.0361328125, 25.875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 6.0, 10.0, 6.0, 9.0, 10.0, 19.0, 19.0, 16.0, 23.0, 29.0, 26.0, 34.0, 46.0, 36.0, 41.0, 64.0, 62.0, 113.0, 162.0, 1397.0, 239.0, 124.0, 85.0, 68.0, 54.0, 48.0, 36.0, 40.0, 25.0, 15.0, 30.0, 14.0, 22.0, 18.0, 13.0, 7.0, 13.0, 16.0, 10.0, 7.0, 7.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-25.6875, -24.880126953125, -24.07275390625, -23.265380859375, -22.4580078125, -21.650634765625, -20.84326171875, -20.035888671875, -19.228515625, -18.421142578125, -17.61376953125, -16.806396484375, -15.9990234375, -15.191650390625, -14.38427734375, -13.576904296875, -12.76953125, -11.962158203125, -11.15478515625, -10.347412109375, -9.5400390625, -8.732666015625, -7.92529296875, -7.117919921875, -6.310546875, -5.503173828125, -4.69580078125, -3.888427734375, -3.0810546875, -2.273681640625, -1.46630859375, -0.658935546875, 0.1484375, 0.955810546875, 1.76318359375, 2.570556640625, 3.3779296875, 4.185302734375, 4.99267578125, 5.800048828125, 6.607421875, 7.414794921875, 8.22216796875, 9.029541015625, 9.8369140625, 10.644287109375, 11.45166015625, 12.259033203125, 13.06640625, 13.873779296875, 14.68115234375, 15.488525390625, 16.2958984375, 17.103271484375, 17.91064453125, 18.718017578125, 19.525390625, 20.332763671875, 21.14013671875, 21.947509765625, 22.7548828125, 23.562255859375, 24.36962890625, 25.177001953125, 25.984375]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 3.0, 4.0, 2.0, 6.0, 4.0, 2.0, 7.0, 8.0, 10.0, 18.0, 16.0, 11.0, 18.0, 22.0, 22.0, 26.0, 36.0, 47.0, 82.0, 140.0, 278.0, 1068.0, 16341.0, 3030881.0, 93448.0, 2232.0, 417.0, 180.0, 79.0, 66.0, 40.0, 35.0, 25.0, 22.0, 20.0, 13.0, 14.0, 18.0, 4.0, 10.0, 8.0, 8.0, 5.0, 6.0, 3.0, 4.0, 2.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.3125, -108.767578125, -105.22265625, -101.677734375, -98.1328125, -94.587890625, -91.04296875, -87.498046875, -83.953125, -80.408203125, -76.86328125, -73.318359375, -69.7734375, -66.228515625, -62.68359375, -59.138671875, -55.59375, -52.048828125, -48.50390625, -44.958984375, -41.4140625, -37.869140625, -34.32421875, -30.779296875, -27.234375, -23.689453125, -20.14453125, -16.599609375, -13.0546875, -9.509765625, -5.96484375, -2.419921875, 1.125, 4.669921875, 8.21484375, 11.759765625, 15.3046875, 18.849609375, 22.39453125, 25.939453125, 29.484375, 33.029296875, 36.57421875, 40.119140625, 43.6640625, 47.208984375, 50.75390625, 54.298828125, 57.84375, 61.388671875, 64.93359375, 68.478515625, 72.0234375, 75.568359375, 79.11328125, 82.658203125, 86.203125, 89.748046875, 93.29296875, 96.837890625, 100.3828125, 103.927734375, 107.47265625, 111.017578125, 114.5625]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 42.0, 868.0, 105.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.68983840942383, -23.963428497314453, -9.237020492553711, 5.489387512207031, 20.215797424316406, 34.942203521728516, 49.66861343383789, 64.39501953125, 79.12142944335938, 93.84783935546875, 108.57424926757812, 123.3006591796875, 138.02706909179688, 152.75347900390625, 167.47988891601562, 182.206298828125, 196.93270874023438, 211.65911865234375, 226.38552856445312, 241.1119384765625, 255.83834838867188, 270.56475830078125, 285.2911682128906, 300.017578125, 314.7439880371094, 329.47039794921875, 344.1968078613281, 358.9232177734375, 373.6496276855469, 388.37603759765625, 403.1024475097656, 417.828857421875, 432.5552673339844, 447.28167724609375, 462.0080871582031, 476.7344970703125, 491.4609069824219, 506.18731689453125, 520.9136962890625, 535.64013671875, 550.3665161132812, 565.0928955078125, 579.8193359375, 594.5457153320312, 609.2721557617188, 623.99853515625, 638.7249755859375, 653.4513549804688, 668.1777954101562, 682.9041748046875, 697.630615234375, 712.3569946289062, 727.0834350585938, 741.809814453125, 756.5362548828125, 771.2626342773438, 785.9890747070312, 800.7154541015625, 815.44189453125, 830.1682739257812, 844.8947143554688, 859.62109375, 874.3475341796875, 889.0739135742188, 903.8003540039062]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 6.0, 5.0, 6.0, 2.0, 9.0, 11.0, 5.0, 17.0, 16.0, 18.0, 23.0, 26.0, 26.0, 33.0, 29.0, 50.0, 28.0, 34.0, 34.0, 32.0, 34.0, 43.0, 45.0, 50.0, 45.0, 40.0, 31.0, 45.0, 33.0, 28.0, 28.0, 29.0, 26.0, 20.0, 26.0, 14.0, 13.0, 12.0, 3.0, 4.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-88.4848861694336, -85.51607513427734, -82.54727172851562, -79.57846069335938, -76.60964965820312, -73.6408462524414, -70.67203521728516, -67.70323181152344, -64.73442077636719, -61.7656135559082, -58.79680633544922, -55.82799530029297, -52.859188079833984, -49.890380859375, -46.92156982421875, -43.952762603759766, -40.98395538330078, -38.0151481628418, -35.04634094238281, -32.07752990722656, -29.108722686767578, -26.139915466308594, -23.171106338500977, -20.20229721069336, -17.233489990234375, -14.264681816101074, -11.295873641967773, -8.327065467834473, -5.358257293701172, -2.389449119567871, 0.5793590545654297, 3.548168182373047, 6.516975402832031, 9.485783576965332, 12.454591751098633, 15.423399925231934, 18.392208099365234, 21.36101531982422, 24.329824447631836, 27.298633575439453, 30.267440795898438, 33.23624801635742, 36.205055236816406, 39.173866271972656, 42.14267349243164, 45.111480712890625, 48.080291748046875, 51.04909896850586, 54.017906188964844, 56.98671340942383, 59.95552062988281, 62.92433166503906, 65.89314270019531, 68.86194610595703, 71.83075714111328, 74.799560546875, 77.76837158203125, 80.7371826171875, 83.70598602294922, 86.67479705810547, 89.64360046386719, 92.61241149902344, 95.58122253417969, 98.55003356933594, 101.51883697509766]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 3.0, 9.0, 2.0, 7.0, 15.0, 11.0, 15.0, 15.0, 20.0, 17.0, 19.0, 21.0, 25.0, 39.0, 45.0, 50.0, 54.0, 57.0, 71.0, 77.0, 74.0, 58.0, 62.0, 51.0, 32.0, 20.0, 21.0, 22.0, 16.0, 17.0, 13.0, 5.0, 5.0, 4.0, 7.0, 4.0, 6.0, 4.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.4375, -11.096923828125, -10.75634765625, -10.415771484375, -10.0751953125, -9.734619140625, -9.39404296875, -9.053466796875, -8.712890625, -8.372314453125, -8.03173828125, -7.691162109375, -7.3505859375, -7.010009765625, -6.66943359375, -6.328857421875, -5.98828125, -5.647705078125, -5.30712890625, -4.966552734375, -4.6259765625, -4.285400390625, -3.94482421875, -3.604248046875, -3.263671875, -2.923095703125, -2.58251953125, -2.241943359375, -1.9013671875, -1.560791015625, -1.22021484375, -0.879638671875, -0.5390625, -0.198486328125, 0.14208984375, 0.482666015625, 0.8232421875, 1.163818359375, 1.50439453125, 1.844970703125, 2.185546875, 2.526123046875, 2.86669921875, 3.207275390625, 3.5478515625, 3.888427734375, 4.22900390625, 4.569580078125, 4.91015625, 5.250732421875, 5.59130859375, 5.931884765625, 6.2724609375, 6.613037109375, 6.95361328125, 7.294189453125, 7.634765625, 7.975341796875, 8.31591796875, 8.656494140625, 8.9970703125, 9.337646484375, 9.67822265625, 10.018798828125, 10.359375]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 4.0, 2.0, 5.0, 2.0, 6.0, 7.0, 8.0, 13.0, 15.0, 15.0, 27.0, 30.0, 42.0, 53.0, 76.0, 111.0, 245.0, 438.0, 1046.0, 2529.0, 7849.0, 44036.0, 3920242.0, 200139.0, 11441.0, 3314.0, 1281.0, 567.0, 275.0, 170.0, 87.0, 55.0, 35.0, 28.0, 21.0, 15.0, 8.0, 12.0, 7.0, 9.0, 6.0, 4.0, 5.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-76.0625, -73.8037109375, -71.544921875, -69.2861328125, -67.02734375, -64.7685546875, -62.509765625, -60.2509765625, -57.9921875, -55.7333984375, -53.474609375, -51.2158203125, -48.95703125, -46.6982421875, -44.439453125, -42.1806640625, -39.921875, -37.6630859375, -35.404296875, -33.1455078125, -30.88671875, -28.6279296875, -26.369140625, -24.1103515625, -21.8515625, -19.5927734375, -17.333984375, -15.0751953125, -12.81640625, -10.5576171875, -8.298828125, -6.0400390625, -3.78125, -1.5224609375, 0.736328125, 2.9951171875, 5.25390625, 7.5126953125, 9.771484375, 12.0302734375, 14.2890625, 16.5478515625, 18.806640625, 21.0654296875, 23.32421875, 25.5830078125, 27.841796875, 30.1005859375, 32.359375, 34.6181640625, 36.876953125, 39.1357421875, 41.39453125, 43.6533203125, 45.912109375, 48.1708984375, 50.4296875, 52.6884765625, 54.947265625, 57.2060546875, 59.46484375, 61.7236328125, 63.982421875, 66.2412109375, 68.5]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 5.0, 6.0, 10.0, 7.0, 11.0, 16.0, 14.0, 20.0, 49.0, 46.0, 78.0, 156.0, 308.0, 652.0, 1034.0, 751.0, 397.0, 162.0, 87.0, 76.0, 46.0, 27.0, 21.0, 13.0, 20.0, 14.0, 13.0, 9.0, 3.0, 6.0, 3.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-38.5625, -37.41650390625, -36.2705078125, -35.12451171875, -33.978515625, -32.83251953125, -31.6865234375, -30.54052734375, -29.39453125, -28.24853515625, -27.1025390625, -25.95654296875, -24.810546875, -23.66455078125, -22.5185546875, -21.37255859375, -20.2265625, -19.08056640625, -17.9345703125, -16.78857421875, -15.642578125, -14.49658203125, -13.3505859375, -12.20458984375, -11.05859375, -9.91259765625, -8.7666015625, -7.62060546875, -6.474609375, -5.32861328125, -4.1826171875, -3.03662109375, -1.890625, -0.74462890625, 0.4013671875, 1.54736328125, 2.693359375, 3.83935546875, 4.9853515625, 6.13134765625, 7.27734375, 8.42333984375, 9.5693359375, 10.71533203125, 11.861328125, 13.00732421875, 14.1533203125, 15.29931640625, 16.4453125, 17.59130859375, 18.7373046875, 19.88330078125, 21.029296875, 22.17529296875, 23.3212890625, 24.46728515625, 25.61328125, 26.75927734375, 27.9052734375, 29.05126953125, 30.197265625, 31.34326171875, 32.4892578125, 33.63525390625, 34.78125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 8.0, 7.0, 8.0, 11.0, 19.0, 23.0, 25.0, 66.0, 131.0, 278.0, 511.0, 1422.0, 4692.0, 22261.0, 362192.0, 3720072.0, 68306.0, 9988.0, 2600.0, 876.0, 364.0, 163.0, 105.0, 44.0, 29.0, 29.0, 19.0, 12.0, 8.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-87.3125, -84.6875, -82.0625, -79.4375, -76.8125, -74.1875, -71.5625, -68.9375, -66.3125, -63.6875, -61.0625, -58.4375, -55.8125, -53.1875, -50.5625, -47.9375, -45.3125, -42.6875, -40.0625, -37.4375, -34.8125, -32.1875, -29.5625, -26.9375, -24.3125, -21.6875, -19.0625, -16.4375, -13.8125, -11.1875, -8.5625, -5.9375, -3.3125, -0.6875, 1.9375, 4.5625, 7.1875, 9.8125, 12.4375, 15.0625, 17.6875, 20.3125, 22.9375, 25.5625, 28.1875, 30.8125, 33.4375, 36.0625, 38.6875, 41.3125, 43.9375, 46.5625, 49.1875, 51.8125, 54.4375, 57.0625, 59.6875, 62.3125, 64.9375, 67.5625, 70.1875, 72.8125, 75.4375, 78.0625, 80.6875]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 8.0, 38.0, 63.0, 186.0, 318.0, 227.0, 95.0, 31.0, 15.0, 10.0, 2.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-251.1020050048828, -245.06678771972656, -239.03158569335938, -232.99636840820312, -226.96115112304688, -220.92593383789062, -214.89073181152344, -208.8555145263672, -202.8203125, -196.78509521484375, -190.74989318847656, -184.7146759033203, -178.67945861816406, -172.64425659179688, -166.60903930664062, -160.57382202148438, -154.53860473632812, -148.50338745117188, -142.4681854248047, -136.43296813964844, -130.3977508544922, -124.36254119873047, -118.32733154296875, -112.2921142578125, -106.25690460205078, -100.22169494628906, -94.18647766113281, -88.1512680053711, -82.11605834960938, -76.08084106445312, -70.0456314086914, -64.01042175292969, -57.9752197265625, -51.940006256103516, -45.90479278564453, -39.86958312988281, -33.83436965942383, -27.799156188964844, -21.763946533203125, -15.72873306274414, -9.693519592285156, -3.6583070755004883, 2.3769054412841797, 8.412117004394531, 14.447330474853516, 20.4825439453125, 26.51775360107422, 32.5529670715332, 38.58818054199219, 44.62339401245117, 50.658607482910156, 56.693817138671875, 62.72903060913086, 68.76424407958984, 74.79945373535156, 80.83467102050781, 86.86988067626953, 92.90509033203125, 98.9403076171875, 104.97551727294922, 111.01072692871094, 117.04594421386719, 123.0811538696289, 129.11636352539062, 135.15158081054688]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 4.0, 8.0, 13.0, 9.0, 14.0, 12.0, 24.0, 16.0, 20.0, 16.0, 26.0, 25.0, 32.0, 29.0, 29.0, 35.0, 28.0, 35.0, 40.0, 43.0, 39.0, 46.0, 34.0, 40.0, 40.0, 31.0, 37.0, 33.0, 35.0, 25.0, 29.0, 19.0, 21.0, 16.0, 17.0, 11.0, 10.0, 10.0, 9.0, 6.0, 5.0, 8.0, 6.0, 0.0, 8.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-83.43560791015625, -80.85160827636719, -78.26760864257812, -75.68360900878906, -73.099609375, -70.51560974121094, -67.93161010742188, -65.34761047363281, -62.763607025146484, -60.17960739135742, -57.59560775756836, -55.0116081237793, -52.42760467529297, -49.843605041503906, -47.259605407714844, -44.67560577392578, -42.09160614013672, -39.507606506347656, -36.923606872558594, -34.33960723876953, -31.755605697631836, -29.171606063842773, -26.587604522705078, -24.003604888916016, -21.419605255126953, -18.83560562133789, -16.251605987548828, -13.667604446411133, -11.08360481262207, -8.499605178833008, -5.915604591369629, -3.33160400390625, -0.7476043701171875, 1.8363957405090332, 4.420395851135254, 7.004395961761475, 9.588396072387695, 12.172395706176758, 14.756396293640137, 17.340396881103516, 19.924396514892578, 22.50839614868164, 25.092395782470703, 27.6763973236084, 30.26039695739746, 32.844398498535156, 35.42839813232422, 38.01239776611328, 40.596397399902344, 43.180397033691406, 45.76439666748047, 48.34839630126953, 50.932395935058594, 53.516395568847656, 56.100399017333984, 58.68439865112305, 61.26839828491211, 63.85239791870117, 66.4364013671875, 69.02040100097656, 71.60440063476562, 74.18840026855469, 76.77239990234375, 79.35639953613281, 81.94039916992188]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 8.0, 10.0, 12.0, 17.0, 16.0, 12.0, 22.0, 20.0, 29.0, 43.0, 48.0, 42.0, 43.0, 51.0, 70.0, 63.0, 73.0, 82.0, 56.0, 42.0, 32.0, 29.0, 27.0, 25.0, 18.0, 16.0, 10.0, 11.0, 6.0, 6.0, 7.0, 4.0, 6.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.0703125, -10.7454833984375, -10.420654296875, -10.0958251953125, -9.77099609375, -9.4461669921875, -9.121337890625, -8.7965087890625, -8.4716796875, -8.1468505859375, -7.822021484375, -7.4971923828125, -7.17236328125, -6.8475341796875, -6.522705078125, -6.1978759765625, -5.873046875, -5.5482177734375, -5.223388671875, -4.8985595703125, -4.57373046875, -4.2489013671875, -3.924072265625, -3.5992431640625, -3.2744140625, -2.9495849609375, -2.624755859375, -2.2999267578125, -1.97509765625, -1.6502685546875, -1.325439453125, -1.0006103515625, -0.67578125, -0.3509521484375, -0.026123046875, 0.2987060546875, 0.62353515625, 0.9483642578125, 1.273193359375, 1.5980224609375, 1.9228515625, 2.2476806640625, 2.572509765625, 2.8973388671875, 3.22216796875, 3.5469970703125, 3.871826171875, 4.1966552734375, 4.521484375, 4.8463134765625, 5.171142578125, 5.4959716796875, 5.82080078125, 6.1456298828125, 6.470458984375, 6.7952880859375, 7.1201171875, 7.4449462890625, 7.769775390625, 8.0946044921875, 8.41943359375, 8.7442626953125, 9.069091796875, 9.3939208984375, 9.71875]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 4.0, 1.0, 3.0, 8.0, 7.0, 9.0, 20.0, 23.0, 27.0, 58.0, 72.0, 122.0, 167.0, 250.0, 354.0, 530.0, 767.0, 1170.0, 1826.0, 2850.0, 4442.0, 7092.0, 12205.0, 22085.0, 42091.0, 90378.0, 212546.0, 321599.0, 171651.0, 73756.0, 35133.0, 18943.0, 10773.0, 6255.0, 3942.0, 2469.0, 1674.0, 1069.0, 684.0, 476.0, 327.0, 232.0, 151.0, 86.0, 87.0, 37.0, 41.0, 18.0, 20.0, 13.0, 7.0, 3.0, 6.0, 3.0, 4.0, 0.0, 1.0, 2.0], "bins": [-1.4951171875, -1.4503173828125, -1.405517578125, -1.3607177734375, -1.31591796875, -1.2711181640625, -1.226318359375, -1.1815185546875, -1.13671875, -1.0919189453125, -1.047119140625, -1.0023193359375, -0.95751953125, -0.9127197265625, -0.867919921875, -0.8231201171875, -0.7783203125, -0.7335205078125, -0.688720703125, -0.6439208984375, -0.59912109375, -0.5543212890625, -0.509521484375, -0.4647216796875, -0.419921875, -0.3751220703125, -0.330322265625, -0.2855224609375, -0.24072265625, -0.1959228515625, -0.151123046875, -0.1063232421875, -0.0615234375, -0.0167236328125, 0.028076171875, 0.0728759765625, 0.11767578125, 0.1624755859375, 0.207275390625, 0.2520751953125, 0.296875, 0.3416748046875, 0.386474609375, 0.4312744140625, 0.47607421875, 0.5208740234375, 0.565673828125, 0.6104736328125, 0.6552734375, 0.7000732421875, 0.744873046875, 0.7896728515625, 0.83447265625, 0.8792724609375, 0.924072265625, 0.9688720703125, 1.013671875, 1.0584716796875, 1.103271484375, 1.1480712890625, 1.19287109375, 1.2376708984375, 1.282470703125, 1.3272705078125, 1.3720703125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 9.0, 2.0, 7.0, 6.0, 8.0, 9.0, 10.0, 15.0, 16.0, 17.0, 17.0, 23.0, 26.0, 18.0, 37.0, 40.0, 29.0, 31.0, 41.0, 25.0, 33.0, 64.0, 36.0, 1055.0, 40.0, 37.0, 36.0, 32.0, 41.0, 31.0, 24.0, 25.0, 22.0, 31.0, 26.0, 16.0, 13.0, 10.0, 13.0, 10.0, 8.0, 8.0, 6.0, 5.0, 2.0, 5.0, 2.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0], "bins": [-5.05859375, -4.9053955078125, -4.752197265625, -4.5989990234375, -4.44580078125, -4.2926025390625, -4.139404296875, -3.9862060546875, -3.8330078125, -3.6798095703125, -3.526611328125, -3.3734130859375, -3.22021484375, -3.0670166015625, -2.913818359375, -2.7606201171875, -2.607421875, -2.4542236328125, -2.301025390625, -2.1478271484375, -1.99462890625, -1.8414306640625, -1.688232421875, -1.5350341796875, -1.3818359375, -1.2286376953125, -1.075439453125, -0.9222412109375, -0.76904296875, -0.6158447265625, -0.462646484375, -0.3094482421875, -0.15625, -0.0030517578125, 0.150146484375, 0.3033447265625, 0.45654296875, 0.6097412109375, 0.762939453125, 0.9161376953125, 1.0693359375, 1.2225341796875, 1.375732421875, 1.5289306640625, 1.68212890625, 1.8353271484375, 1.988525390625, 2.1417236328125, 2.294921875, 2.4481201171875, 2.601318359375, 2.7545166015625, 2.90771484375, 3.0609130859375, 3.214111328125, 3.3673095703125, 3.5205078125, 3.6737060546875, 3.826904296875, 3.9801025390625, 4.13330078125, 4.2864990234375, 4.439697265625, 4.5928955078125, 4.74609375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 5.0, 9.0, 19.0, 20.0, 22.0, 32.0, 49.0, 72.0, 100.0, 123.0, 240.0, 279.0, 442.0, 596.0, 875.0, 1305.0, 1752.0, 2631.0, 3893.0, 5702.0, 8242.0, 12401.0, 19155.0, 29883.0, 47558.0, 77440.0, 125213.0, 482230.0, 933916.0, 127114.0, 78151.0, 48267.0, 30164.0, 19622.0, 12749.0, 8451.0, 5783.0, 3843.0, 2696.0, 1869.0, 1297.0, 857.0, 624.0, 421.0, 315.0, 218.0, 142.0, 111.0, 80.0, 54.0, 34.0, 25.0, 19.0, 11.0, 4.0, 6.0, 4.0, 5.0, 3.0, 1.0], "bins": [-0.6259765625, -0.6064224243164062, -0.5868682861328125, -0.5673141479492188, -0.547760009765625, -0.5282058715820312, -0.5086517333984375, -0.48909759521484375, -0.46954345703125, -0.44998931884765625, -0.4304351806640625, -0.41088104248046875, -0.391326904296875, -0.37177276611328125, -0.3522186279296875, -0.33266448974609375, -0.3131103515625, -0.29355621337890625, -0.2740020751953125, -0.25444793701171875, -0.234893798828125, -0.21533966064453125, -0.1957855224609375, -0.17623138427734375, -0.15667724609375, -0.13712310791015625, -0.1175689697265625, -0.09801483154296875, -0.078460693359375, -0.05890655517578125, -0.0393524169921875, -0.01979827880859375, -0.000244140625, 0.01930999755859375, 0.0388641357421875, 0.05841827392578125, 0.077972412109375, 0.09752655029296875, 0.1170806884765625, 0.13663482666015625, 0.15618896484375, 0.17574310302734375, 0.1952972412109375, 0.21485137939453125, 0.234405517578125, 0.25395965576171875, 0.2735137939453125, 0.29306793212890625, 0.3126220703125, 0.33217620849609375, 0.3517303466796875, 0.37128448486328125, 0.390838623046875, 0.41039276123046875, 0.4299468994140625, 0.44950103759765625, 0.46905517578125, 0.48860931396484375, 0.5081634521484375, 0.5277175903320312, 0.547271728515625, 0.5668258666992188, 0.5863800048828125, 0.6059341430664062, 0.62548828125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 13.0, 14.0, 14.0, 13.0, 25.0, 26.0, 34.0, 46.0, 64.0, 73.0, 88.0, 93.0, 87.0, 95.0, 65.0, 49.0, 48.0, 43.0, 14.0, 19.0, 16.0, 16.0, 9.0, 3.0, 4.0, 3.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0074462890625, -0.00719761848449707, -0.006948947906494141, -0.006700277328491211, -0.006451606750488281, -0.0062029361724853516, -0.005954265594482422, -0.005705595016479492, -0.0054569244384765625, -0.005208253860473633, -0.004959583282470703, -0.0047109127044677734, -0.004462242126464844, -0.004213571548461914, -0.003964900970458984, -0.0037162303924560547, -0.003467559814453125, -0.0032188892364501953, -0.0029702186584472656, -0.002721548080444336, -0.0024728775024414062, -0.0022242069244384766, -0.001975536346435547, -0.0017268657684326172, -0.0014781951904296875, -0.0012295246124267578, -0.0009808540344238281, -0.0007321834564208984, -0.00048351287841796875, -0.00023484230041503906, 1.3828277587890625e-05, 0.0002624988555908203, 0.00051116943359375, 0.0007598400115966797, 0.0010085105895996094, 0.001257181167602539, 0.0015058517456054688, 0.0017545223236083984, 0.002003192901611328, 0.002251863479614258, 0.0025005340576171875, 0.002749204635620117, 0.002997875213623047, 0.0032465457916259766, 0.0034952163696289062, 0.003743886947631836, 0.003992557525634766, 0.004241228103637695, 0.004489898681640625, 0.004738569259643555, 0.004987239837646484, 0.005235910415649414, 0.005484580993652344, 0.0057332515716552734, 0.005981922149658203, 0.006230592727661133, 0.0064792633056640625, 0.006727933883666992, 0.006976604461669922, 0.0072252750396728516, 0.007473945617675781, 0.007722616195678711, 0.00797128677368164, 0.00821995735168457, 0.0084686279296875]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 2.0, 7.0, 11.0, 5.0, 8.0, 15.0, 23.0, 26.0, 27.0, 27.0, 47.0, 60.0, 92.0, 127.0, 199.0, 328.0, 803.0, 11635.0, 1024063.0, 9304.0, 767.0, 312.0, 176.0, 124.0, 103.0, 47.0, 44.0, 35.0, 31.0, 11.0, 13.0, 15.0, 12.0, 7.0, 6.0, 7.0, 5.0, 4.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.158447265625, -0.15385055541992188, -0.14925384521484375, -0.14465713500976562, -0.1400604248046875, -0.13546371459960938, -0.13086700439453125, -0.12627029418945312, -0.121673583984375, -0.11707687377929688, -0.11248016357421875, -0.10788345336914062, -0.1032867431640625, -0.09869003295898438, -0.09409332275390625, -0.08949661254882812, -0.08489990234375, -0.08030319213867188, -0.07570648193359375, -0.07110977172851562, -0.0665130615234375, -0.061916351318359375, -0.05731964111328125, -0.052722930908203125, -0.048126220703125, -0.043529510498046875, -0.03893280029296875, -0.034336090087890625, -0.0297393798828125, -0.025142669677734375, -0.02054595947265625, -0.015949249267578125, -0.0113525390625, -0.006755828857421875, -0.00215911865234375, 0.002437591552734375, 0.0070343017578125, 0.011631011962890625, 0.01622772216796875, 0.020824432373046875, 0.025421142578125, 0.030017852783203125, 0.03461456298828125, 0.039211273193359375, 0.0438079833984375, 0.048404693603515625, 0.05300140380859375, 0.057598114013671875, 0.06219482421875, 0.06679153442382812, 0.07138824462890625, 0.07598495483398438, 0.0805816650390625, 0.08517837524414062, 0.08977508544921875, 0.09437179565429688, 0.098968505859375, 0.10356521606445312, 0.10816192626953125, 0.11275863647460938, 0.1173553466796875, 0.12195205688476562, 0.12654876708984375, 0.13114547729492188, 0.1357421875]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 15.0, 815.0, 181.0, 7.0], "bins": [-0.1300075352191925, -0.12790335714817047, -0.12579917907714844, -0.1236949935555458, -0.12159080803394318, -0.11948662996292114, -0.11738245189189911, -0.11527826637029648, -0.11317408829927444, -0.11106991022825241, -0.10896572470664978, -0.10686154663562775, -0.10475736111402512, -0.10265318304300308, -0.10054899752140045, -0.09844481945037842, -0.09634064137935638, -0.09423646330833435, -0.09213227778673172, -0.09002809971570969, -0.08792391419410706, -0.08581973612308502, -0.08371555805206299, -0.08161137253046036, -0.07950718700885773, -0.0774030089378357, -0.07529882341623306, -0.07319464534521103, -0.0710904598236084, -0.06898628175258636, -0.06688210368156433, -0.0647779181599617, -0.06267374008893967, -0.060569558292627335, -0.058465376496315, -0.05636119842529297, -0.05425701662898064, -0.052152834832668304, -0.05004865303635597, -0.04794447124004364, -0.04584028944373131, -0.043736107647418976, -0.041631925851106644, -0.03952774405479431, -0.03742356598377228, -0.035319384187459946, -0.033215202391147614, -0.03111102059483528, -0.029006842523813248, -0.026902660727500916, -0.024798480793833733, -0.0226942989975214, -0.020590119063854218, -0.018485937267541885, -0.016381755471229553, -0.014277574606239796, -0.012173393741250038, -0.01006921287626028, -0.007965032011270523, -0.005860850214958191, -0.0037566693499684334, -0.0016524884849786758, 0.0004516933113336563, 0.002555874176323414, 0.004660055506974459]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 6.0, 13.0, 10.0, 4.0, 12.0, 18.0, 23.0, 21.0, 18.0, 25.0, 28.0, 34.0, 24.0, 29.0, 28.0, 32.0, 45.0, 44.0, 32.0, 51.0, 27.0, 49.0, 43.0, 43.0, 37.0, 36.0, 27.0, 27.0, 23.0, 29.0, 25.0, 27.0, 16.0, 17.0, 21.0, 8.0, 7.0, 10.0, 8.0, 5.0, 3.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.003438889980316162, -0.0033280132338404655, -0.003217136487364769, -0.0031062597408890724, -0.002995382994413376, -0.0028845062479376793, -0.0027736295014619827, -0.002662752754986286, -0.0025518760085105896, -0.002440999262034893, -0.0023301225155591965, -0.0022192457690835, -0.0021083690226078033, -0.0019974922761321068, -0.0018866155296564102, -0.0017757387831807137, -0.001664862036705017, -0.0015539852902293205, -0.001443108543753624, -0.0013322317972779274, -0.0012213550508022308, -0.0011104783043265343, -0.0009996015578508377, -0.0008887248113751411, -0.0007778480648994446, -0.000666971318423748, -0.0005560945719480515, -0.0004452178254723549, -0.0003343410789966583, -0.00022346433252096176, -0.0001125875860452652, -1.710839569568634e-06, 0.00010916590690612793, 0.0002200426533818245, 0.00033091939985752106, 0.0004417961463332176, 0.0005526728928089142, 0.0006635496392846107, 0.0007744263857603073, 0.0008853031322360039, 0.0009961798787117004, 0.001107056625187397, 0.0012179333716630936, 0.0013288101181387901, 0.0014396868646144867, 0.0015505636110901833, 0.0016614403575658798, 0.0017723171040415764, 0.001883193850517273, 0.0019940705969929695, 0.002104947343468666, 0.0022158240899443626, 0.002326700836420059, 0.0024375775828957558, 0.0025484543293714523, 0.002659331075847149, 0.0027702078223228455, 0.002881084568798542, 0.0029919613152742386, 0.003102838061749935, 0.0032137148082256317, 0.0033245915547013283, 0.003435468301177025, 0.0035463450476527214, 0.003657221794128418]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 5.0, 6.0, 9.0, 8.0, 10.0, 12.0, 17.0, 16.0, 12.0, 22.0, 20.0, 29.0, 43.0, 48.0, 42.0, 42.0, 52.0, 70.0, 63.0, 73.0, 82.0, 56.0, 42.0, 32.0, 29.0, 27.0, 25.0, 18.0, 16.0, 10.0, 11.0, 6.0, 6.0, 7.0, 4.0, 6.0, 6.0, 4.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-11.0703125, -10.7454833984375, -10.420654296875, -10.0958251953125, -9.77099609375, -9.4461669921875, -9.121337890625, -8.7965087890625, -8.4716796875, -8.1468505859375, -7.822021484375, -7.4971923828125, -7.17236328125, -6.8475341796875, -6.522705078125, -6.1978759765625, -5.873046875, -5.5482177734375, -5.223388671875, -4.8985595703125, -4.57373046875, -4.2489013671875, -3.924072265625, -3.5992431640625, -3.2744140625, -2.9495849609375, -2.624755859375, -2.2999267578125, -1.97509765625, -1.6502685546875, -1.325439453125, -1.0006103515625, -0.67578125, -0.3509521484375, -0.026123046875, 0.2987060546875, 0.62353515625, 0.9483642578125, 1.273193359375, 1.5980224609375, 1.9228515625, 2.2476806640625, 2.572509765625, 2.8973388671875, 3.22216796875, 3.5469970703125, 3.871826171875, 4.1966552734375, 4.521484375, 4.8463134765625, 5.171142578125, 5.4959716796875, 5.82080078125, 6.1456298828125, 6.470458984375, 6.7952880859375, 7.1201171875, 7.4449462890625, 7.769775390625, 8.0946044921875, 8.41943359375, 8.7442626953125, 9.069091796875, 9.3939208984375, 9.71875]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 4.0, 4.0, 4.0, 4.0, 5.0, 10.0, 14.0, 19.0, 28.0, 47.0, 58.0, 86.0, 100.0, 155.0, 191.0, 259.0, 408.0, 592.0, 794.0, 1351.0, 2153.0, 3904.0, 7965.0, 23276.0, 126887.0, 767699.0, 78603.0, 17875.0, 6872.0, 3338.0, 1985.0, 1249.0, 810.0, 530.0, 382.0, 249.0, 184.0, 113.0, 95.0, 66.0, 56.0, 28.0, 24.0, 20.0, 14.0, 12.0, 11.0, 5.0, 7.0, 5.0, 3.0, 4.0, 4.0, 0.0, 1.0], "bins": [-20.65625, -20.0556640625, -19.455078125, -18.8544921875, -18.25390625, -17.6533203125, -17.052734375, -16.4521484375, -15.8515625, -15.2509765625, -14.650390625, -14.0498046875, -13.44921875, -12.8486328125, -12.248046875, -11.6474609375, -11.046875, -10.4462890625, -9.845703125, -9.2451171875, -8.64453125, -8.0439453125, -7.443359375, -6.8427734375, -6.2421875, -5.6416015625, -5.041015625, -4.4404296875, -3.83984375, -3.2392578125, -2.638671875, -2.0380859375, -1.4375, -0.8369140625, -0.236328125, 0.3642578125, 0.96484375, 1.5654296875, 2.166015625, 2.7666015625, 3.3671875, 3.9677734375, 4.568359375, 5.1689453125, 5.76953125, 6.3701171875, 6.970703125, 7.5712890625, 8.171875, 8.7724609375, 9.373046875, 9.9736328125, 10.57421875, 11.1748046875, 11.775390625, 12.3759765625, 12.9765625, 13.5771484375, 14.177734375, 14.7783203125, 15.37890625, 15.9794921875, 16.580078125, 17.1806640625, 17.78125]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 8.0, 17.0, 9.0, 7.0, 22.0, 25.0, 19.0, 22.0, 32.0, 31.0, 24.0, 46.0, 34.0, 43.0, 42.0, 54.0, 88.0, 355.0, 1591.0, 123.0, 51.0, 40.0, 44.0, 45.0, 27.0, 31.0, 26.0, 44.0, 25.0, 19.0, 17.0, 13.0, 14.0, 13.0, 7.0, 5.0, 11.0, 4.0, 3.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.96875, -34.8818359375, -33.794921875, -32.7080078125, -31.62109375, -30.5341796875, -29.447265625, -28.3603515625, -27.2734375, -26.1865234375, -25.099609375, -24.0126953125, -22.92578125, -21.8388671875, -20.751953125, -19.6650390625, -18.578125, -17.4912109375, -16.404296875, -15.3173828125, -14.23046875, -13.1435546875, -12.056640625, -10.9697265625, -9.8828125, -8.7958984375, -7.708984375, -6.6220703125, -5.53515625, -4.4482421875, -3.361328125, -2.2744140625, -1.1875, -0.1005859375, 0.986328125, 2.0732421875, 3.16015625, 4.2470703125, 5.333984375, 6.4208984375, 7.5078125, 8.5947265625, 9.681640625, 10.7685546875, 11.85546875, 12.9423828125, 14.029296875, 15.1162109375, 16.203125, 17.2900390625, 18.376953125, 19.4638671875, 20.55078125, 21.6376953125, 22.724609375, 23.8115234375, 24.8984375, 25.9853515625, 27.072265625, 28.1591796875, 29.24609375, 30.3330078125, 31.419921875, 32.5068359375, 33.59375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 4.0, 3.0, 8.0, 4.0, 6.0, 12.0, 9.0, 17.0, 19.0, 16.0, 24.0, 37.0, 63.0, 64.0, 61.0, 106.0, 163.0, 325.0, 843.0, 2232.0, 8037.0, 61823.0, 3028387.0, 33913.0, 6129.0, 1832.0, 706.0, 284.0, 148.0, 99.0, 71.0, 50.0, 44.0, 33.0, 25.0, 21.0, 17.0, 13.0, 18.0, 13.0, 11.0, 2.0, 8.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.0625, -67.8310546875, -65.599609375, -63.3681640625, -61.13671875, -58.9052734375, -56.673828125, -54.4423828125, -52.2109375, -49.9794921875, -47.748046875, -45.5166015625, -43.28515625, -41.0537109375, -38.822265625, -36.5908203125, -34.359375, -32.1279296875, -29.896484375, -27.6650390625, -25.43359375, -23.2021484375, -20.970703125, -18.7392578125, -16.5078125, -14.2763671875, -12.044921875, -9.8134765625, -7.58203125, -5.3505859375, -3.119140625, -0.8876953125, 1.34375, 3.5751953125, 5.806640625, 8.0380859375, 10.26953125, 12.5009765625, 14.732421875, 16.9638671875, 19.1953125, 21.4267578125, 23.658203125, 25.8896484375, 28.12109375, 30.3525390625, 32.583984375, 34.8154296875, 37.046875, 39.2783203125, 41.509765625, 43.7412109375, 45.97265625, 48.2041015625, 50.435546875, 52.6669921875, 54.8984375, 57.1298828125, 59.361328125, 61.5927734375, 63.82421875, 66.0556640625, 68.287109375, 70.5185546875, 72.75]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [11.0, 973.0, 34.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.40872573852539, -14.626548767089844, 9.155628204345703, 32.937801361083984, 56.7199821472168, 80.50216674804688, 104.28433227539062, 128.06651306152344, 151.84869384765625, 175.63087463378906, 199.41305541992188, 223.19522094726562, 246.97740173339844, 270.75958251953125, 294.541748046875, 318.32391357421875, 342.1061096191406, 365.8882751464844, 389.67047119140625, 413.45263671875, 437.23480224609375, 461.0169982910156, 484.7991638183594, 508.58135986328125, 532.363525390625, 556.1456909179688, 579.9278564453125, 603.7100830078125, 627.4922485351562, 651.2744140625, 675.0565795898438, 698.8387451171875, 722.6209716796875, 746.4031372070312, 770.185302734375, 793.967529296875, 817.7496948242188, 841.5318603515625, 865.3140258789062, 889.09619140625, 912.87841796875, 936.6605834960938, 960.4427490234375, 984.2249755859375, 1008.0071411132812, 1031.789306640625, 1055.571533203125, 1079.3536376953125, 1103.1357421875, 1126.91796875, 1150.7000732421875, 1174.4822998046875, 1198.264404296875, 1222.046630859375, 1245.828857421875, 1269.6109619140625, 1293.3931884765625, 1317.1754150390625, 1340.95751953125, 1364.73974609375, 1388.5218505859375, 1412.3040771484375, 1436.086181640625, 1459.868408203125, 1483.650634765625]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 17.0, 16.0, 6.0, 8.0, 14.0, 16.0, 19.0, 22.0, 20.0, 30.0, 30.0, 37.0, 27.0, 37.0, 44.0, 35.0, 40.0, 25.0, 38.0, 45.0, 34.0, 34.0, 33.0, 28.0, 38.0, 38.0, 26.0, 33.0, 25.0, 25.0, 20.0, 17.0, 11.0, 25.0, 15.0, 12.0, 7.0, 8.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-100.50743103027344, -97.37393951416016, -94.2404556274414, -91.10696411132812, -87.97348022460938, -84.8399887084961, -81.70649719238281, -78.57301330566406, -75.43952178955078, -72.3060302734375, -69.17254638671875, -66.03905487060547, -62.90556716918945, -59.77207946777344, -56.63859176635742, -53.505104064941406, -50.37161636352539, -47.238128662109375, -44.10464096069336, -40.971153259277344, -37.83766174316406, -34.70417404174805, -31.57068634033203, -28.437196731567383, -25.303709030151367, -22.17022132873535, -19.036731719970703, -15.903244018554688, -12.769755363464355, -9.636266708374023, -6.502779006958008, -3.3692893981933594, -0.23580169677734375, 2.897686719894409, 6.031175136566162, 9.164663314819336, 12.298151969909668, 15.431640625, 18.565128326416016, 21.698617935180664, 24.83210563659668, 27.965593338012695, 31.099082946777344, 34.23257064819336, 37.366058349609375, 40.499549865722656, 43.633033752441406, 46.76652526855469, 49.9000129699707, 53.03350067138672, 56.166988372802734, 59.30047607421875, 62.43396759033203, 65.56745910644531, 68.70094299316406, 71.83443450927734, 74.9679183959961, 78.10140991210938, 81.23489379882812, 84.3683853149414, 87.50186920166016, 90.63536071777344, 93.76884460449219, 96.90233612060547, 100.03582763671875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 4.0, 7.0, 5.0, 5.0, 6.0, 8.0, 7.0, 16.0, 19.0, 16.0, 16.0, 19.0, 30.0, 24.0, 42.0, 37.0, 40.0, 44.0, 59.0, 59.0, 71.0, 66.0, 63.0, 55.0, 57.0, 36.0, 33.0, 26.0, 22.0, 21.0, 12.0, 16.0, 7.0, 7.0, 6.0, 5.0, 5.0, 7.0, 8.0, 5.0, 1.0, 7.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-11.3671875, -11.03369140625, -10.7001953125, -10.36669921875, -10.033203125, -9.69970703125, -9.3662109375, -9.03271484375, -8.69921875, -8.36572265625, -8.0322265625, -7.69873046875, -7.365234375, -7.03173828125, -6.6982421875, -6.36474609375, -6.03125, -5.69775390625, -5.3642578125, -5.03076171875, -4.697265625, -4.36376953125, -4.0302734375, -3.69677734375, -3.36328125, -3.02978515625, -2.6962890625, -2.36279296875, -2.029296875, -1.69580078125, -1.3623046875, -1.02880859375, -0.6953125, -0.36181640625, -0.0283203125, 0.30517578125, 0.638671875, 0.97216796875, 1.3056640625, 1.63916015625, 1.97265625, 2.30615234375, 2.6396484375, 2.97314453125, 3.306640625, 3.64013671875, 3.9736328125, 4.30712890625, 4.640625, 4.97412109375, 5.3076171875, 5.64111328125, 5.974609375, 6.30810546875, 6.6416015625, 6.97509765625, 7.30859375, 7.64208984375, 7.9755859375, 8.30908203125, 8.642578125, 8.97607421875, 9.3095703125, 9.64306640625, 9.9765625]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 6.0, 5.0, 10.0, 8.0, 11.0, 19.0, 23.0, 30.0, 54.0, 58.0, 108.0, 147.0, 228.0, 386.0, 624.0, 1138.0, 2163.0, 4442.0, 10333.0, 31791.0, 774644.0, 3251072.0, 91259.0, 14207.0, 5710.0, 2607.0, 1298.0, 720.0, 422.0, 258.0, 165.0, 79.0, 77.0, 52.0, 36.0, 26.0, 11.0, 21.0, 10.0, 9.0, 8.0, 4.0, 3.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.1875, -39.947265625, -38.70703125, -37.466796875, -36.2265625, -34.986328125, -33.74609375, -32.505859375, -31.265625, -30.025390625, -28.78515625, -27.544921875, -26.3046875, -25.064453125, -23.82421875, -22.583984375, -21.34375, -20.103515625, -18.86328125, -17.623046875, -16.3828125, -15.142578125, -13.90234375, -12.662109375, -11.421875, -10.181640625, -8.94140625, -7.701171875, -6.4609375, -5.220703125, -3.98046875, -2.740234375, -1.5, -0.259765625, 0.98046875, 2.220703125, 3.4609375, 4.701171875, 5.94140625, 7.181640625, 8.421875, 9.662109375, 10.90234375, 12.142578125, 13.3828125, 14.623046875, 15.86328125, 17.103515625, 18.34375, 19.583984375, 20.82421875, 22.064453125, 23.3046875, 24.544921875, 25.78515625, 27.025390625, 28.265625, 29.505859375, 30.74609375, 31.986328125, 33.2265625, 34.466796875, 35.70703125, 36.947265625, 38.1875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 7.0, 2.0, 5.0, 5.0, 9.0, 7.0, 6.0, 19.0, 16.0, 21.0, 21.0, 33.0, 30.0, 43.0, 75.0, 118.0, 180.0, 413.0, 591.0, 758.0, 630.0, 379.0, 226.0, 124.0, 81.0, 56.0, 40.0, 28.0, 26.0, 22.0, 10.0, 22.0, 8.0, 12.0, 8.0, 10.0, 6.0, 5.0, 3.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.53125, -22.6796875, -21.828125, -20.9765625, -20.125, -19.2734375, -18.421875, -17.5703125, -16.71875, -15.8671875, -15.015625, -14.1640625, -13.3125, -12.4609375, -11.609375, -10.7578125, -9.90625, -9.0546875, -8.203125, -7.3515625, -6.5, -5.6484375, -4.796875, -3.9453125, -3.09375, -2.2421875, -1.390625, -0.5390625, 0.3125, 1.1640625, 2.015625, 2.8671875, 3.71875, 4.5703125, 5.421875, 6.2734375, 7.125, 7.9765625, 8.828125, 9.6796875, 10.53125, 11.3828125, 12.234375, 13.0859375, 13.9375, 14.7890625, 15.640625, 16.4921875, 17.34375, 18.1953125, 19.046875, 19.8984375, 20.75, 21.6015625, 22.453125, 23.3046875, 24.15625, 25.0078125, 25.859375, 26.7109375, 27.5625, 28.4140625, 29.265625, 30.1171875, 30.96875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 3.0, 11.0, 4.0, 10.0, 13.0, 22.0, 29.0, 57.0, 49.0, 99.0, 163.0, 247.0, 399.0, 817.0, 1568.0, 3360.0, 7678.0, 20301.0, 69365.0, 660917.0, 3173090.0, 194305.0, 38642.0, 12887.0, 5284.0, 2359.0, 1135.0, 579.0, 299.0, 192.0, 120.0, 97.0, 65.0, 37.0, 24.0, 12.0, 12.0, 7.0, 9.0, 5.0, 4.0, 2.0, 2.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.96875, -34.650390625, -33.33203125, -32.013671875, -30.6953125, -29.376953125, -28.05859375, -26.740234375, -25.421875, -24.103515625, -22.78515625, -21.466796875, -20.1484375, -18.830078125, -17.51171875, -16.193359375, -14.875, -13.556640625, -12.23828125, -10.919921875, -9.6015625, -8.283203125, -6.96484375, -5.646484375, -4.328125, -3.009765625, -1.69140625, -0.373046875, 0.9453125, 2.263671875, 3.58203125, 4.900390625, 6.21875, 7.537109375, 8.85546875, 10.173828125, 11.4921875, 12.810546875, 14.12890625, 15.447265625, 16.765625, 18.083984375, 19.40234375, 20.720703125, 22.0390625, 23.357421875, 24.67578125, 25.994140625, 27.3125, 28.630859375, 29.94921875, 31.267578125, 32.5859375, 33.904296875, 35.22265625, 36.541015625, 37.859375, 39.177734375, 40.49609375, 41.814453125, 43.1328125, 44.451171875, 45.76953125, 47.087890625, 48.40625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 7.0, 27.0, 81.0, 275.0, 378.0, 152.0, 57.0, 20.0, 7.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-246.1268310546875, -237.38064575195312, -228.6344451904297, -219.8882598876953, -211.14205932617188, -202.3958740234375, -193.64968872070312, -184.90350341796875, -176.1573028564453, -167.41111755371094, -158.6649169921875, -149.91873168945312, -141.17254638671875, -132.4263458251953, -123.68016052246094, -114.93396759033203, -106.18777465820312, -97.44158172607422, -88.69538879394531, -79.94920349121094, -71.20301055908203, -62.456817626953125, -53.710628509521484, -44.964439392089844, -36.21824645996094, -27.472055435180664, -18.72586441040039, -9.979673385620117, -1.2334823608398438, 7.5127105712890625, 16.258899688720703, 25.005088806152344, 33.751251220703125, 42.49744415283203, 51.24363327026367, 59.98982238769531, 68.73601531982422, 77.48220825195312, 86.2283935546875, 94.9745864868164, 103.72077941894531, 112.46697235107422, 121.21316528320312, 129.9593505859375, 138.70553588867188, 147.4517364501953, 156.1979217529297, 164.94412231445312, 173.6903076171875, 182.43649291992188, 191.1826934814453, 199.9288787841797, 208.67507934570312, 217.4212646484375, 226.16744995117188, 234.91363525390625, 243.6598358154297, 252.40602111816406, 261.1522216796875, 269.8984069824219, 278.64459228515625, 287.39080810546875, 296.1369934082031, 304.8831787109375, 313.6293640136719]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 6.0, 1.0, 3.0, 6.0, 5.0, 9.0, 5.0, 10.0, 13.0, 16.0, 19.0, 23.0, 24.0, 24.0, 22.0, 34.0, 37.0, 33.0, 43.0, 47.0, 36.0, 49.0, 33.0, 38.0, 39.0, 44.0, 41.0, 21.0, 32.0, 34.0, 29.0, 30.0, 26.0, 21.0, 25.0, 15.0, 19.0, 14.0, 9.0, 19.0, 16.0, 5.0, 7.0, 10.0, 3.0, 3.0, 5.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-88.31908416748047, -85.6746826171875, -83.03028869628906, -80.38589477539062, -77.74149322509766, -75.09709167480469, -72.45269775390625, -69.80830383300781, -67.16390228271484, -64.51950073242188, -61.87510681152344, -59.230709075927734, -56.58631134033203, -53.94191360473633, -51.297515869140625, -48.65311813354492, -46.00872039794922, -43.364322662353516, -40.71992492675781, -38.07552719116211, -35.431129455566406, -32.7867317199707, -30.142333984375, -27.497936248779297, -24.853538513183594, -22.20914077758789, -19.564743041992188, -16.920345306396484, -14.275947570800781, -11.631549835205078, -8.987152099609375, -6.342754364013672, -3.6983489990234375, -1.0539512634277344, 1.5904464721679688, 4.234844207763672, 6.879241943359375, 9.523639678955078, 12.168037414550781, 14.812435150146484, 17.456832885742188, 20.10123062133789, 22.745628356933594, 25.390026092529297, 28.034423828125, 30.678821563720703, 33.323219299316406, 35.96761703491211, 38.61201477050781, 41.256412506103516, 43.90081024169922, 46.54520797729492, 49.189605712890625, 51.83400344848633, 54.47840118408203, 57.122798919677734, 59.76719665527344, 62.41159439086914, 65.05599212646484, 67.70039367675781, 70.34478759765625, 72.98918151855469, 75.63358306884766, 78.27798461914062, 80.92237854003906]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 8.0, 7.0, 13.0, 17.0, 22.0, 20.0, 17.0, 26.0, 34.0, 33.0, 39.0, 44.0, 60.0, 45.0, 64.0, 57.0, 69.0, 53.0, 45.0, 45.0, 35.0, 47.0, 35.0, 29.0, 21.0, 14.0, 10.0, 6.0, 5.0, 10.0, 10.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.8984375, -10.570068359375, -10.24169921875, -9.913330078125, -9.5849609375, -9.256591796875, -8.92822265625, -8.599853515625, -8.271484375, -7.943115234375, -7.61474609375, -7.286376953125, -6.9580078125, -6.629638671875, -6.30126953125, -5.972900390625, -5.64453125, -5.316162109375, -4.98779296875, -4.659423828125, -4.3310546875, -4.002685546875, -3.67431640625, -3.345947265625, -3.017578125, -2.689208984375, -2.36083984375, -2.032470703125, -1.7041015625, -1.375732421875, -1.04736328125, -0.718994140625, -0.390625, -0.062255859375, 0.26611328125, 0.594482421875, 0.9228515625, 1.251220703125, 1.57958984375, 1.907958984375, 2.236328125, 2.564697265625, 2.89306640625, 3.221435546875, 3.5498046875, 3.878173828125, 4.20654296875, 4.534912109375, 4.86328125, 5.191650390625, 5.52001953125, 5.848388671875, 6.1767578125, 6.505126953125, 6.83349609375, 7.161865234375, 7.490234375, 7.818603515625, 8.14697265625, 8.475341796875, 8.8037109375, 9.132080078125, 9.46044921875, 9.788818359375, 10.1171875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 6.0, 4.0, 7.0, 12.0, 22.0, 18.0, 33.0, 52.0, 80.0, 97.0, 138.0, 186.0, 260.0, 361.0, 528.0, 742.0, 1032.0, 1428.0, 2045.0, 3067.0, 4300.0, 6546.0, 10278.0, 15941.0, 26144.0, 43446.0, 74776.0, 134874.0, 221942.0, 207578.0, 119500.0, 67131.0, 38980.0, 23328.0, 14451.0, 9469.0, 6055.0, 4149.0, 2820.0, 1943.0, 1429.0, 971.0, 667.0, 500.0, 364.0, 232.0, 186.0, 117.0, 95.0, 66.0, 59.0, 40.0, 22.0, 25.0, 12.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-1.1103515625, -1.0755462646484375, -1.040740966796875, -1.0059356689453125, -0.97113037109375, -0.9363250732421875, -0.901519775390625, -0.8667144775390625, -0.8319091796875, -0.7971038818359375, -0.762298583984375, -0.7274932861328125, -0.69268798828125, -0.6578826904296875, -0.623077392578125, -0.5882720947265625, -0.553466796875, -0.5186614990234375, -0.483856201171875, -0.4490509033203125, -0.41424560546875, -0.3794403076171875, -0.344635009765625, -0.3098297119140625, -0.2750244140625, -0.2402191162109375, -0.205413818359375, -0.1706085205078125, -0.13580322265625, -0.1009979248046875, -0.066192626953125, -0.0313873291015625, 0.00341796875, 0.0382232666015625, 0.073028564453125, 0.1078338623046875, 0.14263916015625, 0.1774444580078125, 0.212249755859375, 0.2470550537109375, 0.2818603515625, 0.3166656494140625, 0.351470947265625, 0.3862762451171875, 0.42108154296875, 0.4558868408203125, 0.490692138671875, 0.5254974365234375, 0.560302734375, 0.5951080322265625, 0.629913330078125, 0.6647186279296875, 0.69952392578125, 0.7343292236328125, 0.769134521484375, 0.8039398193359375, 0.8387451171875, 0.8735504150390625, 0.908355712890625, 0.9431610107421875, 0.97796630859375, 1.0127716064453125, 1.047576904296875, 1.0823822021484375, 1.1171875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 7.0, 10.0, 8.0, 5.0, 8.0, 12.0, 15.0, 21.0, 16.0, 19.0, 29.0, 27.0, 29.0, 30.0, 32.0, 36.0, 33.0, 42.0, 33.0, 30.0, 1074.0, 34.0, 44.0, 39.0, 49.0, 34.0, 32.0, 24.0, 30.0, 33.0, 32.0, 18.0, 20.0, 18.0, 15.0, 12.0, 13.0, 9.0, 11.0, 13.0, 7.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.26171875, -5.09661865234375, -4.9315185546875, -4.76641845703125, -4.601318359375, -4.43621826171875, -4.2711181640625, -4.10601806640625, -3.94091796875, -3.77581787109375, -3.6107177734375, -3.44561767578125, -3.280517578125, -3.11541748046875, -2.9503173828125, -2.78521728515625, -2.6201171875, -2.45501708984375, -2.2899169921875, -2.12481689453125, -1.959716796875, -1.79461669921875, -1.6295166015625, -1.46441650390625, -1.29931640625, -1.13421630859375, -0.9691162109375, -0.80401611328125, -0.638916015625, -0.47381591796875, -0.3087158203125, -0.14361572265625, 0.021484375, 0.18658447265625, 0.3516845703125, 0.51678466796875, 0.681884765625, 0.84698486328125, 1.0120849609375, 1.17718505859375, 1.34228515625, 1.50738525390625, 1.6724853515625, 1.83758544921875, 2.002685546875, 2.16778564453125, 2.3328857421875, 2.49798583984375, 2.6630859375, 2.82818603515625, 2.9932861328125, 3.15838623046875, 3.323486328125, 3.48858642578125, 3.6536865234375, 3.81878662109375, 3.98388671875, 4.14898681640625, 4.3140869140625, 4.47918701171875, 4.644287109375, 4.80938720703125, 4.9744873046875, 5.13958740234375, 5.3046875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 8.0, 13.0, 17.0, 20.0, 32.0, 51.0, 66.0, 126.0, 158.0, 247.0, 381.0, 591.0, 899.0, 1429.0, 2114.0, 3394.0, 5392.0, 8580.0, 14164.0, 24307.0, 42070.0, 74483.0, 131884.0, 478216.0, 994125.0, 133425.0, 75433.0, 42635.0, 24482.0, 14548.0, 8734.0, 5471.0, 3481.0, 2131.0, 1403.0, 887.0, 628.0, 333.0, 262.0, 178.0, 111.0, 65.0, 67.0, 31.0, 26.0, 19.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.82861328125, -0.8035125732421875, -0.778411865234375, -0.7533111572265625, -0.72821044921875, -0.7031097412109375, -0.678009033203125, -0.6529083251953125, -0.6278076171875, -0.6027069091796875, -0.577606201171875, -0.5525054931640625, -0.52740478515625, -0.5023040771484375, -0.477203369140625, -0.4521026611328125, -0.427001953125, -0.4019012451171875, -0.376800537109375, -0.3516998291015625, -0.32659912109375, -0.3014984130859375, -0.276397705078125, -0.2512969970703125, -0.2261962890625, -0.2010955810546875, -0.175994873046875, -0.1508941650390625, -0.12579345703125, -0.1006927490234375, -0.075592041015625, -0.0504913330078125, -0.025390625, -0.0002899169921875, 0.024810791015625, 0.0499114990234375, 0.07501220703125, 0.1001129150390625, 0.125213623046875, 0.1503143310546875, 0.1754150390625, 0.2005157470703125, 0.225616455078125, 0.2507171630859375, 0.27581787109375, 0.3009185791015625, 0.326019287109375, 0.3511199951171875, 0.376220703125, 0.4013214111328125, 0.426422119140625, 0.4515228271484375, 0.47662353515625, 0.5017242431640625, 0.526824951171875, 0.5519256591796875, 0.5770263671875, 0.6021270751953125, 0.627227783203125, 0.6523284912109375, 0.67742919921875, 0.7025299072265625, 0.727630615234375, 0.7527313232421875, 0.77783203125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 3.0, 3.0, 4.0, 1.0, 6.0, 13.0, 10.0, 13.0, 16.0, 24.0, 27.0, 38.0, 45.0, 47.0, 71.0, 90.0, 112.0, 95.0, 82.0, 57.0, 48.0, 41.0, 16.0, 18.0, 24.0, 18.0, 16.0, 11.0, 14.0, 8.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00861358642578125, -0.00835716724395752, -0.008100748062133789, -0.007844328880310059, -0.007587909698486328, -0.007331490516662598, -0.007075071334838867, -0.006818652153015137, -0.006562232971191406, -0.006305813789367676, -0.006049394607543945, -0.005792975425720215, -0.005536556243896484, -0.005280137062072754, -0.0050237178802490234, -0.004767298698425293, -0.0045108795166015625, -0.004254460334777832, -0.0039980411529541016, -0.003741621971130371, -0.0034852027893066406, -0.00322878360748291, -0.0029723644256591797, -0.0027159452438354492, -0.0024595260620117188, -0.0022031068801879883, -0.0019466876983642578, -0.0016902685165405273, -0.0014338493347167969, -0.0011774301528930664, -0.0009210109710693359, -0.0006645917892456055, -0.000408172607421875, -0.00015175342559814453, 0.00010466575622558594, 0.0003610849380493164, 0.0006175041198730469, 0.0008739233016967773, 0.0011303424835205078, 0.0013867616653442383, 0.0016431808471679688, 0.0018996000289916992, 0.0021560192108154297, 0.00241243839263916, 0.0026688575744628906, 0.002925276756286621, 0.0031816959381103516, 0.003438115119934082, 0.0036945343017578125, 0.003950953483581543, 0.0042073726654052734, 0.004463791847229004, 0.004720211029052734, 0.004976630210876465, 0.005233049392700195, 0.005489468574523926, 0.005745887756347656, 0.006002306938171387, 0.006258726119995117, 0.006515145301818848, 0.006771564483642578, 0.007027983665466309, 0.007284402847290039, 0.0075408220291137695, 0.0077972412109375]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 6.0, 5.0, 7.0, 11.0, 12.0, 8.0, 14.0, 19.0, 21.0, 28.0, 31.0, 61.0, 67.0, 66.0, 104.0, 143.0, 257.0, 515.0, 2864.0, 952007.0, 89949.0, 1226.0, 399.0, 199.0, 111.0, 89.0, 61.0, 47.0, 47.0, 35.0, 27.0, 23.0, 19.0, 20.0, 14.0, 7.0, 9.0, 4.0, 3.0, 3.0, 2.0, 4.0, 3.0, 0.0, 4.0, 3.0, 1.0, 3.0], "bins": [-0.1671142578125, -0.16245079040527344, -0.15778732299804688, -0.1531238555908203, -0.14846038818359375, -0.1437969207763672, -0.13913345336914062, -0.13446998596191406, -0.1298065185546875, -0.12514305114746094, -0.12047958374023438, -0.11581611633300781, -0.11115264892578125, -0.10648918151855469, -0.10182571411132812, -0.09716224670410156, -0.092498779296875, -0.08783531188964844, -0.08317184448242188, -0.07850837707519531, -0.07384490966796875, -0.06918144226074219, -0.06451797485351562, -0.05985450744628906, -0.0551910400390625, -0.05052757263183594, -0.045864105224609375, -0.04120063781738281, -0.03653717041015625, -0.03187370300292969, -0.027210235595703125, -0.022546768188476562, -0.01788330078125, -0.013219833374023438, -0.008556365966796875, -0.0038928985595703125, 0.00077056884765625, 0.0054340362548828125, 0.010097503662109375, 0.014760971069335938, 0.0194244384765625, 0.024087905883789062, 0.028751373291015625, 0.03341484069824219, 0.03807830810546875, 0.04274177551269531, 0.047405242919921875, 0.05206871032714844, 0.056732177734375, 0.06139564514160156, 0.06605911254882812, 0.07072257995605469, 0.07538604736328125, 0.08004951477050781, 0.08471298217773438, 0.08937644958496094, 0.0940399169921875, 0.09870338439941406, 0.10336685180664062, 0.10803031921386719, 0.11269378662109375, 0.11735725402832031, 0.12202072143554688, 0.12668418884277344, 0.13134765625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 14.0, 767.0, 230.0, 5.0, 1.0], "bins": [-0.14893925189971924, -0.14648935198783875, -0.14403945207595825, -0.14158955216407776, -0.13913966715335846, -0.13668976724147797, -0.13423986732959747, -0.13178996741771698, -0.1293400675058365, -0.126890167593956, -0.1244402751326561, -0.1219903752207756, -0.11954047530889511, -0.11709058284759521, -0.11464068293571472, -0.11219078302383423, -0.10974089056253433, -0.10729099065065384, -0.10484109818935394, -0.10239119827747345, -0.09994129836559296, -0.09749139845371246, -0.09504150599241257, -0.09259160608053207, -0.09014171361923218, -0.08769181370735168, -0.08524192124605179, -0.0827920213341713, -0.0803421214222908, -0.0778922289609909, -0.07544232904911041, -0.07299242913722992, -0.07054253667593002, -0.06809263676404953, -0.06564274430274963, -0.06319284439086914, -0.06074294447898865, -0.05829304829239845, -0.05584315210580826, -0.053393252193927765, -0.05094335600733757, -0.048493459820747375, -0.04604355990886688, -0.04359366372227669, -0.04114376753568649, -0.038693867623806, -0.036243971437215805, -0.03379407525062561, -0.03134417533874512, -0.028894277289509773, -0.02644437924027443, -0.023994483053684235, -0.02154458500444889, -0.019094686955213547, -0.016644790768623352, -0.014194892719388008, -0.01174499373883009, -0.00929509662091732, -0.006845198571681976, -0.00439530098810792, -0.001945403404533863, 0.0005044946447014809, 0.00295439176261425, 0.0054042888805270195, 0.007854186929762363]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 6.0, 8.0, 11.0, 10.0, 7.0, 5.0, 5.0, 15.0, 8.0, 14.0, 18.0, 16.0, 21.0, 31.0, 30.0, 21.0, 24.0, 23.0, 30.0, 38.0, 33.0, 31.0, 28.0, 45.0, 29.0, 27.0, 33.0, 39.0, 38.0, 36.0, 31.0, 23.0, 35.0, 33.0, 24.0, 27.0, 18.0, 23.0, 25.0, 18.0, 16.0, 12.0, 6.0, 8.0, 14.0, 8.0, 2.0, 2.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0038304924964904785, -0.003705178387463093, -0.003579864278435707, -0.0034545501694083214, -0.0033292360603809357, -0.00320392195135355, -0.0030786078423261642, -0.0029532937332987785, -0.002827979624271393, -0.002702665515244007, -0.0025773514062166214, -0.0024520372971892357, -0.00232672318816185, -0.0022014090791344643, -0.0020760949701070786, -0.0019507808610796928, -0.0018254667520523071, -0.0017001526430249214, -0.0015748385339975357, -0.00144952442497015, -0.0013242103159427643, -0.0011988962069153786, -0.0010735820978879929, -0.0009482679888606071, -0.0008229538798332214, -0.0006976397708058357, -0.00057232566177845, -0.0004470115527510643, -0.0003216974437236786, -0.00019638333469629288, -7.106922566890717e-05, 5.4244883358478546e-05, 0.00017955899238586426, 0.00030487310141324997, 0.0004301872104406357, 0.0005555013194680214, 0.0006808154284954071, 0.0008061295375227928, 0.0009314436465501785, 0.0010567577555775642, 0.00118207186460495, 0.0013073859736323357, 0.0014327000826597214, 0.001558014191687107, 0.0016833283007144928, 0.0018086424097418785, 0.0019339565187692642, 0.00205927062779665, 0.0021845847368240356, 0.0023098988458514214, 0.002435212954878807, 0.0025605270639061928, 0.0026858411729335785, 0.002811155281960964, 0.00293646939098835, 0.0030617835000157356, 0.0031870976090431213, 0.003312411718070507, 0.0034377258270978928, 0.0035630399361252785, 0.003688354045152664, 0.00381366815418005, 0.003938982263207436, 0.004064296372234821, 0.004189610481262207]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 4.0, 9.0, 9.0, 8.0, 7.0, 13.0, 17.0, 22.0, 20.0, 17.0, 26.0, 34.0, 33.0, 39.0, 44.0, 60.0, 45.0, 64.0, 57.0, 69.0, 53.0, 45.0, 45.0, 35.0, 47.0, 35.0, 29.0, 21.0, 14.0, 10.0, 6.0, 5.0, 10.0, 10.0, 8.0, 8.0, 4.0, 3.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.8984375, -10.570068359375, -10.24169921875, -9.913330078125, -9.5849609375, -9.256591796875, -8.92822265625, -8.599853515625, -8.271484375, -7.943115234375, -7.61474609375, -7.286376953125, -6.9580078125, -6.629638671875, -6.30126953125, -5.972900390625, -5.64453125, -5.316162109375, -4.98779296875, -4.659423828125, -4.3310546875, -4.002685546875, -3.67431640625, -3.345947265625, -3.017578125, -2.689208984375, -2.36083984375, -2.032470703125, -1.7041015625, -1.375732421875, -1.04736328125, -0.718994140625, -0.390625, -0.062255859375, 0.26611328125, 0.594482421875, 0.9228515625, 1.251220703125, 1.57958984375, 1.907958984375, 2.236328125, 2.564697265625, 2.89306640625, 3.221435546875, 3.5498046875, 3.878173828125, 4.20654296875, 4.534912109375, 4.86328125, 5.191650390625, 5.52001953125, 5.848388671875, 6.1767578125, 6.505126953125, 6.83349609375, 7.161865234375, 7.490234375, 7.818603515625, 8.14697265625, 8.475341796875, 8.8037109375, 9.132080078125, 9.46044921875, 9.788818359375, 10.1171875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 5.0, 10.0, 15.0, 19.0, 14.0, 33.0, 43.0, 50.0, 73.0, 111.0, 153.0, 213.0, 272.0, 421.0, 663.0, 952.0, 1565.0, 2742.0, 5209.0, 12235.0, 37259.0, 210956.0, 654152.0, 83007.0, 20911.0, 7756.0, 3763.0, 2058.0, 1275.0, 843.0, 557.0, 353.0, 256.0, 194.0, 119.0, 85.0, 51.0, 43.0, 33.0, 25.0, 15.0, 18.0, 12.0, 8.0, 4.0, 2.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0], "bins": [-16.5, -16.0184326171875, -15.536865234375, -15.0552978515625, -14.57373046875, -14.0921630859375, -13.610595703125, -13.1290283203125, -12.6474609375, -12.1658935546875, -11.684326171875, -11.2027587890625, -10.72119140625, -10.2396240234375, -9.758056640625, -9.2764892578125, -8.794921875, -8.3133544921875, -7.831787109375, -7.3502197265625, -6.86865234375, -6.3870849609375, -5.905517578125, -5.4239501953125, -4.9423828125, -4.4608154296875, -3.979248046875, -3.4976806640625, -3.01611328125, -2.5345458984375, -2.052978515625, -1.5714111328125, -1.08984375, -0.6082763671875, -0.126708984375, 0.3548583984375, 0.83642578125, 1.3179931640625, 1.799560546875, 2.2811279296875, 2.7626953125, 3.2442626953125, 3.725830078125, 4.2073974609375, 4.68896484375, 5.1705322265625, 5.652099609375, 6.1336669921875, 6.615234375, 7.0968017578125, 7.578369140625, 8.0599365234375, 8.54150390625, 9.0230712890625, 9.504638671875, 9.9862060546875, 10.4677734375, 10.9493408203125, 11.430908203125, 11.9124755859375, 12.39404296875, 12.8756103515625, 13.357177734375, 13.8387451171875, 14.3203125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 12.0, 4.0, 10.0, 11.0, 18.0, 16.0, 21.0, 14.0, 22.0, 39.0, 24.0, 49.0, 37.0, 40.0, 46.0, 58.0, 86.0, 225.0, 1694.0, 156.0, 69.0, 62.0, 45.0, 31.0, 40.0, 28.0, 38.0, 25.0, 22.0, 28.0, 18.0, 11.0, 11.0, 11.0, 9.0, 3.0, 8.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.71875, -35.50732421875, -34.2958984375, -33.08447265625, -31.873046875, -30.66162109375, -29.4501953125, -28.23876953125, -27.02734375, -25.81591796875, -24.6044921875, -23.39306640625, -22.181640625, -20.97021484375, -19.7587890625, -18.54736328125, -17.3359375, -16.12451171875, -14.9130859375, -13.70166015625, -12.490234375, -11.27880859375, -10.0673828125, -8.85595703125, -7.64453125, -6.43310546875, -5.2216796875, -4.01025390625, -2.798828125, -1.58740234375, -0.3759765625, 0.83544921875, 2.046875, 3.25830078125, 4.4697265625, 5.68115234375, 6.892578125, 8.10400390625, 9.3154296875, 10.52685546875, 11.73828125, 12.94970703125, 14.1611328125, 15.37255859375, 16.583984375, 17.79541015625, 19.0068359375, 20.21826171875, 21.4296875, 22.64111328125, 23.8525390625, 25.06396484375, 26.275390625, 27.48681640625, 28.6982421875, 29.90966796875, 31.12109375, 32.33251953125, 33.5439453125, 34.75537109375, 35.966796875, 37.17822265625, 38.3896484375, 39.60107421875, 40.8125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 7.0, 0.0, 4.0, 3.0, 6.0, 5.0, 12.0, 10.0, 15.0, 23.0, 28.0, 28.0, 53.0, 57.0, 79.0, 139.0, 266.0, 665.0, 2412.0, 19540.0, 2893719.0, 219074.0, 7158.0, 1332.0, 442.0, 210.0, 107.0, 91.0, 58.0, 37.0, 21.0, 21.0, 16.0, 21.0, 12.0, 13.0, 8.0, 7.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-67.0, -65.017578125, -63.03515625, -61.052734375, -59.0703125, -57.087890625, -55.10546875, -53.123046875, -51.140625, -49.158203125, -47.17578125, -45.193359375, -43.2109375, -41.228515625, -39.24609375, -37.263671875, -35.28125, -33.298828125, -31.31640625, -29.333984375, -27.3515625, -25.369140625, -23.38671875, -21.404296875, -19.421875, -17.439453125, -15.45703125, -13.474609375, -11.4921875, -9.509765625, -7.52734375, -5.544921875, -3.5625, -1.580078125, 0.40234375, 2.384765625, 4.3671875, 6.349609375, 8.33203125, 10.314453125, 12.296875, 14.279296875, 16.26171875, 18.244140625, 20.2265625, 22.208984375, 24.19140625, 26.173828125, 28.15625, 30.138671875, 32.12109375, 34.103515625, 36.0859375, 38.068359375, 40.05078125, 42.033203125, 44.015625, 45.998046875, 47.98046875, 49.962890625, 51.9453125, 53.927734375, 55.91015625, 57.892578125, 59.875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 9.0, 8.0, 56.0, 189.0, 351.0, 260.0, 107.0, 24.0, 10.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.969234466552734, -60.372314453125, -56.775394439697266, -53.17847442626953, -49.58155059814453, -45.9846305847168, -42.38771057128906, -38.79078674316406, -35.193870544433594, -31.59695053100586, -28.000028610229492, -24.403108596801758, -20.80618667602539, -17.209266662597656, -13.612346649169922, -10.015424728393555, -6.4185028076171875, -2.821582078933716, 0.7753386497497559, 4.372259140014648, 7.969180107116699, 11.56610107421875, 15.163021087646484, 18.75994300842285, 22.356863021850586, 25.95378303527832, 29.550704956054688, 33.14762496948242, 36.744544982910156, 40.341468811035156, 43.938385009765625, 47.535308837890625, 51.132225036621094, 54.72914505004883, 58.32606506347656, 61.92298889160156, 65.51990509033203, 69.11682891845703, 72.7137451171875, 76.3106689453125, 79.9075927734375, 83.5045166015625, 87.10143280029297, 90.69835662841797, 94.29527282714844, 97.89219665527344, 101.48912048339844, 105.0860366821289, 108.68295288085938, 112.27987670898438, 115.87679290771484, 119.47371673583984, 123.07063293457031, 126.66755676269531, 130.2644805908203, 133.8614044189453, 137.4583282470703, 141.0552520751953, 144.6521759033203, 148.24908447265625, 151.84600830078125, 155.44293212890625, 159.03985595703125, 162.63677978515625, 166.2336883544922]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 1.0, 4.0, 4.0, 9.0, 8.0, 10.0, 10.0, 14.0, 10.0, 12.0, 21.0, 35.0, 27.0, 31.0, 26.0, 30.0, 37.0, 41.0, 43.0, 29.0, 30.0, 39.0, 37.0, 35.0, 43.0, 34.0, 47.0, 37.0, 28.0, 28.0, 23.0, 27.0, 27.0, 27.0, 20.0, 18.0, 9.0, 17.0, 13.0, 16.0, 11.0, 4.0, 6.0, 4.0, 4.0, 3.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 3.0], "bins": [-111.24638366699219, -107.84172058105469, -104.43705749511719, -101.03239440917969, -97.62772369384766, -94.22306060791016, -90.81839752197266, -87.41373443603516, -84.00907135009766, -80.60440826416016, -77.19974517822266, -73.79507446289062, -70.39041137695312, -66.98574829101562, -63.581085205078125, -60.176422119140625, -56.77175521850586, -53.36709213256836, -49.962425231933594, -46.557762145996094, -43.153099060058594, -39.748435974121094, -36.34376907348633, -32.93910598754883, -29.534440994262695, -26.129776000976562, -22.725112915039062, -19.32044792175293, -15.915783882141113, -12.511119842529297, -9.106454849243164, -5.701791763305664, -2.2971267700195312, 1.1075375080108643, 4.51220178604126, 7.916866302490234, 11.32153034210205, 14.726194381713867, 18.130859375, 21.5355224609375, 24.940187454223633, 28.344852447509766, 31.749515533447266, 35.15418243408203, 38.55884552001953, 41.96350860595703, 45.36817169189453, 48.77283477783203, 52.1775016784668, 55.5821647644043, 58.98683166503906, 62.39149475097656, 65.79615783691406, 69.20082092285156, 72.60548400878906, 76.01014709472656, 79.4148178100586, 82.8194808959961, 86.2241439819336, 89.62881469726562, 93.03347778320312, 96.43814086914062, 99.84280395507812, 103.24746704101562, 106.65213012695312]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 5.0, 1.0, 2.0, 4.0, 7.0, 5.0, 8.0, 13.0, 7.0, 9.0, 14.0, 19.0, 20.0, 21.0, 27.0, 27.0, 32.0, 31.0, 55.0, 34.0, 54.0, 55.0, 58.0, 65.0, 56.0, 47.0, 45.0, 37.0, 40.0, 39.0, 35.0, 23.0, 24.0, 13.0, 12.0, 6.0, 10.0, 5.0, 10.0, 5.0, 5.0, 8.0, 5.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-11.203125, -10.8714599609375, -10.539794921875, -10.2081298828125, -9.87646484375, -9.5447998046875, -9.213134765625, -8.8814697265625, -8.5498046875, -8.2181396484375, -7.886474609375, -7.5548095703125, -7.22314453125, -6.8914794921875, -6.559814453125, -6.2281494140625, -5.896484375, -5.5648193359375, -5.233154296875, -4.9014892578125, -4.56982421875, -4.2381591796875, -3.906494140625, -3.5748291015625, -3.2431640625, -2.9114990234375, -2.579833984375, -2.2481689453125, -1.91650390625, -1.5848388671875, -1.253173828125, -0.9215087890625, -0.58984375, -0.2581787109375, 0.073486328125, 0.4051513671875, 0.73681640625, 1.0684814453125, 1.400146484375, 1.7318115234375, 2.0634765625, 2.3951416015625, 2.726806640625, 3.0584716796875, 3.39013671875, 3.7218017578125, 4.053466796875, 4.3851318359375, 4.716796875, 5.0484619140625, 5.380126953125, 5.7117919921875, 6.04345703125, 6.3751220703125, 6.706787109375, 7.0384521484375, 7.3701171875, 7.7017822265625, 8.033447265625, 8.3651123046875, 8.69677734375, 9.0284423828125, 9.360107421875, 9.6917724609375, 10.0234375]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 5.0, 4.0, 7.0, 15.0, 22.0, 17.0, 31.0, 37.0, 71.0, 96.0, 124.0, 196.0, 313.0, 459.0, 728.0, 1174.0, 1936.0, 3171.0, 5975.0, 11482.0, 27569.0, 229251.0, 3214204.0, 623324.0, 44475.0, 13755.0, 6625.0, 3585.0, 2044.0, 1235.0, 746.0, 499.0, 346.0, 244.0, 157.0, 102.0, 69.0, 67.0, 35.0, 25.0, 25.0, 18.0, 9.0, 6.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.796875, -29.823974609375, -28.85107421875, -27.878173828125, -26.9052734375, -25.932373046875, -24.95947265625, -23.986572265625, -23.013671875, -22.040771484375, -21.06787109375, -20.094970703125, -19.1220703125, -18.149169921875, -17.17626953125, -16.203369140625, -15.23046875, -14.257568359375, -13.28466796875, -12.311767578125, -11.3388671875, -10.365966796875, -9.39306640625, -8.420166015625, -7.447265625, -6.474365234375, -5.50146484375, -4.528564453125, -3.5556640625, -2.582763671875, -1.60986328125, -0.636962890625, 0.3359375, 1.308837890625, 2.28173828125, 3.254638671875, 4.2275390625, 5.200439453125, 6.17333984375, 7.146240234375, 8.119140625, 9.092041015625, 10.06494140625, 11.037841796875, 12.0107421875, 12.983642578125, 13.95654296875, 14.929443359375, 15.90234375, 16.875244140625, 17.84814453125, 18.821044921875, 19.7939453125, 20.766845703125, 21.73974609375, 22.712646484375, 23.685546875, 24.658447265625, 25.63134765625, 26.604248046875, 27.5771484375, 28.550048828125, 29.52294921875, 30.495849609375, 31.46875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 8.0, 6.0, 10.0, 10.0, 13.0, 16.0, 16.0, 19.0, 35.0, 50.0, 47.0, 99.0, 161.0, 284.0, 550.0, 875.0, 781.0, 463.0, 215.0, 116.0, 79.0, 44.0, 29.0, 15.0, 22.0, 23.0, 14.0, 13.0, 6.0, 8.0, 8.0, 13.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.9375, -23.93408203125, -22.9306640625, -21.92724609375, -20.923828125, -19.92041015625, -18.9169921875, -17.91357421875, -16.91015625, -15.90673828125, -14.9033203125, -13.89990234375, -12.896484375, -11.89306640625, -10.8896484375, -9.88623046875, -8.8828125, -7.87939453125, -6.8759765625, -5.87255859375, -4.869140625, -3.86572265625, -2.8623046875, -1.85888671875, -0.85546875, 0.14794921875, 1.1513671875, 2.15478515625, 3.158203125, 4.16162109375, 5.1650390625, 6.16845703125, 7.171875, 8.17529296875, 9.1787109375, 10.18212890625, 11.185546875, 12.18896484375, 13.1923828125, 14.19580078125, 15.19921875, 16.20263671875, 17.2060546875, 18.20947265625, 19.212890625, 20.21630859375, 21.2197265625, 22.22314453125, 23.2265625, 24.22998046875, 25.2333984375, 26.23681640625, 27.240234375, 28.24365234375, 29.2470703125, 30.25048828125, 31.25390625, 32.25732421875, 33.2607421875, 34.26416015625, 35.267578125, 36.27099609375, 37.2744140625, 38.27783203125, 39.28125]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 7.0, 4.0, 10.0, 10.0, 28.0, 13.0, 23.0, 37.0, 41.0, 93.0, 136.0, 260.0, 463.0, 953.0, 2280.0, 6371.0, 20356.0, 94510.0, 2987260.0, 1000242.0, 57987.0, 14681.0, 4917.0, 1796.0, 805.0, 433.0, 211.0, 121.0, 72.0, 47.0, 33.0, 23.0, 17.0, 11.0, 12.0, 8.0, 10.0, 3.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-69.375, -67.54296875, -65.7109375, -63.87890625, -62.046875, -60.21484375, -58.3828125, -56.55078125, -54.71875, -52.88671875, -51.0546875, -49.22265625, -47.390625, -45.55859375, -43.7265625, -41.89453125, -40.0625, -38.23046875, -36.3984375, -34.56640625, -32.734375, -30.90234375, -29.0703125, -27.23828125, -25.40625, -23.57421875, -21.7421875, -19.91015625, -18.078125, -16.24609375, -14.4140625, -12.58203125, -10.75, -8.91796875, -7.0859375, -5.25390625, -3.421875, -1.58984375, 0.2421875, 2.07421875, 3.90625, 5.73828125, 7.5703125, 9.40234375, 11.234375, 13.06640625, 14.8984375, 16.73046875, 18.5625, 20.39453125, 22.2265625, 24.05859375, 25.890625, 27.72265625, 29.5546875, 31.38671875, 33.21875, 35.05078125, 36.8828125, 38.71484375, 40.546875, 42.37890625, 44.2109375, 46.04296875, 47.875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 23.0, 76.0, 255.0, 426.0, 164.0, 50.0, 11.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.32477569580078, -72.90100860595703, -61.47724533081055, -50.05348205566406, -38.62971496582031, -27.205947875976562, -15.782188415527344, -4.358421325683594, 7.065345764160156, 18.489110946655273, 29.91287612915039, 41.336639404296875, 52.760406494140625, 64.18417358398438, 75.6079330444336, 87.03170013427734, 98.4554672241211, 109.87923431396484, 121.30299377441406, 132.7267608642578, 144.15052795410156, 155.5742950439453, 166.998046875, 178.42181396484375, 189.8455810546875, 201.26934814453125, 212.693115234375, 224.11688232421875, 235.5406494140625, 246.96441650390625, 258.38818359375, 269.81195068359375, 281.2357177734375, 292.65948486328125, 304.083251953125, 315.50701904296875, 326.9307861328125, 338.35455322265625, 349.7783203125, 361.20208740234375, 372.6258544921875, 384.04962158203125, 395.473388671875, 406.89715576171875, 418.3209228515625, 429.74468994140625, 441.16845703125, 452.59222412109375, 464.0159606933594, 475.4397277832031, 486.8634948730469, 498.2872619628906, 509.7110290527344, 521.134765625, 532.5585327148438, 543.9822998046875, 555.4060668945312, 566.829833984375, 578.2536010742188, 589.6773681640625, 601.1011352539062, 612.52490234375, 623.9486694335938, 635.3724365234375, 646.7962036132812]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 6.0, 4.0, 9.0, 7.0, 9.0, 8.0, 5.0, 19.0, 19.0, 23.0, 23.0, 14.0, 28.0, 31.0, 38.0, 30.0, 38.0, 39.0, 35.0, 44.0, 38.0, 42.0, 35.0, 37.0, 41.0, 35.0, 44.0, 39.0, 39.0, 28.0, 30.0, 27.0, 20.0, 17.0, 21.0, 16.0, 18.0, 8.0, 8.0, 15.0, 5.0, 6.0, 4.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-95.60651397705078, -92.955810546875, -90.30509948730469, -87.6543960571289, -85.00369262695312, -82.35298156738281, -79.70227813720703, -77.05157470703125, -74.40086364746094, -71.75016021728516, -69.09944915771484, -66.44874572753906, -63.79804229736328, -61.147335052490234, -58.49662780761719, -55.845924377441406, -53.195220947265625, -50.54451370239258, -47.8938102722168, -45.24310302734375, -42.59239959716797, -39.94169235229492, -37.290985107421875, -34.640281677246094, -31.989574432373047, -29.338869094848633, -26.68816375732422, -24.037456512451172, -21.386751174926758, -18.736045837402344, -16.085338592529297, -13.434633255004883, -10.783920288085938, -8.133214950561523, -5.482508659362793, -2.8318028450012207, -0.18109703063964844, 2.4696083068847656, 5.120314598083496, 7.771020889282227, 10.42172622680664, 13.072431564331055, 15.723137855529785, 18.373844146728516, 21.02454948425293, 23.675254821777344, 26.32596206665039, 28.976667404174805, 31.62737274169922, 34.278079986572266, 36.92878341674805, 39.579490661621094, 42.230194091796875, 44.88090133666992, 47.53160858154297, 50.18231201171875, 52.8330192565918, 55.483726501464844, 58.134429931640625, 60.78513717651367, 63.43584442138672, 66.0865478515625, 68.73725128173828, 71.3879623413086, 74.03866577148438]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 8.0, 10.0, 10.0, 13.0, 14.0, 14.0, 20.0, 20.0, 22.0, 28.0, 27.0, 34.0, 36.0, 48.0, 40.0, 50.0, 61.0, 53.0, 68.0, 47.0, 48.0, 40.0, 38.0, 35.0, 49.0, 19.0, 24.0, 15.0, 19.0, 11.0, 16.0, 7.0, 13.0, 6.0, 6.0, 4.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-10.65625, -10.3297119140625, -10.003173828125, -9.6766357421875, -9.35009765625, -9.0235595703125, -8.697021484375, -8.3704833984375, -8.0439453125, -7.7174072265625, -7.390869140625, -7.0643310546875, -6.73779296875, -6.4112548828125, -6.084716796875, -5.7581787109375, -5.431640625, -5.1051025390625, -4.778564453125, -4.4520263671875, -4.12548828125, -3.7989501953125, -3.472412109375, -3.1458740234375, -2.8193359375, -2.4927978515625, -2.166259765625, -1.8397216796875, -1.51318359375, -1.1866455078125, -0.860107421875, -0.5335693359375, -0.20703125, 0.1195068359375, 0.446044921875, 0.7725830078125, 1.09912109375, 1.4256591796875, 1.752197265625, 2.0787353515625, 2.4052734375, 2.7318115234375, 3.058349609375, 3.3848876953125, 3.71142578125, 4.0379638671875, 4.364501953125, 4.6910400390625, 5.017578125, 5.3441162109375, 5.670654296875, 5.9971923828125, 6.32373046875, 6.6502685546875, 6.976806640625, 7.3033447265625, 7.6298828125, 7.9564208984375, 8.282958984375, 8.6094970703125, 8.93603515625, 9.2625732421875, 9.589111328125, 9.9156494140625, 10.2421875]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 3.0, 6.0, 8.0, 13.0, 16.0, 27.0, 29.0, 48.0, 89.0, 96.0, 133.0, 209.0, 280.0, 407.0, 542.0, 816.0, 1119.0, 1564.0, 2261.0, 3373.0, 4885.0, 7411.0, 11764.0, 18823.0, 30548.0, 52299.0, 90433.0, 154708.0, 229833.0, 177486.0, 103611.0, 60232.0, 35162.0, 21050.0, 13157.0, 8323.0, 5546.0, 3804.0, 2558.0, 1738.0, 1192.0, 809.0, 640.0, 432.0, 297.0, 234.0, 157.0, 122.0, 91.0, 58.0, 38.0, 24.0, 19.0, 21.0, 9.0, 8.0, 4.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.1689453125, -1.131988525390625, -1.09503173828125, -1.058074951171875, -1.0211181640625, -0.984161376953125, -0.94720458984375, -0.910247802734375, -0.873291015625, -0.836334228515625, -0.79937744140625, -0.762420654296875, -0.7254638671875, -0.688507080078125, -0.65155029296875, -0.614593505859375, -0.57763671875, -0.540679931640625, -0.50372314453125, -0.466766357421875, -0.4298095703125, -0.392852783203125, -0.35589599609375, -0.318939208984375, -0.281982421875, -0.245025634765625, -0.20806884765625, -0.171112060546875, -0.1341552734375, -0.097198486328125, -0.06024169921875, -0.023284912109375, 0.013671875, 0.050628662109375, 0.08758544921875, 0.124542236328125, 0.1614990234375, 0.198455810546875, 0.23541259765625, 0.272369384765625, 0.309326171875, 0.346282958984375, 0.38323974609375, 0.420196533203125, 0.4571533203125, 0.494110107421875, 0.53106689453125, 0.568023681640625, 0.60498046875, 0.641937255859375, 0.67889404296875, 0.715850830078125, 0.7528076171875, 0.789764404296875, 0.82672119140625, 0.863677978515625, 0.900634765625, 0.937591552734375, 0.97454833984375, 1.011505126953125, 1.0484619140625, 1.085418701171875, 1.12237548828125, 1.159332275390625, 1.1962890625]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 15.0, 9.0, 8.0, 8.0, 12.0, 20.0, 16.0, 23.0, 25.0, 29.0, 27.0, 39.0, 29.0, 30.0, 48.0, 43.0, 46.0, 36.0, 39.0, 1053.0, 35.0, 48.0, 36.0, 39.0, 43.0, 33.0, 32.0, 27.0, 31.0, 24.0, 16.0, 19.0, 9.0, 15.0, 13.0, 7.0, 6.0, 11.0, 3.0, 5.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.62109375, -5.440185546875, -5.25927734375, -5.078369140625, -4.8974609375, -4.716552734375, -4.53564453125, -4.354736328125, -4.173828125, -3.992919921875, -3.81201171875, -3.631103515625, -3.4501953125, -3.269287109375, -3.08837890625, -2.907470703125, -2.7265625, -2.545654296875, -2.36474609375, -2.183837890625, -2.0029296875, -1.822021484375, -1.64111328125, -1.460205078125, -1.279296875, -1.098388671875, -0.91748046875, -0.736572265625, -0.5556640625, -0.374755859375, -0.19384765625, -0.012939453125, 0.16796875, 0.348876953125, 0.52978515625, 0.710693359375, 0.8916015625, 1.072509765625, 1.25341796875, 1.434326171875, 1.615234375, 1.796142578125, 1.97705078125, 2.157958984375, 2.3388671875, 2.519775390625, 2.70068359375, 2.881591796875, 3.0625, 3.243408203125, 3.42431640625, 3.605224609375, 3.7861328125, 3.967041015625, 4.14794921875, 4.328857421875, 4.509765625, 4.690673828125, 4.87158203125, 5.052490234375, 5.2333984375, 5.414306640625, 5.59521484375, 5.776123046875, 5.95703125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 6.0, 8.0, 9.0, 25.0, 30.0, 32.0, 68.0, 108.0, 148.0, 216.0, 342.0, 483.0, 784.0, 1250.0, 1863.0, 3038.0, 4701.0, 7758.0, 12336.0, 20387.0, 33734.0, 58616.0, 101907.0, 171788.0, 1271815.0, 166824.0, 97901.0, 55815.0, 32982.0, 19824.0, 11997.0, 7375.0, 4666.0, 3045.0, 1876.0, 1148.0, 742.0, 502.0, 330.0, 242.0, 137.0, 88.0, 64.0, 39.0, 31.0, 17.0, 13.0, 7.0, 8.0, 9.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.7783203125, -0.7527694702148438, -0.7272186279296875, -0.7016677856445312, -0.676116943359375, -0.6505661010742188, -0.6250152587890625, -0.5994644165039062, -0.57391357421875, -0.5483627319335938, -0.5228118896484375, -0.49726104736328125, -0.471710205078125, -0.44615936279296875, -0.4206085205078125, -0.39505767822265625, -0.3695068359375, -0.34395599365234375, -0.3184051513671875, -0.29285430908203125, -0.267303466796875, -0.24175262451171875, -0.2162017822265625, -0.19065093994140625, -0.16510009765625, -0.13954925537109375, -0.1139984130859375, -0.08844757080078125, -0.062896728515625, -0.03734588623046875, -0.0117950439453125, 0.01375579833984375, 0.039306640625, 0.06485748291015625, 0.0904083251953125, 0.11595916748046875, 0.141510009765625, 0.16706085205078125, 0.1926116943359375, 0.21816253662109375, 0.24371337890625, 0.26926422119140625, 0.2948150634765625, 0.32036590576171875, 0.345916748046875, 0.37146759033203125, 0.3970184326171875, 0.42256927490234375, 0.4481201171875, 0.47367095947265625, 0.4992218017578125, 0.5247726440429688, 0.550323486328125, 0.5758743286132812, 0.6014251708984375, 0.6269760131835938, 0.65252685546875, 0.6780776977539062, 0.7036285400390625, 0.7291793823242188, 0.754730224609375, 0.7802810668945312, 0.8058319091796875, 0.8313827514648438, 0.85693359375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 4.0, 7.0, 7.0, 11.0, 7.0, 14.0, 16.0, 20.0, 27.0, 24.0, 43.0, 41.0, 48.0, 52.0, 72.0, 80.0, 79.0, 59.0, 70.0, 63.0, 55.0, 34.0, 38.0, 25.0, 19.0, 18.0, 15.0, 11.0, 10.0, 5.0, 10.0, 9.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00630950927734375, -0.006094157695770264, -0.005878806114196777, -0.005663454532623291, -0.005448102951049805, -0.005232751369476318, -0.005017399787902832, -0.004802048206329346, -0.004586696624755859, -0.004371345043182373, -0.004155993461608887, -0.0039406418800354, -0.003725290298461914, -0.0035099387168884277, -0.0032945871353149414, -0.003079235553741455, -0.0028638839721679688, -0.0026485323905944824, -0.002433180809020996, -0.0022178292274475098, -0.0020024776458740234, -0.0017871260643005371, -0.0015717744827270508, -0.0013564229011535645, -0.0011410713195800781, -0.0009257197380065918, -0.0007103681564331055, -0.0004950165748596191, -0.0002796649932861328, -6.431341171264648e-05, 0.00015103816986083984, 0.00036638975143432617, 0.0005817413330078125, 0.0007970929145812988, 0.0010124444961547852, 0.0012277960777282715, 0.0014431476593017578, 0.0016584992408752441, 0.0018738508224487305, 0.002089202404022217, 0.002304553985595703, 0.0025199055671691895, 0.0027352571487426758, 0.002950608730316162, 0.0031659603118896484, 0.0033813118934631348, 0.003596663475036621, 0.0038120150566101074, 0.004027366638183594, 0.00424271821975708, 0.004458069801330566, 0.004673421382904053, 0.004888772964477539, 0.005104124546051025, 0.005319476127624512, 0.005534827709197998, 0.005750179290771484, 0.005965530872344971, 0.006180882453918457, 0.006396234035491943, 0.00661158561706543, 0.006826937198638916, 0.007042288780212402, 0.007257640361785889, 0.007472991943359375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 3.0, 3.0, 7.0, 6.0, 11.0, 14.0, 21.0, 29.0, 44.0, 56.0, 76.0, 116.0, 160.0, 280.0, 632.0, 10015.0, 1027356.0, 8335.0, 580.0, 293.0, 141.0, 111.0, 70.0, 56.0, 31.0, 29.0, 31.0, 19.0, 11.0, 4.0, 7.0, 5.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.172607421875, -0.16729354858398438, -0.16197967529296875, -0.15666580200195312, -0.1513519287109375, -0.14603805541992188, -0.14072418212890625, -0.13541030883789062, -0.130096435546875, -0.12478256225585938, -0.11946868896484375, -0.11415481567382812, -0.1088409423828125, -0.10352706909179688, -0.09821319580078125, -0.09289932250976562, -0.08758544921875, -0.08227157592773438, -0.07695770263671875, -0.07164382934570312, -0.0663299560546875, -0.061016082763671875, -0.05570220947265625, -0.050388336181640625, -0.045074462890625, -0.039760589599609375, -0.03444671630859375, -0.029132843017578125, -0.0238189697265625, -0.018505096435546875, -0.01319122314453125, -0.007877349853515625, -0.0025634765625, 0.002750396728515625, 0.00806427001953125, 0.013378143310546875, 0.0186920166015625, 0.024005889892578125, 0.02931976318359375, 0.034633636474609375, 0.039947509765625, 0.045261383056640625, 0.05057525634765625, 0.055889129638671875, 0.0612030029296875, 0.06651687622070312, 0.07183074951171875, 0.07714462280273438, 0.08245849609375, 0.08777236938476562, 0.09308624267578125, 0.09840011596679688, 0.1037139892578125, 0.10902786254882812, 0.11434173583984375, 0.11965560913085938, 0.124969482421875, 0.13028335571289062, 0.13559722900390625, 0.14091110229492188, 0.1462249755859375, 0.15153884887695312, 0.15685272216796875, 0.16216659545898438, 0.16748046875]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 11.0, 779.0, 219.0, 8.0, 0.0, 1.0], "bins": [-0.1506684273481369, -0.14814729988574982, -0.14562615752220154, -0.14310503005981445, -0.14058390259742737, -0.13806277513504028, -0.135541632771492, -0.13302050530910492, -0.13049937784671783, -0.12797825038433075, -0.12545710802078247, -0.12293598055839539, -0.1204148530960083, -0.11789371818304062, -0.11537259072065353, -0.11285145580768585, -0.11033032834529877, -0.10780919343233109, -0.105288065969944, -0.10276693105697632, -0.10024580359458923, -0.09772466868162155, -0.09520354121923447, -0.09268240630626678, -0.0901612713932991, -0.08764013648033142, -0.08511900901794434, -0.08259787410497665, -0.08007674664258957, -0.07755561172962189, -0.0750344842672348, -0.07251334935426712, -0.06999222189188004, -0.06747108697891235, -0.06494995951652527, -0.062428828328847885, -0.0599076971411705, -0.05738656595349312, -0.054865434765815735, -0.05234429985284805, -0.04982317239046097, -0.047302041202783585, -0.0447809100151062, -0.04225977882742882, -0.039738647639751434, -0.03721751645207405, -0.03469638526439667, -0.032175250351428986, -0.0296541228890419, -0.027132991701364517, -0.024611860513687134, -0.02209072932600975, -0.019569598138332367, -0.017048466950654984, -0.01452733390033245, -0.012006202712655067, -0.00948507059365511, -0.006963939405977726, -0.004442807752639055, -0.0019216760993003845, 0.0005994550883769989, 0.0031205862760543823, 0.00564171839505434, 0.008162849582731724, 0.010683980770409107]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 1.0, 0.0, 7.0, 5.0, 4.0, 11.0, 9.0, 7.0, 13.0, 16.0, 13.0, 11.0, 19.0, 25.0, 24.0, 33.0, 35.0, 39.0, 25.0, 35.0, 34.0, 33.0, 35.0, 36.0, 35.0, 42.0, 42.0, 36.0, 43.0, 36.0, 24.0, 29.0, 26.0, 32.0, 24.0, 33.0, 16.0, 17.0, 14.0, 14.0, 14.0, 12.0, 11.0, 16.0, 9.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004801034927368164, -0.004662330262362957, -0.00452362559735775, -0.004384920932352543, -0.004246216267347336, -0.004107511602342129, -0.003968806937336922, -0.0038301022723317146, -0.0036913976073265076, -0.0035526929423213005, -0.0034139882773160934, -0.0032752836123108864, -0.0031365789473056793, -0.0029978742823004723, -0.002859169617295265, -0.002720464952290058, -0.002581760287284851, -0.002443055622279644, -0.002304350957274437, -0.00216564629226923, -0.002026941627264023, -0.0018882369622588158, -0.0017495322972536087, -0.0016108276322484016, -0.0014721229672431946, -0.0013334183022379875, -0.0011947136372327805, -0.0010560089722275734, -0.0009173043072223663, -0.0007785996422171593, -0.0006398949772119522, -0.0005011903122067451, -0.0003624856472015381, -0.00022378098219633102, -8.507631719112396e-05, 5.36283478140831e-05, 0.00019233301281929016, 0.0003310376778244972, 0.0004697423428297043, 0.0006084470078349113, 0.0007471516728401184, 0.0008858563378453255, 0.0010245610028505325, 0.0011632656678557396, 0.0013019703328609467, 0.0014406749978661537, 0.0015793796628713608, 0.0017180843278765678, 0.001856788992881775, 0.001995493657886982, 0.002134198322892189, 0.002272902987897396, 0.002411607652902603, 0.00255031231790781, 0.0026890169829130173, 0.0028277216479182243, 0.0029664263129234314, 0.0031051309779286385, 0.0032438356429338455, 0.0033825403079390526, 0.0035212449729442596, 0.0036599496379494667, 0.0037986543029546738, 0.003937358967959881, 0.004076063632965088]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 2.0, 4.0, 2.0, 8.0, 10.0, 10.0, 13.0, 14.0, 14.0, 20.0, 20.0, 22.0, 28.0, 27.0, 34.0, 36.0, 48.0, 40.0, 50.0, 61.0, 53.0, 68.0, 47.0, 48.0, 40.0, 38.0, 35.0, 49.0, 19.0, 24.0, 15.0, 19.0, 11.0, 16.0, 7.0, 13.0, 6.0, 6.0, 4.0, 10.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-10.65625, -10.3297119140625, -10.003173828125, -9.6766357421875, -9.35009765625, -9.0235595703125, -8.697021484375, -8.3704833984375, -8.0439453125, -7.7174072265625, -7.390869140625, -7.0643310546875, -6.73779296875, -6.4112548828125, -6.084716796875, -5.7581787109375, -5.431640625, -5.1051025390625, -4.778564453125, -4.4520263671875, -4.12548828125, -3.7989501953125, -3.472412109375, -3.1458740234375, -2.8193359375, -2.4927978515625, -2.166259765625, -1.8397216796875, -1.51318359375, -1.1866455078125, -0.860107421875, -0.5335693359375, -0.20703125, 0.1195068359375, 0.446044921875, 0.7725830078125, 1.09912109375, 1.4256591796875, 1.752197265625, 2.0787353515625, 2.4052734375, 2.7318115234375, 3.058349609375, 3.3848876953125, 3.71142578125, 4.0379638671875, 4.364501953125, 4.6910400390625, 5.017578125, 5.3441162109375, 5.670654296875, 5.9971923828125, 6.32373046875, 6.6502685546875, 6.976806640625, 7.3033447265625, 7.6298828125, 7.9564208984375, 8.282958984375, 8.6094970703125, 8.93603515625, 9.2625732421875, 9.589111328125, 9.9156494140625, 10.2421875]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 9.0, 9.0, 8.0, 21.0, 27.0, 21.0, 31.0, 52.0, 53.0, 79.0, 97.0, 138.0, 171.0, 229.0, 299.0, 455.0, 617.0, 942.0, 1381.0, 2217.0, 4193.0, 9225.0, 29436.0, 204233.0, 697053.0, 67266.0, 15721.0, 5982.0, 2951.0, 1769.0, 1115.0, 710.0, 518.0, 406.0, 299.0, 205.0, 162.0, 118.0, 65.0, 65.0, 61.0, 38.0, 19.0, 29.0, 14.0, 13.0, 9.0, 7.0, 7.0, 5.0, 5.0, 2.0, 2.0, 1.0, 2.0], "bins": [-13.484375, -13.078857421875, -12.67333984375, -12.267822265625, -11.8623046875, -11.456787109375, -11.05126953125, -10.645751953125, -10.240234375, -9.834716796875, -9.42919921875, -9.023681640625, -8.6181640625, -8.212646484375, -7.80712890625, -7.401611328125, -6.99609375, -6.590576171875, -6.18505859375, -5.779541015625, -5.3740234375, -4.968505859375, -4.56298828125, -4.157470703125, -3.751953125, -3.346435546875, -2.94091796875, -2.535400390625, -2.1298828125, -1.724365234375, -1.31884765625, -0.913330078125, -0.5078125, -0.102294921875, 0.30322265625, 0.708740234375, 1.1142578125, 1.519775390625, 1.92529296875, 2.330810546875, 2.736328125, 3.141845703125, 3.54736328125, 3.952880859375, 4.3583984375, 4.763916015625, 5.16943359375, 5.574951171875, 5.98046875, 6.385986328125, 6.79150390625, 7.197021484375, 7.6025390625, 8.008056640625, 8.41357421875, 8.819091796875, 9.224609375, 9.630126953125, 10.03564453125, 10.441162109375, 10.8466796875, 11.252197265625, 11.65771484375, 12.063232421875, 12.46875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 5.0, 8.0, 12.0, 13.0, 17.0, 11.0, 12.0, 13.0, 18.0, 28.0, 27.0, 32.0, 37.0, 35.0, 49.0, 53.0, 68.0, 137.0, 1808.0, 163.0, 83.0, 49.0, 51.0, 38.0, 36.0, 27.0, 33.0, 20.0, 24.0, 26.0, 26.0, 12.0, 12.0, 13.0, 8.0, 6.0, 6.0, 9.0, 6.0, 8.0, 2.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-37.40625, -36.29248046875, -35.1787109375, -34.06494140625, -32.951171875, -31.83740234375, -30.7236328125, -29.60986328125, -28.49609375, -27.38232421875, -26.2685546875, -25.15478515625, -24.041015625, -22.92724609375, -21.8134765625, -20.69970703125, -19.5859375, -18.47216796875, -17.3583984375, -16.24462890625, -15.130859375, -14.01708984375, -12.9033203125, -11.78955078125, -10.67578125, -9.56201171875, -8.4482421875, -7.33447265625, -6.220703125, -5.10693359375, -3.9931640625, -2.87939453125, -1.765625, -0.65185546875, 0.4619140625, 1.57568359375, 2.689453125, 3.80322265625, 4.9169921875, 6.03076171875, 7.14453125, 8.25830078125, 9.3720703125, 10.48583984375, 11.599609375, 12.71337890625, 13.8271484375, 14.94091796875, 16.0546875, 17.16845703125, 18.2822265625, 19.39599609375, 20.509765625, 21.62353515625, 22.7373046875, 23.85107421875, 24.96484375, 26.07861328125, 27.1923828125, 28.30615234375, 29.419921875, 30.53369140625, 31.6474609375, 32.76123046875, 33.875]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 3.0, 1.0, 5.0, 8.0, 9.0, 7.0, 5.0, 10.0, 14.0, 7.0, 16.0, 21.0, 35.0, 30.0, 31.0, 59.0, 77.0, 103.0, 180.0, 367.0, 1012.0, 4116.0, 94638.0, 3027201.0, 14352.0, 2013.0, 635.0, 265.0, 145.0, 91.0, 59.0, 40.0, 32.0, 19.0, 16.0, 12.0, 19.0, 12.0, 13.0, 10.0, 5.0, 7.0, 3.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.34375, -50.61474609375, -48.8857421875, -47.15673828125, -45.427734375, -43.69873046875, -41.9697265625, -40.24072265625, -38.51171875, -36.78271484375, -35.0537109375, -33.32470703125, -31.595703125, -29.86669921875, -28.1376953125, -26.40869140625, -24.6796875, -22.95068359375, -21.2216796875, -19.49267578125, -17.763671875, -16.03466796875, -14.3056640625, -12.57666015625, -10.84765625, -9.11865234375, -7.3896484375, -5.66064453125, -3.931640625, -2.20263671875, -0.4736328125, 1.25537109375, 2.984375, 4.71337890625, 6.4423828125, 8.17138671875, 9.900390625, 11.62939453125, 13.3583984375, 15.08740234375, 16.81640625, 18.54541015625, 20.2744140625, 22.00341796875, 23.732421875, 25.46142578125, 27.1904296875, 28.91943359375, 30.6484375, 32.37744140625, 34.1064453125, 35.83544921875, 37.564453125, 39.29345703125, 41.0224609375, 42.75146484375, 44.48046875, 46.20947265625, 47.9384765625, 49.66748046875, 51.396484375, 53.12548828125, 54.8544921875, 56.58349609375, 58.3125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 95.0, 795.0, 118.0, 3.0], "bins": [-491.91143798828125, -483.9143981933594, -475.9173583984375, -467.9203186035156, -459.92327880859375, -451.92626953125, -443.92919921875, -435.93218994140625, -427.9351501464844, -419.9381103515625, -411.9410705566406, -403.94403076171875, -395.9469909667969, -387.949951171875, -379.95294189453125, -371.9559020996094, -363.9588623046875, -355.9618225097656, -347.96478271484375, -339.9677429199219, -331.970703125, -323.97369384765625, -315.97662353515625, -307.9796142578125, -299.9825439453125, -291.9855041503906, -283.98846435546875, -275.9914245605469, -267.994384765625, -259.99737548828125, -252.0003204345703, -244.00328063964844, -236.0062713623047, -228.0092315673828, -220.01219177246094, -212.01516723632812, -204.01812744140625, -196.02108764648438, -188.0240478515625, -180.02700805664062, -172.02996826171875, -164.03292846679688, -156.035888671875, -148.03884887695312, -140.0418243408203, -132.04478454589844, -124.04774475097656, -116.05070495605469, -108.05368041992188, -100.056640625, -92.05960845947266, -84.06256866455078, -76.06553649902344, -68.06849670410156, -60.07145690917969, -52.07442092895508, -44.07738494873047, -36.08034896850586, -28.083311080932617, -20.086273193359375, -12.089237213134766, -4.092201232910156, 3.9048385620117188, 11.901874542236328, 19.89891242980957]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 0.0, 2.0, 1.0, 7.0, 5.0, 3.0, 7.0, 6.0, 7.0, 12.0, 13.0, 19.0, 14.0, 12.0, 26.0, 20.0, 25.0, 27.0, 30.0, 43.0, 27.0, 30.0, 37.0, 44.0, 40.0, 47.0, 37.0, 36.0, 38.0, 37.0, 32.0, 38.0, 43.0, 24.0, 24.0, 16.0, 22.0, 15.0, 21.0, 21.0, 25.0, 9.0, 11.0, 6.0, 7.0, 9.0, 2.0, 5.0, 6.0, 3.0, 7.0, 5.0, 3.0, 3.0], "bins": [-105.17705535888672, -102.18560028076172, -99.19414520263672, -96.20269012451172, -93.21123504638672, -90.21978759765625, -87.22833251953125, -84.23687744140625, -81.24542236328125, -78.25396728515625, -75.26251220703125, -72.27105712890625, -69.27960205078125, -66.28814697265625, -63.296695709228516, -60.30524444580078, -57.313785552978516, -54.322330474853516, -51.330875396728516, -48.33942413330078, -45.34796905517578, -42.35651397705078, -39.36505889892578, -36.37360382080078, -33.38214874267578, -30.39069366455078, -27.399240493774414, -24.407785415649414, -21.416332244873047, -18.424877166748047, -15.433422088623047, -12.44196891784668, -9.450515747070312, -6.459061622619629, -3.467607021331787, -0.4761524200439453, 2.5153017044067383, 5.506755828857422, 8.498210906982422, 11.489664077758789, 14.481119155883789, 17.47257423400879, 20.464027404785156, 23.455482482910156, 26.446937561035156, 29.438390731811523, 32.429847717285156, 35.42129898071289, 38.41275405883789, 41.40420913696289, 44.39566421508789, 47.387115478515625, 50.378570556640625, 53.370025634765625, 56.361480712890625, 59.352935791015625, 62.344390869140625, 65.33584594726562, 68.32730102539062, 71.31875610351562, 74.31021118164062, 77.30166625976562, 80.29312133789062, 83.2845687866211, 86.2760238647461]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 2.0, 1.0, 2.0, 2.0, 8.0, 10.0, 11.0, 11.0, 16.0, 17.0, 18.0, 24.0, 18.0, 30.0, 25.0, 31.0, 35.0, 46.0, 46.0, 45.0, 60.0, 59.0, 60.0, 54.0, 40.0, 40.0, 34.0, 44.0, 28.0, 41.0, 19.0, 16.0, 15.0, 14.0, 15.0, 11.0, 12.0, 9.0, 7.0, 4.0, 7.0, 4.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.3203125, -9.995361328125, -9.67041015625, -9.345458984375, -9.0205078125, -8.695556640625, -8.37060546875, -8.045654296875, -7.720703125, -7.395751953125, -7.07080078125, -6.745849609375, -6.4208984375, -6.095947265625, -5.77099609375, -5.446044921875, -5.12109375, -4.796142578125, -4.47119140625, -4.146240234375, -3.8212890625, -3.496337890625, -3.17138671875, -2.846435546875, -2.521484375, -2.196533203125, -1.87158203125, -1.546630859375, -1.2216796875, -0.896728515625, -0.57177734375, -0.246826171875, 0.078125, 0.403076171875, 0.72802734375, 1.052978515625, 1.3779296875, 1.702880859375, 2.02783203125, 2.352783203125, 2.677734375, 3.002685546875, 3.32763671875, 3.652587890625, 3.9775390625, 4.302490234375, 4.62744140625, 4.952392578125, 5.27734375, 5.602294921875, 5.92724609375, 6.252197265625, 6.5771484375, 6.902099609375, 7.22705078125, 7.552001953125, 7.876953125, 8.201904296875, 8.52685546875, 8.851806640625, 9.1767578125, 9.501708984375, 9.82666015625, 10.151611328125, 10.4765625]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 4.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 14.0, 22.0, 16.0, 37.0, 48.0, 76.0, 121.0, 228.0, 465.0, 901.0, 2005.0, 4749.0, 13385.0, 96449.0, 3554730.0, 487646.0, 21765.0, 6385.0, 2576.0, 1225.0, 613.0, 291.0, 186.0, 111.0, 62.0, 49.0, 29.0, 21.0, 10.0, 3.0, 7.0, 6.0, 4.0, 5.0, 0.0, 3.0, 5.0, 2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-45.3125, -43.9267578125, -42.541015625, -41.1552734375, -39.76953125, -38.3837890625, -36.998046875, -35.6123046875, -34.2265625, -32.8408203125, -31.455078125, -30.0693359375, -28.68359375, -27.2978515625, -25.912109375, -24.5263671875, -23.140625, -21.7548828125, -20.369140625, -18.9833984375, -17.59765625, -16.2119140625, -14.826171875, -13.4404296875, -12.0546875, -10.6689453125, -9.283203125, -7.8974609375, -6.51171875, -5.1259765625, -3.740234375, -2.3544921875, -0.96875, 0.4169921875, 1.802734375, 3.1884765625, 4.57421875, 5.9599609375, 7.345703125, 8.7314453125, 10.1171875, 11.5029296875, 12.888671875, 14.2744140625, 15.66015625, 17.0458984375, 18.431640625, 19.8173828125, 21.203125, 22.5888671875, 23.974609375, 25.3603515625, 26.74609375, 28.1318359375, 29.517578125, 30.9033203125, 32.2890625, 33.6748046875, 35.060546875, 36.4462890625, 37.83203125, 39.2177734375, 40.603515625, 41.9892578125, 43.375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 5.0, 3.0, 6.0, 8.0, 5.0, 10.0, 14.0, 6.0, 9.0, 19.0, 27.0, 25.0, 45.0, 67.0, 95.0, 179.0, 359.0, 641.0, 955.0, 716.0, 364.0, 179.0, 98.0, 57.0, 51.0, 37.0, 21.0, 17.0, 15.0, 11.0, 10.0, 4.0, 7.0, 6.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.53125, -26.53173828125, -25.5322265625, -24.53271484375, -23.533203125, -22.53369140625, -21.5341796875, -20.53466796875, -19.53515625, -18.53564453125, -17.5361328125, -16.53662109375, -15.537109375, -14.53759765625, -13.5380859375, -12.53857421875, -11.5390625, -10.53955078125, -9.5400390625, -8.54052734375, -7.541015625, -6.54150390625, -5.5419921875, -4.54248046875, -3.54296875, -2.54345703125, -1.5439453125, -0.54443359375, 0.455078125, 1.45458984375, 2.4541015625, 3.45361328125, 4.453125, 5.45263671875, 6.4521484375, 7.45166015625, 8.451171875, 9.45068359375, 10.4501953125, 11.44970703125, 12.44921875, 13.44873046875, 14.4482421875, 15.44775390625, 16.447265625, 17.44677734375, 18.4462890625, 19.44580078125, 20.4453125, 21.44482421875, 22.4443359375, 23.44384765625, 24.443359375, 25.44287109375, 26.4423828125, 27.44189453125, 28.44140625, 29.44091796875, 30.4404296875, 31.43994140625, 32.439453125, 33.43896484375, 34.4384765625, 35.43798828125, 36.4375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 5.0, 11.0, 12.0, 22.0, 24.0, 39.0, 58.0, 76.0, 147.0, 216.0, 327.0, 548.0, 1003.0, 1911.0, 3869.0, 8470.0, 21250.0, 72595.0, 645828.0, 3141900.0, 226295.0, 42455.0, 14481.0, 6234.0, 2890.0, 1534.0, 803.0, 488.0, 269.0, 178.0, 124.0, 64.0, 46.0, 37.0, 22.0, 19.0, 13.0, 4.0, 3.0, 3.0, 5.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.65625, -36.49072265625, -35.3251953125, -34.15966796875, -32.994140625, -31.82861328125, -30.6630859375, -29.49755859375, -28.33203125, -27.16650390625, -26.0009765625, -24.83544921875, -23.669921875, -22.50439453125, -21.3388671875, -20.17333984375, -19.0078125, -17.84228515625, -16.6767578125, -15.51123046875, -14.345703125, -13.18017578125, -12.0146484375, -10.84912109375, -9.68359375, -8.51806640625, -7.3525390625, -6.18701171875, -5.021484375, -3.85595703125, -2.6904296875, -1.52490234375, -0.359375, 0.80615234375, 1.9716796875, 3.13720703125, 4.302734375, 5.46826171875, 6.6337890625, 7.79931640625, 8.96484375, 10.13037109375, 11.2958984375, 12.46142578125, 13.626953125, 14.79248046875, 15.9580078125, 17.12353515625, 18.2890625, 19.45458984375, 20.6201171875, 21.78564453125, 22.951171875, 24.11669921875, 25.2822265625, 26.44775390625, 27.61328125, 28.77880859375, 29.9443359375, 31.10986328125, 32.275390625, 33.44091796875, 34.6064453125, 35.77197265625, 36.9375]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 9.0, 16.0, 45.0, 62.0, 159.0, 193.0, 211.0, 168.0, 80.0, 36.0, 16.0, 6.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.83331298828125, -135.94273376464844, -130.05215454101562, -124.16157531738281, -118.27099609375, -112.38041687011719, -106.48983764648438, -100.59925842285156, -94.70867919921875, -88.81809997558594, -82.92752075195312, -77.03694152832031, -71.1463623046875, -65.25578308105469, -59.36520004272461, -53.4746208190918, -47.58403778076172, -41.693458557128906, -35.802879333496094, -29.91229820251465, -24.021718978881836, -18.131139755249023, -12.240558624267578, -6.349979400634766, -0.4594001770019531, 5.431179523468018, 11.321759223937988, 17.212339401245117, 23.10291862487793, 28.993497848510742, 34.88407897949219, 40.774658203125, 46.66523742675781, 52.555816650390625, 58.44639587402344, 64.33697509765625, 70.22755432128906, 76.11813354492188, 82.00871276855469, 87.8992919921875, 93.78987121582031, 99.68045043945312, 105.57102966308594, 111.46160888671875, 117.35218811035156, 123.24276733398438, 129.1333465576172, 135.02392578125, 140.91452026367188, 146.8050994873047, 152.6956787109375, 158.5862579345703, 164.47683715820312, 170.36741638183594, 176.25799560546875, 182.14857482910156, 188.03915405273438, 193.9297332763672, 199.8203125, 205.7108917236328, 211.60147094726562, 217.49205017089844, 223.38262939453125, 229.27320861816406, 235.16378784179688]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 3.0, 7.0, 7.0, 13.0, 7.0, 16.0, 13.0, 19.0, 14.0, 19.0, 18.0, 18.0, 34.0, 40.0, 32.0, 45.0, 34.0, 34.0, 37.0, 34.0, 40.0, 47.0, 45.0, 40.0, 41.0, 35.0, 40.0, 33.0, 26.0, 23.0, 26.0, 28.0, 15.0, 26.0, 19.0, 15.0, 8.0, 11.0, 8.0, 6.0, 6.0, 7.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-76.81509399414062, -74.3446273803711, -71.87415313720703, -69.4036865234375, -66.93321228027344, -64.4627456665039, -61.992279052734375, -59.52180862426758, -57.05133819580078, -54.580867767333984, -52.11039733886719, -49.639930725097656, -47.16946029663086, -44.69898986816406, -42.22852325439453, -39.758052825927734, -37.28758239746094, -34.81711196899414, -32.346641540527344, -29.876174926757812, -27.405704498291016, -24.93523406982422, -22.464765548706055, -19.99429702758789, -17.523826599121094, -15.053357124328613, -12.582887649536133, -10.112418174743652, -7.641948699951172, -5.171479225158691, -2.701009750366211, -0.23054122924804688, 2.23992919921875, 4.7103986740112305, 7.180868148803711, 9.651337623596191, 12.121807098388672, 14.592276573181152, 17.062746047973633, 19.533214569091797, 22.003684997558594, 24.47415542602539, 26.944623947143555, 29.41509246826172, 31.885562896728516, 34.35603332519531, 36.826499938964844, 39.29697036743164, 41.76744079589844, 44.237911224365234, 46.70838165283203, 49.17884826660156, 51.64931869506836, 54.119789123535156, 56.59025573730469, 59.060726165771484, 61.53119659423828, 64.00166320800781, 66.47213745117188, 68.9426040649414, 71.41307067871094, 73.883544921875, 76.35401153564453, 78.82447814941406, 81.29495239257812]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 9.0, 6.0, 11.0, 10.0, 9.0, 16.0, 17.0, 15.0, 22.0, 22.0, 33.0, 27.0, 29.0, 49.0, 37.0, 39.0, 59.0, 56.0, 38.0, 53.0, 58.0, 53.0, 42.0, 35.0, 31.0, 36.0, 26.0, 27.0, 20.0, 24.0, 15.0, 13.0, 9.0, 9.0, 6.0, 3.0, 6.0, 4.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.9765625, -9.6607666015625, -9.344970703125, -9.0291748046875, -8.71337890625, -8.3975830078125, -8.081787109375, -7.7659912109375, -7.4501953125, -7.1343994140625, -6.818603515625, -6.5028076171875, -6.18701171875, -5.8712158203125, -5.555419921875, -5.2396240234375, -4.923828125, -4.6080322265625, -4.292236328125, -3.9764404296875, -3.66064453125, -3.3448486328125, -3.029052734375, -2.7132568359375, -2.3974609375, -2.0816650390625, -1.765869140625, -1.4500732421875, -1.13427734375, -0.8184814453125, -0.502685546875, -0.1868896484375, 0.12890625, 0.4447021484375, 0.760498046875, 1.0762939453125, 1.39208984375, 1.7078857421875, 2.023681640625, 2.3394775390625, 2.6552734375, 2.9710693359375, 3.286865234375, 3.6026611328125, 3.91845703125, 4.2342529296875, 4.550048828125, 4.8658447265625, 5.181640625, 5.4974365234375, 5.813232421875, 6.1290283203125, 6.44482421875, 6.7606201171875, 7.076416015625, 7.3922119140625, 7.7080078125, 8.0238037109375, 8.339599609375, 8.6553955078125, 8.97119140625, 9.2869873046875, 9.602783203125, 9.9185791015625, 10.234375]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 8.0, 8.0, 16.0, 24.0, 30.0, 50.0, 49.0, 56.0, 84.0, 103.0, 211.0, 250.0, 302.0, 435.0, 577.0, 861.0, 1105.0, 1550.0, 2134.0, 2973.0, 4112.0, 5888.0, 8509.0, 12735.0, 19994.0, 31104.0, 49934.0, 81938.0, 130359.0, 186549.0, 178077.0, 120865.0, 74997.0, 46115.0, 28688.0, 18375.0, 11967.0, 7856.0, 5649.0, 3892.0, 2800.0, 1932.0, 1406.0, 1083.0, 807.0, 571.0, 401.0, 300.0, 219.0, 168.0, 131.0, 99.0, 62.0, 53.0, 34.0, 24.0, 18.0, 16.0, 14.0, 4.0, 1.0, 1.0], "bins": [-1.064453125, -1.031097412109375, -0.99774169921875, -0.964385986328125, -0.9310302734375, -0.897674560546875, -0.86431884765625, -0.830963134765625, -0.797607421875, -0.764251708984375, -0.73089599609375, -0.697540283203125, -0.6641845703125, -0.630828857421875, -0.59747314453125, -0.564117431640625, -0.53076171875, -0.497406005859375, -0.46405029296875, -0.430694580078125, -0.3973388671875, -0.363983154296875, -0.33062744140625, -0.297271728515625, -0.263916015625, -0.230560302734375, -0.19720458984375, -0.163848876953125, -0.1304931640625, -0.097137451171875, -0.06378173828125, -0.030426025390625, 0.0029296875, 0.036285400390625, 0.06964111328125, 0.102996826171875, 0.1363525390625, 0.169708251953125, 0.20306396484375, 0.236419677734375, 0.269775390625, 0.303131103515625, 0.33648681640625, 0.369842529296875, 0.4031982421875, 0.436553955078125, 0.46990966796875, 0.503265380859375, 0.53662109375, 0.569976806640625, 0.60333251953125, 0.636688232421875, 0.6700439453125, 0.703399658203125, 0.73675537109375, 0.770111083984375, 0.803466796875, 0.836822509765625, 0.87017822265625, 0.903533935546875, 0.9368896484375, 0.970245361328125, 1.00360107421875, 1.036956787109375, 1.0703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 6.0, 4.0, 2.0, 8.0, 5.0, 7.0, 15.0, 12.0, 16.0, 13.0, 21.0, 21.0, 20.0, 27.0, 26.0, 21.0, 39.0, 43.0, 41.0, 31.0, 34.0, 49.0, 1062.0, 43.0, 39.0, 44.0, 36.0, 40.0, 27.0, 28.0, 33.0, 26.0, 30.0, 22.0, 18.0, 24.0, 21.0, 17.0, 7.0, 8.0, 9.0, 8.0, 8.0, 3.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.24609375, -5.070068359375, -4.89404296875, -4.718017578125, -4.5419921875, -4.365966796875, -4.18994140625, -4.013916015625, -3.837890625, -3.661865234375, -3.48583984375, -3.309814453125, -3.1337890625, -2.957763671875, -2.78173828125, -2.605712890625, -2.4296875, -2.253662109375, -2.07763671875, -1.901611328125, -1.7255859375, -1.549560546875, -1.37353515625, -1.197509765625, -1.021484375, -0.845458984375, -0.66943359375, -0.493408203125, -0.3173828125, -0.141357421875, 0.03466796875, 0.210693359375, 0.38671875, 0.562744140625, 0.73876953125, 0.914794921875, 1.0908203125, 1.266845703125, 1.44287109375, 1.618896484375, 1.794921875, 1.970947265625, 2.14697265625, 2.322998046875, 2.4990234375, 2.675048828125, 2.85107421875, 3.027099609375, 3.203125, 3.379150390625, 3.55517578125, 3.731201171875, 3.9072265625, 4.083251953125, 4.25927734375, 4.435302734375, 4.611328125, 4.787353515625, 4.96337890625, 5.139404296875, 5.3154296875, 5.491455078125, 5.66748046875, 5.843505859375, 6.01953125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 2.0, 2.0, 13.0, 10.0, 10.0, 19.0, 28.0, 27.0, 59.0, 79.0, 94.0, 165.0, 207.0, 329.0, 421.0, 644.0, 915.0, 1351.0, 2000.0, 2767.0, 4281.0, 6324.0, 9389.0, 13880.0, 20428.0, 30842.0, 46700.0, 71030.0, 107523.0, 152171.0, 1217361.0, 135336.0, 91901.0, 60933.0, 39823.0, 26412.0, 17422.0, 11559.0, 7999.0, 5283.0, 3547.0, 2509.0, 1631.0, 1080.0, 833.0, 545.0, 398.0, 247.0, 168.0, 126.0, 92.0, 70.0, 46.0, 41.0, 17.0, 21.0, 10.0, 10.0, 5.0, 4.0, 4.0, 3.0], "bins": [-0.64208984375, -0.6222152709960938, -0.6023406982421875, -0.5824661254882812, -0.562591552734375, -0.5427169799804688, -0.5228424072265625, -0.5029678344726562, -0.48309326171875, -0.46321868896484375, -0.4433441162109375, -0.42346954345703125, -0.403594970703125, -0.38372039794921875, -0.3638458251953125, -0.34397125244140625, -0.3240966796875, -0.30422210693359375, -0.2843475341796875, -0.26447296142578125, -0.244598388671875, -0.22472381591796875, -0.2048492431640625, -0.18497467041015625, -0.16510009765625, -0.14522552490234375, -0.1253509521484375, -0.10547637939453125, -0.085601806640625, -0.06572723388671875, -0.0458526611328125, -0.02597808837890625, -0.006103515625, 0.01377105712890625, 0.0336456298828125, 0.05352020263671875, 0.073394775390625, 0.09326934814453125, 0.1131439208984375, 0.13301849365234375, 0.15289306640625, 0.17276763916015625, 0.1926422119140625, 0.21251678466796875, 0.232391357421875, 0.25226593017578125, 0.2721405029296875, 0.29201507568359375, 0.3118896484375, 0.33176422119140625, 0.3516387939453125, 0.37151336669921875, 0.391387939453125, 0.41126251220703125, 0.4311370849609375, 0.45101165771484375, 0.47088623046875, 0.49076080322265625, 0.5106353759765625, 0.5305099487304688, 0.550384521484375, 0.5702590942382812, 0.5901336669921875, 0.6100082397460938, 0.6298828125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 6.0, 7.0, 10.0, 12.0, 9.0, 13.0, 20.0, 20.0, 23.0, 35.0, 48.0, 52.0, 82.0, 102.0, 103.0, 95.0, 69.0, 66.0, 50.0, 27.0, 24.0, 27.0, 17.0, 14.0, 10.0, 11.0, 5.0, 5.0, 8.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00994110107421875, -0.009652495384216309, -0.009363889694213867, -0.009075284004211426, -0.008786678314208984, -0.008498072624206543, -0.008209466934204102, -0.00792086124420166, -0.007632255554199219, -0.007343649864196777, -0.007055044174194336, -0.0067664384841918945, -0.006477832794189453, -0.006189227104187012, -0.00590062141418457, -0.005612015724182129, -0.0053234100341796875, -0.005034804344177246, -0.004746198654174805, -0.004457592964172363, -0.004168987274169922, -0.0038803815841674805, -0.003591775894165039, -0.0033031702041625977, -0.0030145645141601562, -0.002725958824157715, -0.0024373531341552734, -0.002148747444152832, -0.0018601417541503906, -0.0015715360641479492, -0.0012829303741455078, -0.0009943246841430664, -0.000705718994140625, -0.0004171133041381836, -0.0001285076141357422, 0.00016009807586669922, 0.0004487037658691406, 0.000737309455871582, 0.0010259151458740234, 0.0013145208358764648, 0.0016031265258789062, 0.0018917322158813477, 0.002180337905883789, 0.0024689435958862305, 0.002757549285888672, 0.0030461549758911133, 0.0033347606658935547, 0.003623366355895996, 0.0039119720458984375, 0.004200577735900879, 0.00448918342590332, 0.004777789115905762, 0.005066394805908203, 0.0053550004959106445, 0.005643606185913086, 0.005932211875915527, 0.006220817565917969, 0.00650942325592041, 0.0067980289459228516, 0.007086634635925293, 0.007375240325927734, 0.007663846015930176, 0.007952451705932617, 0.008241057395935059, 0.0085296630859375]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 5.0, 5.0, 20.0, 15.0, 19.0, 34.0, 43.0, 75.0, 107.0, 191.0, 285.0, 566.0, 4957.0, 974949.0, 65131.0, 1101.0, 384.0, 222.0, 124.0, 92.0, 60.0, 37.0, 27.0, 20.0, 21.0, 5.0, 9.0, 5.0, 11.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177734375, -0.17176055908203125, -0.1657867431640625, -0.15981292724609375, -0.153839111328125, -0.14786529541015625, -0.1418914794921875, -0.13591766357421875, -0.12994384765625, -0.12397003173828125, -0.1179962158203125, -0.11202239990234375, -0.106048583984375, -0.10007476806640625, -0.0941009521484375, -0.08812713623046875, -0.0821533203125, -0.07617950439453125, -0.0702056884765625, -0.06423187255859375, -0.058258056640625, -0.05228424072265625, -0.0463104248046875, -0.04033660888671875, -0.03436279296875, -0.02838897705078125, -0.0224151611328125, -0.01644134521484375, -0.010467529296875, -0.00449371337890625, 0.0014801025390625, 0.00745391845703125, 0.013427734375, 0.01940155029296875, 0.0253753662109375, 0.03134918212890625, 0.037322998046875, 0.04329681396484375, 0.0492706298828125, 0.05524444580078125, 0.06121826171875, 0.06719207763671875, 0.0731658935546875, 0.07913970947265625, 0.085113525390625, 0.09108734130859375, 0.0970611572265625, 0.10303497314453125, 0.1090087890625, 0.11498260498046875, 0.1209564208984375, 0.12693023681640625, 0.132904052734375, 0.13887786865234375, 0.1448516845703125, 0.15082550048828125, 0.15679931640625, 0.16277313232421875, 0.1687469482421875, 0.17472076416015625, 0.180694580078125, 0.18666839599609375, 0.1926422119140625, 0.19861602783203125, 0.20458984375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 11.0, 222.0, 707.0, 71.0, 8.0], "bins": [-0.1481674164533615, -0.14574740827083588, -0.14332741498947144, -0.1409074068069458, -0.13848741352558136, -0.13606740534305573, -0.13364741206169128, -0.13122740387916565, -0.1288074105978012, -0.12638740241527557, -0.12396740913391113, -0.1215474084019661, -0.11912740767002106, -0.11670740693807602, -0.11428740620613098, -0.11186739802360535, -0.10944739729166031, -0.10702739655971527, -0.10460739582777023, -0.1021873950958252, -0.09976739436388016, -0.09734739363193512, -0.09492739289999008, -0.09250739216804504, -0.09008738398551941, -0.08766738325357437, -0.08524738252162933, -0.0828273817896843, -0.08040738105773926, -0.07798738032579422, -0.07556737959384918, -0.07314737141132355, -0.0707273855805397, -0.06830738484859467, -0.06588738411664963, -0.06346738338470459, -0.06104738265275955, -0.058627381920814514, -0.05620737746357918, -0.05378737673163414, -0.0513673759996891, -0.048947375267744064, -0.046527374535799026, -0.04410737380385399, -0.04168736934661865, -0.039267368614673615, -0.03684736788272858, -0.03442736715078354, -0.0320073664188385, -0.029587365686893463, -0.027167364954948425, -0.024747362360358238, -0.0223273616284132, -0.019907360896468163, -0.017487358301877975, -0.015067357569932938, -0.0126473568379879, -0.010227356106042862, -0.0078073544427752495, -0.005387353245168924, -0.002967352047562599, -0.0005473513156175613, 0.0018726503476500511, 0.004292652010917664, 0.006712652742862701]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 3.0, 5.0, 7.0, 7.0, 6.0, 8.0, 15.0, 8.0, 14.0, 12.0, 20.0, 31.0, 27.0, 29.0, 25.0, 32.0, 41.0, 42.0, 37.0, 34.0, 40.0, 49.0, 41.0, 40.0, 35.0, 37.0, 42.0, 36.0, 39.0, 33.0, 32.0, 26.0, 17.0, 22.0, 23.0, 16.0, 13.0, 14.0, 8.0, 11.0, 5.0, 7.0, 4.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006248652935028076, -0.006037823855876923, -0.005826994776725769, -0.0056161656975746155, -0.005405336618423462, -0.005194507539272308, -0.004983678460121155, -0.004772849380970001, -0.004562020301818848, -0.004351191222667694, -0.0041403621435165405, -0.003929533064365387, -0.0037187039852142334, -0.00350787490606308, -0.0032970458269119263, -0.0030862167477607727, -0.002875387668609619, -0.0026645585894584656, -0.002453729510307312, -0.0022429004311561584, -0.002032071352005005, -0.0018212422728538513, -0.0016104131937026978, -0.0013995841145515442, -0.0011887550354003906, -0.000977925956249237, -0.0007670968770980835, -0.0005562677979469299, -0.00034543871879577637, -0.0001346096396446228, 7.621943950653076e-05, 0.0002870485186576843, 0.0004978775978088379, 0.0007087066769599915, 0.000919535756111145, 0.0011303648352622986, 0.0013411939144134521, 0.0015520229935646057, 0.0017628520727157593, 0.001973681151866913, 0.0021845102310180664, 0.00239533931016922, 0.0026061683893203735, 0.002816997468471527, 0.0030278265476226807, 0.0032386556267738342, 0.003449484705924988, 0.0036603137850761414, 0.003871142864227295, 0.0040819719433784485, 0.004292801022529602, 0.004503630101680756, 0.004714459180831909, 0.004925288259983063, 0.005136117339134216, 0.00534694641828537, 0.0055577754974365234, 0.005768604576587677, 0.005979433655738831, 0.006190262734889984, 0.006401091814041138, 0.006611920893192291, 0.006822749972343445, 0.007033579051494598, 0.007244408130645752]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 3.0, 5.0, 9.0, 6.0, 11.0, 10.0, 9.0, 16.0, 17.0, 15.0, 22.0, 22.0, 33.0, 27.0, 29.0, 49.0, 37.0, 39.0, 59.0, 56.0, 38.0, 53.0, 58.0, 52.0, 43.0, 35.0, 31.0, 36.0, 26.0, 27.0, 20.0, 24.0, 15.0, 13.0, 9.0, 9.0, 6.0, 3.0, 6.0, 4.0, 6.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-9.9765625, -9.6607666015625, -9.344970703125, -9.0291748046875, -8.71337890625, -8.3975830078125, -8.081787109375, -7.7659912109375, -7.4501953125, -7.1343994140625, -6.818603515625, -6.5028076171875, -6.18701171875, -5.8712158203125, -5.555419921875, -5.2396240234375, -4.923828125, -4.6080322265625, -4.292236328125, -3.9764404296875, -3.66064453125, -3.3448486328125, -3.029052734375, -2.7132568359375, -2.3974609375, -2.0816650390625, -1.765869140625, -1.4500732421875, -1.13427734375, -0.8184814453125, -0.502685546875, -0.1868896484375, 0.12890625, 0.4447021484375, 0.760498046875, 1.0762939453125, 1.39208984375, 1.7078857421875, 2.023681640625, 2.3394775390625, 2.6552734375, 2.9710693359375, 3.286865234375, 3.6026611328125, 3.91845703125, 4.2342529296875, 4.550048828125, 4.8658447265625, 5.181640625, 5.4974365234375, 5.813232421875, 6.1290283203125, 6.44482421875, 6.7606201171875, 7.076416015625, 7.3922119140625, 7.7080078125, 8.0238037109375, 8.339599609375, 8.6553955078125, 8.97119140625, 9.2869873046875, 9.602783203125, 9.9185791015625, 10.234375]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 8.0, 8.0, 14.0, 19.0, 23.0, 30.0, 53.0, 76.0, 106.0, 138.0, 214.0, 345.0, 483.0, 774.0, 1219.0, 2003.0, 3761.0, 7378.0, 18414.0, 80399.0, 786125.0, 107586.0, 21218.0, 8221.0, 4052.0, 2163.0, 1294.0, 807.0, 514.0, 346.0, 231.0, 168.0, 104.0, 77.0, 49.0, 33.0, 34.0, 12.0, 16.0, 10.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.28125, -20.5849609375, -19.888671875, -19.1923828125, -18.49609375, -17.7998046875, -17.103515625, -16.4072265625, -15.7109375, -15.0146484375, -14.318359375, -13.6220703125, -12.92578125, -12.2294921875, -11.533203125, -10.8369140625, -10.140625, -9.4443359375, -8.748046875, -8.0517578125, -7.35546875, -6.6591796875, -5.962890625, -5.2666015625, -4.5703125, -3.8740234375, -3.177734375, -2.4814453125, -1.78515625, -1.0888671875, -0.392578125, 0.3037109375, 1.0, 1.6962890625, 2.392578125, 3.0888671875, 3.78515625, 4.4814453125, 5.177734375, 5.8740234375, 6.5703125, 7.2666015625, 7.962890625, 8.6591796875, 9.35546875, 10.0517578125, 10.748046875, 11.4443359375, 12.140625, 12.8369140625, 13.533203125, 14.2294921875, 14.92578125, 15.6220703125, 16.318359375, 17.0146484375, 17.7109375, 18.4072265625, 19.103515625, 19.7998046875, 20.49609375, 21.1923828125, 21.888671875, 22.5849609375, 23.28125]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 0.0, 2.0, 5.0, 2.0, 4.0, 6.0, 6.0, 8.0, 13.0, 20.0, 14.0, 25.0, 21.0, 18.0, 35.0, 31.0, 42.0, 48.0, 56.0, 71.0, 103.0, 282.0, 1604.0, 131.0, 85.0, 60.0, 45.0, 51.0, 45.0, 25.0, 32.0, 21.0, 23.0, 19.0, 19.0, 18.0, 14.0, 5.0, 7.0, 7.0, 10.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 3.0, 1.0, 2.0], "bins": [-40.75, -39.624267578125, -38.49853515625, -37.372802734375, -36.2470703125, -35.121337890625, -33.99560546875, -32.869873046875, -31.744140625, -30.618408203125, -29.49267578125, -28.366943359375, -27.2412109375, -26.115478515625, -24.98974609375, -23.864013671875, -22.73828125, -21.612548828125, -20.48681640625, -19.361083984375, -18.2353515625, -17.109619140625, -15.98388671875, -14.858154296875, -13.732421875, -12.606689453125, -11.48095703125, -10.355224609375, -9.2294921875, -8.103759765625, -6.97802734375, -5.852294921875, -4.7265625, -3.600830078125, -2.47509765625, -1.349365234375, -0.2236328125, 0.902099609375, 2.02783203125, 3.153564453125, 4.279296875, 5.405029296875, 6.53076171875, 7.656494140625, 8.7822265625, 9.907958984375, 11.03369140625, 12.159423828125, 13.28515625, 14.410888671875, 15.53662109375, 16.662353515625, 17.7880859375, 18.913818359375, 20.03955078125, 21.165283203125, 22.291015625, 23.416748046875, 24.54248046875, 25.668212890625, 26.7939453125, 27.919677734375, 29.04541015625, 30.171142578125, 31.296875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 5.0, 5.0, 4.0, 2.0, 1.0, 3.0, 6.0, 10.0, 7.0, 9.0, 4.0, 13.0, 24.0, 19.0, 19.0, 18.0, 27.0, 33.0, 51.0, 79.0, 121.0, 234.0, 553.0, 1495.0, 5098.0, 23486.0, 740817.0, 2335068.0, 29638.0, 5904.0, 1712.0, 596.0, 262.0, 110.0, 60.0, 57.0, 29.0, 22.0, 22.0, 14.0, 14.0, 22.0, 10.0, 7.0, 6.0, 5.0, 5.0, 3.0, 2.0, 3.0, 1.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.875, -46.2275390625, -44.580078125, -42.9326171875, -41.28515625, -39.6376953125, -37.990234375, -36.3427734375, -34.6953125, -33.0478515625, -31.400390625, -29.7529296875, -28.10546875, -26.4580078125, -24.810546875, -23.1630859375, -21.515625, -19.8681640625, -18.220703125, -16.5732421875, -14.92578125, -13.2783203125, -11.630859375, -9.9833984375, -8.3359375, -6.6884765625, -5.041015625, -3.3935546875, -1.74609375, -0.0986328125, 1.548828125, 3.1962890625, 4.84375, 6.4912109375, 8.138671875, 9.7861328125, 11.43359375, 13.0810546875, 14.728515625, 16.3759765625, 18.0234375, 19.6708984375, 21.318359375, 22.9658203125, 24.61328125, 26.2607421875, 27.908203125, 29.5556640625, 31.203125, 32.8505859375, 34.498046875, 36.1455078125, 37.79296875, 39.4404296875, 41.087890625, 42.7353515625, 44.3828125, 46.0302734375, 47.677734375, 49.3251953125, 50.97265625, 52.6201171875, 54.267578125, 55.9150390625, 57.5625]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 10.0, 26.0, 37.0, 77.0, 106.0, 170.0, 207.0, 155.0, 83.0, 66.0, 35.0, 15.0, 14.0, 5.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.27699279785156, -50.88579177856445, -48.494590759277344, -46.10338592529297, -43.71218490600586, -41.32098388671875, -38.929779052734375, -36.538578033447266, -34.147377014160156, -31.756175994873047, -29.364973068237305, -26.973770141601562, -24.582569122314453, -22.191368103027344, -19.8001651763916, -17.40896224975586, -15.01776123046875, -12.626559257507324, -10.235357284545898, -7.844155311584473, -5.452953338623047, -3.061751365661621, -0.6705493927001953, 1.7206535339355469, 4.111854553222656, 6.503056526184082, 8.894258499145508, 11.285460472106934, 13.67666244506836, 16.06786346435547, 18.45906639099121, 20.850269317626953, 23.241470336914062, 25.632671356201172, 28.023874282836914, 30.415077209472656, 32.806278228759766, 35.197479248046875, 37.58868408203125, 39.97988510131836, 42.37108612060547, 44.76228713989258, 47.15348815917969, 49.54469299316406, 51.93589401245117, 54.32709503173828, 56.718299865722656, 59.109500885009766, 61.500701904296875, 63.891902923583984, 66.2831039428711, 68.67430877685547, 71.06550598144531, 73.45671081542969, 75.84791564941406, 78.23912048339844, 80.63031768798828, 83.02152252197266, 85.4127197265625, 87.80392456054688, 90.19512939453125, 92.5863265991211, 94.97753143310547, 97.36872863769531, 99.75993347167969]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 5.0, 4.0, 4.0, 3.0, 2.0, 9.0, 6.0, 14.0, 8.0, 12.0, 12.0, 17.0, 22.0, 27.0, 23.0, 30.0, 20.0, 33.0, 39.0, 40.0, 37.0, 32.0, 35.0, 39.0, 39.0, 37.0, 54.0, 44.0, 33.0, 36.0, 47.0, 27.0, 29.0, 25.0, 28.0, 16.0, 22.0, 21.0, 14.0, 13.0, 8.0, 13.0, 6.0, 5.0, 7.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-110.80199432373047, -107.41445922851562, -104.02693176269531, -100.63939666748047, -97.25186157226562, -93.86433410644531, -90.47679901123047, -87.08926391601562, -83.70173645019531, -80.31420135498047, -76.92667388916016, -73.53913879394531, -70.15160369873047, -66.76406860351562, -63.37654113769531, -59.98900604248047, -56.601470947265625, -53.21393966674805, -49.8264045715332, -46.438873291015625, -43.05133819580078, -39.6638069152832, -36.276275634765625, -32.88874053955078, -29.501209259033203, -26.113676071166992, -22.72614288330078, -19.338611602783203, -15.951078414916992, -12.563545227050781, -9.176013946533203, -5.788480758666992, -2.4009475708007812, 0.9865851402282715, 4.374117851257324, 7.761650085449219, 11.14918327331543, 14.53671646118164, 17.92424774169922, 21.31178092956543, 24.69931411743164, 28.08684730529785, 31.474380493164062, 34.86191177368164, 38.24944305419922, 41.63697814941406, 45.02450942993164, 48.41204071044922, 51.79957580566406, 55.18710708618164, 58.574642181396484, 61.96217346191406, 65.3497085571289, 68.73724365234375, 72.12477111816406, 75.5123062133789, 78.89984130859375, 82.2873764038086, 85.6749038696289, 89.06243896484375, 92.4499740600586, 95.83750915527344, 99.22503662109375, 102.6125717163086, 106.0000991821289]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 7.0, 5.0, 3.0, 4.0, 9.0, 12.0, 12.0, 13.0, 22.0, 13.0, 22.0, 23.0, 34.0, 23.0, 36.0, 31.0, 40.0, 42.0, 56.0, 40.0, 42.0, 53.0, 42.0, 52.0, 50.0, 44.0, 31.0, 33.0, 32.0, 36.0, 25.0, 16.0, 16.0, 14.0, 11.0, 9.0, 5.0, 9.0, 8.0, 6.0, 3.0, 7.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-9.9296875, -9.6097412109375, -9.289794921875, -8.9698486328125, -8.64990234375, -8.3299560546875, -8.010009765625, -7.6900634765625, -7.3701171875, -7.0501708984375, -6.730224609375, -6.4102783203125, -6.09033203125, -5.7703857421875, -5.450439453125, -5.1304931640625, -4.810546875, -4.4906005859375, -4.170654296875, -3.8507080078125, -3.53076171875, -3.2108154296875, -2.890869140625, -2.5709228515625, -2.2509765625, -1.9310302734375, -1.611083984375, -1.2911376953125, -0.97119140625, -0.6512451171875, -0.331298828125, -0.0113525390625, 0.30859375, 0.6285400390625, 0.948486328125, 1.2684326171875, 1.58837890625, 1.9083251953125, 2.228271484375, 2.5482177734375, 2.8681640625, 3.1881103515625, 3.508056640625, 3.8280029296875, 4.14794921875, 4.4678955078125, 4.787841796875, 5.1077880859375, 5.427734375, 5.7476806640625, 6.067626953125, 6.3875732421875, 6.70751953125, 7.0274658203125, 7.347412109375, 7.6673583984375, 7.9873046875, 8.3072509765625, 8.627197265625, 8.9471435546875, 9.26708984375, 9.5870361328125, 9.906982421875, 10.2269287109375, 10.546875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 5.0, 8.0, 11.0, 7.0, 21.0, 25.0, 33.0, 43.0, 65.0, 94.0, 142.0, 224.0, 308.0, 456.0, 677.0, 994.0, 1598.0, 2513.0, 4122.0, 7476.0, 17233.0, 81643.0, 646542.0, 2703633.0, 620354.0, 72907.0, 15806.0, 7021.0, 3642.0, 2226.0, 1425.0, 931.0, 604.0, 433.0, 309.0, 192.0, 155.0, 112.0, 86.0, 60.0, 38.0, 36.0, 26.0, 19.0, 9.0, 13.0, 3.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.625, -18.981201171875, -18.33740234375, -17.693603515625, -17.0498046875, -16.406005859375, -15.76220703125, -15.118408203125, -14.474609375, -13.830810546875, -13.18701171875, -12.543212890625, -11.8994140625, -11.255615234375, -10.61181640625, -9.968017578125, -9.32421875, -8.680419921875, -8.03662109375, -7.392822265625, -6.7490234375, -6.105224609375, -5.46142578125, -4.817626953125, -4.173828125, -3.530029296875, -2.88623046875, -2.242431640625, -1.5986328125, -0.954833984375, -0.31103515625, 0.332763671875, 0.9765625, 1.620361328125, 2.26416015625, 2.907958984375, 3.5517578125, 4.195556640625, 4.83935546875, 5.483154296875, 6.126953125, 6.770751953125, 7.41455078125, 8.058349609375, 8.7021484375, 9.345947265625, 9.98974609375, 10.633544921875, 11.27734375, 11.921142578125, 12.56494140625, 13.208740234375, 13.8525390625, 14.496337890625, 15.14013671875, 15.783935546875, 16.427734375, 17.071533203125, 17.71533203125, 18.359130859375, 19.0029296875, 19.646728515625, 20.29052734375, 20.934326171875, 21.578125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 6.0, 3.0, 1.0, 3.0, 4.0, 6.0, 4.0, 4.0, 8.0, 15.0, 16.0, 19.0, 25.0, 24.0, 27.0, 49.0, 80.0, 125.0, 188.0, 341.0, 533.0, 714.0, 645.0, 464.0, 275.0, 167.0, 95.0, 62.0, 37.0, 30.0, 20.0, 17.0, 11.0, 7.0, 11.0, 11.0, 13.0, 4.0, 4.0, 2.0, 2.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-24.609375, -23.78173828125, -22.9541015625, -22.12646484375, -21.298828125, -20.47119140625, -19.6435546875, -18.81591796875, -17.98828125, -17.16064453125, -16.3330078125, -15.50537109375, -14.677734375, -13.85009765625, -13.0224609375, -12.19482421875, -11.3671875, -10.53955078125, -9.7119140625, -8.88427734375, -8.056640625, -7.22900390625, -6.4013671875, -5.57373046875, -4.74609375, -3.91845703125, -3.0908203125, -2.26318359375, -1.435546875, -0.60791015625, 0.2197265625, 1.04736328125, 1.875, 2.70263671875, 3.5302734375, 4.35791015625, 5.185546875, 6.01318359375, 6.8408203125, 7.66845703125, 8.49609375, 9.32373046875, 10.1513671875, 10.97900390625, 11.806640625, 12.63427734375, 13.4619140625, 14.28955078125, 15.1171875, 15.94482421875, 16.7724609375, 17.60009765625, 18.427734375, 19.25537109375, 20.0830078125, 20.91064453125, 21.73828125, 22.56591796875, 23.3935546875, 24.22119140625, 25.048828125, 25.87646484375, 26.7041015625, 27.53173828125, 28.359375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 7.0, 12.0, 11.0, 25.0, 31.0, 36.0, 71.0, 59.0, 118.0, 228.0, 380.0, 701.0, 1265.0, 2395.0, 4977.0, 11509.0, 31392.0, 130552.0, 1744004.0, 2063849.0, 145910.0, 33916.0, 11978.0, 5285.0, 2528.0, 1280.0, 705.0, 393.0, 243.0, 138.0, 89.0, 56.0, 32.0, 36.0, 17.0, 16.0, 8.0, 6.0, 5.0, 8.0, 4.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.84375, -32.787109375, -31.73046875, -30.673828125, -29.6171875, -28.560546875, -27.50390625, -26.447265625, -25.390625, -24.333984375, -23.27734375, -22.220703125, -21.1640625, -20.107421875, -19.05078125, -17.994140625, -16.9375, -15.880859375, -14.82421875, -13.767578125, -12.7109375, -11.654296875, -10.59765625, -9.541015625, -8.484375, -7.427734375, -6.37109375, -5.314453125, -4.2578125, -3.201171875, -2.14453125, -1.087890625, -0.03125, 1.025390625, 2.08203125, 3.138671875, 4.1953125, 5.251953125, 6.30859375, 7.365234375, 8.421875, 9.478515625, 10.53515625, 11.591796875, 12.6484375, 13.705078125, 14.76171875, 15.818359375, 16.875, 17.931640625, 18.98828125, 20.044921875, 21.1015625, 22.158203125, 23.21484375, 24.271484375, 25.328125, 26.384765625, 27.44140625, 28.498046875, 29.5546875, 30.611328125, 31.66796875, 32.724609375, 33.78125]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 4.0, 14.0, 39.0, 92.0, 238.0, 326.0, 186.0, 68.0, 27.0, 10.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.39427185058594, -103.94099426269531, -95.48771667480469, -87.03443908691406, -78.58116149902344, -70.12788391113281, -61.67461395263672, -53.221336364746094, -44.76805877685547, -36.314781188964844, -27.86150550842285, -19.40822982788086, -10.954952239990234, -2.5016746520996094, 5.95159912109375, 14.404876708984375, 22.858154296875, 31.311431884765625, 39.76470947265625, 48.21798324584961, 56.671260833740234, 65.12454223632812, 73.57781219482422, 82.03108978271484, 90.48436737060547, 98.9376449584961, 107.39092254638672, 115.84419250488281, 124.29747009277344, 132.75074768066406, 141.2040252685547, 149.6573028564453, 158.110595703125, 166.56387329101562, 175.01715087890625, 183.47042846679688, 191.9237060546875, 200.37698364257812, 208.83026123046875, 217.28353881835938, 225.73681640625, 234.19009399414062, 242.64337158203125, 251.09664916992188, 259.5499267578125, 268.0032043457031, 276.45648193359375, 284.9097595214844, 293.363037109375, 301.8163146972656, 310.26959228515625, 318.7228698730469, 327.1761474609375, 335.6294250488281, 344.08270263671875, 352.5359802246094, 360.9892272949219, 369.4425048828125, 377.8957824707031, 386.34906005859375, 394.8023376464844, 403.255615234375, 411.7088928222656, 420.16217041015625, 428.6154479980469]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 13.0, 9.0, 8.0, 15.0, 11.0, 15.0, 13.0, 15.0, 16.0, 22.0, 26.0, 27.0, 42.0, 40.0, 36.0, 59.0, 43.0, 42.0, 37.0, 28.0, 45.0, 38.0, 37.0, 40.0, 40.0, 32.0, 24.0, 23.0, 27.0, 23.0, 21.0, 15.0, 22.0, 8.0, 17.0, 15.0, 11.0, 8.0, 4.0, 10.0, 4.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0], "bins": [-81.27159881591797, -78.85063171386719, -76.4296646118164, -74.00869750976562, -71.58773040771484, -69.16676330566406, -66.74579620361328, -64.3248291015625, -61.90386199951172, -59.48289489746094, -57.061927795410156, -54.640960693359375, -52.219993591308594, -49.79902648925781, -47.37805938720703, -44.95709228515625, -42.53612518310547, -40.11515808105469, -37.694190979003906, -35.273223876953125, -32.852256774902344, -30.431289672851562, -28.01032257080078, -25.58935546875, -23.16838836669922, -20.747421264648438, -18.326454162597656, -15.905487060546875, -13.484519958496094, -11.063552856445312, -8.642585754394531, -6.22161865234375, -3.8006591796875, -1.3796920776367188, 1.0412750244140625, 3.4622421264648438, 5.883209228515625, 8.304176330566406, 10.725143432617188, 13.146110534667969, 15.56707763671875, 17.98804473876953, 20.409011840820312, 22.829978942871094, 25.250946044921875, 27.671913146972656, 30.092880249023438, 32.51384735107422, 34.934814453125, 37.35578155517578, 39.77674865722656, 42.197715759277344, 44.618682861328125, 47.039649963378906, 49.46061706542969, 51.88158416748047, 54.30255126953125, 56.72351837158203, 59.14448547363281, 61.565452575683594, 63.986419677734375, 66.40738677978516, 68.82835388183594, 71.24932098388672, 73.6702880859375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 5.0, 3.0, 10.0, 5.0, 13.0, 10.0, 22.0, 19.0, 9.0, 34.0, 26.0, 30.0, 31.0, 31.0, 39.0, 47.0, 49.0, 52.0, 42.0, 54.0, 51.0, 57.0, 47.0, 38.0, 43.0, 33.0, 25.0, 35.0, 22.0, 22.0, 17.0, 15.0, 9.0, 7.0, 7.0, 11.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.291748046875, -9.95068359375, -9.609619140625, -9.2685546875, -8.927490234375, -8.58642578125, -8.245361328125, -7.904296875, -7.563232421875, -7.22216796875, -6.881103515625, -6.5400390625, -6.198974609375, -5.85791015625, -5.516845703125, -5.17578125, -4.834716796875, -4.49365234375, -4.152587890625, -3.8115234375, -3.470458984375, -3.12939453125, -2.788330078125, -2.447265625, -2.106201171875, -1.76513671875, -1.424072265625, -1.0830078125, -0.741943359375, -0.40087890625, -0.059814453125, 0.28125, 0.622314453125, 0.96337890625, 1.304443359375, 1.6455078125, 1.986572265625, 2.32763671875, 2.668701171875, 3.009765625, 3.350830078125, 3.69189453125, 4.032958984375, 4.3740234375, 4.715087890625, 5.05615234375, 5.397216796875, 5.73828125, 6.079345703125, 6.42041015625, 6.761474609375, 7.1025390625, 7.443603515625, 7.78466796875, 8.125732421875, 8.466796875, 8.807861328125, 9.14892578125, 9.489990234375, 9.8310546875, 10.172119140625, 10.51318359375, 10.854248046875, 11.1953125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 6.0, 5.0, 5.0, 16.0, 13.0, 19.0, 33.0, 49.0, 78.0, 123.0, 141.0, 261.0, 324.0, 447.0, 664.0, 1081.0, 1525.0, 2186.0, 3410.0, 5137.0, 8130.0, 12706.0, 20750.0, 34848.0, 60252.0, 106765.0, 177581.0, 221964.0, 160500.0, 93472.0, 53665.0, 30789.0, 18759.0, 11553.0, 7221.0, 4651.0, 3023.0, 2059.0, 1446.0, 932.0, 613.0, 420.0, 291.0, 206.0, 135.0, 85.0, 77.0, 45.0, 35.0, 26.0, 18.0, 7.0, 5.0, 7.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-1.400390625, -1.35577392578125, -1.3111572265625, -1.26654052734375, -1.221923828125, -1.17730712890625, -1.1326904296875, -1.08807373046875, -1.04345703125, -0.99884033203125, -0.9542236328125, -0.90960693359375, -0.864990234375, -0.82037353515625, -0.7757568359375, -0.73114013671875, -0.6865234375, -0.64190673828125, -0.5972900390625, -0.55267333984375, -0.508056640625, -0.46343994140625, -0.4188232421875, -0.37420654296875, -0.32958984375, -0.28497314453125, -0.2403564453125, -0.19573974609375, -0.151123046875, -0.10650634765625, -0.0618896484375, -0.01727294921875, 0.02734375, 0.07196044921875, 0.1165771484375, 0.16119384765625, 0.205810546875, 0.25042724609375, 0.2950439453125, 0.33966064453125, 0.38427734375, 0.42889404296875, 0.4735107421875, 0.51812744140625, 0.562744140625, 0.60736083984375, 0.6519775390625, 0.69659423828125, 0.7412109375, 0.78582763671875, 0.8304443359375, 0.87506103515625, 0.919677734375, 0.96429443359375, 1.0089111328125, 1.05352783203125, 1.09814453125, 1.14276123046875, 1.1873779296875, 1.23199462890625, 1.276611328125, 1.32122802734375, 1.3658447265625, 1.41046142578125, 1.455078125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 9.0, 3.0, 4.0, 12.0, 8.0, 15.0, 7.0, 28.0, 15.0, 24.0, 14.0, 24.0, 26.0, 28.0, 30.0, 36.0, 20.0, 32.0, 32.0, 44.0, 38.0, 35.0, 1062.0, 35.0, 44.0, 42.0, 40.0, 21.0, 44.0, 26.0, 21.0, 30.0, 25.0, 17.0, 19.0, 9.0, 15.0, 14.0, 13.0, 13.0, 12.0, 10.0, 6.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.2421875, -5.068603515625, -4.89501953125, -4.721435546875, -4.5478515625, -4.374267578125, -4.20068359375, -4.027099609375, -3.853515625, -3.679931640625, -3.50634765625, -3.332763671875, -3.1591796875, -2.985595703125, -2.81201171875, -2.638427734375, -2.46484375, -2.291259765625, -2.11767578125, -1.944091796875, -1.7705078125, -1.596923828125, -1.42333984375, -1.249755859375, -1.076171875, -0.902587890625, -0.72900390625, -0.555419921875, -0.3818359375, -0.208251953125, -0.03466796875, 0.138916015625, 0.3125, 0.486083984375, 0.65966796875, 0.833251953125, 1.0068359375, 1.180419921875, 1.35400390625, 1.527587890625, 1.701171875, 1.874755859375, 2.04833984375, 2.221923828125, 2.3955078125, 2.569091796875, 2.74267578125, 2.916259765625, 3.08984375, 3.263427734375, 3.43701171875, 3.610595703125, 3.7841796875, 3.957763671875, 4.13134765625, 4.304931640625, 4.478515625, 4.652099609375, 4.82568359375, 4.999267578125, 5.1728515625, 5.346435546875, 5.52001953125, 5.693603515625, 5.8671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 6.0, 13.0, 17.0, 26.0, 38.0, 53.0, 80.0, 117.0, 175.0, 245.0, 350.0, 546.0, 833.0, 1133.0, 1710.0, 2665.0, 3997.0, 6266.0, 9328.0, 14682.0, 23558.0, 38428.0, 64266.0, 106372.0, 167493.0, 1250008.0, 154798.0, 96498.0, 58432.0, 35348.0, 21287.0, 13352.0, 8643.0, 5403.0, 3800.0, 2292.0, 1647.0, 1062.0, 683.0, 463.0, 310.0, 238.0, 158.0, 78.0, 87.0, 46.0, 35.0, 27.0, 15.0, 12.0, 9.0, 3.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.8486328125, -0.8232269287109375, -0.797821044921875, -0.7724151611328125, -0.74700927734375, -0.7216033935546875, -0.696197509765625, -0.6707916259765625, -0.6453857421875, -0.6199798583984375, -0.594573974609375, -0.5691680908203125, -0.54376220703125, -0.5183563232421875, -0.492950439453125, -0.4675445556640625, -0.442138671875, -0.4167327880859375, -0.391326904296875, -0.3659210205078125, -0.34051513671875, -0.3151092529296875, -0.289703369140625, -0.2642974853515625, -0.2388916015625, -0.2134857177734375, -0.188079833984375, -0.1626739501953125, -0.13726806640625, -0.1118621826171875, -0.086456298828125, -0.0610504150390625, -0.03564453125, -0.0102386474609375, 0.015167236328125, 0.0405731201171875, 0.06597900390625, 0.0913848876953125, 0.116790771484375, 0.1421966552734375, 0.1676025390625, 0.1930084228515625, 0.218414306640625, 0.2438201904296875, 0.26922607421875, 0.2946319580078125, 0.320037841796875, 0.3454437255859375, 0.370849609375, 0.3962554931640625, 0.421661376953125, 0.4470672607421875, 0.47247314453125, 0.4978790283203125, 0.523284912109375, 0.5486907958984375, 0.5740966796875, 0.5995025634765625, 0.624908447265625, 0.6503143310546875, 0.67572021484375, 0.7011260986328125, 0.726531982421875, 0.7519378662109375, 0.77734375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 10.0, 11.0, 1.0, 11.0, 8.0, 8.0, 11.0, 16.0, 14.0, 27.0, 28.0, 24.0, 38.0, 54.0, 44.0, 69.0, 103.0, 97.0, 74.0, 71.0, 49.0, 45.0, 31.0, 34.0, 18.0, 15.0, 13.0, 7.0, 7.0, 13.0, 6.0, 6.0, 6.0, 5.0, 6.0, 4.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.01247406005859375, -0.012099504470825195, -0.01172494888305664, -0.011350393295288086, -0.010975837707519531, -0.010601282119750977, -0.010226726531982422, -0.009852170944213867, -0.009477615356445312, -0.009103059768676758, -0.008728504180908203, -0.008353948593139648, -0.007979393005371094, -0.007604837417602539, -0.007230281829833984, -0.00685572624206543, -0.006481170654296875, -0.00610661506652832, -0.005732059478759766, -0.005357503890991211, -0.004982948303222656, -0.0046083927154541016, -0.004233837127685547, -0.003859281539916992, -0.0034847259521484375, -0.003110170364379883, -0.002735614776611328, -0.0023610591888427734, -0.0019865036010742188, -0.001611948013305664, -0.0012373924255371094, -0.0008628368377685547, -0.00048828125, -0.00011372566223144531, 0.0002608299255371094, 0.0006353855133056641, 0.0010099411010742188, 0.0013844966888427734, 0.0017590522766113281, 0.002133607864379883, 0.0025081634521484375, 0.002882719039916992, 0.003257274627685547, 0.0036318302154541016, 0.004006385803222656, 0.004380941390991211, 0.004755496978759766, 0.00513005256652832, 0.005504608154296875, 0.00587916374206543, 0.006253719329833984, 0.006628274917602539, 0.007002830505371094, 0.0073773860931396484, 0.007751941680908203, 0.008126497268676758, 0.008501052856445312, 0.008875608444213867, 0.009250164031982422, 0.009624719619750977, 0.009999275207519531, 0.010373830795288086, 0.01074838638305664, 0.011122941970825195, 0.01149749755859375]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 9.0, 12.0, 19.0, 15.0, 20.0, 42.0, 53.0, 65.0, 82.0, 123.0, 205.0, 320.0, 981.0, 17788.0, 989723.0, 36567.0, 1465.0, 350.0, 183.0, 149.0, 102.0, 57.0, 43.0, 36.0, 23.0, 24.0, 16.0, 19.0, 10.0, 8.0, 7.0, 3.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2275390625, -0.2198486328125, -0.212158203125, -0.2044677734375, -0.19677734375, -0.1890869140625, -0.181396484375, -0.1737060546875, -0.166015625, -0.1583251953125, -0.150634765625, -0.1429443359375, -0.13525390625, -0.1275634765625, -0.119873046875, -0.1121826171875, -0.1044921875, -0.0968017578125, -0.089111328125, -0.0814208984375, -0.07373046875, -0.0660400390625, -0.058349609375, -0.0506591796875, -0.04296875, -0.0352783203125, -0.027587890625, -0.0198974609375, -0.01220703125, -0.0045166015625, 0.003173828125, 0.0108642578125, 0.0185546875, 0.0262451171875, 0.033935546875, 0.0416259765625, 0.04931640625, 0.0570068359375, 0.064697265625, 0.0723876953125, 0.080078125, 0.0877685546875, 0.095458984375, 0.1031494140625, 0.11083984375, 0.1185302734375, 0.126220703125, 0.1339111328125, 0.1416015625, 0.1492919921875, 0.156982421875, 0.1646728515625, 0.17236328125, 0.1800537109375, 0.187744140625, 0.1954345703125, 0.203125, 0.2108154296875, 0.218505859375, 0.2261962890625, 0.23388671875, 0.2415771484375, 0.249267578125, 0.2569580078125, 0.2646484375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 25.0, 248.0, 595.0, 125.0, 16.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.13521601259708405, -0.1322910189628601, -0.12936602532863617, -0.12644103169441223, -0.12351604551076889, -0.12059105187654495, -0.11766606569290161, -0.11474107205867767, -0.11181607842445374, -0.1088910847902298, -0.10596609860658646, -0.10304110497236252, -0.10011611133813858, -0.09719111770391464, -0.0942661315202713, -0.09134113788604736, -0.08841614425182343, -0.08549115061759949, -0.08256616443395615, -0.07964117079973221, -0.07671617716550827, -0.07379118353128433, -0.07086619734764099, -0.06794120371341705, -0.06501621752977371, -0.06209122762084007, -0.059166233986616135, -0.056241244077682495, -0.05331625044345856, -0.05039126053452492, -0.04746627062559128, -0.04454127699136734, -0.041616279631853104, -0.038691289722919464, -0.035766296088695526, -0.03284130617976189, -0.02991631254553795, -0.02699132263660431, -0.02406633086502552, -0.02114133909344673, -0.018216347321867943, -0.015291355550289154, -0.012366363778710365, -0.009441372938454151, -0.006516381166875362, -0.0035913893952965736, -0.0006663985550403595, 0.0022585932165384293, 0.005183584988117218, 0.008108576759696007, 0.011033568531274796, 0.01395855937153101, 0.016883552074432373, 0.019808541983366013, 0.0227335337549448, 0.02565852552652359, 0.02858351729810238, 0.03150850906968117, 0.03443349897861481, 0.037358492612838745, 0.040283482521772385, 0.04320847615599632, 0.04613346606492996, 0.0490584596991539, 0.05198344960808754]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 8.0, 8.0, 9.0, 7.0, 14.0, 14.0, 13.0, 15.0, 23.0, 24.0, 28.0, 40.0, 34.0, 42.0, 21.0, 44.0, 45.0, 41.0, 52.0, 39.0, 48.0, 59.0, 33.0, 42.0, 43.0, 32.0, 31.0, 29.0, 22.0, 25.0, 16.0, 21.0, 15.0, 16.0, 11.0, 11.0, 11.0, 5.0, 5.0, 8.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0074086785316467285, -0.007179425098001957, -0.006950171664357185, -0.006720918230712414, -0.006491664797067642, -0.006262411363422871, -0.006033157929778099, -0.0058039044961333275, -0.005574651062488556, -0.005345397628843784, -0.005116144195199013, -0.004886890761554241, -0.00465763732790947, -0.004428383894264698, -0.0041991304606199265, -0.003969877026975155, -0.0037406235933303833, -0.0035113701596856117, -0.00328211672604084, -0.0030528632923960686, -0.002823609858751297, -0.0025943564251065254, -0.002365102991461754, -0.0021358495578169823, -0.0019065961241722107, -0.0016773426905274391, -0.0014480892568826675, -0.001218835823237896, -0.0009895823895931244, -0.0007603289559483528, -0.0005310755223035812, -0.00030182208865880966, -7.256865501403809e-05, 0.0001566847786307335, 0.00038593821227550507, 0.0006151916459202766, 0.0008444450795650482, 0.0010736985132098198, 0.0013029519468545914, 0.001532205380499363, 0.0017614588141441345, 0.001990712247788906, 0.0022199656814336777, 0.0024492191150784492, 0.002678472548723221, 0.0029077259823679924, 0.003136979416012764, 0.0033662328496575356, 0.003595486283302307, 0.0038247397169470787, 0.00405399315059185, 0.004283246584236622, 0.004512500017881393, 0.004741753451526165, 0.004971006885170937, 0.005200260318815708, 0.00542951375246048, 0.005658767186105251, 0.005888020619750023, 0.0061172740533947945, 0.006346527487039566, 0.006575780920684338, 0.006805034354329109, 0.007034287787973881, 0.007263541221618652]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 2.0, 5.0, 3.0, 10.0, 5.0, 13.0, 10.0, 22.0, 18.0, 10.0, 33.0, 26.0, 31.0, 31.0, 31.0, 38.0, 48.0, 49.0, 51.0, 43.0, 54.0, 51.0, 56.0, 48.0, 38.0, 43.0, 33.0, 25.0, 35.0, 22.0, 22.0, 17.0, 15.0, 9.0, 7.0, 7.0, 11.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.6328125, -10.2918701171875, -9.950927734375, -9.6099853515625, -9.26904296875, -8.9281005859375, -8.587158203125, -8.2462158203125, -7.9052734375, -7.5643310546875, -7.223388671875, -6.8824462890625, -6.54150390625, -6.2005615234375, -5.859619140625, -5.5186767578125, -5.177734375, -4.8367919921875, -4.495849609375, -4.1549072265625, -3.81396484375, -3.4730224609375, -3.132080078125, -2.7911376953125, -2.4501953125, -2.1092529296875, -1.768310546875, -1.4273681640625, -1.08642578125, -0.7454833984375, -0.404541015625, -0.0635986328125, 0.27734375, 0.6182861328125, 0.959228515625, 1.3001708984375, 1.64111328125, 1.9820556640625, 2.322998046875, 2.6639404296875, 3.0048828125, 3.3458251953125, 3.686767578125, 4.0277099609375, 4.36865234375, 4.7095947265625, 5.050537109375, 5.3914794921875, 5.732421875, 6.0733642578125, 6.414306640625, 6.7552490234375, 7.09619140625, 7.4371337890625, 7.778076171875, 8.1190185546875, 8.4599609375, 8.8009033203125, 9.141845703125, 9.4827880859375, 9.82373046875, 10.1646728515625, 10.505615234375, 10.8465576171875, 11.1875]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [4.0, 2.0, 3.0, 5.0, 6.0, 3.0, 4.0, 1.0, 7.0, 7.0, 12.0, 23.0, 28.0, 36.0, 39.0, 48.0, 66.0, 113.0, 138.0, 210.0, 236.0, 356.0, 522.0, 730.0, 1045.0, 1615.0, 2536.0, 3978.0, 6383.0, 11465.0, 21668.0, 49421.0, 195198.0, 589794.0, 90840.0, 32837.0, 15684.0, 8782.0, 5080.0, 3160.0, 1953.0, 1376.0, 857.0, 632.0, 438.0, 315.0, 238.0, 179.0, 133.0, 89.0, 61.0, 42.0, 44.0, 31.0, 26.0, 20.0, 14.0, 10.0, 8.0, 11.0, 7.0, 4.0, 1.0, 2.0], "bins": [-19.46875, -18.883544921875, -18.29833984375, -17.713134765625, -17.1279296875, -16.542724609375, -15.95751953125, -15.372314453125, -14.787109375, -14.201904296875, -13.61669921875, -13.031494140625, -12.4462890625, -11.861083984375, -11.27587890625, -10.690673828125, -10.10546875, -9.520263671875, -8.93505859375, -8.349853515625, -7.7646484375, -7.179443359375, -6.59423828125, -6.009033203125, -5.423828125, -4.838623046875, -4.25341796875, -3.668212890625, -3.0830078125, -2.497802734375, -1.91259765625, -1.327392578125, -0.7421875, -0.156982421875, 0.42822265625, 1.013427734375, 1.5986328125, 2.183837890625, 2.76904296875, 3.354248046875, 3.939453125, 4.524658203125, 5.10986328125, 5.695068359375, 6.2802734375, 6.865478515625, 7.45068359375, 8.035888671875, 8.62109375, 9.206298828125, 9.79150390625, 10.376708984375, 10.9619140625, 11.547119140625, 12.13232421875, 12.717529296875, 13.302734375, 13.887939453125, 14.47314453125, 15.058349609375, 15.6435546875, 16.228759765625, 16.81396484375, 17.399169921875, 17.984375]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 3.0, 2.0, 2.0, 5.0, 2.0, 6.0, 3.0, 10.0, 6.0, 9.0, 10.0, 14.0, 24.0, 21.0, 22.0, 16.0, 18.0, 37.0, 40.0, 46.0, 55.0, 63.0, 85.0, 150.0, 1478.0, 344.0, 122.0, 89.0, 63.0, 31.0, 41.0, 35.0, 29.0, 27.0, 25.0, 20.0, 26.0, 12.0, 8.0, 16.0, 4.0, 6.0, 15.0, 7.0, 0.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.78125, -33.65576171875, -32.5302734375, -31.40478515625, -30.279296875, -29.15380859375, -28.0283203125, -26.90283203125, -25.77734375, -24.65185546875, -23.5263671875, -22.40087890625, -21.275390625, -20.14990234375, -19.0244140625, -17.89892578125, -16.7734375, -15.64794921875, -14.5224609375, -13.39697265625, -12.271484375, -11.14599609375, -10.0205078125, -8.89501953125, -7.76953125, -6.64404296875, -5.5185546875, -4.39306640625, -3.267578125, -2.14208984375, -1.0166015625, 0.10888671875, 1.234375, 2.35986328125, 3.4853515625, 4.61083984375, 5.736328125, 6.86181640625, 7.9873046875, 9.11279296875, 10.23828125, 11.36376953125, 12.4892578125, 13.61474609375, 14.740234375, 15.86572265625, 16.9912109375, 18.11669921875, 19.2421875, 20.36767578125, 21.4931640625, 22.61865234375, 23.744140625, 24.86962890625, 25.9951171875, 27.12060546875, 28.24609375, 29.37158203125, 30.4970703125, 31.62255859375, 32.748046875, 33.87353515625, 34.9990234375, 36.12451171875, 37.25]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 11.0, 9.0, 18.0, 20.0, 23.0, 36.0, 52.0, 60.0, 73.0, 115.0, 173.0, 385.0, 1368.0, 6561.0, 59855.0, 2935590.0, 128125.0, 10068.0, 1914.0, 492.0, 268.0, 129.0, 81.0, 58.0, 42.0, 36.0, 28.0, 15.0, 15.0, 14.0, 11.0, 7.0, 11.0, 7.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-77.75, -75.50390625, -73.2578125, -71.01171875, -68.765625, -66.51953125, -64.2734375, -62.02734375, -59.78125, -57.53515625, -55.2890625, -53.04296875, -50.796875, -48.55078125, -46.3046875, -44.05859375, -41.8125, -39.56640625, -37.3203125, -35.07421875, -32.828125, -30.58203125, -28.3359375, -26.08984375, -23.84375, -21.59765625, -19.3515625, -17.10546875, -14.859375, -12.61328125, -10.3671875, -8.12109375, -5.875, -3.62890625, -1.3828125, 0.86328125, 3.109375, 5.35546875, 7.6015625, 9.84765625, 12.09375, 14.33984375, 16.5859375, 18.83203125, 21.078125, 23.32421875, 25.5703125, 27.81640625, 30.0625, 32.30859375, 34.5546875, 36.80078125, 39.046875, 41.29296875, 43.5390625, 45.78515625, 48.03125, 50.27734375, 52.5234375, 54.76953125, 57.015625, 59.26171875, 61.5078125, 63.75390625, 66.0]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 14.0, 73.0, 266.0, 384.0, 186.0, 67.0, 14.0, 7.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-368.6368408203125, -361.59356689453125, -354.55029296875, -347.5070495605469, -340.4637756347656, -333.4205017089844, -326.3772277832031, -319.333984375, -312.29071044921875, -305.2474365234375, -298.20416259765625, -291.1609191894531, -284.1176452636719, -277.0743713378906, -270.0310974121094, -262.98785400390625, -255.94456481933594, -248.9012908935547, -241.8580322265625, -234.81475830078125, -227.77149963378906, -220.7282257080078, -213.68496704101562, -206.64169311523438, -199.59841918945312, -192.55514526367188, -185.5118865966797, -178.46861267089844, -171.42535400390625, -164.382080078125, -157.33880615234375, -150.29554748535156, -143.25228881835938, -136.20901489257812, -129.16575622558594, -122.12248229980469, -115.0792236328125, -108.03594970703125, -100.99268341064453, -93.94941711425781, -86.90615844726562, -79.8628921508789, -72.81962585449219, -65.77635192871094, -58.733089447021484, -51.689823150634766, -44.64655303955078, -37.60328674316406, -30.560020446777344, -23.516754150390625, -16.473485946655273, -9.430217742919922, -2.386951446533203, 4.656314849853516, 11.6995849609375, 18.74285125732422, 25.786117553710938, 32.829383850097656, 39.872650146484375, 46.91592025756836, 53.95918655395508, 61.0024528503418, 68.04572296142578, 75.0889892578125, 82.13225555419922]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 2.0, 7.0, 5.0, 13.0, 11.0, 12.0, 13.0, 20.0, 11.0, 23.0, 12.0, 27.0, 38.0, 25.0, 33.0, 43.0, 30.0, 37.0, 34.0, 40.0, 48.0, 47.0, 48.0, 35.0, 27.0, 31.0, 38.0, 38.0, 28.0, 31.0, 29.0, 30.0, 30.0, 22.0, 13.0, 18.0, 12.0, 9.0, 9.0, 7.0, 5.0, 4.0, 1.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.90230560302734, -93.67972564697266, -90.45713806152344, -87.23455810546875, -84.01197814941406, -80.78939819335938, -77.56681823730469, -74.34423065185547, -71.12165069580078, -67.8990707397461, -64.67648315429688, -61.45390319824219, -58.2313232421875, -55.00874328613281, -51.78615951538086, -48.563575744628906, -45.34099578857422, -42.11841583251953, -38.89583206176758, -35.673248291015625, -32.45066833496094, -29.228086471557617, -26.005504608154297, -22.782922744750977, -19.560340881347656, -16.337759017944336, -13.115177154541016, -9.892595291137695, -6.670013427734375, -3.4474315643310547, -0.22484970092773438, 2.997732162475586, 6.2203216552734375, 9.442903518676758, 12.665485382080078, 15.888067245483398, 19.11064910888672, 22.33323097229004, 25.55581283569336, 28.77839469909668, 32.0009765625, 35.22355651855469, 38.44614028930664, 41.668724060058594, 44.89130401611328, 48.11388397216797, 51.33646774291992, 54.559051513671875, 57.78163146972656, 61.00421142578125, 64.22679138183594, 67.44937896728516, 70.67195892333984, 73.89453887939453, 77.11712646484375, 80.33970642089844, 83.56228637695312, 86.78486633300781, 90.0074462890625, 93.23003387451172, 96.4526138305664, 99.6751937866211, 102.89778137207031, 106.120361328125, 109.34294128417969]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 4.0, 3.0, 5.0, 5.0, 2.0, 8.0, 12.0, 10.0, 18.0, 17.0, 26.0, 21.0, 28.0, 37.0, 35.0, 33.0, 54.0, 37.0, 45.0, 54.0, 50.0, 53.0, 55.0, 53.0, 47.0, 42.0, 35.0, 47.0, 28.0, 24.0, 17.0, 26.0, 14.0, 9.0, 7.0, 9.0, 11.0, 11.0, 6.0, 4.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.640625, -11.26416015625, -10.8876953125, -10.51123046875, -10.134765625, -9.75830078125, -9.3818359375, -9.00537109375, -8.62890625, -8.25244140625, -7.8759765625, -7.49951171875, -7.123046875, -6.74658203125, -6.3701171875, -5.99365234375, -5.6171875, -5.24072265625, -4.8642578125, -4.48779296875, -4.111328125, -3.73486328125, -3.3583984375, -2.98193359375, -2.60546875, -2.22900390625, -1.8525390625, -1.47607421875, -1.099609375, -0.72314453125, -0.3466796875, 0.02978515625, 0.40625, 0.78271484375, 1.1591796875, 1.53564453125, 1.912109375, 2.28857421875, 2.6650390625, 3.04150390625, 3.41796875, 3.79443359375, 4.1708984375, 4.54736328125, 4.923828125, 5.30029296875, 5.6767578125, 6.05322265625, 6.4296875, 6.80615234375, 7.1826171875, 7.55908203125, 7.935546875, 8.31201171875, 8.6884765625, 9.06494140625, 9.44140625, 9.81787109375, 10.1943359375, 10.57080078125, 10.947265625, 11.32373046875, 11.7001953125, 12.07666015625, 12.453125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 6.0, 11.0, 9.0, 14.0, 14.0, 28.0, 36.0, 56.0, 68.0, 93.0, 108.0, 165.0, 234.0, 319.0, 417.0, 573.0, 853.0, 1301.0, 1895.0, 2904.0, 4708.0, 8461.0, 18414.0, 65945.0, 437932.0, 2315248.0, 1121977.0, 155314.0, 29889.0, 11277.0, 5809.0, 3420.0, 2082.0, 1385.0, 942.0, 658.0, 425.0, 350.0, 261.0, 181.0, 110.0, 89.0, 83.0, 58.0, 43.0, 29.0, 27.0, 20.0, 15.0, 11.0, 9.0, 8.0, 5.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.734375, -17.137939453125, -16.54150390625, -15.945068359375, -15.3486328125, -14.752197265625, -14.15576171875, -13.559326171875, -12.962890625, -12.366455078125, -11.77001953125, -11.173583984375, -10.5771484375, -9.980712890625, -9.38427734375, -8.787841796875, -8.19140625, -7.594970703125, -6.99853515625, -6.402099609375, -5.8056640625, -5.209228515625, -4.61279296875, -4.016357421875, -3.419921875, -2.823486328125, -2.22705078125, -1.630615234375, -1.0341796875, -0.437744140625, 0.15869140625, 0.755126953125, 1.3515625, 1.947998046875, 2.54443359375, 3.140869140625, 3.7373046875, 4.333740234375, 4.93017578125, 5.526611328125, 6.123046875, 6.719482421875, 7.31591796875, 7.912353515625, 8.5087890625, 9.105224609375, 9.70166015625, 10.298095703125, 10.89453125, 11.490966796875, 12.08740234375, 12.683837890625, 13.2802734375, 13.876708984375, 14.47314453125, 15.069580078125, 15.666015625, 16.262451171875, 16.85888671875, 17.455322265625, 18.0517578125, 18.648193359375, 19.24462890625, 19.841064453125, 20.4375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 5.0, 3.0, 5.0, 3.0, 5.0, 7.0, 7.0, 6.0, 20.0, 19.0, 17.0, 29.0, 34.0, 59.0, 95.0, 134.0, 223.0, 332.0, 628.0, 720.0, 645.0, 388.0, 224.0, 134.0, 97.0, 58.0, 43.0, 30.0, 25.0, 19.0, 11.0, 16.0, 9.0, 7.0, 4.0, 8.0, 7.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.34375, -29.465576171875, -28.58740234375, -27.709228515625, -26.8310546875, -25.952880859375, -25.07470703125, -24.196533203125, -23.318359375, -22.440185546875, -21.56201171875, -20.683837890625, -19.8056640625, -18.927490234375, -18.04931640625, -17.171142578125, -16.29296875, -15.414794921875, -14.53662109375, -13.658447265625, -12.7802734375, -11.902099609375, -11.02392578125, -10.145751953125, -9.267578125, -8.389404296875, -7.51123046875, -6.633056640625, -5.7548828125, -4.876708984375, -3.99853515625, -3.120361328125, -2.2421875, -1.364013671875, -0.48583984375, 0.392333984375, 1.2705078125, 2.148681640625, 3.02685546875, 3.905029296875, 4.783203125, 5.661376953125, 6.53955078125, 7.417724609375, 8.2958984375, 9.174072265625, 10.05224609375, 10.930419921875, 11.80859375, 12.686767578125, 13.56494140625, 14.443115234375, 15.3212890625, 16.199462890625, 17.07763671875, 17.955810546875, 18.833984375, 19.712158203125, 20.59033203125, 21.468505859375, 22.3466796875, 23.224853515625, 24.10302734375, 24.981201171875, 25.859375]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 1.0, 3.0, 6.0, 8.0, 16.0, 28.0, 31.0, 57.0, 59.0, 108.0, 148.0, 216.0, 405.0, 678.0, 1199.0, 2273.0, 4266.0, 8707.0, 19847.0, 55775.0, 258609.0, 2553017.0, 1093003.0, 131269.0, 36278.0, 14309.0, 6531.0, 3311.0, 1674.0, 975.0, 549.0, 348.0, 198.0, 123.0, 89.0, 53.0, 32.0, 26.0, 20.0, 11.0, 11.0, 6.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.84375, -26.93994140625, -26.0361328125, -25.13232421875, -24.228515625, -23.32470703125, -22.4208984375, -21.51708984375, -20.61328125, -19.70947265625, -18.8056640625, -17.90185546875, -16.998046875, -16.09423828125, -15.1904296875, -14.28662109375, -13.3828125, -12.47900390625, -11.5751953125, -10.67138671875, -9.767578125, -8.86376953125, -7.9599609375, -7.05615234375, -6.15234375, -5.24853515625, -4.3447265625, -3.44091796875, -2.537109375, -1.63330078125, -0.7294921875, 0.17431640625, 1.078125, 1.98193359375, 2.8857421875, 3.78955078125, 4.693359375, 5.59716796875, 6.5009765625, 7.40478515625, 8.30859375, 9.21240234375, 10.1162109375, 11.02001953125, 11.923828125, 12.82763671875, 13.7314453125, 14.63525390625, 15.5390625, 16.44287109375, 17.3466796875, 18.25048828125, 19.154296875, 20.05810546875, 20.9619140625, 21.86572265625, 22.76953125, 23.67333984375, 24.5771484375, 25.48095703125, 26.384765625, 27.28857421875, 28.1923828125, 29.09619140625, 30.0]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 9.0, 17.0, 39.0, 69.0, 142.0, 244.0, 242.0, 124.0, 64.0, 34.0, 13.0, 4.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-326.5813293457031, -320.16802978515625, -313.7547302246094, -307.3414306640625, -300.9281311035156, -294.51483154296875, -288.1015319824219, -281.688232421875, -275.2749328613281, -268.86163330078125, -262.4483337402344, -256.0350341796875, -249.62173461914062, -243.20843505859375, -236.79513549804688, -230.38185119628906, -223.96856689453125, -217.55526733398438, -211.1419677734375, -204.72866821289062, -198.31536865234375, -191.90206909179688, -185.48876953125, -179.0754852294922, -172.66217041015625, -166.24887084960938, -159.8355712890625, -153.42227172851562, -147.00897216796875, -140.59567260742188, -134.182373046875, -127.76908874511719, -121.35579681396484, -114.94249725341797, -108.5291976928711, -102.11590576171875, -95.70260620117188, -89.289306640625, -82.87600708007812, -76.46270751953125, -70.04940795898438, -63.6361083984375, -57.22281265258789, -50.809513092041016, -44.396217346191406, -37.98291778564453, -31.569618225097656, -25.156322479248047, -18.743026733398438, -12.329729080200195, -5.916430473327637, 0.4968681335449219, 6.910165786743164, 13.323463439941406, 19.73676300048828, 26.15005874633789, 32.563358306884766, 38.97665786743164, 45.38995361328125, 51.803253173828125, 58.216552734375, 64.62985229492188, 71.04315185546875, 77.4564437866211, 83.86974334716797]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 2.0, 8.0, 6.0, 8.0, 11.0, 16.0, 9.0, 18.0, 20.0, 19.0, 21.0, 23.0, 25.0, 29.0, 26.0, 40.0, 37.0, 35.0, 53.0, 51.0, 45.0, 39.0, 46.0, 43.0, 34.0, 37.0, 36.0, 29.0, 36.0, 28.0, 16.0, 24.0, 23.0, 21.0, 12.0, 10.0, 8.0, 14.0, 13.0, 5.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-73.432861328125, -71.07173919677734, -68.71062469482422, -66.34950256347656, -63.988380432128906, -61.627262115478516, -59.266143798828125, -56.90502166748047, -54.54390335083008, -52.18278503417969, -49.82166290283203, -47.46054458618164, -45.09942626953125, -42.738304138183594, -40.3771858215332, -38.01606750488281, -35.654945373535156, -33.293827056884766, -30.93270492553711, -28.57158660888672, -26.210466384887695, -23.849346160888672, -21.48822784423828, -19.127107620239258, -16.765987396240234, -14.404867172241211, -12.043747901916504, -9.682628631591797, -7.321508407592773, -4.96038818359375, -2.599268913269043, -0.23814964294433594, 2.1229705810546875, 4.484090328216553, 6.845210075378418, 9.206329345703125, 11.567449569702148, 13.928569793701172, 16.289688110351562, 18.650808334350586, 21.01192855834961, 23.373048782348633, 25.734169006347656, 28.095287322998047, 30.45640754699707, 32.817527770996094, 35.178646087646484, 37.539764404296875, 39.90088653564453, 42.26200485229492, 44.62312698364258, 46.98424530029297, 49.345367431640625, 51.706485748291016, 54.067604064941406, 56.42872619628906, 58.78984451293945, 61.150962829589844, 63.5120849609375, 65.87320709228516, 68.23432159423828, 70.59544372558594, 72.9565658569336, 75.31768035888672, 77.67880249023438]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 6.0, 12.0, 6.0, 11.0, 22.0, 28.0, 23.0, 31.0, 43.0, 39.0, 31.0, 49.0, 43.0, 52.0, 48.0, 64.0, 57.0, 56.0, 46.0, 39.0, 39.0, 37.0, 28.0, 32.0, 31.0, 23.0, 19.0, 14.0, 14.0, 10.0, 11.0, 11.0, 5.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.280029296875, -9.89599609375, -9.511962890625, -9.1279296875, -8.743896484375, -8.35986328125, -7.975830078125, -7.591796875, -7.207763671875, -6.82373046875, -6.439697265625, -6.0556640625, -5.671630859375, -5.28759765625, -4.903564453125, -4.51953125, -4.135498046875, -3.75146484375, -3.367431640625, -2.9833984375, -2.599365234375, -2.21533203125, -1.831298828125, -1.447265625, -1.063232421875, -0.67919921875, -0.295166015625, 0.0888671875, 0.472900390625, 0.85693359375, 1.240966796875, 1.625, 2.009033203125, 2.39306640625, 2.777099609375, 3.1611328125, 3.545166015625, 3.92919921875, 4.313232421875, 4.697265625, 5.081298828125, 5.46533203125, 5.849365234375, 6.2333984375, 6.617431640625, 7.00146484375, 7.385498046875, 7.76953125, 8.153564453125, 8.53759765625, 8.921630859375, 9.3056640625, 9.689697265625, 10.07373046875, 10.457763671875, 10.841796875, 11.225830078125, 11.60986328125, 11.993896484375, 12.3779296875, 12.761962890625, 13.14599609375, 13.530029296875, 13.9140625]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 2.0, 3.0, 12.0, 6.0, 19.0, 32.0, 32.0, 41.0, 63.0, 109.0, 193.0, 252.0, 356.0, 526.0, 767.0, 1202.0, 1837.0, 2849.0, 4349.0, 7026.0, 11473.0, 19069.0, 32395.0, 56542.0, 99919.0, 170593.0, 230651.0, 170168.0, 99281.0, 56376.0, 32433.0, 19086.0, 11342.0, 7010.0, 4313.0, 2822.0, 1776.0, 1172.0, 784.0, 529.0, 396.0, 267.0, 163.0, 109.0, 73.0, 41.0, 33.0, 20.0, 17.0, 18.0, 9.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.634765625, -1.5811614990234375, -1.527557373046875, -1.4739532470703125, -1.42034912109375, -1.3667449951171875, -1.313140869140625, -1.2595367431640625, -1.2059326171875, -1.1523284912109375, -1.098724365234375, -1.0451202392578125, -0.99151611328125, -0.9379119873046875, -0.884307861328125, -0.8307037353515625, -0.777099609375, -0.7234954833984375, -0.669891357421875, -0.6162872314453125, -0.56268310546875, -0.5090789794921875, -0.455474853515625, -0.4018707275390625, -0.3482666015625, -0.2946624755859375, -0.241058349609375, -0.1874542236328125, -0.13385009765625, -0.0802459716796875, -0.026641845703125, 0.0269622802734375, 0.08056640625, 0.1341705322265625, 0.187774658203125, 0.2413787841796875, 0.29498291015625, 0.3485870361328125, 0.402191162109375, 0.4557952880859375, 0.5093994140625, 0.5630035400390625, 0.616607666015625, 0.6702117919921875, 0.72381591796875, 0.7774200439453125, 0.831024169921875, 0.8846282958984375, 0.938232421875, 0.9918365478515625, 1.045440673828125, 1.0990447998046875, 1.15264892578125, 1.2062530517578125, 1.259857177734375, 1.3134613037109375, 1.3670654296875, 1.4206695556640625, 1.474273681640625, 1.5278778076171875, 1.58148193359375, 1.6350860595703125, 1.688690185546875, 1.7422943115234375, 1.7958984375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 4.0, 3.0, 6.0, 3.0, 11.0, 5.0, 7.0, 12.0, 11.0, 16.0, 14.0, 18.0, 16.0, 27.0, 28.0, 40.0, 39.0, 36.0, 42.0, 35.0, 34.0, 41.0, 35.0, 1058.0, 35.0, 36.0, 35.0, 30.0, 48.0, 28.0, 38.0, 27.0, 32.0, 30.0, 18.0, 19.0, 16.0, 20.0, 12.0, 16.0, 10.0, 11.0, 7.0, 5.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.69140625, -6.4918212890625, -6.292236328125, -6.0926513671875, -5.89306640625, -5.6934814453125, -5.493896484375, -5.2943115234375, -5.0947265625, -4.8951416015625, -4.695556640625, -4.4959716796875, -4.29638671875, -4.0968017578125, -3.897216796875, -3.6976318359375, -3.498046875, -3.2984619140625, -3.098876953125, -2.8992919921875, -2.69970703125, -2.5001220703125, -2.300537109375, -2.1009521484375, -1.9013671875, -1.7017822265625, -1.502197265625, -1.3026123046875, -1.10302734375, -0.9034423828125, -0.703857421875, -0.5042724609375, -0.3046875, -0.1051025390625, 0.094482421875, 0.2940673828125, 0.49365234375, 0.6932373046875, 0.892822265625, 1.0924072265625, 1.2919921875, 1.4915771484375, 1.691162109375, 1.8907470703125, 2.09033203125, 2.2899169921875, 2.489501953125, 2.6890869140625, 2.888671875, 3.0882568359375, 3.287841796875, 3.4874267578125, 3.68701171875, 3.8865966796875, 4.086181640625, 4.2857666015625, 4.4853515625, 4.6849365234375, 4.884521484375, 5.0841064453125, 5.28369140625, 5.4832763671875, 5.682861328125, 5.8824462890625, 6.08203125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 10.0, 17.0, 29.0, 33.0, 41.0, 85.0, 120.0, 194.0, 278.0, 403.0, 642.0, 1039.0, 1591.0, 2607.0, 4137.0, 6715.0, 10921.0, 18210.0, 29683.0, 50187.0, 84048.0, 137713.0, 1233394.0, 202355.0, 124209.0, 74867.0, 44609.0, 26636.0, 16153.0, 9844.0, 6025.0, 3853.0, 2333.0, 1487.0, 914.0, 604.0, 404.0, 256.0, 164.0, 108.0, 81.0, 38.0, 37.0, 22.0, 13.0, 8.0, 12.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.91748046875, -0.8877792358398438, -0.8580780029296875, -0.8283767700195312, -0.798675537109375, -0.7689743041992188, -0.7392730712890625, -0.7095718383789062, -0.67987060546875, -0.6501693725585938, -0.6204681396484375, -0.5907669067382812, -0.561065673828125, -0.5313644409179688, -0.5016632080078125, -0.47196197509765625, -0.4422607421875, -0.41255950927734375, -0.3828582763671875, -0.35315704345703125, -0.323455810546875, -0.29375457763671875, -0.2640533447265625, -0.23435211181640625, -0.20465087890625, -0.17494964599609375, -0.1452484130859375, -0.11554718017578125, -0.085845947265625, -0.05614471435546875, -0.0264434814453125, 0.00325775146484375, 0.032958984375, 0.06266021728515625, 0.0923614501953125, 0.12206268310546875, 0.151763916015625, 0.18146514892578125, 0.2111663818359375, 0.24086761474609375, 0.27056884765625, 0.30027008056640625, 0.3299713134765625, 0.35967254638671875, 0.389373779296875, 0.41907501220703125, 0.4487762451171875, 0.47847747802734375, 0.5081787109375, 0.5378799438476562, 0.5675811767578125, 0.5972824096679688, 0.626983642578125, 0.6566848754882812, 0.6863861083984375, 0.7160873413085938, 0.74578857421875, 0.7754898071289062, 0.8051910400390625, 0.8348922729492188, 0.864593505859375, 0.8942947387695312, 0.9239959716796875, 0.9536972045898438, 0.9833984375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 3.0, 7.0, 5.0, 5.0, 3.0, 15.0, 10.0, 12.0, 15.0, 8.0, 32.0, 28.0, 44.0, 56.0, 59.0, 78.0, 95.0, 83.0, 100.0, 82.0, 41.0, 51.0, 36.0, 26.0, 14.0, 14.0, 16.0, 9.0, 10.0, 18.0, 2.0, 4.0, 8.0, 7.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.01508331298828125, -0.014626264572143555, -0.01416921615600586, -0.013712167739868164, -0.013255119323730469, -0.012798070907592773, -0.012341022491455078, -0.011883974075317383, -0.011426925659179688, -0.010969877243041992, -0.010512828826904297, -0.010055780410766602, -0.009598731994628906, -0.009141683578491211, -0.008684635162353516, -0.00822758674621582, -0.007770538330078125, -0.00731348991394043, -0.006856441497802734, -0.006399393081665039, -0.005942344665527344, -0.0054852962493896484, -0.005028247833251953, -0.004571199417114258, -0.0041141510009765625, -0.003657102584838867, -0.003200054168701172, -0.0027430057525634766, -0.0022859573364257812, -0.001828908920288086, -0.0013718605041503906, -0.0009148120880126953, -0.000457763671875, -7.152557373046875e-07, 0.0004563331604003906, 0.0009133815765380859, 0.0013704299926757812, 0.0018274784088134766, 0.002284526824951172, 0.002741575241088867, 0.0031986236572265625, 0.003655672073364258, 0.004112720489501953, 0.0045697689056396484, 0.005026817321777344, 0.005483865737915039, 0.005940914154052734, 0.00639796257019043, 0.006855010986328125, 0.00731205940246582, 0.007769107818603516, 0.008226156234741211, 0.008683204650878906, 0.009140253067016602, 0.009597301483154297, 0.010054349899291992, 0.010511398315429688, 0.010968446731567383, 0.011425495147705078, 0.011882543563842773, 0.012339591979980469, 0.012796640396118164, 0.01325368881225586, 0.013710737228393555, 0.01416778564453125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 6.0, 12.0, 16.0, 14.0, 18.0, 20.0, 31.0, 40.0, 55.0, 84.0, 113.0, 160.0, 228.0, 472.0, 1412.0, 23985.0, 944489.0, 73329.0, 2556.0, 544.0, 305.0, 183.0, 123.0, 88.0, 66.0, 43.0, 28.0, 29.0, 22.0, 11.0, 9.0, 10.0, 6.0, 8.0, 4.0, 7.0, 5.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.24755859375, -0.2399730682373047, -0.23238754272460938, -0.22480201721191406, -0.21721649169921875, -0.20963096618652344, -0.20204544067382812, -0.1944599151611328, -0.1868743896484375, -0.1792888641357422, -0.17170333862304688, -0.16411781311035156, -0.15653228759765625, -0.14894676208496094, -0.14136123657226562, -0.1337757110595703, -0.126190185546875, -0.11860466003417969, -0.11101913452148438, -0.10343360900878906, -0.09584808349609375, -0.08826255798339844, -0.08067703247070312, -0.07309150695800781, -0.0655059814453125, -0.05792045593261719, -0.050334930419921875, -0.04274940490722656, -0.03516387939453125, -0.027578353881835938, -0.019992828369140625, -0.012407302856445312, -0.00482177734375, 0.0027637481689453125, 0.010349273681640625, 0.017934799194335938, 0.02552032470703125, 0.03310585021972656, 0.040691375732421875, 0.04827690124511719, 0.0558624267578125, 0.06344795227050781, 0.07103347778320312, 0.07861900329589844, 0.08620452880859375, 0.09379005432128906, 0.10137557983398438, 0.10896110534667969, 0.116546630859375, 0.12413215637207031, 0.13171768188476562, 0.13930320739746094, 0.14688873291015625, 0.15447425842285156, 0.16205978393554688, 0.1696453094482422, 0.1772308349609375, 0.1848163604736328, 0.19240188598632812, 0.19998741149902344, 0.20757293701171875, 0.21515846252441406, 0.22274398803710938, 0.2303295135498047, 0.2379150390625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 30.0, 60.0, 291.0, 429.0, 127.0, 44.0, 15.0, 12.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06344835460186005, -0.06029770150780678, -0.05714705213904381, -0.05399639904499054, -0.05084574595093727, -0.047695092856884, -0.04454444348812103, -0.041393790394067764, -0.038243137300014496, -0.03509248420596123, -0.03194183483719826, -0.02879118174314499, -0.02564052864909172, -0.0224898774176836, -0.019339226186275482, -0.016188573092222214, -0.013037923723459244, -0.00988727156072855, -0.0067366198636591434, -0.003585968166589737, -0.0004353160038590431, 0.0027153361588716507, 0.00586598739027977, 0.009016640484333038, 0.012167291715741158, 0.015317943878471851, 0.018468596041202545, 0.021619247272610664, 0.024769898504018784, 0.027920551598072052, 0.03107120282948017, 0.03422185778617859, 0.03737250715494156, 0.04052316024899483, 0.0436738096177578, 0.046824462711811066, 0.049975115805864334, 0.0531257688999176, 0.05627641826868057, 0.05942707136273384, 0.06257772445678711, 0.06572837382555008, 0.06887903064489365, 0.07202968001365662, 0.07518032938241959, 0.07833098620176315, 0.08148163557052612, 0.08463229238986969, 0.08778293430805206, 0.09093358367681503, 0.0940842404961586, 0.09723488986492157, 0.10038553923368454, 0.1035361960530281, 0.10668684542179108, 0.10983750224113464, 0.11298815160989761, 0.11613880097866058, 0.11928945779800415, 0.12244010716676712, 0.1255907565355301, 0.12874141335487366, 0.13189205527305603, 0.1350427120923996, 0.13819336891174316]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 5.0, 1.0, 6.0, 3.0, 3.0, 3.0, 8.0, 8.0, 9.0, 9.0, 5.0, 9.0, 12.0, 18.0, 28.0, 20.0, 25.0, 30.0, 29.0, 33.0, 32.0, 40.0, 40.0, 50.0, 54.0, 36.0, 46.0, 30.0, 43.0, 38.0, 39.0, 40.0, 30.0, 31.0, 32.0, 24.0, 22.0, 18.0, 11.0, 11.0, 13.0, 17.0, 15.0, 11.0, 10.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.008916795253753662, -0.00861247070133686, -0.00830814614892006, -0.008003821596503258, -0.007699497044086456, -0.007395172491669655, -0.007090847939252853, -0.006786523386836052, -0.0064821988344192505, -0.006177874282002449, -0.005873549729585648, -0.005569225177168846, -0.005264900624752045, -0.004960576072335243, -0.004656251519918442, -0.00435192696750164, -0.004047602415084839, -0.0037432778626680374, -0.003438953310251236, -0.0031346287578344345, -0.002830304205417633, -0.0025259796530008316, -0.00222165510058403, -0.0019173305481672287, -0.0016130059957504272, -0.0013086814433336258, -0.0010043568909168243, -0.0007000323385000229, -0.00039570778608322144, -9.138323366641998e-05, 0.00021294131875038147, 0.0005172658711671829, 0.0008215904235839844, 0.0011259149760007858, 0.0014302395284175873, 0.0017345640808343887, 0.00203888863325119, 0.0023432131856679916, 0.002647537738084793, 0.0029518622905015945, 0.003256186842918396, 0.0035605113953351974, 0.003864835947751999, 0.0041691605001688, 0.004473485052585602, 0.004777809605002403, 0.005082134157419205, 0.005386458709836006, 0.005690783262252808, 0.005995107814669609, 0.0062994323670864105, 0.006603756919503212, 0.006908081471920013, 0.007212406024336815, 0.007516730576753616, 0.007821055129170418, 0.00812537968158722, 0.00842970423400402, 0.008734028786420822, 0.009038353338837624, 0.009342677891254425, 0.009647002443671227, 0.009951326996088028, 0.01025565154850483, 0.01055997610092163]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 6.0, 12.0, 6.0, 11.0, 22.0, 28.0, 23.0, 31.0, 43.0, 39.0, 31.0, 49.0, 43.0, 52.0, 48.0, 64.0, 57.0, 56.0, 46.0, 39.0, 39.0, 37.0, 28.0, 32.0, 31.0, 23.0, 19.0, 15.0, 13.0, 10.0, 11.0, 11.0, 5.0, 3.0, 2.0, 1.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6640625, -10.280029296875, -9.89599609375, -9.511962890625, -9.1279296875, -8.743896484375, -8.35986328125, -7.975830078125, -7.591796875, -7.207763671875, -6.82373046875, -6.439697265625, -6.0556640625, -5.671630859375, -5.28759765625, -4.903564453125, -4.51953125, -4.135498046875, -3.75146484375, -3.367431640625, -2.9833984375, -2.599365234375, -2.21533203125, -1.831298828125, -1.447265625, -1.063232421875, -0.67919921875, -0.295166015625, 0.0888671875, 0.472900390625, 0.85693359375, 1.240966796875, 1.625, 2.009033203125, 2.39306640625, 2.777099609375, 3.1611328125, 3.545166015625, 3.92919921875, 4.313232421875, 4.697265625, 5.081298828125, 5.46533203125, 5.849365234375, 6.2333984375, 6.617431640625, 7.00146484375, 7.385498046875, 7.76953125, 8.153564453125, 8.53759765625, 8.921630859375, 9.3056640625, 9.689697265625, 10.07373046875, 10.457763671875, 10.841796875, 11.225830078125, 11.60986328125, 11.993896484375, 12.3779296875, 12.761962890625, 13.14599609375, 13.530029296875, 13.9140625]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 11.0, 7.0, 6.0, 15.0, 22.0, 26.0, 37.0, 74.0, 94.0, 133.0, 198.0, 232.0, 370.0, 570.0, 795.0, 1262.0, 1922.0, 2929.0, 4947.0, 8506.0, 16865.0, 46729.0, 496770.0, 386373.0, 42247.0, 16196.0, 8027.0, 4748.0, 2887.0, 1803.0, 1199.0, 810.0, 527.0, 382.0, 245.0, 172.0, 139.0, 93.0, 55.0, 46.0, 30.0, 20.0, 14.0, 9.0, 7.0, 6.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.1875, -21.447021484375, -20.70654296875, -19.966064453125, -19.2255859375, -18.485107421875, -17.74462890625, -17.004150390625, -16.263671875, -15.523193359375, -14.78271484375, -14.042236328125, -13.3017578125, -12.561279296875, -11.82080078125, -11.080322265625, -10.33984375, -9.599365234375, -8.85888671875, -8.118408203125, -7.3779296875, -6.637451171875, -5.89697265625, -5.156494140625, -4.416015625, -3.675537109375, -2.93505859375, -2.194580078125, -1.4541015625, -0.713623046875, 0.02685546875, 0.767333984375, 1.5078125, 2.248291015625, 2.98876953125, 3.729248046875, 4.4697265625, 5.210205078125, 5.95068359375, 6.691162109375, 7.431640625, 8.172119140625, 8.91259765625, 9.653076171875, 10.3935546875, 11.134033203125, 11.87451171875, 12.614990234375, 13.35546875, 14.095947265625, 14.83642578125, 15.576904296875, 16.3173828125, 17.057861328125, 17.79833984375, 18.538818359375, 19.279296875, 20.019775390625, 20.76025390625, 21.500732421875, 22.2412109375, 22.981689453125, 23.72216796875, 24.462646484375, 25.203125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 6.0, 8.0, 9.0, 8.0, 14.0, 15.0, 25.0, 21.0, 32.0, 26.0, 38.0, 29.0, 43.0, 60.0, 57.0, 70.0, 121.0, 356.0, 1473.0, 146.0, 80.0, 64.0, 43.0, 53.0, 38.0, 44.0, 23.0, 25.0, 31.0, 21.0, 14.0, 12.0, 9.0, 10.0, 9.0, 3.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-40.21875, -39.00341796875, -37.7880859375, -36.57275390625, -35.357421875, -34.14208984375, -32.9267578125, -31.71142578125, -30.49609375, -29.28076171875, -28.0654296875, -26.85009765625, -25.634765625, -24.41943359375, -23.2041015625, -21.98876953125, -20.7734375, -19.55810546875, -18.3427734375, -17.12744140625, -15.912109375, -14.69677734375, -13.4814453125, -12.26611328125, -11.05078125, -9.83544921875, -8.6201171875, -7.40478515625, -6.189453125, -4.97412109375, -3.7587890625, -2.54345703125, -1.328125, -0.11279296875, 1.1025390625, 2.31787109375, 3.533203125, 4.74853515625, 5.9638671875, 7.17919921875, 8.39453125, 9.60986328125, 10.8251953125, 12.04052734375, 13.255859375, 14.47119140625, 15.6865234375, 16.90185546875, 18.1171875, 19.33251953125, 20.5478515625, 21.76318359375, 22.978515625, 24.19384765625, 25.4091796875, 26.62451171875, 27.83984375, 29.05517578125, 30.2705078125, 31.48583984375, 32.701171875, 33.91650390625, 35.1318359375, 36.34716796875, 37.5625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 7.0, 4.0, 11.0, 9.0, 12.0, 16.0, 22.0, 21.0, 23.0, 37.0, 53.0, 56.0, 100.0, 138.0, 274.0, 538.0, 2851.0, 27269.0, 2963174.0, 142102.0, 6913.0, 1091.0, 385.0, 179.0, 96.0, 79.0, 58.0, 41.0, 39.0, 29.0, 21.0, 11.0, 12.0, 9.0, 4.0, 1.0, 5.0, 8.0, 3.0, 2.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.1875, -68.419921875, -65.65234375, -62.884765625, -60.1171875, -57.349609375, -54.58203125, -51.814453125, -49.046875, -46.279296875, -43.51171875, -40.744140625, -37.9765625, -35.208984375, -32.44140625, -29.673828125, -26.90625, -24.138671875, -21.37109375, -18.603515625, -15.8359375, -13.068359375, -10.30078125, -7.533203125, -4.765625, -1.998046875, 0.76953125, 3.537109375, 6.3046875, 9.072265625, 11.83984375, 14.607421875, 17.375, 20.142578125, 22.91015625, 25.677734375, 28.4453125, 31.212890625, 33.98046875, 36.748046875, 39.515625, 42.283203125, 45.05078125, 47.818359375, 50.5859375, 53.353515625, 56.12109375, 58.888671875, 61.65625, 64.423828125, 67.19140625, 69.958984375, 72.7265625, 75.494140625, 78.26171875, 81.029296875, 83.796875, 86.564453125, 89.33203125, 92.099609375, 94.8671875, 97.634765625, 100.40234375, 103.169921875, 105.9375]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [6.0, 406.0, 580.0, 19.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.41343307495117, -18.864364624023438, -1.3152961730957031, 16.23377227783203, 33.782840728759766, 51.331912994384766, 68.8809814453125, 86.43003845214844, 103.97911071777344, 121.52818298339844, 139.07723999023438, 156.62631225585938, 174.17538452148438, 191.72445678710938, 209.27352905273438, 226.8225860595703, 244.3716583251953, 261.92071533203125, 279.46978759765625, 297.01885986328125, 314.56793212890625, 332.11700439453125, 349.66607666015625, 367.21514892578125, 384.76422119140625, 402.31329345703125, 419.86236572265625, 437.41143798828125, 454.96051025390625, 472.50958251953125, 490.0586242675781, 507.6076965332031, 525.15673828125, 542.705810546875, 560.2548828125, 577.803955078125, 595.35302734375, 612.902099609375, 630.451171875, 648.000244140625, 665.54931640625, 683.098388671875, 700.6474609375, 718.196533203125, 735.74560546875, 753.294677734375, 770.84375, 788.392822265625, 805.9418334960938, 823.4909057617188, 841.0399780273438, 858.5890502929688, 876.1381225585938, 893.6871948242188, 911.2362670898438, 928.7852783203125, 946.3343505859375, 963.8834228515625, 981.4324951171875, 998.9815673828125, 1016.5306396484375, 1034.0797119140625, 1051.6287841796875, 1069.1778564453125, 1086.7269287109375]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 6.0, 2.0, 3.0, 3.0, 2.0, 5.0, 5.0, 3.0, 5.0, 8.0, 10.0, 9.0, 10.0, 17.0, 23.0, 21.0, 19.0, 30.0, 17.0, 41.0, 32.0, 29.0, 34.0, 44.0, 37.0, 41.0, 44.0, 34.0, 36.0, 38.0, 37.0, 32.0, 38.0, 38.0, 36.0, 30.0, 22.0, 26.0, 31.0, 15.0, 13.0, 19.0, 14.0, 15.0, 8.0, 11.0, 8.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.92601013183594, -78.16325378417969, -75.4004898071289, -72.63773345947266, -69.8749771118164, -67.11221313476562, -64.34945678710938, -61.58669662475586, -58.823936462402344, -56.06117630004883, -53.29841995239258, -50.53565979003906, -47.77289962768555, -45.01013946533203, -42.24738311767578, -39.484622955322266, -36.721866607666016, -33.9591064453125, -31.196348190307617, -28.433589935302734, -25.67082977294922, -22.908071517944336, -20.145313262939453, -17.382553100585938, -14.619794845581055, -11.857035636901855, -9.094276428222656, -6.331518173217773, -3.568758964538574, -0.805999755859375, 1.9567584991455078, 4.719518661499023, 7.482276916503906, 10.245036125183105, 13.007795333862305, 15.770553588867188, 18.533313751220703, 21.296072006225586, 24.05883026123047, 26.821590423583984, 29.584348678588867, 32.34710693359375, 35.109867095947266, 37.87262725830078, 40.63538360595703, 43.39814376831055, 46.16090393066406, 48.92366027832031, 51.68642044067383, 54.449180603027344, 57.211936950683594, 59.97469711303711, 62.737457275390625, 65.50021362304688, 68.26296997070312, 71.0257339477539, 73.78849029541016, 76.5512466430664, 79.31401062011719, 82.07676696777344, 84.83952331542969, 87.60228729248047, 90.36504364013672, 93.1278076171875, 95.89056396484375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 5.0, 2.0, 4.0, 5.0, 7.0, 7.0, 5.0, 13.0, 13.0, 20.0, 28.0, 24.0, 27.0, 24.0, 32.0, 47.0, 47.0, 42.0, 44.0, 49.0, 49.0, 42.0, 45.0, 50.0, 50.0, 41.0, 42.0, 36.0, 30.0, 25.0, 25.0, 18.0, 26.0, 15.0, 16.0, 11.0, 13.0, 8.0, 6.0, 3.0, 2.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1875, -9.81494140625, -9.4423828125, -9.06982421875, -8.697265625, -8.32470703125, -7.9521484375, -7.57958984375, -7.20703125, -6.83447265625, -6.4619140625, -6.08935546875, -5.716796875, -5.34423828125, -4.9716796875, -4.59912109375, -4.2265625, -3.85400390625, -3.4814453125, -3.10888671875, -2.736328125, -2.36376953125, -1.9912109375, -1.61865234375, -1.24609375, -0.87353515625, -0.5009765625, -0.12841796875, 0.244140625, 0.61669921875, 0.9892578125, 1.36181640625, 1.734375, 2.10693359375, 2.4794921875, 2.85205078125, 3.224609375, 3.59716796875, 3.9697265625, 4.34228515625, 4.71484375, 5.08740234375, 5.4599609375, 5.83251953125, 6.205078125, 6.57763671875, 6.9501953125, 7.32275390625, 7.6953125, 8.06787109375, 8.4404296875, 8.81298828125, 9.185546875, 9.55810546875, 9.9306640625, 10.30322265625, 10.67578125, 11.04833984375, 11.4208984375, 11.79345703125, 12.166015625, 12.53857421875, 12.9111328125, 13.28369140625, 13.65625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 4.0, 5.0, 4.0, 9.0, 12.0, 17.0, 19.0, 15.0, 38.0, 43.0, 49.0, 87.0, 130.0, 184.0, 332.0, 742.0, 1738.0, 4852.0, 18097.0, 293602.0, 3677399.0, 174743.0, 14862.0, 4123.0, 1531.0, 693.0, 352.0, 177.0, 121.0, 70.0, 50.0, 46.0, 42.0, 20.0, 17.0, 12.0, 14.0, 11.0, 2.0, 10.0, 2.0, 3.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.5, -37.0439453125, -35.587890625, -34.1318359375, -32.67578125, -31.2197265625, -29.763671875, -28.3076171875, -26.8515625, -25.3955078125, -23.939453125, -22.4833984375, -21.02734375, -19.5712890625, -18.115234375, -16.6591796875, -15.203125, -13.7470703125, -12.291015625, -10.8349609375, -9.37890625, -7.9228515625, -6.466796875, -5.0107421875, -3.5546875, -2.0986328125, -0.642578125, 0.8134765625, 2.26953125, 3.7255859375, 5.181640625, 6.6376953125, 8.09375, 9.5498046875, 11.005859375, 12.4619140625, 13.91796875, 15.3740234375, 16.830078125, 18.2861328125, 19.7421875, 21.1982421875, 22.654296875, 24.1103515625, 25.56640625, 27.0224609375, 28.478515625, 29.9345703125, 31.390625, 32.8466796875, 34.302734375, 35.7587890625, 37.21484375, 38.6708984375, 40.126953125, 41.5830078125, 43.0390625, 44.4951171875, 45.951171875, 47.4072265625, 48.86328125, 50.3193359375, 51.775390625, 53.2314453125, 54.6875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 4.0, 12.0, 18.0, 15.0, 27.0, 36.0, 59.0, 71.0, 116.0, 226.0, 470.0, 798.0, 862.0, 573.0, 327.0, 150.0, 95.0, 48.0, 44.0, 31.0, 16.0, 17.0, 18.0, 9.0, 5.0, 4.0, 7.0, 8.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.21875, -36.162109375, -35.10546875, -34.048828125, -32.9921875, -31.935546875, -30.87890625, -29.822265625, -28.765625, -27.708984375, -26.65234375, -25.595703125, -24.5390625, -23.482421875, -22.42578125, -21.369140625, -20.3125, -19.255859375, -18.19921875, -17.142578125, -16.0859375, -15.029296875, -13.97265625, -12.916015625, -11.859375, -10.802734375, -9.74609375, -8.689453125, -7.6328125, -6.576171875, -5.51953125, -4.462890625, -3.40625, -2.349609375, -1.29296875, -0.236328125, 0.8203125, 1.876953125, 2.93359375, 3.990234375, 5.046875, 6.103515625, 7.16015625, 8.216796875, 9.2734375, 10.330078125, 11.38671875, 12.443359375, 13.5, 14.556640625, 15.61328125, 16.669921875, 17.7265625, 18.783203125, 19.83984375, 20.896484375, 21.953125, 23.009765625, 24.06640625, 25.123046875, 26.1796875, 27.236328125, 28.29296875, 29.349609375, 30.40625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 7.0, 4.0, 5.0, 16.0, 17.0, 21.0, 28.0, 50.0, 81.0, 174.0, 359.0, 1298.0, 6394.0, 59653.0, 3768926.0, 337473.0, 15974.0, 2625.0, 652.0, 224.0, 109.0, 69.0, 37.0, 20.0, 27.0, 11.0, 9.0, 6.0, 1.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.0625, -75.4365234375, -72.810546875, -70.1845703125, -67.55859375, -64.9326171875, -62.306640625, -59.6806640625, -57.0546875, -54.4287109375, -51.802734375, -49.1767578125, -46.55078125, -43.9248046875, -41.298828125, -38.6728515625, -36.046875, -33.4208984375, -30.794921875, -28.1689453125, -25.54296875, -22.9169921875, -20.291015625, -17.6650390625, -15.0390625, -12.4130859375, -9.787109375, -7.1611328125, -4.53515625, -1.9091796875, 0.716796875, 3.3427734375, 5.96875, 8.5947265625, 11.220703125, 13.8466796875, 16.47265625, 19.0986328125, 21.724609375, 24.3505859375, 26.9765625, 29.6025390625, 32.228515625, 34.8544921875, 37.48046875, 40.1064453125, 42.732421875, 45.3583984375, 47.984375, 50.6103515625, 53.236328125, 55.8623046875, 58.48828125, 61.1142578125, 63.740234375, 66.3662109375, 68.9921875, 71.6181640625, 74.244140625, 76.8701171875, 79.49609375, 82.1220703125, 84.748046875, 87.3740234375, 90.0]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 10.0, 46.0, 118.0, 283.0, 339.0, 150.0, 40.0, 15.0, 9.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-380.7870178222656, -370.51727294921875, -360.2475280761719, -349.977783203125, -339.7080383300781, -329.43829345703125, -319.1685485839844, -308.8988037109375, -298.6290588378906, -288.35931396484375, -278.0895690917969, -267.81982421875, -257.5500793457031, -247.28033447265625, -237.01058959960938, -226.7408447265625, -216.47108459472656, -206.2013397216797, -195.9315948486328, -185.66184997558594, -175.39210510253906, -165.1223602294922, -154.85260009765625, -144.58285522460938, -134.3131103515625, -124.04336547851562, -113.77362060546875, -103.50387573242188, -93.234130859375, -82.96438598632812, -72.69463348388672, -62.424888610839844, -52.1551513671875, -41.885406494140625, -31.615659713745117, -21.34591293334961, -11.076168060302734, -0.8064231872558594, 9.463325500488281, 19.733070373535156, 30.00281524658203, 40.272560119628906, 50.54230499267578, 60.81205368041992, 71.08180236816406, 81.35154724121094, 91.62129211425781, 101.89103698730469, 112.16078186035156, 122.43052673339844, 132.7002716064453, 142.9700164794922, 153.23976135253906, 163.50950622558594, 173.77926635742188, 184.04901123046875, 194.31875610351562, 204.5885009765625, 214.85824584960938, 225.12799072265625, 235.39773559570312, 245.66748046875, 255.93722534179688, 266.20697021484375, 276.4767150878906]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 0.0, 3.0, 1.0, 5.0, 4.0, 3.0, 7.0, 6.0, 5.0, 13.0, 16.0, 13.0, 15.0, 21.0, 19.0, 23.0, 21.0, 24.0, 21.0, 31.0, 23.0, 28.0, 30.0, 31.0, 36.0, 34.0, 34.0, 35.0, 23.0, 32.0, 39.0, 32.0, 40.0, 30.0, 25.0, 38.0, 27.0, 20.0, 16.0, 24.0, 19.0, 30.0, 25.0, 17.0, 15.0, 6.0, 16.0, 8.0, 4.0, 8.0, 3.0, 7.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-69.30131530761719, -67.17257690429688, -65.04383850097656, -62.915096282958984, -60.786354064941406, -58.657615661621094, -56.52887725830078, -54.40013885498047, -52.27139663696289, -50.14265823364258, -48.013916015625, -45.88517761230469, -43.756439208984375, -41.6276969909668, -39.498958587646484, -37.370216369628906, -35.241477966308594, -33.11273956298828, -30.983997344970703, -28.85525894165039, -26.726518630981445, -24.5977783203125, -22.469039916992188, -20.340299606323242, -18.211559295654297, -16.08281898498535, -13.954079627990723, -11.825340270996094, -9.696599960327148, -7.567859649658203, -5.439120292663574, -3.3103809356689453, -1.1816329956054688, 0.9471068382263184, 3.0758466720581055, 5.204586505889893, 7.33332633972168, 9.462066650390625, 11.590806007385254, 13.719545364379883, 15.848285675048828, 17.977025985717773, 20.10576629638672, 22.23450469970703, 24.363245010375977, 26.491985321044922, 28.620723724365234, 30.74946403503418, 32.878204345703125, 35.00694274902344, 37.135684967041016, 39.26442337036133, 41.393165588378906, 43.52190399169922, 45.65064239501953, 47.779380798339844, 49.90812301635742, 52.036861419677734, 54.16560363769531, 56.294342041015625, 58.42308044433594, 60.551822662353516, 62.68056106567383, 64.8093032836914, 66.93804168701172]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 13.0, 9.0, 11.0, 19.0, 21.0, 24.0, 21.0, 26.0, 38.0, 33.0, 34.0, 49.0, 59.0, 50.0, 45.0, 55.0, 55.0, 57.0, 52.0, 50.0, 30.0, 43.0, 32.0, 33.0, 30.0, 23.0, 15.0, 17.0, 14.0, 11.0, 7.0, 4.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.5113525390625, -11.108642578125, -10.7059326171875, -10.30322265625, -9.9005126953125, -9.497802734375, -9.0950927734375, -8.6923828125, -8.2896728515625, -7.886962890625, -7.4842529296875, -7.08154296875, -6.6788330078125, -6.276123046875, -5.8734130859375, -5.470703125, -5.0679931640625, -4.665283203125, -4.2625732421875, -3.85986328125, -3.4571533203125, -3.054443359375, -2.6517333984375, -2.2490234375, -1.8463134765625, -1.443603515625, -1.0408935546875, -0.63818359375, -0.2354736328125, 0.167236328125, 0.5699462890625, 0.97265625, 1.3753662109375, 1.778076171875, 2.1807861328125, 2.58349609375, 2.9862060546875, 3.388916015625, 3.7916259765625, 4.1943359375, 4.5970458984375, 4.999755859375, 5.4024658203125, 5.80517578125, 6.2078857421875, 6.610595703125, 7.0133056640625, 7.416015625, 7.8187255859375, 8.221435546875, 8.6241455078125, 9.02685546875, 9.4295654296875, 9.832275390625, 10.2349853515625, 10.6376953125, 11.0404052734375, 11.443115234375, 11.8458251953125, 12.24853515625, 12.6512451171875, 13.053955078125, 13.4566650390625, 13.859375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 5.0, 2.0, 9.0, 13.0, 9.0, 21.0, 35.0, 44.0, 61.0, 88.0, 112.0, 196.0, 255.0, 356.0, 510.0, 765.0, 1030.0, 1638.0, 2381.0, 3581.0, 5602.0, 8552.0, 13717.0, 22672.0, 38420.0, 64914.0, 110402.0, 176342.0, 210461.0, 152995.0, 93301.0, 54713.0, 32231.0, 19375.0, 11830.0, 7472.0, 4776.0, 3055.0, 2063.0, 1460.0, 930.0, 678.0, 459.0, 308.0, 235.0, 139.0, 104.0, 72.0, 53.0, 42.0, 20.0, 28.0, 12.0, 7.0, 8.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.673828125, -1.61865234375, -1.5634765625, -1.50830078125, -1.453125, -1.39794921875, -1.3427734375, -1.28759765625, -1.232421875, -1.17724609375, -1.1220703125, -1.06689453125, -1.01171875, -0.95654296875, -0.9013671875, -0.84619140625, -0.791015625, -0.73583984375, -0.6806640625, -0.62548828125, -0.5703125, -0.51513671875, -0.4599609375, -0.40478515625, -0.349609375, -0.29443359375, -0.2392578125, -0.18408203125, -0.12890625, -0.07373046875, -0.0185546875, 0.03662109375, 0.091796875, 0.14697265625, 0.2021484375, 0.25732421875, 0.3125, 0.36767578125, 0.4228515625, 0.47802734375, 0.533203125, 0.58837890625, 0.6435546875, 0.69873046875, 0.75390625, 0.80908203125, 0.8642578125, 0.91943359375, 0.974609375, 1.02978515625, 1.0849609375, 1.14013671875, 1.1953125, 1.25048828125, 1.3056640625, 1.36083984375, 1.416015625, 1.47119140625, 1.5263671875, 1.58154296875, 1.63671875, 1.69189453125, 1.7470703125, 1.80224609375, 1.857421875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 6.0, 3.0, 3.0, 3.0, 9.0, 15.0, 13.0, 7.0, 16.0, 27.0, 24.0, 40.0, 37.0, 32.0, 32.0, 31.0, 42.0, 46.0, 42.0, 52.0, 1073.0, 40.0, 44.0, 39.0, 39.0, 41.0, 27.0, 32.0, 33.0, 35.0, 24.0, 27.0, 20.0, 20.0, 12.0, 10.0, 9.0, 6.0, 10.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.73828125, -6.49591064453125, -6.2535400390625, -6.01116943359375, -5.768798828125, -5.52642822265625, -5.2840576171875, -5.04168701171875, -4.79931640625, -4.55694580078125, -4.3145751953125, -4.07220458984375, -3.829833984375, -3.58746337890625, -3.3450927734375, -3.10272216796875, -2.8603515625, -2.61798095703125, -2.3756103515625, -2.13323974609375, -1.890869140625, -1.64849853515625, -1.4061279296875, -1.16375732421875, -0.92138671875, -0.67901611328125, -0.4366455078125, -0.19427490234375, 0.048095703125, 0.29046630859375, 0.5328369140625, 0.77520751953125, 1.017578125, 1.25994873046875, 1.5023193359375, 1.74468994140625, 1.987060546875, 2.22943115234375, 2.4718017578125, 2.71417236328125, 2.95654296875, 3.19891357421875, 3.4412841796875, 3.68365478515625, 3.926025390625, 4.16839599609375, 4.4107666015625, 4.65313720703125, 4.8955078125, 5.13787841796875, 5.3802490234375, 5.62261962890625, 5.864990234375, 6.10736083984375, 6.3497314453125, 6.59210205078125, 6.83447265625, 7.07684326171875, 7.3192138671875, 7.56158447265625, 7.803955078125, 8.04632568359375, 8.2886962890625, 8.53106689453125, 8.7734375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 6.0, 1.0, 10.0, 23.0, 32.0, 26.0, 61.0, 79.0, 107.0, 194.0, 290.0, 425.0, 637.0, 999.0, 1628.0, 2359.0, 3900.0, 5810.0, 9393.0, 14543.0, 23474.0, 37255.0, 60788.0, 99163.0, 157050.0, 1249343.0, 160806.0, 102220.0, 62955.0, 38138.0, 23789.0, 14874.0, 9695.0, 6097.0, 3931.0, 2508.0, 1634.0, 991.0, 642.0, 423.0, 276.0, 192.0, 124.0, 85.0, 63.0, 29.0, 23.0, 18.0, 11.0, 6.0, 6.0, 5.0, 1.0, 1.0, 0.0, 3.0], "bins": [-0.96484375, -0.936065673828125, -0.90728759765625, -0.878509521484375, -0.8497314453125, -0.820953369140625, -0.79217529296875, -0.763397216796875, -0.734619140625, -0.705841064453125, -0.67706298828125, -0.648284912109375, -0.6195068359375, -0.590728759765625, -0.56195068359375, -0.533172607421875, -0.50439453125, -0.475616455078125, -0.44683837890625, -0.418060302734375, -0.3892822265625, -0.360504150390625, -0.33172607421875, -0.302947998046875, -0.274169921875, -0.245391845703125, -0.21661376953125, -0.187835693359375, -0.1590576171875, -0.130279541015625, -0.10150146484375, -0.072723388671875, -0.0439453125, -0.015167236328125, 0.01361083984375, 0.042388916015625, 0.0711669921875, 0.099945068359375, 0.12872314453125, 0.157501220703125, 0.186279296875, 0.215057373046875, 0.24383544921875, 0.272613525390625, 0.3013916015625, 0.330169677734375, 0.35894775390625, 0.387725830078125, 0.41650390625, 0.445281982421875, 0.47406005859375, 0.502838134765625, 0.5316162109375, 0.560394287109375, 0.58917236328125, 0.617950439453125, 0.646728515625, 0.675506591796875, 0.70428466796875, 0.733062744140625, 0.7618408203125, 0.790618896484375, 0.81939697265625, 0.848175048828125, 0.876953125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 12.0, 7.0, 12.0, 13.0, 7.0, 8.0, 20.0, 19.0, 25.0, 35.0, 44.0, 65.0, 92.0, 116.0, 126.0, 93.0, 85.0, 43.0, 38.0, 31.0, 28.0, 16.0, 9.0, 9.0, 12.0, 7.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.016632080078125, -0.01611614227294922, -0.015600204467773438, -0.015084266662597656, -0.014568328857421875, -0.014052391052246094, -0.013536453247070312, -0.013020515441894531, -0.01250457763671875, -0.011988639831542969, -0.011472702026367188, -0.010956764221191406, -0.010440826416015625, -0.009924888610839844, -0.009408950805664062, -0.008893013000488281, -0.0083770751953125, -0.007861137390136719, -0.0073451995849609375, -0.006829261779785156, -0.006313323974609375, -0.005797386169433594, -0.0052814483642578125, -0.004765510559082031, -0.00424957275390625, -0.0037336349487304688, -0.0032176971435546875, -0.0027017593383789062, -0.002185821533203125, -0.0016698837280273438, -0.0011539459228515625, -0.0006380081176757812, -0.0001220703125, 0.00039386749267578125, 0.0009098052978515625, 0.0014257431030273438, 0.001941680908203125, 0.0024576187133789062, 0.0029735565185546875, 0.0034894943237304688, 0.00400543212890625, 0.004521369934082031, 0.0050373077392578125, 0.005553245544433594, 0.006069183349609375, 0.006585121154785156, 0.0071010589599609375, 0.007616996765136719, 0.0081329345703125, 0.008648872375488281, 0.009164810180664062, 0.009680747985839844, 0.010196685791015625, 0.010712623596191406, 0.011228561401367188, 0.011744499206542969, 0.01226043701171875, 0.012776374816894531, 0.013292312622070312, 0.013808250427246094, 0.014324188232421875, 0.014840126037597656, 0.015356063842773438, 0.01587200164794922, 0.016387939453125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 13.0, 7.0, 10.0, 13.0, 19.0, 20.0, 47.0, 64.0, 64.0, 127.0, 175.0, 302.0, 686.0, 6116.0, 617113.0, 417091.0, 5151.0, 705.0, 275.0, 182.0, 96.0, 62.0, 41.0, 50.0, 23.0, 17.0, 20.0, 19.0, 12.0, 10.0, 5.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.266845703125, -0.2584991455078125, -0.250152587890625, -0.2418060302734375, -0.23345947265625, -0.2251129150390625, -0.216766357421875, -0.2084197998046875, -0.2000732421875, -0.1917266845703125, -0.183380126953125, -0.1750335693359375, -0.16668701171875, -0.1583404541015625, -0.149993896484375, -0.1416473388671875, -0.13330078125, -0.1249542236328125, -0.116607666015625, -0.1082611083984375, -0.09991455078125, -0.0915679931640625, -0.083221435546875, -0.0748748779296875, -0.0665283203125, -0.0581817626953125, -0.049835205078125, -0.0414886474609375, -0.03314208984375, -0.0247955322265625, -0.016448974609375, -0.0081024169921875, 0.000244140625, 0.0085906982421875, 0.016937255859375, 0.0252838134765625, 0.03363037109375, 0.0419769287109375, 0.050323486328125, 0.0586700439453125, 0.0670166015625, 0.0753631591796875, 0.083709716796875, 0.0920562744140625, 0.10040283203125, 0.1087493896484375, 0.117095947265625, 0.1254425048828125, 0.1337890625, 0.1421356201171875, 0.150482177734375, 0.1588287353515625, 0.16717529296875, 0.1755218505859375, 0.183868408203125, 0.1922149658203125, 0.2005615234375, 0.2089080810546875, 0.217254638671875, 0.2256011962890625, 0.23394775390625, 0.2422943115234375, 0.250640869140625, 0.2589874267578125, 0.267333984375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 10.0, 25.0, 26.0, 30.0, 55.0, 85.0, 144.0, 199.0, 134.0, 105.0, 57.0, 43.0, 19.0, 25.0, 11.0, 14.0, 5.0, 4.0, 1.0, 4.0, 4.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01906820386648178, -0.01802540011703968, -0.01698259450495243, -0.01593979075551033, -0.01489698700606823, -0.013854182325303555, -0.01281137764453888, -0.011768573895096779, -0.010725769214332104, -0.009682964533567429, -0.008640160784125328, -0.007597356103360653, -0.006554551888257265, -0.005511747673153877, -0.004468942992389202, -0.0034261387772858143, -0.0023833345621824265, -0.0013405302306637168, -0.00029772589914500713, 0.0007450785487890244, 0.0017878827638924122, 0.0028306869789958, 0.003873491659760475, 0.004916295874863863, 0.005959100089967251, 0.007001904305070639, 0.008044708520174026, 0.009087513200938702, 0.010130317881703377, 0.011173121631145477, 0.012215926311910152, 0.013258730992674828, 0.014301534742116928, 0.015344339422881603, 0.01638714410364628, 0.01742994785308838, 0.01847275160253048, 0.01951555535197258, 0.02055836096405983, 0.02160116471350193, 0.02264396846294403, 0.02368677221238613, 0.02472957782447338, 0.02577238157391548, 0.026815185323357582, 0.027857989072799683, 0.028900794684886932, 0.029943598434329033, 0.030986404046416283, 0.03202920779585838, 0.03307201340794563, 0.034114815294742584, 0.035157620906829834, 0.036200426518917084, 0.037243232131004333, 0.038286034017801285, 0.039328839629888535, 0.040371645241975784, 0.041414447128772736, 0.042457252740859985, 0.043500058352947235, 0.044542860239744186, 0.045585665851831436, 0.046628471463918686, 0.04767127335071564]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 4.0, 5.0, 6.0, 5.0, 5.0, 4.0, 16.0, 23.0, 17.0, 16.0, 28.0, 34.0, 28.0, 34.0, 38.0, 38.0, 39.0, 43.0, 46.0, 43.0, 49.0, 45.0, 50.0, 50.0, 28.0, 32.0, 34.0, 24.0, 26.0, 19.0, 24.0, 29.0, 21.0, 17.0, 15.0, 12.0, 13.0, 9.0, 11.0, 4.0, 6.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.008784055709838867, -0.008507591672241688, -0.008231127634644508, -0.007954663597047329, -0.0076781995594501495, -0.00740173552185297, -0.007125271484255791, -0.006848807446658611, -0.006572343409061432, -0.0062958793714642525, -0.006019415333867073, -0.005742951296269894, -0.005466487258672714, -0.005190023221075535, -0.004913559183478355, -0.004637095145881176, -0.004360631108283997, -0.004084167070686817, -0.0038077030330896378, -0.0035312389954924583, -0.003254774957895279, -0.0029783109202980995, -0.00270184688270092, -0.0024253828451037407, -0.0021489188075065613, -0.0018724547699093819, -0.0015959907323122025, -0.001319526694715023, -0.0010430626571178436, -0.0007665986195206642, -0.0004901345819234848, -0.0002136705443263054, 6.279349327087402e-05, 0.00033925753086805344, 0.0006157215684652328, 0.0008921856060624123, 0.0011686496436595917, 0.001445113681256771, 0.0017215777188539505, 0.00199804175645113, 0.0022745057940483093, 0.0025509698316454887, 0.002827433869242668, 0.0031038979068398476, 0.003380361944437027, 0.0036568259820342064, 0.003933290019631386, 0.004209754057228565, 0.004486218094825745, 0.004762682132422924, 0.0050391461700201035, 0.005315610207617283, 0.005592074245214462, 0.005868538282811642, 0.006145002320408821, 0.0064214663580060005, 0.00669793039560318, 0.006974394433200359, 0.007250858470797539, 0.007527322508394718, 0.007803786545991898, 0.008080250583589077, 0.008356714621186256, 0.008633178658783436, 0.008909642696380615]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 13.0, 9.0, 11.0, 19.0, 21.0, 24.0, 21.0, 26.0, 38.0, 33.0, 34.0, 49.0, 59.0, 50.0, 45.0, 55.0, 55.0, 57.0, 52.0, 50.0, 30.0, 43.0, 32.0, 33.0, 30.0, 23.0, 15.0, 17.0, 14.0, 11.0, 7.0, 4.0, 4.0, 1.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.9140625, -11.5113525390625, -11.108642578125, -10.7059326171875, -10.30322265625, -9.9005126953125, -9.497802734375, -9.0950927734375, -8.6923828125, -8.2896728515625, -7.886962890625, -7.4842529296875, -7.08154296875, -6.6788330078125, -6.276123046875, -5.8734130859375, -5.470703125, -5.0679931640625, -4.665283203125, -4.2625732421875, -3.85986328125, -3.4571533203125, -3.054443359375, -2.6517333984375, -2.2490234375, -1.8463134765625, -1.443603515625, -1.0408935546875, -0.63818359375, -0.2354736328125, 0.167236328125, 0.5699462890625, 0.97265625, 1.3753662109375, 1.778076171875, 2.1807861328125, 2.58349609375, 2.9862060546875, 3.388916015625, 3.7916259765625, 4.1943359375, 4.5970458984375, 4.999755859375, 5.4024658203125, 5.80517578125, 6.2078857421875, 6.610595703125, 7.0133056640625, 7.416015625, 7.8187255859375, 8.221435546875, 8.6241455078125, 9.02685546875, 9.4295654296875, 9.832275390625, 10.2349853515625, 10.6376953125, 11.0404052734375, 11.443115234375, 11.8458251953125, 12.24853515625, 12.6512451171875, 13.053955078125, 13.4566650390625, 13.859375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 4.0, 4.0, 16.0, 8.0, 18.0, 29.0, 22.0, 36.0, 50.0, 72.0, 88.0, 160.0, 196.0, 261.0, 359.0, 527.0, 790.0, 1167.0, 1687.0, 2825.0, 4501.0, 7869.0, 15936.0, 42929.0, 267759.0, 593307.0, 63410.0, 20381.0, 9606.0, 5274.0, 3125.0, 1935.0, 1282.0, 867.0, 583.0, 414.0, 288.0, 194.0, 156.0, 106.0, 78.0, 70.0, 47.0, 37.0, 35.0, 17.0, 8.0, 6.0, 8.0, 5.0, 6.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-18.515625, -17.921142578125, -17.32666015625, -16.732177734375, -16.1376953125, -15.543212890625, -14.94873046875, -14.354248046875, -13.759765625, -13.165283203125, -12.57080078125, -11.976318359375, -11.3818359375, -10.787353515625, -10.19287109375, -9.598388671875, -9.00390625, -8.409423828125, -7.81494140625, -7.220458984375, -6.6259765625, -6.031494140625, -5.43701171875, -4.842529296875, -4.248046875, -3.653564453125, -3.05908203125, -2.464599609375, -1.8701171875, -1.275634765625, -0.68115234375, -0.086669921875, 0.5078125, 1.102294921875, 1.69677734375, 2.291259765625, 2.8857421875, 3.480224609375, 4.07470703125, 4.669189453125, 5.263671875, 5.858154296875, 6.45263671875, 7.047119140625, 7.6416015625, 8.236083984375, 8.83056640625, 9.425048828125, 10.01953125, 10.614013671875, 11.20849609375, 11.802978515625, 12.3974609375, 12.991943359375, 13.58642578125, 14.180908203125, 14.775390625, 15.369873046875, 15.96435546875, 16.558837890625, 17.1533203125, 17.747802734375, 18.34228515625, 18.936767578125, 19.53125]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 1.0, 1.0, 5.0, 0.0, 2.0, 7.0, 2.0, 7.0, 18.0, 9.0, 22.0, 18.0, 18.0, 35.0, 26.0, 31.0, 36.0, 49.0, 49.0, 50.0, 60.0, 113.0, 246.0, 1580.0, 149.0, 86.0, 59.0, 48.0, 43.0, 39.0, 33.0, 27.0, 34.0, 26.0, 26.0, 23.0, 16.0, 14.0, 9.0, 1.0, 10.0, 13.0, 7.0, 2.0, 3.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.84375, -30.63330078125, -29.4228515625, -28.21240234375, -27.001953125, -25.79150390625, -24.5810546875, -23.37060546875, -22.16015625, -20.94970703125, -19.7392578125, -18.52880859375, -17.318359375, -16.10791015625, -14.8974609375, -13.68701171875, -12.4765625, -11.26611328125, -10.0556640625, -8.84521484375, -7.634765625, -6.42431640625, -5.2138671875, -4.00341796875, -2.79296875, -1.58251953125, -0.3720703125, 0.83837890625, 2.048828125, 3.25927734375, 4.4697265625, 5.68017578125, 6.890625, 8.10107421875, 9.3115234375, 10.52197265625, 11.732421875, 12.94287109375, 14.1533203125, 15.36376953125, 16.57421875, 17.78466796875, 18.9951171875, 20.20556640625, 21.416015625, 22.62646484375, 23.8369140625, 25.04736328125, 26.2578125, 27.46826171875, 28.6787109375, 29.88916015625, 31.099609375, 32.31005859375, 33.5205078125, 34.73095703125, 35.94140625, 37.15185546875, 38.3623046875, 39.57275390625, 40.783203125, 41.99365234375, 43.2041015625, 44.41455078125, 45.625]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 5.0, 0.0, 4.0, 5.0, 5.0, 6.0, 12.0, 7.0, 14.0, 22.0, 23.0, 35.0, 48.0, 71.0, 92.0, 145.0, 232.0, 475.0, 2262.0, 41448.0, 3064997.0, 32679.0, 2002.0, 462.0, 222.0, 130.0, 96.0, 56.0, 43.0, 28.0, 14.0, 22.0, 16.0, 8.0, 5.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.9375, -91.4814453125, -88.025390625, -84.5693359375, -81.11328125, -77.6572265625, -74.201171875, -70.7451171875, -67.2890625, -63.8330078125, -60.376953125, -56.9208984375, -53.46484375, -50.0087890625, -46.552734375, -43.0966796875, -39.640625, -36.1845703125, -32.728515625, -29.2724609375, -25.81640625, -22.3603515625, -18.904296875, -15.4482421875, -11.9921875, -8.5361328125, -5.080078125, -1.6240234375, 1.83203125, 5.2880859375, 8.744140625, 12.2001953125, 15.65625, 19.1123046875, 22.568359375, 26.0244140625, 29.48046875, 32.9365234375, 36.392578125, 39.8486328125, 43.3046875, 46.7607421875, 50.216796875, 53.6728515625, 57.12890625, 60.5849609375, 64.041015625, 67.4970703125, 70.953125, 74.4091796875, 77.865234375, 81.3212890625, 84.77734375, 88.2333984375, 91.689453125, 95.1455078125, 98.6015625, 102.0576171875, 105.513671875, 108.9697265625, 112.42578125, 115.8818359375, 119.337890625, 122.7939453125, 126.25]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 50.0, 596.0, 336.0, 30.0, 5.0], "bins": [-778.5198364257812, -765.7190551757812, -752.9182739257812, -740.1174926757812, -727.3167114257812, -714.5159912109375, -701.7152099609375, -688.9144287109375, -676.1136474609375, -663.3128662109375, -650.5120849609375, -637.7113037109375, -624.9105224609375, -612.1097412109375, -599.3089599609375, -586.5082397460938, -573.7073974609375, -560.9066162109375, -548.1058349609375, -535.3050537109375, -522.5042724609375, -509.7035217285156, -496.9027404785156, -484.1019592285156, -471.30120849609375, -458.50042724609375, -445.69964599609375, -432.89886474609375, -420.0981140136719, -407.2973327636719, -394.4965515136719, -381.6957702636719, -368.89501953125, -356.09423828125, -343.29345703125, -330.49267578125, -317.6919250488281, -304.8911437988281, -292.0903625488281, -279.2895812988281, -266.4888000488281, -253.68801879882812, -240.8872528076172, -228.0864715576172, -215.28570556640625, -202.48492431640625, -189.68414306640625, -176.88336181640625, -164.0825958251953, -151.2818145751953, -138.48104858398438, -125.68026733398438, -112.8794937133789, -100.07872009277344, -87.27793884277344, -74.47716522216797, -61.676395416259766, -48.87561798095703, -36.07484436035156, -23.274066925048828, -10.47329330444336, 2.3274803161621094, 15.12826156616211, 27.929035186767578, 40.72980880737305]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 1.0, 5.0, 5.0, 4.0, 6.0, 10.0, 8.0, 12.0, 8.0, 11.0, 12.0, 27.0, 30.0, 26.0, 32.0, 24.0, 26.0, 39.0, 36.0, 34.0, 37.0, 32.0, 35.0, 32.0, 45.0, 46.0, 42.0, 40.0, 45.0, 32.0, 26.0, 29.0, 36.0, 29.0, 23.0, 18.0, 20.0, 21.0, 14.0, 7.0, 10.0, 11.0, 4.0, 7.0, 4.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0], "bins": [-114.74717712402344, -111.5773696899414, -108.4075698852539, -105.23776245117188, -102.06796264648438, -98.89815521240234, -95.72834777832031, -92.55854797363281, -89.38874053955078, -86.21893310546875, -83.04913330078125, -79.87932586669922, -76.70951843261719, -73.53971862792969, -70.36991119384766, -67.20010375976562, -64.03030395507812, -60.86050033569336, -57.690696716308594, -54.52088928222656, -51.3510856628418, -48.18128204345703, -45.011474609375, -41.841670989990234, -38.67186737060547, -35.5020637512207, -32.33226013183594, -29.162452697753906, -25.99264907836914, -22.822845458984375, -19.653039932250977, -16.483234405517578, -13.313438415527344, -10.143633842468262, -6.97382926940918, -3.8040246963500977, -0.6342201232910156, 2.5355844497680664, 5.705389022827148, 8.875194549560547, 12.044998168945312, 15.214802742004395, 18.384607315063477, 21.554412841796875, 24.72421646118164, 27.894020080566406, 31.063825607299805, 34.2336311340332, 37.40343475341797, 40.573238372802734, 43.7430419921875, 46.91284942626953, 50.0826530456543, 53.25245666503906, 56.422264099121094, 59.59206771850586, 62.761871337890625, 65.93167877197266, 69.10147857666016, 72.27128601074219, 75.44108581542969, 78.61089324951172, 81.78070068359375, 84.95050048828125, 88.12030792236328]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 11.0, 10.0, 17.0, 8.0, 28.0, 24.0, 40.0, 26.0, 32.0, 41.0, 47.0, 42.0, 45.0, 56.0, 57.0, 54.0, 49.0, 56.0, 56.0, 44.0, 38.0, 36.0, 32.0, 28.0, 23.0, 18.0, 14.0, 15.0, 13.0, 7.0, 10.0, 6.0, 1.0, 5.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6640625, -12.2269287109375, -11.789794921875, -11.3526611328125, -10.91552734375, -10.4783935546875, -10.041259765625, -9.6041259765625, -9.1669921875, -8.7298583984375, -8.292724609375, -7.8555908203125, -7.41845703125, -6.9813232421875, -6.544189453125, -6.1070556640625, -5.669921875, -5.2327880859375, -4.795654296875, -4.3585205078125, -3.92138671875, -3.4842529296875, -3.047119140625, -2.6099853515625, -2.1728515625, -1.7357177734375, -1.298583984375, -0.8614501953125, -0.42431640625, 0.0128173828125, 0.449951171875, 0.8870849609375, 1.32421875, 1.7613525390625, 2.198486328125, 2.6356201171875, 3.07275390625, 3.5098876953125, 3.947021484375, 4.3841552734375, 4.8212890625, 5.2584228515625, 5.695556640625, 6.1326904296875, 6.56982421875, 7.0069580078125, 7.444091796875, 7.8812255859375, 8.318359375, 8.7554931640625, 9.192626953125, 9.6297607421875, 10.06689453125, 10.5040283203125, 10.941162109375, 11.3782958984375, 11.8154296875, 12.2525634765625, 12.689697265625, 13.1268310546875, 13.56396484375, 14.0010986328125, 14.438232421875, 14.8753662109375, 15.3125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 6.0, 11.0, 10.0, 12.0, 14.0, 26.0, 27.0, 45.0, 84.0, 106.0, 138.0, 271.0, 457.0, 790.0, 1232.0, 2236.0, 4053.0, 7926.0, 19209.0, 66805.0, 492997.0, 2422479.0, 1002359.0, 125705.0, 26307.0, 9931.0, 4850.0, 2567.0, 1361.0, 857.0, 497.0, 285.0, 209.0, 139.0, 94.0, 53.0, 40.0, 32.0, 19.0, 16.0, 6.0, 2.0, 6.0, 12.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.1875, -19.507080078125, -18.82666015625, -18.146240234375, -17.4658203125, -16.785400390625, -16.10498046875, -15.424560546875, -14.744140625, -14.063720703125, -13.38330078125, -12.702880859375, -12.0224609375, -11.342041015625, -10.66162109375, -9.981201171875, -9.30078125, -8.620361328125, -7.93994140625, -7.259521484375, -6.5791015625, -5.898681640625, -5.21826171875, -4.537841796875, -3.857421875, -3.177001953125, -2.49658203125, -1.816162109375, -1.1357421875, -0.455322265625, 0.22509765625, 0.905517578125, 1.5859375, 2.266357421875, 2.94677734375, 3.627197265625, 4.3076171875, 4.988037109375, 5.66845703125, 6.348876953125, 7.029296875, 7.709716796875, 8.39013671875, 9.070556640625, 9.7509765625, 10.431396484375, 11.11181640625, 11.792236328125, 12.47265625, 13.153076171875, 13.83349609375, 14.513916015625, 15.1943359375, 15.874755859375, 16.55517578125, 17.235595703125, 17.916015625, 18.596435546875, 19.27685546875, 19.957275390625, 20.6376953125, 21.318115234375, 21.99853515625, 22.678955078125, 23.359375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 7.0, 3.0, 10.0, 11.0, 7.0, 11.0, 12.0, 17.0, 28.0, 33.0, 60.0, 65.0, 126.0, 201.0, 365.0, 628.0, 830.0, 664.0, 397.0, 208.0, 112.0, 85.0, 70.0, 31.0, 28.0, 16.0, 9.0, 13.0, 9.0, 6.0, 3.0, 3.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.671875, -30.668212890625, -29.66455078125, -28.660888671875, -27.6572265625, -26.653564453125, -25.64990234375, -24.646240234375, -23.642578125, -22.638916015625, -21.63525390625, -20.631591796875, -19.6279296875, -18.624267578125, -17.62060546875, -16.616943359375, -15.61328125, -14.609619140625, -13.60595703125, -12.602294921875, -11.5986328125, -10.594970703125, -9.59130859375, -8.587646484375, -7.583984375, -6.580322265625, -5.57666015625, -4.572998046875, -3.5693359375, -2.565673828125, -1.56201171875, -0.558349609375, 0.4453125, 1.448974609375, 2.45263671875, 3.456298828125, 4.4599609375, 5.463623046875, 6.46728515625, 7.470947265625, 8.474609375, 9.478271484375, 10.48193359375, 11.485595703125, 12.4892578125, 13.492919921875, 14.49658203125, 15.500244140625, 16.50390625, 17.507568359375, 18.51123046875, 19.514892578125, 20.5185546875, 21.522216796875, 22.52587890625, 23.529541015625, 24.533203125, 25.536865234375, 26.54052734375, 27.544189453125, 28.5478515625, 29.551513671875, 30.55517578125, 31.558837890625, 32.5625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 3.0, 4.0, 9.0, 10.0, 13.0, 13.0, 26.0, 26.0, 67.0, 111.0, 238.0, 536.0, 1329.0, 4039.0, 15422.0, 105802.0, 3353093.0, 662955.0, 38524.0, 7965.0, 2447.0, 855.0, 348.0, 180.0, 100.0, 48.0, 34.0, 25.0, 16.0, 13.0, 10.0, 8.0, 6.0, 2.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.34375, -59.52734375, -57.7109375, -55.89453125, -54.078125, -52.26171875, -50.4453125, -48.62890625, -46.8125, -44.99609375, -43.1796875, -41.36328125, -39.546875, -37.73046875, -35.9140625, -34.09765625, -32.28125, -30.46484375, -28.6484375, -26.83203125, -25.015625, -23.19921875, -21.3828125, -19.56640625, -17.75, -15.93359375, -14.1171875, -12.30078125, -10.484375, -8.66796875, -6.8515625, -5.03515625, -3.21875, -1.40234375, 0.4140625, 2.23046875, 4.046875, 5.86328125, 7.6796875, 9.49609375, 11.3125, 13.12890625, 14.9453125, 16.76171875, 18.578125, 20.39453125, 22.2109375, 24.02734375, 25.84375, 27.66015625, 29.4765625, 31.29296875, 33.109375, 34.92578125, 36.7421875, 38.55859375, 40.375, 42.19140625, 44.0078125, 45.82421875, 47.640625, 49.45703125, 51.2734375, 53.08984375, 54.90625]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 6.0, 11.0, 41.0, 115.0, 246.0, 304.0, 173.0, 75.0, 29.0, 6.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-282.99395751953125, -274.4769287109375, -265.95989990234375, -257.4429016113281, -248.92587280273438, -240.40884399414062, -231.89181518554688, -223.37478637695312, -214.85777282714844, -206.3407440185547, -197.82373046875, -189.30670166015625, -180.7896728515625, -172.2726593017578, -163.75563049316406, -155.23861694335938, -146.72158813476562, -138.20455932617188, -129.6875457763672, -121.17051696777344, -112.65349578857422, -104.136474609375, -95.61944580078125, -87.10242462158203, -78.58540344238281, -70.0683822631836, -61.55135726928711, -53.034332275390625, -44.517311096191406, -36.00028991699219, -27.483264923095703, -18.96623992919922, -10.449249267578125, -1.9322261810302734, 6.584796905517578, 15.10181999206543, 23.61884307861328, 32.1358642578125, 40.652889251708984, 49.16991424560547, 57.68693542480469, 66.2039566040039, 74.72097778320312, 83.23800659179688, 91.7550277709961, 100.27204895019531, 108.78907775878906, 117.30609893798828, 125.8231201171875, 134.34014892578125, 142.85716247558594, 151.3741912841797, 159.89120483398438, 168.40823364257812, 176.92526245117188, 185.44229125976562, 193.9593048095703, 202.47633361816406, 210.99334716796875, 219.5103759765625, 228.02740478515625, 236.54441833496094, 245.0614471435547, 253.57846069335938, 262.0954895019531]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 5.0, 7.0, 6.0, 7.0, 5.0, 4.0, 7.0, 14.0, 7.0, 13.0, 17.0, 20.0, 23.0, 26.0, 26.0, 32.0, 26.0, 37.0, 31.0, 35.0, 34.0, 41.0, 52.0, 44.0, 37.0, 47.0, 44.0, 39.0, 42.0, 42.0, 23.0, 30.0, 32.0, 33.0, 16.0, 5.0, 20.0, 17.0, 9.0, 21.0, 9.0, 4.0, 4.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-79.554443359375, -77.22966003417969, -74.9048843383789, -72.5801010131836, -70.25532531738281, -67.9305419921875, -65.60576629638672, -63.280982971191406, -60.95620346069336, -58.63142395019531, -56.306644439697266, -53.98186492919922, -51.657081604003906, -49.332305908203125, -47.00752258300781, -44.682743072509766, -42.35796356201172, -40.03318405151367, -37.708404541015625, -35.38362503051758, -33.05884552001953, -30.73406410217285, -28.409282684326172, -26.084503173828125, -23.759723663330078, -21.43494415283203, -19.110164642333984, -16.785383224487305, -14.460603713989258, -12.135824203491211, -9.811043739318848, -7.486263275146484, -5.161491394042969, -2.8367114067077637, -0.5119314193725586, 1.8128485679626465, 4.137628555297852, 6.462408065795898, 8.787188529968262, 11.111968994140625, 13.436748504638672, 15.761528015136719, 18.086307525634766, 20.411088943481445, 22.735868453979492, 25.06064796447754, 27.38542938232422, 29.710208892822266, 32.03498840332031, 34.35976791381836, 36.684547424316406, 39.00932693481445, 41.3341064453125, 43.65888977050781, 45.98366928100586, 48.308448791503906, 50.63322830200195, 52.9580078125, 55.28278732299805, 57.607566833496094, 59.932350158691406, 62.25712585449219, 64.5819091796875, 66.90669250488281, 69.2314682006836]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 9.0, 19.0, 20.0, 17.0, 20.0, 23.0, 31.0, 36.0, 35.0, 37.0, 44.0, 45.0, 42.0, 52.0, 61.0, 56.0, 61.0, 58.0, 49.0, 50.0, 36.0, 34.0, 43.0, 17.0, 20.0, 13.0, 17.0, 11.0, 17.0, 2.0, 4.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.75, -12.3056640625, -11.861328125, -11.4169921875, -10.97265625, -10.5283203125, -10.083984375, -9.6396484375, -9.1953125, -8.7509765625, -8.306640625, -7.8623046875, -7.41796875, -6.9736328125, -6.529296875, -6.0849609375, -5.640625, -5.1962890625, -4.751953125, -4.3076171875, -3.86328125, -3.4189453125, -2.974609375, -2.5302734375, -2.0859375, -1.6416015625, -1.197265625, -0.7529296875, -0.30859375, 0.1357421875, 0.580078125, 1.0244140625, 1.46875, 1.9130859375, 2.357421875, 2.8017578125, 3.24609375, 3.6904296875, 4.134765625, 4.5791015625, 5.0234375, 5.4677734375, 5.912109375, 6.3564453125, 6.80078125, 7.2451171875, 7.689453125, 8.1337890625, 8.578125, 9.0224609375, 9.466796875, 9.9111328125, 10.35546875, 10.7998046875, 11.244140625, 11.6884765625, 12.1328125, 12.5771484375, 13.021484375, 13.4658203125, 13.91015625, 14.3544921875, 14.798828125, 15.2431640625, 15.6875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 1.0, 5.0, 5.0, 11.0, 21.0, 27.0, 36.0, 67.0, 75.0, 120.0, 191.0, 287.0, 462.0, 710.0, 1199.0, 1862.0, 2986.0, 4878.0, 8149.0, 14378.0, 25935.0, 48907.0, 93298.0, 176578.0, 255657.0, 190361.0, 102589.0, 53490.0, 28122.0, 15476.0, 9092.0, 5079.0, 3182.0, 1942.0, 1211.0, 774.0, 478.0, 304.0, 209.0, 140.0, 71.0, 71.0, 34.0, 27.0, 23.0, 17.0, 8.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21484375, -2.144683837890625, -2.07452392578125, -2.004364013671875, -1.9342041015625, -1.864044189453125, -1.79388427734375, -1.723724365234375, -1.653564453125, -1.583404541015625, -1.51324462890625, -1.443084716796875, -1.3729248046875, -1.302764892578125, -1.23260498046875, -1.162445068359375, -1.09228515625, -1.022125244140625, -0.95196533203125, -0.881805419921875, -0.8116455078125, -0.741485595703125, -0.67132568359375, -0.601165771484375, -0.531005859375, -0.460845947265625, -0.39068603515625, -0.320526123046875, -0.2503662109375, -0.180206298828125, -0.11004638671875, -0.039886474609375, 0.0302734375, 0.100433349609375, 0.17059326171875, 0.240753173828125, 0.3109130859375, 0.381072998046875, 0.45123291015625, 0.521392822265625, 0.591552734375, 0.661712646484375, 0.73187255859375, 0.802032470703125, 0.8721923828125, 0.942352294921875, 1.01251220703125, 1.082672119140625, 1.15283203125, 1.222991943359375, 1.29315185546875, 1.363311767578125, 1.4334716796875, 1.503631591796875, 1.57379150390625, 1.643951416015625, 1.714111328125, 1.784271240234375, 1.85443115234375, 1.924591064453125, 1.9947509765625, 2.064910888671875, 2.13507080078125, 2.205230712890625, 2.275390625]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 2.0, 5.0, 5.0, 3.0, 6.0, 11.0, 10.0, 10.0, 14.0, 16.0, 25.0, 22.0, 17.0, 20.0, 21.0, 34.0, 34.0, 34.0, 37.0, 46.0, 37.0, 31.0, 37.0, 1057.0, 33.0, 36.0, 40.0, 30.0, 37.0, 36.0, 35.0, 32.0, 28.0, 32.0, 20.0, 14.0, 14.0, 14.0, 15.0, 15.0, 16.0, 9.0, 8.0, 5.0, 12.0, 7.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-7.78125, -7.5504150390625, -7.319580078125, -7.0887451171875, -6.85791015625, -6.6270751953125, -6.396240234375, -6.1654052734375, -5.9345703125, -5.7037353515625, -5.472900390625, -5.2420654296875, -5.01123046875, -4.7803955078125, -4.549560546875, -4.3187255859375, -4.087890625, -3.8570556640625, -3.626220703125, -3.3953857421875, -3.16455078125, -2.9337158203125, -2.702880859375, -2.4720458984375, -2.2412109375, -2.0103759765625, -1.779541015625, -1.5487060546875, -1.31787109375, -1.0870361328125, -0.856201171875, -0.6253662109375, -0.39453125, -0.1636962890625, 0.067138671875, 0.2979736328125, 0.52880859375, 0.7596435546875, 0.990478515625, 1.2213134765625, 1.4521484375, 1.6829833984375, 1.913818359375, 2.1446533203125, 2.37548828125, 2.6063232421875, 2.837158203125, 3.0679931640625, 3.298828125, 3.5296630859375, 3.760498046875, 3.9913330078125, 4.22216796875, 4.4530029296875, 4.683837890625, 4.9146728515625, 5.1455078125, 5.3763427734375, 5.607177734375, 5.8380126953125, 6.06884765625, 6.2996826171875, 6.530517578125, 6.7613525390625, 6.9921875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 3.0, 0.0, 4.0, 7.0, 17.0, 14.0, 36.0, 34.0, 61.0, 80.0, 114.0, 148.0, 241.0, 335.0, 455.0, 698.0, 1101.0, 1588.0, 2328.0, 3385.0, 5176.0, 7651.0, 11467.0, 17561.0, 27446.0, 43792.0, 69685.0, 108941.0, 160156.0, 1230615.0, 142440.0, 94194.0, 60133.0, 37522.0, 23748.0, 15164.0, 10030.0, 6684.0, 4731.0, 2963.0, 2078.0, 1350.0, 918.0, 654.0, 409.0, 306.0, 226.0, 143.0, 107.0, 65.0, 44.0, 26.0, 20.0, 11.0, 12.0, 11.0, 9.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.9609375, -0.9312210083007812, -0.9015045166015625, -0.8717880249023438, -0.842071533203125, -0.8123550415039062, -0.7826385498046875, -0.7529220581054688, -0.72320556640625, -0.6934890747070312, -0.6637725830078125, -0.6340560913085938, -0.604339599609375, -0.5746231079101562, -0.5449066162109375, -0.5151901245117188, -0.4854736328125, -0.45575714111328125, -0.4260406494140625, -0.39632415771484375, -0.366607666015625, -0.33689117431640625, -0.3071746826171875, -0.27745819091796875, -0.24774169921875, -0.21802520751953125, -0.1883087158203125, -0.15859222412109375, -0.128875732421875, -0.09915924072265625, -0.0694427490234375, -0.03972625732421875, -0.010009765625, 0.01970672607421875, 0.0494232177734375, 0.07913970947265625, 0.108856201171875, 0.13857269287109375, 0.1682891845703125, 0.19800567626953125, 0.22772216796875, 0.25743865966796875, 0.2871551513671875, 0.31687164306640625, 0.346588134765625, 0.37630462646484375, 0.4060211181640625, 0.43573760986328125, 0.4654541015625, 0.49517059326171875, 0.5248870849609375, 0.5546035766601562, 0.584320068359375, 0.6140365600585938, 0.6437530517578125, 0.6734695434570312, 0.70318603515625, 0.7329025268554688, 0.7626190185546875, 0.7923355102539062, 0.822052001953125, 0.8517684936523438, 0.8814849853515625, 0.9112014770507812, 0.94091796875]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 7.0, 9.0, 14.0, 24.0, 42.0, 70.0, 101.0, 141.0, 175.0, 136.0, 72.0, 53.0, 40.0, 23.0, 15.0, 8.0, 10.0, 9.0, 2.0, 4.0, 0.0, 2.0, 4.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.03997802734375, -0.03890728950500488, -0.037836551666259766, -0.03676581382751465, -0.03569507598876953, -0.034624338150024414, -0.0335536003112793, -0.03248286247253418, -0.03141212463378906, -0.030341386795043945, -0.029270648956298828, -0.02819991111755371, -0.027129173278808594, -0.026058435440063477, -0.02498769760131836, -0.023916959762573242, -0.022846221923828125, -0.021775484085083008, -0.02070474624633789, -0.019634008407592773, -0.018563270568847656, -0.01749253273010254, -0.016421794891357422, -0.015351057052612305, -0.014280319213867188, -0.01320958137512207, -0.012138843536376953, -0.011068105697631836, -0.009997367858886719, -0.008926630020141602, -0.007855892181396484, -0.006785154342651367, -0.00571441650390625, -0.004643678665161133, -0.0035729408264160156, -0.0025022029876708984, -0.0014314651489257812, -0.00036072731018066406, 0.0007100105285644531, 0.0017807483673095703, 0.0028514862060546875, 0.003922224044799805, 0.004992961883544922, 0.006063699722290039, 0.007134437561035156, 0.008205175399780273, 0.00927591323852539, 0.010346651077270508, 0.011417388916015625, 0.012488126754760742, 0.01355886459350586, 0.014629602432250977, 0.015700340270996094, 0.01677107810974121, 0.017841815948486328, 0.018912553787231445, 0.019983291625976562, 0.02105402946472168, 0.022124767303466797, 0.023195505142211914, 0.02426624298095703, 0.02533698081970215, 0.026407718658447266, 0.027478456497192383, 0.0285491943359375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 1.0, 5.0, 4.0, 13.0, 19.0, 21.0, 62.0, 94.0, 181.0, 500.0, 7512.0, 1007227.0, 31396.0, 996.0, 266.0, 107.0, 48.0, 23.0, 22.0, 7.0, 8.0, 5.0, 0.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.60400390625, -0.5813446044921875, -0.558685302734375, -0.5360260009765625, -0.51336669921875, -0.4907073974609375, -0.468048095703125, -0.4453887939453125, -0.4227294921875, -0.4000701904296875, -0.377410888671875, -0.3547515869140625, -0.33209228515625, -0.3094329833984375, -0.286773681640625, -0.2641143798828125, -0.241455078125, -0.2187957763671875, -0.196136474609375, -0.1734771728515625, -0.15081787109375, -0.1281585693359375, -0.105499267578125, -0.0828399658203125, -0.0601806640625, -0.0375213623046875, -0.014862060546875, 0.0077972412109375, 0.03045654296875, 0.0531158447265625, 0.075775146484375, 0.0984344482421875, 0.12109375, 0.1437530517578125, 0.166412353515625, 0.1890716552734375, 0.21173095703125, 0.2343902587890625, 0.257049560546875, 0.2797088623046875, 0.3023681640625, 0.3250274658203125, 0.347686767578125, 0.3703460693359375, 0.39300537109375, 0.4156646728515625, 0.438323974609375, 0.4609832763671875, 0.483642578125, 0.5063018798828125, 0.528961181640625, 0.5516204833984375, 0.57427978515625, 0.5969390869140625, 0.619598388671875, 0.6422576904296875, 0.6649169921875, 0.6875762939453125, 0.710235595703125, 0.7328948974609375, 0.75555419921875, 0.7782135009765625, 0.800872802734375, 0.8235321044921875, 0.84619140625]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 8.0, 18.0, 72.0, 292.0, 390.0, 141.0, 51.0, 19.0, 9.0, 7.0, 7.0], "bins": [-0.28634798526763916, -0.2813399136066437, -0.2763318419456482, -0.2713237702846527, -0.2663156986236572, -0.26130759716033936, -0.25629952549934387, -0.2512914538383484, -0.2462833821773529, -0.24127531051635742, -0.23626723885536194, -0.23125915229320526, -0.22625108063220978, -0.2212430089712143, -0.2162349373102188, -0.21122686564922333, -0.20621879398822784, -0.20121072232723236, -0.19620265066623688, -0.1911945641040802, -0.18618649244308472, -0.18117842078208923, -0.17617034912109375, -0.17116227746009827, -0.16615420579910278, -0.1611461341381073, -0.15613806247711182, -0.15112997591495514, -0.14612190425395966, -0.14111383259296417, -0.1361057609319687, -0.1310976892709732, -0.12608958780765533, -0.12108151614665985, -0.11607343703508377, -0.11106536537408829, -0.10605728626251221, -0.10104921460151672, -0.09604114294052124, -0.09103307127952576, -0.08602499961853027, -0.08101692795753479, -0.07600884884595871, -0.07100077718496323, -0.06599269807338715, -0.06098462641239166, -0.05597655475139618, -0.0509684793651104, -0.04596040025353432, -0.040952324867248535, -0.03594425320625305, -0.03093617781996727, -0.025928102433681488, -0.020920027047395706, -0.015911953523755074, -0.010903880000114441, -0.005895804613828659, -0.0008877301588654518, 0.004120344296097755, 0.009128418751060963, 0.01413649320602417, 0.019144568592309952, 0.024152642115950584, 0.029160715639591217, 0.034168791025877]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 6.0, 3.0, 11.0, 4.0, 9.0, 0.0, 8.0, 13.0, 16.0, 18.0, 14.0, 22.0, 17.0, 36.0, 19.0, 32.0, 30.0, 36.0, 44.0, 41.0, 35.0, 43.0, 30.0, 27.0, 43.0, 38.0, 32.0, 30.0, 26.0, 32.0, 30.0, 28.0, 20.0, 34.0, 13.0, 16.0, 28.0, 19.0, 16.0, 16.0, 13.0, 10.0, 14.0, 6.0, 12.0, 2.0, 7.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.014987409114837646, -0.014529501087963581, -0.014071593061089516, -0.01361368503421545, -0.013155777007341385, -0.01269786898046732, -0.012239960953593254, -0.011782052926719189, -0.011324144899845123, -0.010866236872971058, -0.010408328846096992, -0.009950420819222927, -0.009492512792348862, -0.009034604765474796, -0.008576696738600731, -0.008118788711726665, -0.0076608806848526, -0.007202972657978535, -0.006745064631104469, -0.006287156604230404, -0.0058292485773563385, -0.005371340550482273, -0.004913432523608208, -0.004455524496734142, -0.003997616469860077, -0.0035397084429860115, -0.003081800416111946, -0.0026238923892378807, -0.0021659843623638153, -0.00170807633548975, -0.0012501683086156845, -0.0007922602817416191, -0.0003343522548675537, 0.0001235557720065117, 0.0005814637988805771, 0.0010393718257546425, 0.0014972798526287079, 0.0019551878795027733, 0.0024130959063768387, 0.002871003933250904, 0.0033289119601249695, 0.003786819986999035, 0.0042447280138731, 0.004702636040747166, 0.005160544067621231, 0.0056184520944952965, 0.006076360121369362, 0.006534268148243427, 0.006992176175117493, 0.007450084201991558, 0.007907992228865623, 0.008365900255739689, 0.008823808282613754, 0.00928171630948782, 0.009739624336361885, 0.01019753236323595, 0.010655440390110016, 0.011113348416984081, 0.011571256443858147, 0.012029164470732212, 0.012487072497606277, 0.012944980524480343, 0.013402888551354408, 0.013860796578228474, 0.014318704605102539]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 9.0, 9.0, 19.0, 20.0, 17.0, 20.0, 23.0, 31.0, 36.0, 35.0, 37.0, 44.0, 45.0, 42.0, 52.0, 61.0, 56.0, 60.0, 59.0, 49.0, 50.0, 36.0, 34.0, 43.0, 17.0, 20.0, 13.0, 17.0, 11.0, 17.0, 2.0, 4.0, 3.0, 5.0, 1.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.75, -12.3056640625, -11.861328125, -11.4169921875, -10.97265625, -10.5283203125, -10.083984375, -9.6396484375, -9.1953125, -8.7509765625, -8.306640625, -7.8623046875, -7.41796875, -6.9736328125, -6.529296875, -6.0849609375, -5.640625, -5.1962890625, -4.751953125, -4.3076171875, -3.86328125, -3.4189453125, -2.974609375, -2.5302734375, -2.0859375, -1.6416015625, -1.197265625, -0.7529296875, -0.30859375, 0.1357421875, 0.580078125, 1.0244140625, 1.46875, 1.9130859375, 2.357421875, 2.8017578125, 3.24609375, 3.6904296875, 4.134765625, 4.5791015625, 5.0234375, 5.4677734375, 5.912109375, 6.3564453125, 6.80078125, 7.2451171875, 7.689453125, 8.1337890625, 8.578125, 9.0224609375, 9.466796875, 9.9111328125, 10.35546875, 10.7998046875, 11.244140625, 11.6884765625, 12.1328125, 12.5771484375, 13.021484375, 13.4658203125, 13.91015625, 14.3544921875, 14.798828125, 15.2431640625, 15.6875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 8.0, 7.0, 5.0, 14.0, 14.0, 23.0, 30.0, 30.0, 28.0, 45.0, 89.0, 90.0, 158.0, 177.0, 259.0, 393.0, 556.0, 905.0, 1429.0, 2280.0, 3739.0, 7100.0, 15495.0, 51292.0, 309450.0, 538124.0, 76250.0, 20314.0, 8538.0, 4413.0, 2513.0, 1579.0, 957.0, 646.0, 465.0, 312.0, 219.0, 178.0, 109.0, 92.0, 49.0, 49.0, 37.0, 25.0, 18.0, 13.0, 10.0, 4.0, 8.0, 3.0, 5.0, 8.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-16.53125, -16.000244140625, -15.46923828125, -14.938232421875, -14.4072265625, -13.876220703125, -13.34521484375, -12.814208984375, -12.283203125, -11.752197265625, -11.22119140625, -10.690185546875, -10.1591796875, -9.628173828125, -9.09716796875, -8.566162109375, -8.03515625, -7.504150390625, -6.97314453125, -6.442138671875, -5.9111328125, -5.380126953125, -4.84912109375, -4.318115234375, -3.787109375, -3.256103515625, -2.72509765625, -2.194091796875, -1.6630859375, -1.132080078125, -0.60107421875, -0.070068359375, 0.4609375, 0.991943359375, 1.52294921875, 2.053955078125, 2.5849609375, 3.115966796875, 3.64697265625, 4.177978515625, 4.708984375, 5.239990234375, 5.77099609375, 6.302001953125, 6.8330078125, 7.364013671875, 7.89501953125, 8.426025390625, 8.95703125, 9.488037109375, 10.01904296875, 10.550048828125, 11.0810546875, 11.612060546875, 12.14306640625, 12.674072265625, 13.205078125, 13.736083984375, 14.26708984375, 14.798095703125, 15.3291015625, 15.860107421875, 16.39111328125, 16.922119140625, 17.453125]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 5.0, 0.0, 4.0, 6.0, 2.0, 9.0, 8.0, 8.0, 21.0, 10.0, 18.0, 23.0, 31.0, 44.0, 30.0, 32.0, 55.0, 43.0, 70.0, 104.0, 376.0, 1579.0, 135.0, 64.0, 55.0, 41.0, 42.0, 35.0, 31.0, 24.0, 24.0, 22.0, 19.0, 18.0, 19.0, 11.0, 10.0, 1.0, 9.0, 5.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-47.25, -45.8232421875, -44.396484375, -42.9697265625, -41.54296875, -40.1162109375, -38.689453125, -37.2626953125, -35.8359375, -34.4091796875, -32.982421875, -31.5556640625, -30.12890625, -28.7021484375, -27.275390625, -25.8486328125, -24.421875, -22.9951171875, -21.568359375, -20.1416015625, -18.71484375, -17.2880859375, -15.861328125, -14.4345703125, -13.0078125, -11.5810546875, -10.154296875, -8.7275390625, -7.30078125, -5.8740234375, -4.447265625, -3.0205078125, -1.59375, -0.1669921875, 1.259765625, 2.6865234375, 4.11328125, 5.5400390625, 6.966796875, 8.3935546875, 9.8203125, 11.2470703125, 12.673828125, 14.1005859375, 15.52734375, 16.9541015625, 18.380859375, 19.8076171875, 21.234375, 22.6611328125, 24.087890625, 25.5146484375, 26.94140625, 28.3681640625, 29.794921875, 31.2216796875, 32.6484375, 34.0751953125, 35.501953125, 36.9287109375, 38.35546875, 39.7822265625, 41.208984375, 42.6357421875, 44.0625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 6.0, 3.0, 7.0, 5.0, 4.0, 13.0, 12.0, 26.0, 18.0, 36.0, 39.0, 38.0, 66.0, 87.0, 114.0, 179.0, 282.0, 715.0, 2858.0, 45459.0, 3073692.0, 18692.0, 1980.0, 522.0, 275.0, 134.0, 98.0, 102.0, 57.0, 37.0, 30.0, 29.0, 21.0, 16.0, 12.0, 11.0, 7.0, 4.0, 6.0, 2.0, 7.0, 3.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-90.75, -87.662109375, -84.57421875, -81.486328125, -78.3984375, -75.310546875, -72.22265625, -69.134765625, -66.046875, -62.958984375, -59.87109375, -56.783203125, -53.6953125, -50.607421875, -47.51953125, -44.431640625, -41.34375, -38.255859375, -35.16796875, -32.080078125, -28.9921875, -25.904296875, -22.81640625, -19.728515625, -16.640625, -13.552734375, -10.46484375, -7.376953125, -4.2890625, -1.201171875, 1.88671875, 4.974609375, 8.0625, 11.150390625, 14.23828125, 17.326171875, 20.4140625, 23.501953125, 26.58984375, 29.677734375, 32.765625, 35.853515625, 38.94140625, 42.029296875, 45.1171875, 48.205078125, 51.29296875, 54.380859375, 57.46875, 60.556640625, 63.64453125, 66.732421875, 69.8203125, 72.908203125, 75.99609375, 79.083984375, 82.171875, 85.259765625, 88.34765625, 91.435546875, 94.5234375, 97.611328125, 100.69921875, 103.787109375, 106.875]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 178.0, 830.0, 8.0, 1.0, 0.0, 1.0], "bins": [-1408.3238525390625, -1384.528564453125, -1360.7333984375, -1336.9381103515625, -1313.142822265625, -1289.34765625, -1265.5523681640625, -1241.7572021484375, -1217.9619140625, -1194.1666259765625, -1170.3714599609375, -1146.576171875, -1122.781005859375, -1098.9857177734375, -1075.1904296875, -1051.395263671875, -1027.5999755859375, -1003.8047485351562, -980.009521484375, -956.2142333984375, -932.4190063476562, -908.623779296875, -884.8284912109375, -861.0332641601562, -837.238037109375, -813.4428100585938, -789.6475830078125, -765.852294921875, -742.0570678710938, -718.2618408203125, -694.466552734375, -670.6713256835938, -646.8760986328125, -623.0808715820312, -599.28564453125, -575.4903564453125, -551.6951293945312, -527.89990234375, -504.1046447753906, -480.30938720703125, -456.51416015625, -432.71893310546875, -408.9236755371094, -385.12841796875, -361.33319091796875, -337.5379638671875, -313.7427062988281, -289.94744873046875, -266.1522216796875, -242.3569793701172, -218.56173706054688, -194.76649475097656, -170.97125244140625, -147.17601013183594, -123.38076782226562, -99.58552551269531, -75.79027557373047, -51.995033264160156, -28.199790954589844, -4.404548645019531, 19.39069366455078, 43.185935974121094, 66.9811782836914, 90.77642059326172, 114.57166290283203]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 2.0, 9.0, 7.0, 6.0, 9.0, 12.0, 17.0, 14.0, 20.0, 25.0, 22.0, 21.0, 29.0, 31.0, 46.0, 27.0, 43.0, 41.0, 39.0, 31.0, 37.0, 39.0, 44.0, 39.0, 39.0, 33.0, 36.0, 41.0, 27.0, 26.0, 23.0, 24.0, 24.0, 25.0, 19.0, 20.0, 12.0, 5.0, 6.0, 9.0, 5.0, 3.0, 4.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-100.46959686279297, -97.39745330810547, -94.32530975341797, -91.25316619873047, -88.18102264404297, -85.10887908935547, -82.0367431640625, -78.964599609375, -75.8924560546875, -72.8203125, -69.7481689453125, -66.676025390625, -63.6038818359375, -60.53173828125, -57.459598541259766, -54.387454986572266, -51.3153076171875, -48.2431640625, -45.1710205078125, -42.098876953125, -39.0267333984375, -35.95458984375, -32.882450103759766, -29.810306549072266, -26.738162994384766, -23.666019439697266, -20.593875885009766, -17.5217342376709, -14.449590682983398, -11.377447128295898, -8.305305480957031, -5.233161926269531, -2.1610183715820312, 0.9111247062683105, 3.9832677841186523, 7.055410385131836, 10.127553939819336, 13.199697494506836, 16.271839141845703, 19.343982696533203, 22.416126251220703, 25.488269805908203, 28.560413360595703, 31.63255500793457, 34.70469665527344, 37.77684020996094, 40.84898376464844, 43.92112731933594, 46.99327087402344, 50.06541442871094, 53.13755798339844, 56.20970153808594, 59.28184509277344, 62.35398864746094, 65.42613220214844, 68.49827575683594, 71.57041931152344, 74.64256286621094, 77.71470642089844, 80.78684997558594, 83.85899353027344, 86.93113708496094, 90.00328063964844, 93.07542419433594, 96.1475601196289]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 2.0, 3.0, 8.0, 13.0, 18.0, 18.0, 19.0, 22.0, 26.0, 37.0, 36.0, 27.0, 38.0, 30.0, 51.0, 68.0, 39.0, 51.0, 65.0, 68.0, 57.0, 45.0, 42.0, 34.0, 27.0, 40.0, 33.0, 19.0, 9.0, 11.0, 17.0, 13.0, 5.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.8515625, -12.3848876953125, -11.918212890625, -11.4515380859375, -10.98486328125, -10.5181884765625, -10.051513671875, -9.5848388671875, -9.1181640625, -8.6514892578125, -8.184814453125, -7.7181396484375, -7.25146484375, -6.7847900390625, -6.318115234375, -5.8514404296875, -5.384765625, -4.9180908203125, -4.451416015625, -3.9847412109375, -3.51806640625, -3.0513916015625, -2.584716796875, -2.1180419921875, -1.6513671875, -1.1846923828125, -0.718017578125, -0.2513427734375, 0.21533203125, 0.6820068359375, 1.148681640625, 1.6153564453125, 2.08203125, 2.5487060546875, 3.015380859375, 3.4820556640625, 3.94873046875, 4.4154052734375, 4.882080078125, 5.3487548828125, 5.8154296875, 6.2821044921875, 6.748779296875, 7.2154541015625, 7.68212890625, 8.1488037109375, 8.615478515625, 9.0821533203125, 9.548828125, 10.0155029296875, 10.482177734375, 10.9488525390625, 11.41552734375, 11.8822021484375, 12.348876953125, 12.8155517578125, 13.2822265625, 13.7489013671875, 14.215576171875, 14.6822509765625, 15.14892578125, 15.6156005859375, 16.082275390625, 16.5489501953125, 17.015625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 2.0, 2.0, 3.0, 12.0, 20.0, 17.0, 16.0, 16.0, 30.0, 32.0, 51.0, 83.0, 140.0, 449.0, 1182.0, 4153.0, 20147.0, 589019.0, 3496762.0, 70688.0, 8200.0, 2006.0, 640.0, 244.0, 118.0, 67.0, 57.0, 34.0, 23.0, 9.0, 10.0, 17.0, 11.0, 8.0, 6.0, 2.0, 4.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.8125, -43.1064453125, -41.400390625, -39.6943359375, -37.98828125, -36.2822265625, -34.576171875, -32.8701171875, -31.1640625, -29.4580078125, -27.751953125, -26.0458984375, -24.33984375, -22.6337890625, -20.927734375, -19.2216796875, -17.515625, -15.8095703125, -14.103515625, -12.3974609375, -10.69140625, -8.9853515625, -7.279296875, -5.5732421875, -3.8671875, -2.1611328125, -0.455078125, 1.2509765625, 2.95703125, 4.6630859375, 6.369140625, 8.0751953125, 9.78125, 11.4873046875, 13.193359375, 14.8994140625, 16.60546875, 18.3115234375, 20.017578125, 21.7236328125, 23.4296875, 25.1357421875, 26.841796875, 28.5478515625, 30.25390625, 31.9599609375, 33.666015625, 35.3720703125, 37.078125, 38.7841796875, 40.490234375, 42.1962890625, 43.90234375, 45.6083984375, 47.314453125, 49.0205078125, 50.7265625, 52.4326171875, 54.138671875, 55.8447265625, 57.55078125, 59.2568359375, 60.962890625, 62.6689453125, 64.375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 15.0, 5.0, 7.0, 15.0, 19.0, 21.0, 35.0, 69.0, 70.0, 119.0, 224.0, 410.0, 712.0, 886.0, 640.0, 396.0, 156.0, 79.0, 63.0, 44.0, 27.0, 17.0, 20.0, 9.0, 2.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.09375, -34.97705078125, -33.8603515625, -32.74365234375, -31.626953125, -30.51025390625, -29.3935546875, -28.27685546875, -27.16015625, -26.04345703125, -24.9267578125, -23.81005859375, -22.693359375, -21.57666015625, -20.4599609375, -19.34326171875, -18.2265625, -17.10986328125, -15.9931640625, -14.87646484375, -13.759765625, -12.64306640625, -11.5263671875, -10.40966796875, -9.29296875, -8.17626953125, -7.0595703125, -5.94287109375, -4.826171875, -3.70947265625, -2.5927734375, -1.47607421875, -0.359375, 0.75732421875, 1.8740234375, 2.99072265625, 4.107421875, 5.22412109375, 6.3408203125, 7.45751953125, 8.57421875, 9.69091796875, 10.8076171875, 11.92431640625, 13.041015625, 14.15771484375, 15.2744140625, 16.39111328125, 17.5078125, 18.62451171875, 19.7412109375, 20.85791015625, 21.974609375, 23.09130859375, 24.2080078125, 25.32470703125, 26.44140625, 27.55810546875, 28.6748046875, 29.79150390625, 30.908203125, 32.02490234375, 33.1416015625, 34.25830078125, 35.375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 5.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 25.0, 30.0, 44.0, 80.0, 149.0, 338.0, 1073.0, 4737.0, 41737.0, 2965491.0, 1149681.0, 25876.0, 3531.0, 784.0, 287.0, 156.0, 90.0, 45.0, 28.0, 18.0, 23.0, 7.0, 10.0, 11.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.6875, -75.2529296875, -72.818359375, -70.3837890625, -67.94921875, -65.5146484375, -63.080078125, -60.6455078125, -58.2109375, -55.7763671875, -53.341796875, -50.9072265625, -48.47265625, -46.0380859375, -43.603515625, -41.1689453125, -38.734375, -36.2998046875, -33.865234375, -31.4306640625, -28.99609375, -26.5615234375, -24.126953125, -21.6923828125, -19.2578125, -16.8232421875, -14.388671875, -11.9541015625, -9.51953125, -7.0849609375, -4.650390625, -2.2158203125, 0.21875, 2.6533203125, 5.087890625, 7.5224609375, 9.95703125, 12.3916015625, 14.826171875, 17.2607421875, 19.6953125, 22.1298828125, 24.564453125, 26.9990234375, 29.43359375, 31.8681640625, 34.302734375, 36.7373046875, 39.171875, 41.6064453125, 44.041015625, 46.4755859375, 48.91015625, 51.3447265625, 53.779296875, 56.2138671875, 58.6484375, 61.0830078125, 63.517578125, 65.9521484375, 68.38671875, 70.8212890625, 73.255859375, 75.6904296875, 78.125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 9.0, 35.0, 118.0, 250.0, 328.0, 175.0, 62.0, 25.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-311.44061279296875, -302.3659362792969, -293.2912902832031, -284.21661376953125, -275.1419677734375, -266.0672912597656, -256.9926452636719, -247.91796875, -238.84332275390625, -229.76866149902344, -220.69400024414062, -211.6193389892578, -202.544677734375, -193.4700164794922, -184.39535522460938, -175.3206787109375, -166.2460174560547, -157.17135620117188, -148.09669494628906, -139.02203369140625, -129.94737243652344, -120.87271118164062, -111.79804229736328, -102.72338104248047, -93.64871978759766, -84.57405853271484, -75.49939727783203, -66.42472839355469, -57.35007095336914, -48.27540969848633, -39.20074462890625, -30.126083374023438, -21.051422119140625, -11.976759910583496, -2.902097702026367, 6.172565460205078, 15.24722671508789, 24.321887969970703, 33.39655303955078, 42.471214294433594, 51.545875549316406, 60.62053680419922, 69.69519805908203, 78.76986694335938, 87.84452819824219, 96.919189453125, 105.99385070800781, 115.06851196289062, 124.14317321777344, 133.21783447265625, 142.29249572753906, 151.36715698242188, 160.4418182373047, 169.5164794921875, 178.59115600585938, 187.66580200195312, 196.740478515625, 205.8151397705078, 214.88980102539062, 223.96446228027344, 233.03912353515625, 242.11378479003906, 251.18844604492188, 260.26312255859375, 269.3377685546875]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 4.0, 2.0, 3.0, 4.0, 6.0, 7.0, 3.0, 6.0, 16.0, 19.0, 18.0, 15.0, 19.0, 17.0, 24.0, 13.0, 29.0, 23.0, 21.0, 34.0, 33.0, 29.0, 38.0, 38.0, 36.0, 47.0, 33.0, 45.0, 45.0, 40.0, 37.0, 29.0, 26.0, 30.0, 26.0, 14.0, 20.0, 22.0, 25.0, 20.0, 14.0, 15.0, 15.0, 11.0, 8.0, 4.0, 10.0, 3.0, 4.0, 2.0, 5.0, 1.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-65.13229370117188, -62.97682571411133, -60.821353912353516, -58.66588592529297, -56.510414123535156, -54.35494613647461, -52.19947814941406, -50.04400634765625, -47.8885383605957, -45.733070373535156, -43.577598571777344, -41.4221305847168, -39.26666259765625, -37.11119079589844, -34.95572280883789, -32.800254821777344, -30.64478302001953, -28.48931312561035, -26.333843231201172, -24.178375244140625, -22.022905349731445, -19.867435455322266, -17.71196746826172, -15.556497573852539, -13.40102767944336, -11.24555778503418, -9.090088844299316, -6.934619426727295, -4.779150009155273, -2.6236801147460938, -0.46821117401123047, 1.6872577667236328, 3.8427276611328125, 5.998197078704834, 8.153666496276855, 10.309135437011719, 12.464605331420898, 14.620075225830078, 16.775543212890625, 18.931013107299805, 21.086483001708984, 23.241952896118164, 25.397422790527344, 27.55289077758789, 29.70836067199707, 31.86383056640625, 34.0192985534668, 36.174766540527344, 38.330238342285156, 40.4857063293457, 42.641178131103516, 44.79664611816406, 46.952117919921875, 49.10758590698242, 51.26305389404297, 53.41852569580078, 55.57399368286133, 57.729461669921875, 59.88493347167969, 62.040401458740234, 64.19586944580078, 66.3513412475586, 68.5068130493164, 70.66227722167969, 72.8177490234375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 11.0, 16.0, 16.0, 12.0, 23.0, 13.0, 21.0, 24.0, 25.0, 23.0, 36.0, 33.0, 39.0, 43.0, 38.0, 45.0, 51.0, 62.0, 48.0, 48.0, 37.0, 52.0, 43.0, 36.0, 31.0, 30.0, 23.0, 22.0, 25.0, 18.0, 13.0, 4.0, 14.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.617431640625, -10.21142578125, -9.805419921875, -9.3994140625, -8.993408203125, -8.58740234375, -8.181396484375, -7.775390625, -7.369384765625, -6.96337890625, -6.557373046875, -6.1513671875, -5.745361328125, -5.33935546875, -4.933349609375, -4.52734375, -4.121337890625, -3.71533203125, -3.309326171875, -2.9033203125, -2.497314453125, -2.09130859375, -1.685302734375, -1.279296875, -0.873291015625, -0.46728515625, -0.061279296875, 0.3447265625, 0.750732421875, 1.15673828125, 1.562744140625, 1.96875, 2.374755859375, 2.78076171875, 3.186767578125, 3.5927734375, 3.998779296875, 4.40478515625, 4.810791015625, 5.216796875, 5.622802734375, 6.02880859375, 6.434814453125, 6.8408203125, 7.246826171875, 7.65283203125, 8.058837890625, 8.46484375, 8.870849609375, 9.27685546875, 9.682861328125, 10.0888671875, 10.494873046875, 10.90087890625, 11.306884765625, 11.712890625, 12.118896484375, 12.52490234375, 12.930908203125, 13.3369140625, 13.742919921875, 14.14892578125, 14.554931640625, 14.9609375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 2.0, 3.0, 9.0, 15.0, 14.0, 27.0, 34.0, 67.0, 106.0, 145.0, 218.0, 332.0, 500.0, 790.0, 1151.0, 1770.0, 2693.0, 4203.0, 6459.0, 10296.0, 16638.0, 27387.0, 45926.0, 76804.0, 127554.0, 196307.0, 198143.0, 130193.0, 78920.0, 47005.0, 28150.0, 17072.0, 10796.0, 6677.0, 4251.0, 2708.0, 1770.0, 1133.0, 822.0, 483.0, 337.0, 238.0, 143.0, 96.0, 59.0, 42.0, 24.0, 20.0, 8.0, 6.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.984375, -1.9224090576171875, -1.860443115234375, -1.7984771728515625, -1.73651123046875, -1.6745452880859375, -1.612579345703125, -1.5506134033203125, -1.4886474609375, -1.4266815185546875, -1.364715576171875, -1.3027496337890625, -1.24078369140625, -1.1788177490234375, -1.116851806640625, -1.0548858642578125, -0.992919921875, -0.9309539794921875, -0.868988037109375, -0.8070220947265625, -0.74505615234375, -0.6830902099609375, -0.621124267578125, -0.5591583251953125, -0.4971923828125, -0.4352264404296875, -0.373260498046875, -0.3112945556640625, -0.24932861328125, -0.1873626708984375, -0.125396728515625, -0.0634307861328125, -0.00146484375, 0.0605010986328125, 0.122467041015625, 0.1844329833984375, 0.24639892578125, 0.3083648681640625, 0.370330810546875, 0.4322967529296875, 0.4942626953125, 0.5562286376953125, 0.618194580078125, 0.6801605224609375, 0.74212646484375, 0.8040924072265625, 0.866058349609375, 0.9280242919921875, 0.989990234375, 1.0519561767578125, 1.113922119140625, 1.1758880615234375, 1.23785400390625, 1.2998199462890625, 1.361785888671875, 1.4237518310546875, 1.4857177734375, 1.5476837158203125, 1.609649658203125, 1.6716156005859375, 1.73358154296875, 1.7955474853515625, 1.857513427734375, 1.9194793701171875, 1.9814453125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 2.0, 7.0, 5.0, 7.0, 6.0, 7.0, 14.0, 14.0, 12.0, 24.0, 25.0, 27.0, 24.0, 23.0, 28.0, 40.0, 42.0, 40.0, 47.0, 37.0, 35.0, 1067.0, 47.0, 42.0, 37.0, 37.0, 25.0, 33.0, 34.0, 40.0, 36.0, 17.0, 32.0, 21.0, 12.0, 14.0, 14.0, 10.0, 9.0, 5.0, 4.0, 6.0, 9.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.59375, -8.336181640625, -8.07861328125, -7.821044921875, -7.5634765625, -7.305908203125, -7.04833984375, -6.790771484375, -6.533203125, -6.275634765625, -6.01806640625, -5.760498046875, -5.5029296875, -5.245361328125, -4.98779296875, -4.730224609375, -4.47265625, -4.215087890625, -3.95751953125, -3.699951171875, -3.4423828125, -3.184814453125, -2.92724609375, -2.669677734375, -2.412109375, -2.154541015625, -1.89697265625, -1.639404296875, -1.3818359375, -1.124267578125, -0.86669921875, -0.609130859375, -0.3515625, -0.093994140625, 0.16357421875, 0.421142578125, 0.6787109375, 0.936279296875, 1.19384765625, 1.451416015625, 1.708984375, 1.966552734375, 2.22412109375, 2.481689453125, 2.7392578125, 2.996826171875, 3.25439453125, 3.511962890625, 3.76953125, 4.027099609375, 4.28466796875, 4.542236328125, 4.7998046875, 5.057373046875, 5.31494140625, 5.572509765625, 5.830078125, 6.087646484375, 6.34521484375, 6.602783203125, 6.8603515625, 7.117919921875, 7.37548828125, 7.633056640625, 7.890625]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 8.0, 5.0, 5.0, 11.0, 13.0, 30.0, 33.0, 46.0, 73.0, 111.0, 171.0, 225.0, 370.0, 446.0, 802.0, 1308.0, 1978.0, 3112.0, 4941.0, 8122.0, 13218.0, 21679.0, 36798.0, 63178.0, 110043.0, 183275.0, 1268947.0, 156714.0, 91325.0, 52123.0, 30317.0, 18089.0, 10980.0, 6965.0, 4225.0, 2635.0, 1653.0, 1053.0, 668.0, 479.0, 334.0, 195.0, 132.0, 106.0, 64.0, 42.0, 36.0, 25.0, 9.0, 6.0, 11.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-1.189453125, -1.1514892578125, -1.113525390625, -1.0755615234375, -1.03759765625, -0.9996337890625, -0.961669921875, -0.9237060546875, -0.8857421875, -0.8477783203125, -0.809814453125, -0.7718505859375, -0.73388671875, -0.6959228515625, -0.657958984375, -0.6199951171875, -0.58203125, -0.5440673828125, -0.506103515625, -0.4681396484375, -0.43017578125, -0.3922119140625, -0.354248046875, -0.3162841796875, -0.2783203125, -0.2403564453125, -0.202392578125, -0.1644287109375, -0.12646484375, -0.0885009765625, -0.050537109375, -0.0125732421875, 0.025390625, 0.0633544921875, 0.101318359375, 0.1392822265625, 0.17724609375, 0.2152099609375, 0.253173828125, 0.2911376953125, 0.3291015625, 0.3670654296875, 0.405029296875, 0.4429931640625, 0.48095703125, 0.5189208984375, 0.556884765625, 0.5948486328125, 0.6328125, 0.6707763671875, 0.708740234375, 0.7467041015625, 0.78466796875, 0.8226318359375, 0.860595703125, 0.8985595703125, 0.9365234375, 0.9744873046875, 1.012451171875, 1.0504150390625, 1.08837890625, 1.1263427734375, 1.164306640625, 1.2022705078125, 1.240234375]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 5.0, 1.0, 4.0, 1.0, 2.0, 2.0, 11.0, 8.0, 5.0, 17.0, 17.0, 24.0, 34.0, 43.0, 49.0, 73.0, 120.0, 191.0, 128.0, 69.0, 47.0, 43.0, 17.0, 25.0, 15.0, 10.0, 8.0, 7.0, 4.0, 5.0, 2.0, 3.0, 4.0, 3.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.042144775390625, -0.040712833404541016, -0.03928089141845703, -0.03784894943237305, -0.03641700744628906, -0.03498506546020508, -0.033553123474121094, -0.03212118148803711, -0.030689239501953125, -0.02925729751586914, -0.027825355529785156, -0.026393413543701172, -0.024961471557617188, -0.023529529571533203, -0.02209758758544922, -0.020665645599365234, -0.01923370361328125, -0.017801761627197266, -0.01636981964111328, -0.014937877655029297, -0.013505935668945312, -0.012073993682861328, -0.010642051696777344, -0.00921010971069336, -0.007778167724609375, -0.006346225738525391, -0.004914283752441406, -0.003482341766357422, -0.0020503997802734375, -0.0006184577941894531, 0.0008134841918945312, 0.0022454261779785156, 0.0036773681640625, 0.005109310150146484, 0.006541252136230469, 0.007973194122314453, 0.009405136108398438, 0.010837078094482422, 0.012269020080566406, 0.01370096206665039, 0.015132904052734375, 0.01656484603881836, 0.017996788024902344, 0.019428730010986328, 0.020860671997070312, 0.022292613983154297, 0.02372455596923828, 0.025156497955322266, 0.02658843994140625, 0.028020381927490234, 0.02945232391357422, 0.030884265899658203, 0.03231620788574219, 0.03374814987182617, 0.035180091857910156, 0.03661203384399414, 0.038043975830078125, 0.03947591781616211, 0.040907859802246094, 0.04233980178833008, 0.04377174377441406, 0.04520368576049805, 0.04663562774658203, 0.048067569732666016, 0.04949951171875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 3.0, 7.0, 10.0, 9.0, 16.0, 20.0, 41.0, 55.0, 90.0, 182.0, 767.0, 18342.0, 1021624.0, 6430.0, 505.0, 161.0, 81.0, 57.0, 38.0, 29.0, 13.0, 17.0, 5.0, 8.0, 6.0, 3.0, 4.0, 1.0, 3.0, 4.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.05078125, -1.0202255249023438, -0.9896697998046875, -0.9591140747070312, -0.928558349609375, -0.8980026245117188, -0.8674468994140625, -0.8368911743164062, -0.80633544921875, -0.7757797241210938, -0.7452239990234375, -0.7146682739257812, -0.684112548828125, -0.6535568237304688, -0.6230010986328125, -0.5924453735351562, -0.5618896484375, -0.5313339233398438, -0.5007781982421875, -0.47022247314453125, -0.439666748046875, -0.40911102294921875, -0.3785552978515625, -0.34799957275390625, -0.31744384765625, -0.28688812255859375, -0.2563323974609375, -0.22577667236328125, -0.195220947265625, -0.16466522216796875, -0.1341094970703125, -0.10355377197265625, -0.072998046875, -0.04244232177734375, -0.0118865966796875, 0.01866912841796875, 0.049224853515625, 0.07978057861328125, 0.1103363037109375, 0.14089202880859375, 0.17144775390625, 0.20200347900390625, 0.2325592041015625, 0.26311492919921875, 0.293670654296875, 0.32422637939453125, 0.3547821044921875, 0.38533782958984375, 0.4158935546875, 0.44644927978515625, 0.4770050048828125, 0.5075607299804688, 0.538116455078125, 0.5686721801757812, 0.5992279052734375, 0.6297836303710938, 0.66033935546875, 0.6908950805664062, 0.7214508056640625, 0.7520065307617188, 0.782562255859375, 0.8131179809570312, 0.8436737060546875, 0.8742294311523438, 0.90478515625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 25.0, 114.0, 479.0, 285.0, 62.0, 17.0, 15.0, 7.0], "bins": [-0.5228639245033264, -0.5139737129211426, -0.505083441734314, -0.4961932301521301, -0.4873030185699463, -0.47841277718544006, -0.4695225656032562, -0.46063232421875, -0.45174211263656616, -0.44285187125205994, -0.4339616596698761, -0.4250714182853699, -0.41618120670318604, -0.4072909653186798, -0.39840075373649597, -0.38951051235198975, -0.3806202709674835, -0.3717300295829773, -0.36283981800079346, -0.35394957661628723, -0.3450593650341034, -0.33616912364959717, -0.32727891206741333, -0.3183886706829071, -0.3094984292984009, -0.30060818791389465, -0.2917179763317108, -0.2828277349472046, -0.27393752336502075, -0.2650472819805145, -0.2561570703983307, -0.24726682901382446, -0.23837663233280182, -0.2294864058494568, -0.22059617936611176, -0.21170595288276672, -0.2028157114982605, -0.19392549991607666, -0.18503525853157043, -0.1761450320482254, -0.16725480556488037, -0.15836457908153534, -0.1494743525981903, -0.14058412611484528, -0.13169389963150024, -0.12280366569757462, -0.11391343176364899, -0.10502320528030396, -0.09613297879695892, -0.08724275231361389, -0.07835252583026886, -0.06946229189634323, -0.0605720654129982, -0.05168183892965317, -0.04279160872101784, -0.03390137851238251, -0.025011155754327774, -0.016120927408337593, -0.007230699062347412, 0.0016595292836427689, 0.01054975762963295, 0.01943998411297798, 0.028330214321613312, 0.03722044453024864, 0.046110671013593674]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 4.0, 4.0, 4.0, 13.0, 3.0, 13.0, 16.0, 13.0, 21.0, 12.0, 13.0, 24.0, 25.0, 24.0, 34.0, 36.0, 41.0, 39.0, 39.0, 50.0, 40.0, 53.0, 45.0, 35.0, 40.0, 45.0, 42.0, 38.0, 31.0, 38.0, 24.0, 30.0, 11.0, 17.0, 19.0, 16.0, 10.0, 7.0, 12.0, 8.0, 10.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.04622715711593628, -0.044882070273160934, -0.04353698343038559, -0.042191896587610245, -0.0408468097448349, -0.039501722902059555, -0.03815663605928421, -0.036811549216508865, -0.03546646237373352, -0.034121375530958176, -0.03277628868818283, -0.031431201845407486, -0.03008611500263214, -0.028741028159856796, -0.02739594131708145, -0.026050854474306107, -0.02470576763153076, -0.023360680788755417, -0.022015593945980072, -0.020670507103204727, -0.019325420260429382, -0.017980333417654037, -0.016635246574878693, -0.015290159732103348, -0.013945072889328003, -0.012599986046552658, -0.011254899203777313, -0.009909812361001968, -0.008564725518226624, -0.007219638675451279, -0.005874551832675934, -0.004529464989900589, -0.003184378147125244, -0.0018392913043498993, -0.0004942044615745544, 0.0008508823812007904, 0.0021959692239761353, 0.00354105606675148, 0.004886142909526825, 0.00623122975230217, 0.007576316595077515, 0.00892140343785286, 0.010266490280628204, 0.01161157712340355, 0.012956663966178894, 0.014301750808954239, 0.015646837651729584, 0.01699192449450493, 0.018337011337280273, 0.01968209818005562, 0.021027185022830963, 0.022372271865606308, 0.023717358708381653, 0.025062445551156998, 0.026407532393932343, 0.027752619236707687, 0.029097706079483032, 0.030442792922258377, 0.03178787976503372, 0.03313296660780907, 0.03447805345058441, 0.035823140293359756, 0.0371682271361351, 0.038513313978910446, 0.03985840082168579]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 4.0, 1.0, 10.0, 17.0, 16.0, 12.0, 23.0, 13.0, 21.0, 24.0, 24.0, 24.0, 36.0, 33.0, 39.0, 43.0, 38.0, 46.0, 50.0, 62.0, 48.0, 48.0, 37.0, 52.0, 44.0, 35.0, 31.0, 30.0, 23.0, 22.0, 25.0, 18.0, 13.0, 4.0, 14.0, 7.0, 4.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.617431640625, -10.21142578125, -9.805419921875, -9.3994140625, -8.993408203125, -8.58740234375, -8.181396484375, -7.775390625, -7.369384765625, -6.96337890625, -6.557373046875, -6.1513671875, -5.745361328125, -5.33935546875, -4.933349609375, -4.52734375, -4.121337890625, -3.71533203125, -3.309326171875, -2.9033203125, -2.497314453125, -2.09130859375, -1.685302734375, -1.279296875, -0.873291015625, -0.46728515625, -0.061279296875, 0.3447265625, 0.750732421875, 1.15673828125, 1.562744140625, 1.96875, 2.374755859375, 2.78076171875, 3.186767578125, 3.5927734375, 3.998779296875, 4.40478515625, 4.810791015625, 5.216796875, 5.622802734375, 6.02880859375, 6.434814453125, 6.8408203125, 7.246826171875, 7.65283203125, 8.058837890625, 8.46484375, 8.870849609375, 9.27685546875, 9.682861328125, 10.0888671875, 10.494873046875, 10.90087890625, 11.306884765625, 11.712890625, 12.118896484375, 12.52490234375, 12.930908203125, 13.3369140625, 13.742919921875, 14.14892578125, 14.554931640625, 14.9609375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 3.0, 5.0, 7.0, 7.0, 3.0, 6.0, 13.0, 13.0, 15.0, 21.0, 34.0, 71.0, 101.0, 122.0, 199.0, 312.0, 541.0, 927.0, 1461.0, 2658.0, 4800.0, 9231.0, 20126.0, 57004.0, 495301.0, 368560.0, 49167.0, 18292.0, 8753.0, 4603.0, 2566.0, 1442.0, 814.0, 504.0, 316.0, 193.0, 128.0, 70.0, 50.0, 38.0, 21.0, 17.0, 21.0, 10.0, 3.0, 5.0, 3.0, 4.0, 0.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.0625, -23.284912109375, -22.50732421875, -21.729736328125, -20.9521484375, -20.174560546875, -19.39697265625, -18.619384765625, -17.841796875, -17.064208984375, -16.28662109375, -15.509033203125, -14.7314453125, -13.953857421875, -13.17626953125, -12.398681640625, -11.62109375, -10.843505859375, -10.06591796875, -9.288330078125, -8.5107421875, -7.733154296875, -6.95556640625, -6.177978515625, -5.400390625, -4.622802734375, -3.84521484375, -3.067626953125, -2.2900390625, -1.512451171875, -0.73486328125, 0.042724609375, 0.8203125, 1.597900390625, 2.37548828125, 3.153076171875, 3.9306640625, 4.708251953125, 5.48583984375, 6.263427734375, 7.041015625, 7.818603515625, 8.59619140625, 9.373779296875, 10.1513671875, 10.928955078125, 11.70654296875, 12.484130859375, 13.26171875, 14.039306640625, 14.81689453125, 15.594482421875, 16.3720703125, 17.149658203125, 17.92724609375, 18.704833984375, 19.482421875, 20.260009765625, 21.03759765625, 21.815185546875, 22.5927734375, 23.370361328125, 24.14794921875, 24.925537109375, 25.703125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 2.0, 6.0, 9.0, 6.0, 21.0, 14.0, 18.0, 22.0, 31.0, 33.0, 48.0, 34.0, 31.0, 44.0, 61.0, 83.0, 122.0, 310.0, 1512.0, 164.0, 81.0, 55.0, 37.0, 47.0, 38.0, 30.0, 26.0, 21.0, 13.0, 28.0, 20.0, 15.0, 11.0, 15.0, 9.0, 9.0, 4.0, 7.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-42.59375, -41.3095703125, -40.025390625, -38.7412109375, -37.45703125, -36.1728515625, -34.888671875, -33.6044921875, -32.3203125, -31.0361328125, -29.751953125, -28.4677734375, -27.18359375, -25.8994140625, -24.615234375, -23.3310546875, -22.046875, -20.7626953125, -19.478515625, -18.1943359375, -16.91015625, -15.6259765625, -14.341796875, -13.0576171875, -11.7734375, -10.4892578125, -9.205078125, -7.9208984375, -6.63671875, -5.3525390625, -4.068359375, -2.7841796875, -1.5, -0.2158203125, 1.068359375, 2.3525390625, 3.63671875, 4.9208984375, 6.205078125, 7.4892578125, 8.7734375, 10.0576171875, 11.341796875, 12.6259765625, 13.91015625, 15.1943359375, 16.478515625, 17.7626953125, 19.046875, 20.3310546875, 21.615234375, 22.8994140625, 24.18359375, 25.4677734375, 26.751953125, 28.0361328125, 29.3203125, 30.6044921875, 31.888671875, 33.1728515625, 34.45703125, 35.7412109375, 37.025390625, 38.3095703125, 39.59375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 11.0, 12.0, 12.0, 18.0, 12.0, 32.0, 43.0, 41.0, 51.0, 82.0, 83.0, 130.0, 206.0, 363.0, 1502.0, 15700.0, 2848897.0, 269915.0, 6695.0, 878.0, 344.0, 164.0, 123.0, 81.0, 79.0, 54.0, 41.0, 26.0, 34.0, 13.0, 12.0, 11.0, 5.0, 6.0, 5.0, 3.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.5, -84.357421875, -81.21484375, -78.072265625, -74.9296875, -71.787109375, -68.64453125, -65.501953125, -62.359375, -59.216796875, -56.07421875, -52.931640625, -49.7890625, -46.646484375, -43.50390625, -40.361328125, -37.21875, -34.076171875, -30.93359375, -27.791015625, -24.6484375, -21.505859375, -18.36328125, -15.220703125, -12.078125, -8.935546875, -5.79296875, -2.650390625, 0.4921875, 3.634765625, 6.77734375, 9.919921875, 13.0625, 16.205078125, 19.34765625, 22.490234375, 25.6328125, 28.775390625, 31.91796875, 35.060546875, 38.203125, 41.345703125, 44.48828125, 47.630859375, 50.7734375, 53.916015625, 57.05859375, 60.201171875, 63.34375, 66.486328125, 69.62890625, 72.771484375, 75.9140625, 79.056640625, 82.19921875, 85.341796875, 88.484375, 91.626953125, 94.76953125, 97.912109375, 101.0546875, 104.197265625, 107.33984375, 110.482421875, 113.625]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 17.0, 58.0, 238.0, 449.0, 183.0, 44.0, 16.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-293.0624694824219, -285.7979736328125, -278.5334777832031, -271.2690124511719, -264.0045166015625, -256.7400207519531, -249.47552490234375, -242.21102905273438, -234.94654846191406, -227.6820526123047, -220.41757202148438, -213.153076171875, -205.88858032226562, -198.6240997314453, -191.35960388183594, -184.09512329101562, -176.83062744140625, -169.56613159179688, -162.30165100097656, -155.0371551513672, -147.77267456054688, -140.5081787109375, -133.24368286132812, -125.97919464111328, -118.71470642089844, -111.4502182006836, -104.18572998046875, -96.92123413085938, -89.65674591064453, -82.39225769042969, -75.12776184082031, -67.86327362060547, -60.59877014160156, -53.33428192138672, -46.06978988647461, -38.8052978515625, -31.540809631347656, -24.276321411132812, -17.011829376220703, -9.747337341308594, -2.48284912109375, 4.781641006469727, 12.046131134033203, 19.31062126159668, 26.575111389160156, 33.839599609375, 41.10409164428711, 48.36858367919922, 55.63307189941406, 62.897560119628906, 70.16204833984375, 77.42654418945312, 84.69103240966797, 91.95552062988281, 99.22001647949219, 106.48450469970703, 113.74899291992188, 121.01348114013672, 128.27796936035156, 135.54246520996094, 142.80694580078125, 150.07144165039062, 157.3359375, 164.60043334960938, 171.8649139404297]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 5.0, 3.0, 11.0, 10.0, 14.0, 10.0, 10.0, 18.0, 19.0, 31.0, 28.0, 31.0, 26.0, 31.0, 38.0, 37.0, 41.0, 36.0, 50.0, 40.0, 45.0, 42.0, 46.0, 52.0, 45.0, 37.0, 32.0, 33.0, 32.0, 16.0, 9.0, 19.0, 17.0, 10.0, 10.0, 13.0, 5.0, 7.0, 8.0, 6.0, 7.0, 6.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.7728271484375, -100.11311340332031, -96.45339965820312, -92.79368591308594, -89.13397216796875, -85.47425842285156, -81.8145523071289, -78.15483856201172, -74.49512481689453, -70.83541107177734, -67.17569732666016, -63.515987396240234, -59.85627365112305, -56.19655990600586, -52.53684997558594, -48.87713623046875, -45.21742248535156, -41.557708740234375, -37.89799499511719, -34.238285064697266, -30.578571319580078, -26.91885757446289, -23.259145736694336, -19.59943389892578, -15.939720153808594, -12.280007362365723, -8.620294570922852, -4.9605817794799805, -1.3008689880371094, 2.358844757080078, 6.018556594848633, 9.678268432617188, 13.337982177734375, 16.997695922851562, 20.657407760620117, 24.317119598388672, 27.97683334350586, 31.636547088623047, 35.29625701904297, 38.955970764160156, 42.615684509277344, 46.27539825439453, 49.93511199951172, 53.59482192993164, 57.25453567504883, 60.914249420166016, 64.57395935058594, 68.23367309570312, 71.89338684082031, 75.5531005859375, 79.21281433105469, 82.87252807617188, 86.53224182128906, 90.19195556640625, 93.8516616821289, 97.5113754272461, 101.17108917236328, 104.83080291748047, 108.49051666259766, 112.15023040771484, 115.8099365234375, 119.46965026855469, 123.12936401367188, 126.78907775878906, 130.44879150390625]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 4.0, 2.0, 3.0, 6.0, 10.0, 14.0, 16.0, 18.0, 17.0, 26.0, 23.0, 30.0, 28.0, 26.0, 30.0, 44.0, 38.0, 49.0, 54.0, 48.0, 55.0, 51.0, 48.0, 43.0, 46.0, 43.0, 32.0, 34.0, 39.0, 22.0, 21.0, 18.0, 18.0, 5.0, 15.0, 9.0, 6.0, 2.0, 2.0, 4.0, 2.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.671875, -11.224365234375, -10.77685546875, -10.329345703125, -9.8818359375, -9.434326171875, -8.98681640625, -8.539306640625, -8.091796875, -7.644287109375, -7.19677734375, -6.749267578125, -6.3017578125, -5.854248046875, -5.40673828125, -4.959228515625, -4.51171875, -4.064208984375, -3.61669921875, -3.169189453125, -2.7216796875, -2.274169921875, -1.82666015625, -1.379150390625, -0.931640625, -0.484130859375, -0.03662109375, 0.410888671875, 0.8583984375, 1.305908203125, 1.75341796875, 2.200927734375, 2.6484375, 3.095947265625, 3.54345703125, 3.990966796875, 4.4384765625, 4.885986328125, 5.33349609375, 5.781005859375, 6.228515625, 6.676025390625, 7.12353515625, 7.571044921875, 8.0185546875, 8.466064453125, 8.91357421875, 9.361083984375, 9.80859375, 10.256103515625, 10.70361328125, 11.151123046875, 11.5986328125, 12.046142578125, 12.49365234375, 12.941162109375, 13.388671875, 13.836181640625, 14.28369140625, 14.731201171875, 15.1787109375, 15.626220703125, 16.07373046875, 16.521240234375, 16.96875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 1.0, 1.0, 5.0, 0.0, 2.0, 5.0, 9.0, 17.0, 14.0, 17.0, 9.0, 27.0, 21.0, 31.0, 36.0, 37.0, 93.0, 229.0, 781.0, 2750.0, 12495.0, 163052.0, 3651671.0, 343241.0, 15198.0, 3029.0, 845.0, 295.0, 108.0, 69.0, 45.0, 34.0, 21.0, 25.0, 16.0, 16.0, 10.0, 10.0, 7.0, 5.0, 1.0, 5.0, 2.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.9375, -39.3369140625, -37.736328125, -36.1357421875, -34.53515625, -32.9345703125, -31.333984375, -29.7333984375, -28.1328125, -26.5322265625, -24.931640625, -23.3310546875, -21.73046875, -20.1298828125, -18.529296875, -16.9287109375, -15.328125, -13.7275390625, -12.126953125, -10.5263671875, -8.92578125, -7.3251953125, -5.724609375, -4.1240234375, -2.5234375, -0.9228515625, 0.677734375, 2.2783203125, 3.87890625, 5.4794921875, 7.080078125, 8.6806640625, 10.28125, 11.8818359375, 13.482421875, 15.0830078125, 16.68359375, 18.2841796875, 19.884765625, 21.4853515625, 23.0859375, 24.6865234375, 26.287109375, 27.8876953125, 29.48828125, 31.0888671875, 32.689453125, 34.2900390625, 35.890625, 37.4912109375, 39.091796875, 40.6923828125, 42.29296875, 43.8935546875, 45.494140625, 47.0947265625, 48.6953125, 50.2958984375, 51.896484375, 53.4970703125, 55.09765625, 56.6982421875, 58.298828125, 59.8994140625, 61.5]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 2.0, 7.0, 6.0, 4.0, 7.0, 5.0, 14.0, 18.0, 33.0, 29.0, 36.0, 57.0, 102.0, 103.0, 186.0, 270.0, 413.0, 606.0, 661.0, 518.0, 337.0, 194.0, 136.0, 92.0, 48.0, 46.0, 35.0, 30.0, 18.0, 10.0, 14.0, 11.0, 7.0, 4.0, 1.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.375, -22.54541015625, -21.7158203125, -20.88623046875, -20.056640625, -19.22705078125, -18.3974609375, -17.56787109375, -16.73828125, -15.90869140625, -15.0791015625, -14.24951171875, -13.419921875, -12.59033203125, -11.7607421875, -10.93115234375, -10.1015625, -9.27197265625, -8.4423828125, -7.61279296875, -6.783203125, -5.95361328125, -5.1240234375, -4.29443359375, -3.46484375, -2.63525390625, -1.8056640625, -0.97607421875, -0.146484375, 0.68310546875, 1.5126953125, 2.34228515625, 3.171875, 4.00146484375, 4.8310546875, 5.66064453125, 6.490234375, 7.31982421875, 8.1494140625, 8.97900390625, 9.80859375, 10.63818359375, 11.4677734375, 12.29736328125, 13.126953125, 13.95654296875, 14.7861328125, 15.61572265625, 16.4453125, 17.27490234375, 18.1044921875, 18.93408203125, 19.763671875, 20.59326171875, 21.4228515625, 22.25244140625, 23.08203125, 23.91162109375, 24.7412109375, 25.57080078125, 26.400390625, 27.22998046875, 28.0595703125, 28.88916015625, 29.71875]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 10.0, 7.0, 11.0, 15.0, 25.0, 28.0, 35.0, 58.0, 79.0, 119.0, 282.0, 763.0, 3381.0, 37675.0, 3582988.0, 552556.0, 13286.0, 1808.0, 493.0, 228.0, 138.0, 97.0, 41.0, 41.0, 30.0, 21.0, 16.0, 5.0, 8.0, 5.0, 4.0, 6.0, 3.0, 4.0, 1.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-102.0625, -99.212890625, -96.36328125, -93.513671875, -90.6640625, -87.814453125, -84.96484375, -82.115234375, -79.265625, -76.416015625, -73.56640625, -70.716796875, -67.8671875, -65.017578125, -62.16796875, -59.318359375, -56.46875, -53.619140625, -50.76953125, -47.919921875, -45.0703125, -42.220703125, -39.37109375, -36.521484375, -33.671875, -30.822265625, -27.97265625, -25.123046875, -22.2734375, -19.423828125, -16.57421875, -13.724609375, -10.875, -8.025390625, -5.17578125, -2.326171875, 0.5234375, 3.373046875, 6.22265625, 9.072265625, 11.921875, 14.771484375, 17.62109375, 20.470703125, 23.3203125, 26.169921875, 29.01953125, 31.869140625, 34.71875, 37.568359375, 40.41796875, 43.267578125, 46.1171875, 48.966796875, 51.81640625, 54.666015625, 57.515625, 60.365234375, 63.21484375, 66.064453125, 68.9140625, 71.763671875, 74.61328125, 77.462890625, 80.3125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 14.0, 35.0, 244.0, 410.0, 251.0, 51.0, 8.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-554.8233642578125, -541.4363403320312, -528.04931640625, -514.6622314453125, -501.27520751953125, -487.88818359375, -474.50115966796875, -461.1141052246094, -447.72705078125, -434.34002685546875, -420.9529724121094, -407.5659484863281, -394.17889404296875, -380.7918701171875, -367.40484619140625, -354.0177917480469, -340.6307678222656, -327.2437438964844, -313.856689453125, -300.46966552734375, -287.0826110839844, -273.6955871582031, -260.30853271484375, -246.9215087890625, -233.5344696044922, -220.14743041992188, -206.76039123535156, -193.37335205078125, -179.986328125, -166.59927368164062, -153.21224975585938, -139.82521057128906, -126.43820190429688, -113.05116271972656, -99.66412353515625, -86.27709197998047, -72.89005279541016, -59.503013610839844, -46.11598205566406, -32.72894287109375, -19.341903686523438, -5.954866409301758, 7.432170867919922, 20.81920623779297, 34.20624542236328, 47.593284606933594, 60.980316162109375, 74.36735534667969, 87.75439453125, 101.14143371582031, 114.52847290039062, 127.9155044555664, 141.30255126953125, 154.6895751953125, 168.0766143798828, 181.46365356445312, 194.85069274902344, 208.23773193359375, 221.62477111816406, 235.01181030273438, 248.39883422851562, 261.785888671875, 275.17291259765625, 288.5599365234375, 301.9469909667969]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 6.0, 3.0, 6.0, 11.0, 12.0, 10.0, 14.0, 21.0, 17.0, 19.0, 24.0, 32.0, 32.0, 43.0, 37.0, 40.0, 44.0, 39.0, 42.0, 48.0, 46.0, 45.0, 45.0, 42.0, 42.0, 34.0, 28.0, 37.0, 22.0, 31.0, 31.0, 24.0, 16.0, 8.0, 6.0, 11.0, 9.0, 13.0, 3.0, 7.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0], "bins": [-90.00277709960938, -87.25083923339844, -84.49890899658203, -81.7469711303711, -78.99504089355469, -76.24310302734375, -73.49116516113281, -70.73922729492188, -67.98729705810547, -65.23535919189453, -62.483428955078125, -59.73149108886719, -56.979557037353516, -54.227622985839844, -51.475685119628906, -48.723751068115234, -45.97181701660156, -43.21988296508789, -40.46794891357422, -37.71601104736328, -34.96407699584961, -32.21214294433594, -29.460206985473633, -26.708271026611328, -23.956336975097656, -21.204402923583984, -18.45246696472168, -15.700531959533691, -12.948596954345703, -10.196661949157715, -7.444726943969727, -4.692790985107422, -1.94085693359375, 0.8110780715942383, 3.5630130767822266, 6.314948081970215, 9.066883087158203, 11.818818092346191, 14.57075309753418, 17.322689056396484, 20.074623107910156, 22.826557159423828, 25.578493118286133, 28.330429077148438, 31.08236312866211, 33.83429718017578, 36.58623504638672, 39.33816909790039, 42.09010314941406, 44.842037200927734, 47.593971252441406, 50.345909118652344, 53.097843170166016, 55.84977722167969, 58.601715087890625, 61.3536491394043, 64.10558319091797, 66.8575210571289, 69.60945129394531, 72.36138916015625, 75.11332702636719, 77.8652572631836, 80.61719512939453, 83.36912536621094, 86.12106323242188]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 8.0, 7.0, 8.0, 7.0, 14.0, 17.0, 26.0, 21.0, 20.0, 29.0, 22.0, 30.0, 36.0, 48.0, 54.0, 49.0, 53.0, 62.0, 42.0, 37.0, 44.0, 52.0, 46.0, 38.0, 30.0, 44.0, 29.0, 32.0, 22.0, 18.0, 14.0, 10.0, 7.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1875, -11.737060546875, -11.28662109375, -10.836181640625, -10.3857421875, -9.935302734375, -9.48486328125, -9.034423828125, -8.583984375, -8.133544921875, -7.68310546875, -7.232666015625, -6.7822265625, -6.331787109375, -5.88134765625, -5.430908203125, -4.98046875, -4.530029296875, -4.07958984375, -3.629150390625, -3.1787109375, -2.728271484375, -2.27783203125, -1.827392578125, -1.376953125, -0.926513671875, -0.47607421875, -0.025634765625, 0.4248046875, 0.875244140625, 1.32568359375, 1.776123046875, 2.2265625, 2.677001953125, 3.12744140625, 3.577880859375, 4.0283203125, 4.478759765625, 4.92919921875, 5.379638671875, 5.830078125, 6.280517578125, 6.73095703125, 7.181396484375, 7.6318359375, 8.082275390625, 8.53271484375, 8.983154296875, 9.43359375, 9.884033203125, 10.33447265625, 10.784912109375, 11.2353515625, 11.685791015625, 12.13623046875, 12.586669921875, 13.037109375, 13.487548828125, 13.93798828125, 14.388427734375, 14.8388671875, 15.289306640625, 15.73974609375, 16.190185546875, 16.640625]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 4.0, 13.0, 7.0, 12.0, 23.0, 48.0, 54.0, 85.0, 112.0, 214.0, 322.0, 514.0, 764.0, 1300.0, 2190.0, 3781.0, 6592.0, 11624.0, 21431.0, 39385.0, 74952.0, 143035.0, 239643.0, 225743.0, 129665.0, 66680.0, 35449.0, 19510.0, 10676.0, 5913.0, 3527.0, 2059.0, 1212.0, 736.0, 479.0, 253.0, 203.0, 121.0, 74.0, 52.0, 34.0, 19.0, 16.0, 10.0, 10.0, 3.0, 5.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-2.658203125, -2.57745361328125, -2.4967041015625, -2.41595458984375, -2.335205078125, -2.25445556640625, -2.1737060546875, -2.09295654296875, -2.01220703125, -1.93145751953125, -1.8507080078125, -1.76995849609375, -1.689208984375, -1.60845947265625, -1.5277099609375, -1.44696044921875, -1.3662109375, -1.28546142578125, -1.2047119140625, -1.12396240234375, -1.043212890625, -0.96246337890625, -0.8817138671875, -0.80096435546875, -0.72021484375, -0.63946533203125, -0.5587158203125, -0.47796630859375, -0.397216796875, -0.31646728515625, -0.2357177734375, -0.15496826171875, -0.07421875, 0.00653076171875, 0.0872802734375, 0.16802978515625, 0.248779296875, 0.32952880859375, 0.4102783203125, 0.49102783203125, 0.57177734375, 0.65252685546875, 0.7332763671875, 0.81402587890625, 0.894775390625, 0.97552490234375, 1.0562744140625, 1.13702392578125, 1.2177734375, 1.29852294921875, 1.3792724609375, 1.46002197265625, 1.540771484375, 1.62152099609375, 1.7022705078125, 1.78302001953125, 1.86376953125, 1.94451904296875, 2.0252685546875, 2.10601806640625, 2.186767578125, 2.26751708984375, 2.3482666015625, 2.42901611328125, 2.509765625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 4.0, 3.0, 9.0, 4.0, 7.0, 5.0, 16.0, 15.0, 14.0, 11.0, 15.0, 22.0, 30.0, 34.0, 23.0, 31.0, 35.0, 26.0, 34.0, 42.0, 28.0, 42.0, 1070.0, 40.0, 42.0, 40.0, 35.0, 31.0, 42.0, 23.0, 28.0, 26.0, 25.0, 24.0, 20.0, 16.0, 22.0, 21.0, 16.0, 17.0, 13.0, 11.0, 11.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.65625, -7.3990478515625, -7.141845703125, -6.8846435546875, -6.62744140625, -6.3702392578125, -6.113037109375, -5.8558349609375, -5.5986328125, -5.3414306640625, -5.084228515625, -4.8270263671875, -4.56982421875, -4.3126220703125, -4.055419921875, -3.7982177734375, -3.541015625, -3.2838134765625, -3.026611328125, -2.7694091796875, -2.51220703125, -2.2550048828125, -1.997802734375, -1.7406005859375, -1.4833984375, -1.2261962890625, -0.968994140625, -0.7117919921875, -0.45458984375, -0.1973876953125, 0.059814453125, 0.3170166015625, 0.57421875, 0.8314208984375, 1.088623046875, 1.3458251953125, 1.60302734375, 1.8602294921875, 2.117431640625, 2.3746337890625, 2.6318359375, 2.8890380859375, 3.146240234375, 3.4034423828125, 3.66064453125, 3.9178466796875, 4.175048828125, 4.4322509765625, 4.689453125, 4.9466552734375, 5.203857421875, 5.4610595703125, 5.71826171875, 5.9754638671875, 6.232666015625, 6.4898681640625, 6.7470703125, 7.0042724609375, 7.261474609375, 7.5186767578125, 7.77587890625, 8.0330810546875, 8.290283203125, 8.5474853515625, 8.8046875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 9.0, 13.0, 12.0, 30.0, 46.0, 50.0, 76.0, 111.0, 130.0, 221.0, 314.0, 487.0, 702.0, 1028.0, 1432.0, 2110.0, 3094.0, 4664.0, 7057.0, 10803.0, 16575.0, 25582.0, 40351.0, 65532.0, 105350.0, 159400.0, 1238153.0, 149836.0, 97796.0, 60218.0, 37288.0, 23492.0, 14917.0, 9987.0, 6714.0, 4382.0, 2887.0, 1983.0, 1306.0, 890.0, 669.0, 454.0, 289.0, 231.0, 145.0, 96.0, 75.0, 41.0, 33.0, 20.0, 15.0, 17.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0], "bins": [-1.1005859375, -1.0666351318359375, -1.032684326171875, -0.9987335205078125, -0.96478271484375, -0.9308319091796875, -0.896881103515625, -0.8629302978515625, -0.8289794921875, -0.7950286865234375, -0.761077880859375, -0.7271270751953125, -0.69317626953125, -0.6592254638671875, -0.625274658203125, -0.5913238525390625, -0.557373046875, -0.5234222412109375, -0.489471435546875, -0.4555206298828125, -0.42156982421875, -0.3876190185546875, -0.353668212890625, -0.3197174072265625, -0.2857666015625, -0.2518157958984375, -0.217864990234375, -0.1839141845703125, -0.14996337890625, -0.1160125732421875, -0.082061767578125, -0.0481109619140625, -0.01416015625, 0.0197906494140625, 0.053741455078125, 0.0876922607421875, 0.12164306640625, 0.1555938720703125, 0.189544677734375, 0.2234954833984375, 0.2574462890625, 0.2913970947265625, 0.325347900390625, 0.3592987060546875, 0.39324951171875, 0.4272003173828125, 0.461151123046875, 0.4951019287109375, 0.529052734375, 0.5630035400390625, 0.596954345703125, 0.6309051513671875, 0.66485595703125, 0.6988067626953125, 0.732757568359375, 0.7667083740234375, 0.8006591796875, 0.8346099853515625, 0.868560791015625, 0.9025115966796875, 0.93646240234375, 0.9704132080078125, 1.004364013671875, 1.0383148193359375, 1.072265625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 4.0, 13.0, 6.0, 8.0, 12.0, 14.0, 9.0, 15.0, 24.0, 18.0, 31.0, 18.0, 35.0, 33.0, 29.0, 35.0, 34.0, 29.0, 43.0, 63.0, 46.0, 51.0, 38.0, 41.0, 40.0, 33.0, 31.0, 29.0, 32.0, 27.0, 24.0, 24.0, 13.0, 17.0, 16.0, 12.0, 11.0, 14.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.0149078369140625, -0.014421701431274414, -0.013935565948486328, -0.013449430465698242, -0.012963294982910156, -0.01247715950012207, -0.011991024017333984, -0.011504888534545898, -0.011018753051757812, -0.010532617568969727, -0.01004648208618164, -0.009560346603393555, -0.009074211120605469, -0.008588075637817383, -0.008101940155029297, -0.007615804672241211, -0.007129669189453125, -0.006643533706665039, -0.006157398223876953, -0.005671262741088867, -0.005185127258300781, -0.004698991775512695, -0.004212856292724609, -0.0037267208099365234, -0.0032405853271484375, -0.0027544498443603516, -0.0022683143615722656, -0.0017821788787841797, -0.0012960433959960938, -0.0008099079132080078, -0.0003237724304199219, 0.00016236305236816406, 0.00064849853515625, 0.001134634017944336, 0.0016207695007324219, 0.002106904983520508, 0.0025930404663085938, 0.0030791759490966797, 0.0035653114318847656, 0.0040514469146728516, 0.0045375823974609375, 0.0050237178802490234, 0.005509853363037109, 0.005995988845825195, 0.006482124328613281, 0.006968259811401367, 0.007454395294189453, 0.007940530776977539, 0.008426666259765625, 0.008912801742553711, 0.009398937225341797, 0.009885072708129883, 0.010371208190917969, 0.010857343673706055, 0.01134347915649414, 0.011829614639282227, 0.012315750122070312, 0.012801885604858398, 0.013288021087646484, 0.01377415657043457, 0.014260292053222656, 0.014746427536010742, 0.015232563018798828, 0.015718698501586914, 0.016204833984375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 3.0, 12.0, 10.0, 7.0, 15.0, 15.0, 26.0, 28.0, 25.0, 37.0, 51.0, 62.0, 104.0, 151.0, 282.0, 1096.0, 8388.0, 141246.0, 851897.0, 40426.0, 3346.0, 588.0, 215.0, 118.0, 78.0, 62.0, 57.0, 27.0, 26.0, 21.0, 30.0, 20.0, 14.0, 13.0, 7.0, 9.0, 3.0, 6.0, 7.0, 1.0, 7.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.365478515625, -0.3545036315917969, -0.34352874755859375, -0.3325538635253906, -0.3215789794921875, -0.3106040954589844, -0.29962921142578125, -0.2886543273925781, -0.277679443359375, -0.2667045593261719, -0.25572967529296875, -0.24475479125976562, -0.2337799072265625, -0.22280502319335938, -0.21183013916015625, -0.20085525512695312, -0.18988037109375, -0.17890548706054688, -0.16793060302734375, -0.15695571899414062, -0.1459808349609375, -0.13500595092773438, -0.12403106689453125, -0.11305618286132812, -0.102081298828125, -0.09110641479492188, -0.08013153076171875, -0.06915664672851562, -0.0581817626953125, -0.047206878662109375, -0.03623199462890625, -0.025257110595703125, -0.0142822265625, -0.003307342529296875, 0.00766754150390625, 0.018642425537109375, 0.0296173095703125, 0.040592193603515625, 0.05156707763671875, 0.06254196166992188, 0.073516845703125, 0.08449172973632812, 0.09546661376953125, 0.10644149780273438, 0.1174163818359375, 0.12839126586914062, 0.13936614990234375, 0.15034103393554688, 0.16131591796875, 0.17229080200195312, 0.18326568603515625, 0.19424057006835938, 0.2052154541015625, 0.21619033813476562, 0.22716522216796875, 0.23814010620117188, 0.249114990234375, 0.2600898742675781, 0.27106475830078125, 0.2820396423339844, 0.2930145263671875, 0.3039894104003906, 0.31496429443359375, 0.3259391784667969, 0.3369140625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 4.0, 6.0, 6.0, 11.0, 13.0, 25.0, 35.0, 65.0, 92.0, 167.0, 233.0, 127.0, 68.0, 41.0, 35.0, 22.0, 16.0, 7.0, 11.0, 5.0, 7.0, 4.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.11992428451776505, -0.1170882135629654, -0.11425214260816574, -0.11141607165336609, -0.10858000069856644, -0.10574392974376678, -0.10290785878896713, -0.10007178783416748, -0.09723571687936783, -0.09439964592456818, -0.09156357496976852, -0.08872750401496887, -0.08589143306016922, -0.08305536210536957, -0.08021929115056992, -0.07738322019577026, -0.07454714924097061, -0.07171107828617096, -0.06887500733137131, -0.06603893637657166, -0.063202865421772, -0.06036679446697235, -0.0575307235121727, -0.05469465255737305, -0.051858581602573395, -0.04902251064777374, -0.04618643969297409, -0.04335036873817444, -0.040514297783374786, -0.037678226828575134, -0.03484215587377548, -0.03200608491897583, -0.029170017689466476, -0.026333946734666824, -0.023497875779867172, -0.02066180482506752, -0.017825733870267868, -0.014989662915468216, -0.012153591960668564, -0.009317521005868912, -0.00648145005106926, -0.0036453790962696075, -0.0008093081414699554, 0.0020267628133296967, 0.004862833768129349, 0.007698904722929001, 0.010534975677728653, 0.013371046632528305, 0.016207117587327957, 0.01904318854212761, 0.02187925949692726, 0.024715330451726913, 0.027551401406526566, 0.030387472361326218, 0.03322354331612587, 0.03605961427092552, 0.038895685225725174, 0.041731756180524826, 0.04456782713532448, 0.04740389809012413, 0.05023996904492378, 0.053076039999723434, 0.05591211095452309, 0.05874818190932274, 0.06158425286412239]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 3.0, 6.0, 1.0, 10.0, 5.0, 9.0, 10.0, 8.0, 21.0, 21.0, 17.0, 23.0, 24.0, 27.0, 33.0, 29.0, 30.0, 33.0, 47.0, 40.0, 26.0, 40.0, 37.0, 48.0, 46.0, 40.0, 28.0, 37.0, 32.0, 28.0, 26.0, 29.0, 31.0, 25.0, 23.0, 15.0, 11.0, 18.0, 13.0, 9.0, 12.0, 14.0, 10.0, 2.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.012537598609924316, -0.01213921420276165, -0.011740829795598984, -0.011342445388436317, -0.010944060981273651, -0.010545676574110985, -0.010147292166948318, -0.009748907759785652, -0.009350523352622986, -0.00895213894546032, -0.008553754538297653, -0.008155370131134987, -0.0077569857239723206, -0.007358601316809654, -0.006960216909646988, -0.006561832502484322, -0.006163448095321655, -0.005765063688158989, -0.005366679280996323, -0.004968294873833656, -0.00456991046667099, -0.004171526059508324, -0.0037731416523456573, -0.003374757245182991, -0.0029763728380203247, -0.0025779884308576584, -0.002179604023694992, -0.0017812196165323257, -0.0013828352093696594, -0.000984450802206993, -0.0005860663950443268, -0.00018768198788166046, 0.00021070241928100586, 0.0006090868264436722, 0.0010074712336063385, 0.0014058556407690048, 0.0018042400479316711, 0.0022026244550943375, 0.002601008862257004, 0.00299939326941967, 0.0033977776765823364, 0.0037961620837450027, 0.004194546490907669, 0.004592930898070335, 0.004991315305233002, 0.005389699712395668, 0.005788084119558334, 0.006186468526721001, 0.006584852933883667, 0.006983237341046333, 0.007381621748209, 0.007780006155371666, 0.008178390562534332, 0.008576774969696999, 0.008975159376859665, 0.009373543784022331, 0.009771928191184998, 0.010170312598347664, 0.01056869700551033, 0.010967081412672997, 0.011365465819835663, 0.01176385022699833, 0.012162234634160995, 0.012560619041323662, 0.012959003448486328]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 5.0, 7.0, 7.0, 8.0, 7.0, 14.0, 18.0, 28.0, 19.0, 20.0, 28.0, 22.0, 30.0, 38.0, 48.0, 55.0, 47.0, 56.0, 60.0, 43.0, 34.0, 44.0, 53.0, 45.0, 38.0, 33.0, 42.0, 29.0, 31.0, 25.0, 15.0, 17.0, 9.0, 5.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1796875, -11.7291259765625, -11.278564453125, -10.8280029296875, -10.37744140625, -9.9268798828125, -9.476318359375, -9.0257568359375, -8.5751953125, -8.1246337890625, -7.674072265625, -7.2235107421875, -6.77294921875, -6.3223876953125, -5.871826171875, -5.4212646484375, -4.970703125, -4.5201416015625, -4.069580078125, -3.6190185546875, -3.16845703125, -2.7178955078125, -2.267333984375, -1.8167724609375, -1.3662109375, -0.9156494140625, -0.465087890625, -0.0145263671875, 0.43603515625, 0.8865966796875, 1.337158203125, 1.7877197265625, 2.23828125, 2.6888427734375, 3.139404296875, 3.5899658203125, 4.04052734375, 4.4910888671875, 4.941650390625, 5.3922119140625, 5.8427734375, 6.2933349609375, 6.743896484375, 7.1944580078125, 7.64501953125, 8.0955810546875, 8.546142578125, 8.9967041015625, 9.447265625, 9.8978271484375, 10.348388671875, 10.7989501953125, 11.24951171875, 11.7000732421875, 12.150634765625, 12.6011962890625, 13.0517578125, 13.5023193359375, 13.952880859375, 14.4034423828125, 14.85400390625, 15.3045654296875, 15.755126953125, 16.2056884765625, 16.65625]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 8.0, 13.0, 13.0, 30.0, 24.0, 36.0, 55.0, 78.0, 150.0, 224.0, 331.0, 560.0, 954.0, 1488.0, 2520.0, 4442.0, 7916.0, 14818.0, 29212.0, 74887.0, 561929.0, 248244.0, 50378.0, 22709.0, 11940.0, 6427.0, 3624.0, 2236.0, 1235.0, 752.0, 478.0, 307.0, 182.0, 107.0, 83.0, 42.0, 40.0, 36.0, 17.0, 11.0, 4.0, 9.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.265625, -18.640625, -18.015625, -17.390625, -16.765625, -16.140625, -15.515625, -14.890625, -14.265625, -13.640625, -13.015625, -12.390625, -11.765625, -11.140625, -10.515625, -9.890625, -9.265625, -8.640625, -8.015625, -7.390625, -6.765625, -6.140625, -5.515625, -4.890625, -4.265625, -3.640625, -3.015625, -2.390625, -1.765625, -1.140625, -0.515625, 0.109375, 0.734375, 1.359375, 1.984375, 2.609375, 3.234375, 3.859375, 4.484375, 5.109375, 5.734375, 6.359375, 6.984375, 7.609375, 8.234375, 8.859375, 9.484375, 10.109375, 10.734375, 11.359375, 11.984375, 12.609375, 13.234375, 13.859375, 14.484375, 15.109375, 15.734375, 16.359375, 16.984375, 17.609375, 18.234375, 18.859375, 19.484375, 20.109375, 20.734375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 13.0, 14.0, 13.0, 8.0, 18.0, 26.0, 33.0, 34.0, 43.0, 50.0, 49.0, 66.0, 97.0, 236.0, 1721.0, 173.0, 84.0, 71.0, 45.0, 48.0, 37.0, 45.0, 28.0, 17.0, 18.0, 18.0, 8.0, 12.0, 11.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0], "bins": [-63.4375, -61.865234375, -60.29296875, -58.720703125, -57.1484375, -55.576171875, -54.00390625, -52.431640625, -50.859375, -49.287109375, -47.71484375, -46.142578125, -44.5703125, -42.998046875, -41.42578125, -39.853515625, -38.28125, -36.708984375, -35.13671875, -33.564453125, -31.9921875, -30.419921875, -28.84765625, -27.275390625, -25.703125, -24.130859375, -22.55859375, -20.986328125, -19.4140625, -17.841796875, -16.26953125, -14.697265625, -13.125, -11.552734375, -9.98046875, -8.408203125, -6.8359375, -5.263671875, -3.69140625, -2.119140625, -0.546875, 1.025390625, 2.59765625, 4.169921875, 5.7421875, 7.314453125, 8.88671875, 10.458984375, 12.03125, 13.603515625, 15.17578125, 16.748046875, 18.3203125, 19.892578125, 21.46484375, 23.037109375, 24.609375, 26.181640625, 27.75390625, 29.326171875, 30.8984375, 32.470703125, 34.04296875, 35.615234375, 37.1875]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 9.0, 8.0, 14.0, 10.0, 15.0, 26.0, 27.0, 46.0, 41.0, 79.0, 115.0, 158.0, 237.0, 390.0, 1676.0, 29969.0, 3073157.0, 36653.0, 1915.0, 362.0, 246.0, 153.0, 105.0, 72.0, 48.0, 32.0, 34.0, 30.0, 12.0, 11.0, 12.0, 12.0, 10.0, 5.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-121.5, -117.7646484375, -114.029296875, -110.2939453125, -106.55859375, -102.8232421875, -99.087890625, -95.3525390625, -91.6171875, -87.8818359375, -84.146484375, -80.4111328125, -76.67578125, -72.9404296875, -69.205078125, -65.4697265625, -61.734375, -57.9990234375, -54.263671875, -50.5283203125, -46.79296875, -43.0576171875, -39.322265625, -35.5869140625, -31.8515625, -28.1162109375, -24.380859375, -20.6455078125, -16.91015625, -13.1748046875, -9.439453125, -5.7041015625, -1.96875, 1.7666015625, 5.501953125, 9.2373046875, 12.97265625, 16.7080078125, 20.443359375, 24.1787109375, 27.9140625, 31.6494140625, 35.384765625, 39.1201171875, 42.85546875, 46.5908203125, 50.326171875, 54.0615234375, 57.796875, 61.5322265625, 65.267578125, 69.0029296875, 72.73828125, 76.4736328125, 80.208984375, 83.9443359375, 87.6796875, 91.4150390625, 95.150390625, 98.8857421875, 102.62109375, 106.3564453125, 110.091796875, 113.8271484375, 117.5625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 42.0, 611.0, 341.0, 22.0, 2.0], "bins": [-773.5540771484375, -760.8399047851562, -748.125732421875, -735.4114990234375, -722.6973266601562, -709.983154296875, -697.2689819335938, -684.5547485351562, -671.840576171875, -659.1264038085938, -646.4122314453125, -633.697998046875, -620.9838256835938, -608.2696533203125, -595.5554809570312, -582.8412475585938, -570.1270751953125, -557.4129028320312, -544.69873046875, -531.9844970703125, -519.2703247070312, -506.55615234375, -493.8419494628906, -481.1277770996094, -468.4136047363281, -455.6994323730469, -442.9852294921875, -430.27105712890625, -417.5568542480469, -404.8426818847656, -392.12847900390625, -379.414306640625, -366.70013427734375, -353.9859619140625, -341.2717590332031, -328.5575866699219, -315.8433837890625, -303.12921142578125, -290.4150085449219, -277.7008361816406, -264.98663330078125, -252.27244567871094, -239.55825805664062, -226.8440704345703, -214.1298828125, -201.4156951904297, -188.70150756835938, -175.98733520507812, -163.27313232421875, -150.55894470214844, -137.84475708007812, -125.13056945800781, -112.4163818359375, -99.70219421386719, -86.9880142211914, -74.2738265991211, -61.55963897705078, -48.84545135498047, -36.131263732910156, -23.41707992553711, -10.702892303466797, 2.0112953186035156, 14.725479125976562, 27.439666748046875, 40.15385437011719]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 7.0, 2.0, 5.0, 3.0, 6.0, 7.0, 11.0, 7.0, 11.0, 10.0, 13.0, 17.0, 14.0, 22.0, 17.0, 26.0, 25.0, 23.0, 29.0, 28.0, 42.0, 37.0, 35.0, 40.0, 36.0, 42.0, 34.0, 40.0, 29.0, 41.0, 29.0, 27.0, 26.0, 26.0, 35.0, 30.0, 26.0, 24.0, 16.0, 16.0, 15.0, 14.0, 20.0, 12.0, 7.0, 7.0, 5.0, 2.0, 9.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-83.64948272705078, -80.78413391113281, -77.91877746582031, -75.05342102050781, -72.18807220458984, -69.32272338867188, -66.45736694335938, -63.59201431274414, -60.726661682128906, -57.86130905151367, -54.99595642089844, -52.1306037902832, -49.26525115966797, -46.399898529052734, -43.5345458984375, -40.669193267822266, -37.80384063720703, -34.9384880065918, -32.07313537597656, -29.207782745361328, -26.342430114746094, -23.47707748413086, -20.611724853515625, -17.74637222290039, -14.881019592285156, -12.015666961669922, -9.150314331054688, -6.284961700439453, -3.4196090698242188, -0.5542564392089844, 2.31109619140625, 5.176448822021484, 8.041801452636719, 10.907154083251953, 13.772506713867188, 16.637859344482422, 19.503211975097656, 22.36856460571289, 25.233917236328125, 28.09926986694336, 30.964622497558594, 33.82997512817383, 36.69532775878906, 39.5606803894043, 42.42603302001953, 45.291385650634766, 48.15673828125, 51.022090911865234, 53.88744354248047, 56.7527961730957, 59.61814880371094, 62.48350143432617, 65.3488540649414, 68.21420288085938, 71.07955932617188, 73.94491577148438, 76.81026458740234, 79.67561340332031, 82.54096984863281, 85.40632629394531, 88.27167510986328, 91.13702392578125, 94.00238037109375, 96.86773681640625, 99.73308563232422]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 1.0, 7.0, 14.0, 15.0, 16.0, 24.0, 18.0, 15.0, 23.0, 29.0, 33.0, 32.0, 39.0, 53.0, 54.0, 56.0, 48.0, 43.0, 34.0, 46.0, 44.0, 45.0, 40.0, 47.0, 35.0, 31.0, 32.0, 25.0, 19.0, 22.0, 12.0, 10.0, 6.0, 8.0, 3.0, 4.0, 3.0, 2.0, 6.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.421875, -11.953857421875, -11.48583984375, -11.017822265625, -10.5498046875, -10.081787109375, -9.61376953125, -9.145751953125, -8.677734375, -8.209716796875, -7.74169921875, -7.273681640625, -6.8056640625, -6.337646484375, -5.86962890625, -5.401611328125, -4.93359375, -4.465576171875, -3.99755859375, -3.529541015625, -3.0615234375, -2.593505859375, -2.12548828125, -1.657470703125, -1.189453125, -0.721435546875, -0.25341796875, 0.214599609375, 0.6826171875, 1.150634765625, 1.61865234375, 2.086669921875, 2.5546875, 3.022705078125, 3.49072265625, 3.958740234375, 4.4267578125, 4.894775390625, 5.36279296875, 5.830810546875, 6.298828125, 6.766845703125, 7.23486328125, 7.702880859375, 8.1708984375, 8.638916015625, 9.10693359375, 9.574951171875, 10.04296875, 10.510986328125, 10.97900390625, 11.447021484375, 11.9150390625, 12.383056640625, 12.85107421875, 13.319091796875, 13.787109375, 14.255126953125, 14.72314453125, 15.191162109375, 15.6591796875, 16.127197265625, 16.59521484375, 17.063232421875, 17.53125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 8.0, 8.0, 13.0, 11.0, 15.0, 25.0, 37.0, 38.0, 43.0, 51.0, 74.0, 116.0, 146.0, 236.0, 365.0, 762.0, 1624.0, 4371.0, 14934.0, 114533.0, 2306112.0, 1659254.0, 72781.0, 11620.0, 3712.0, 1504.0, 712.0, 354.0, 230.0, 171.0, 91.0, 81.0, 64.0, 51.0, 40.0, 24.0, 23.0, 12.0, 11.0, 8.0, 8.0, 4.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.96875, -31.7880859375, -30.607421875, -29.4267578125, -28.24609375, -27.0654296875, -25.884765625, -24.7041015625, -23.5234375, -22.3427734375, -21.162109375, -19.9814453125, -18.80078125, -17.6201171875, -16.439453125, -15.2587890625, -14.078125, -12.8974609375, -11.716796875, -10.5361328125, -9.35546875, -8.1748046875, -6.994140625, -5.8134765625, -4.6328125, -3.4521484375, -2.271484375, -1.0908203125, 0.08984375, 1.2705078125, 2.451171875, 3.6318359375, 4.8125, 5.9931640625, 7.173828125, 8.3544921875, 9.53515625, 10.7158203125, 11.896484375, 13.0771484375, 14.2578125, 15.4384765625, 16.619140625, 17.7998046875, 18.98046875, 20.1611328125, 21.341796875, 22.5224609375, 23.703125, 24.8837890625, 26.064453125, 27.2451171875, 28.42578125, 29.6064453125, 30.787109375, 31.9677734375, 33.1484375, 34.3291015625, 35.509765625, 36.6904296875, 37.87109375, 39.0517578125, 40.232421875, 41.4130859375, 42.59375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 10.0, 11.0, 21.0, 12.0, 23.0, 23.0, 38.0, 59.0, 83.0, 123.0, 206.0, 362.0, 574.0, 776.0, 699.0, 411.0, 245.0, 141.0, 79.0, 54.0, 41.0, 19.0, 19.0, 19.0, 4.0, 8.0, 4.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.125, -37.112548828125, -36.10009765625, -35.087646484375, -34.0751953125, -33.062744140625, -32.05029296875, -31.037841796875, -30.025390625, -29.012939453125, -28.00048828125, -26.988037109375, -25.9755859375, -24.963134765625, -23.95068359375, -22.938232421875, -21.92578125, -20.913330078125, -19.90087890625, -18.888427734375, -17.8759765625, -16.863525390625, -15.85107421875, -14.838623046875, -13.826171875, -12.813720703125, -11.80126953125, -10.788818359375, -9.7763671875, -8.763916015625, -7.75146484375, -6.739013671875, -5.7265625, -4.714111328125, -3.70166015625, -2.689208984375, -1.6767578125, -0.664306640625, 0.34814453125, 1.360595703125, 2.373046875, 3.385498046875, 4.39794921875, 5.410400390625, 6.4228515625, 7.435302734375, 8.44775390625, 9.460205078125, 10.47265625, 11.485107421875, 12.49755859375, 13.510009765625, 14.5224609375, 15.534912109375, 16.54736328125, 17.559814453125, 18.572265625, 19.584716796875, 20.59716796875, 21.609619140625, 22.6220703125, 23.634521484375, 24.64697265625, 25.659423828125, 26.671875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 11.0, 13.0, 23.0, 24.0, 37.0, 60.0, 127.0, 207.0, 516.0, 2037.0, 29133.0, 3876939.0, 277267.0, 6101.0, 966.0, 310.0, 185.0, 104.0, 63.0, 41.0, 23.0, 22.0, 22.0, 17.0, 11.0, 7.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.0625, -89.5830078125, -86.103515625, -82.6240234375, -79.14453125, -75.6650390625, -72.185546875, -68.7060546875, -65.2265625, -61.7470703125, -58.267578125, -54.7880859375, -51.30859375, -47.8291015625, -44.349609375, -40.8701171875, -37.390625, -33.9111328125, -30.431640625, -26.9521484375, -23.47265625, -19.9931640625, -16.513671875, -13.0341796875, -9.5546875, -6.0751953125, -2.595703125, 0.8837890625, 4.36328125, 7.8427734375, 11.322265625, 14.8017578125, 18.28125, 21.7607421875, 25.240234375, 28.7197265625, 32.19921875, 35.6787109375, 39.158203125, 42.6376953125, 46.1171875, 49.5966796875, 53.076171875, 56.5556640625, 60.03515625, 63.5146484375, 66.994140625, 70.4736328125, 73.953125, 77.4326171875, 80.912109375, 84.3916015625, 87.87109375, 91.3505859375, 94.830078125, 98.3095703125, 101.7890625, 105.2685546875, 108.748046875, 112.2275390625, 115.70703125, 119.1865234375, 122.666015625, 126.1455078125, 129.625]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 7.0, 9.0, 11.0, 26.0, 26.0, 42.0, 51.0, 97.0, 131.0, 130.0, 134.0, 122.0, 90.0, 55.0, 27.0, 19.0, 11.0, 6.0, 7.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-109.36597442626953, -105.58758544921875, -101.80918884277344, -98.03079986572266, -94.25241088867188, -90.47401428222656, -86.69562530517578, -82.917236328125, -79.13883972167969, -75.3604507446289, -71.5820541381836, -67.80366516113281, -64.02527618408203, -60.246883392333984, -56.46849060058594, -52.690101623535156, -48.911712646484375, -45.13331985473633, -41.35493087768555, -37.5765380859375, -33.79814910888672, -30.019756317138672, -26.241363525390625, -22.46297264099121, -18.684581756591797, -14.906190872192383, -11.127799034118652, -7.349407196044922, -3.571016311645508, 0.20737457275390625, 3.985767364501953, 7.764158248901367, 11.54254150390625, 15.320932388305664, 19.099323272705078, 22.877716064453125, 26.65610694885254, 30.434497833251953, 34.212890625, 37.99127960205078, 41.76967239379883, 45.548065185546875, 49.326454162597656, 53.1048469543457, 56.88323974609375, 60.66162872314453, 64.44001770019531, 68.21841430664062, 71.9968032836914, 75.77519226074219, 79.5535888671875, 83.33197784423828, 87.11036682128906, 90.88876342773438, 94.66715240478516, 98.44554138183594, 102.22393798828125, 106.00232696533203, 109.78072357177734, 113.55911254882812, 117.3375015258789, 121.11589050292969, 124.894287109375, 128.6726837158203, 132.45106506347656]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 6.0, 4.0, 8.0, 3.0, 8.0, 8.0, 8.0, 7.0, 18.0, 11.0, 21.0, 13.0, 14.0, 17.0, 20.0, 32.0, 20.0, 29.0, 23.0, 34.0, 36.0, 30.0, 22.0, 26.0, 54.0, 33.0, 42.0, 32.0, 41.0, 34.0, 43.0, 35.0, 34.0, 31.0, 16.0, 20.0, 24.0, 12.0, 19.0, 15.0, 21.0, 13.0, 16.0, 6.0, 9.0, 9.0, 6.0, 6.0, 6.0, 5.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0], "bins": [-60.43287658691406, -58.43415069580078, -56.4354248046875, -54.43669891357422, -52.43797302246094, -50.439247131347656, -48.44052505493164, -46.44179916381836, -44.44307327270508, -42.4443473815918, -40.445621490478516, -38.446895599365234, -36.44817352294922, -34.44944763183594, -32.450721740722656, -30.451995849609375, -28.453269958496094, -26.454544067382812, -24.45581817626953, -22.457094192504883, -20.4583683013916, -18.45964241027832, -16.460918426513672, -14.46219253540039, -12.46346664428711, -10.464740753173828, -8.466015815734863, -6.46729040145874, -4.468564987182617, -2.469839096069336, -0.4711141586303711, 1.5276107788085938, 3.526336669921875, 5.525062084197998, 7.523787498474121, 9.522512435913086, 11.521238327026367, 13.519964218139648, 15.518689155578613, 17.517414093017578, 19.51613998413086, 21.51486587524414, 23.513591766357422, 25.51231575012207, 27.51104164123535, 29.509767532348633, 31.50849151611328, 33.50721740722656, 35.505943298339844, 37.504669189453125, 39.503395080566406, 41.50212097167969, 43.50084686279297, 45.49957275390625, 47.498294830322266, 49.49702072143555, 51.49574661254883, 53.49447250366211, 55.49319839477539, 57.49192428588867, 59.49064636230469, 61.48937225341797, 63.48809814453125, 65.48682403564453, 67.48554992675781]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 10.0, 10.0, 14.0, 5.0, 17.0, 13.0, 21.0, 21.0, 24.0, 27.0, 20.0, 43.0, 48.0, 38.0, 39.0, 56.0, 53.0, 40.0, 45.0, 45.0, 38.0, 49.0, 40.0, 54.0, 33.0, 27.0, 18.0, 29.0, 30.0, 22.0, 14.0, 9.0, 7.0, 8.0, 8.0, 4.0, 3.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6875, -11.25146484375, -10.8154296875, -10.37939453125, -9.943359375, -9.50732421875, -9.0712890625, -8.63525390625, -8.19921875, -7.76318359375, -7.3271484375, -6.89111328125, -6.455078125, -6.01904296875, -5.5830078125, -5.14697265625, -4.7109375, -4.27490234375, -3.8388671875, -3.40283203125, -2.966796875, -2.53076171875, -2.0947265625, -1.65869140625, -1.22265625, -0.78662109375, -0.3505859375, 0.08544921875, 0.521484375, 0.95751953125, 1.3935546875, 1.82958984375, 2.265625, 2.70166015625, 3.1376953125, 3.57373046875, 4.009765625, 4.44580078125, 4.8818359375, 5.31787109375, 5.75390625, 6.18994140625, 6.6259765625, 7.06201171875, 7.498046875, 7.93408203125, 8.3701171875, 8.80615234375, 9.2421875, 9.67822265625, 10.1142578125, 10.55029296875, 10.986328125, 11.42236328125, 11.8583984375, 12.29443359375, 12.73046875, 13.16650390625, 13.6025390625, 14.03857421875, 14.474609375, 14.91064453125, 15.3466796875, 15.78271484375, 16.21875]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 5.0, 3.0, 10.0, 19.0, 26.0, 49.0, 75.0, 92.0, 132.0, 171.0, 299.0, 493.0, 640.0, 937.0, 1372.0, 2167.0, 3135.0, 4590.0, 7086.0, 10737.0, 17119.0, 26723.0, 43078.0, 70233.0, 112308.0, 166685.0, 188950.0, 143878.0, 92453.0, 57101.0, 35027.0, 22179.0, 13916.0, 8992.0, 5876.0, 3910.0, 2576.0, 1839.0, 1218.0, 796.0, 551.0, 346.0, 283.0, 166.0, 97.0, 77.0, 60.0, 24.0, 22.0, 14.0, 6.0, 6.0, 7.0, 3.0, 1.0, 2.0, 3.0], "bins": [-1.9052734375, -1.8480377197265625, -1.790802001953125, -1.7335662841796875, -1.67633056640625, -1.6190948486328125, -1.561859130859375, -1.5046234130859375, -1.4473876953125, -1.3901519775390625, -1.332916259765625, -1.2756805419921875, -1.21844482421875, -1.1612091064453125, -1.103973388671875, -1.0467376708984375, -0.989501953125, -0.9322662353515625, -0.875030517578125, -0.8177947998046875, -0.76055908203125, -0.7033233642578125, -0.646087646484375, -0.5888519287109375, -0.5316162109375, -0.4743804931640625, -0.417144775390625, -0.3599090576171875, -0.30267333984375, -0.2454376220703125, -0.188201904296875, -0.1309661865234375, -0.07373046875, -0.0164947509765625, 0.040740966796875, 0.0979766845703125, 0.15521240234375, 0.2124481201171875, 0.269683837890625, 0.3269195556640625, 0.3841552734375, 0.4413909912109375, 0.498626708984375, 0.5558624267578125, 0.61309814453125, 0.6703338623046875, 0.727569580078125, 0.7848052978515625, 0.842041015625, 0.8992767333984375, 0.956512451171875, 1.0137481689453125, 1.07098388671875, 1.1282196044921875, 1.185455322265625, 1.2426910400390625, 1.2999267578125, 1.3571624755859375, 1.414398193359375, 1.4716339111328125, 1.52886962890625, 1.5861053466796875, 1.643341064453125, 1.7005767822265625, 1.7578125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 5.0, 4.0, 4.0, 8.0, 10.0, 13.0, 9.0, 11.0, 16.0, 26.0, 21.0, 20.0, 24.0, 39.0, 30.0, 29.0, 43.0, 32.0, 33.0, 46.0, 30.0, 1058.0, 45.0, 35.0, 37.0, 41.0, 34.0, 35.0, 33.0, 34.0, 29.0, 26.0, 16.0, 24.0, 21.0, 17.0, 14.0, 11.0, 7.0, 12.0, 10.0, 7.0, 4.0, 3.0, 5.0, 2.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-8.3046875, -8.0377197265625, -7.770751953125, -7.5037841796875, -7.23681640625, -6.9698486328125, -6.702880859375, -6.4359130859375, -6.1689453125, -5.9019775390625, -5.635009765625, -5.3680419921875, -5.10107421875, -4.8341064453125, -4.567138671875, -4.3001708984375, -4.033203125, -3.7662353515625, -3.499267578125, -3.2322998046875, -2.96533203125, -2.6983642578125, -2.431396484375, -2.1644287109375, -1.8974609375, -1.6304931640625, -1.363525390625, -1.0965576171875, -0.82958984375, -0.5626220703125, -0.295654296875, -0.0286865234375, 0.23828125, 0.5052490234375, 0.772216796875, 1.0391845703125, 1.30615234375, 1.5731201171875, 1.840087890625, 2.1070556640625, 2.3740234375, 2.6409912109375, 2.907958984375, 3.1749267578125, 3.44189453125, 3.7088623046875, 3.975830078125, 4.2427978515625, 4.509765625, 4.7767333984375, 5.043701171875, 5.3106689453125, 5.57763671875, 5.8446044921875, 6.111572265625, 6.3785400390625, 6.6455078125, 6.9124755859375, 7.179443359375, 7.4464111328125, 7.71337890625, 7.9803466796875, 8.247314453125, 8.5142822265625, 8.78125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 5.0, 8.0, 9.0, 14.0, 17.0, 38.0, 40.0, 81.0, 105.0, 131.0, 192.0, 294.0, 371.0, 596.0, 830.0, 1189.0, 1800.0, 2516.0, 3639.0, 5251.0, 7811.0, 11670.0, 17986.0, 27895.0, 43752.0, 69432.0, 108478.0, 161616.0, 1226939.0, 142930.0, 93822.0, 59648.0, 37764.0, 23713.0, 15315.0, 10052.0, 6588.0, 4555.0, 3104.0, 2083.0, 1488.0, 1017.0, 722.0, 502.0, 334.0, 232.0, 183.0, 108.0, 91.0, 58.0, 46.0, 32.0, 18.0, 12.0, 9.0, 9.0, 4.0, 1.0, 0.0, 1.0], "bins": [-1.0849609375, -1.0514068603515625, -1.017852783203125, -0.9842987060546875, -0.95074462890625, -0.9171905517578125, -0.883636474609375, -0.8500823974609375, -0.8165283203125, -0.7829742431640625, -0.749420166015625, -0.7158660888671875, -0.68231201171875, -0.6487579345703125, -0.615203857421875, -0.5816497802734375, -0.548095703125, -0.5145416259765625, -0.480987548828125, -0.4474334716796875, -0.41387939453125, -0.3803253173828125, -0.346771240234375, -0.3132171630859375, -0.2796630859375, -0.2461090087890625, -0.212554931640625, -0.1790008544921875, -0.14544677734375, -0.1118927001953125, -0.078338623046875, -0.0447845458984375, -0.01123046875, 0.0223236083984375, 0.055877685546875, 0.0894317626953125, 0.12298583984375, 0.1565399169921875, 0.190093994140625, 0.2236480712890625, 0.2572021484375, 0.2907562255859375, 0.324310302734375, 0.3578643798828125, 0.39141845703125, 0.4249725341796875, 0.458526611328125, 0.4920806884765625, 0.525634765625, 0.5591888427734375, 0.592742919921875, 0.6262969970703125, 0.65985107421875, 0.6934051513671875, 0.726959228515625, 0.7605133056640625, 0.7940673828125, 0.8276214599609375, 0.861175537109375, 0.8947296142578125, 0.92828369140625, 0.9618377685546875, 0.995391845703125, 1.0289459228515625, 1.0625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 5.0, 1.0, 3.0, 4.0, 5.0, 6.0, 5.0, 13.0, 9.0, 13.0, 8.0, 10.0, 17.0, 26.0, 34.0, 46.0, 84.0, 121.0, 201.0, 119.0, 68.0, 54.0, 36.0, 15.0, 15.0, 18.0, 16.0, 8.0, 5.0, 10.0, 4.0, 7.0, 0.0, 6.0, 3.0, 6.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03961181640625, -0.038210391998291016, -0.03680896759033203, -0.03540754318237305, -0.03400611877441406, -0.03260469436645508, -0.031203269958496094, -0.02980184555053711, -0.028400421142578125, -0.02699899673461914, -0.025597572326660156, -0.024196147918701172, -0.022794723510742188, -0.021393299102783203, -0.01999187469482422, -0.018590450286865234, -0.01718902587890625, -0.015787601470947266, -0.014386177062988281, -0.012984752655029297, -0.011583328247070312, -0.010181903839111328, -0.008780479431152344, -0.007379055023193359, -0.005977630615234375, -0.004576206207275391, -0.0031747817993164062, -0.0017733573913574219, -0.0003719329833984375, 0.0010294914245605469, 0.0024309158325195312, 0.0038323402404785156, 0.0052337646484375, 0.006635189056396484, 0.008036613464355469, 0.009438037872314453, 0.010839462280273438, 0.012240886688232422, 0.013642311096191406, 0.01504373550415039, 0.016445159912109375, 0.01784658432006836, 0.019248008728027344, 0.020649433135986328, 0.022050857543945312, 0.023452281951904297, 0.02485370635986328, 0.026255130767822266, 0.02765655517578125, 0.029057979583740234, 0.03045940399169922, 0.0318608283996582, 0.03326225280761719, 0.03466367721557617, 0.036065101623535156, 0.03746652603149414, 0.038867950439453125, 0.04026937484741211, 0.041670799255371094, 0.04307222366333008, 0.04447364807128906, 0.04587507247924805, 0.04727649688720703, 0.048677921295166016, 0.050079345703125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 2.0, 6.0, 5.0, 8.0, 10.0, 11.0, 25.0, 22.0, 30.0, 34.0, 75.0, 135.0, 351.0, 3100.0, 1017358.0, 26285.0, 630.0, 176.0, 87.0, 53.0, 35.0, 18.0, 15.0, 15.0, 11.0, 14.0, 4.0, 6.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.10546875, -1.0745086669921875, -1.043548583984375, -1.0125885009765625, -0.98162841796875, -0.9506683349609375, -0.919708251953125, -0.8887481689453125, -0.8577880859375, -0.8268280029296875, -0.795867919921875, -0.7649078369140625, -0.73394775390625, -0.7029876708984375, -0.672027587890625, -0.6410675048828125, -0.610107421875, -0.5791473388671875, -0.548187255859375, -0.5172271728515625, -0.48626708984375, -0.4553070068359375, -0.424346923828125, -0.3933868408203125, -0.3624267578125, -0.3314666748046875, -0.300506591796875, -0.2695465087890625, -0.23858642578125, -0.2076263427734375, -0.176666259765625, -0.1457061767578125, -0.11474609375, -0.0837860107421875, -0.052825927734375, -0.0218658447265625, 0.00909423828125, 0.0400543212890625, 0.071014404296875, 0.1019744873046875, 0.1329345703125, 0.1638946533203125, 0.194854736328125, 0.2258148193359375, 0.25677490234375, 0.2877349853515625, 0.318695068359375, 0.3496551513671875, 0.380615234375, 0.4115753173828125, 0.442535400390625, 0.4734954833984375, 0.50445556640625, 0.5354156494140625, 0.566375732421875, 0.5973358154296875, 0.6282958984375, 0.6592559814453125, 0.690216064453125, 0.7211761474609375, 0.75213623046875, 0.7830963134765625, 0.814056396484375, 0.8450164794921875, 0.8759765625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 17.0, 49.0, 176.0, 395.0, 242.0, 77.0, 26.0, 16.0, 7.0, 2.0, 4.0, 0.0, 1.0], "bins": [-0.26095834374427795, -0.2561827600002289, -0.2514071464538574, -0.24663156270980835, -0.24185597896575928, -0.2370803952217102, -0.23230479657649994, -0.22752919793128967, -0.2227536141872406, -0.21797803044319153, -0.21320243179798126, -0.208426833152771, -0.20365124940872192, -0.19887566566467285, -0.19410006701946259, -0.18932446837425232, -0.18454888463020325, -0.17977330088615417, -0.1749977022409439, -0.17022210359573364, -0.16544651985168457, -0.1606709361076355, -0.15589533746242523, -0.15111973881721497, -0.1463441550731659, -0.14156857132911682, -0.13679297268390656, -0.1320173740386963, -0.12724179029464722, -0.12246619910001755, -0.11769060790538788, -0.11291501671075821, -0.10813944041728973, -0.10336384922266006, -0.0985882580280304, -0.09381266683340073, -0.08903707563877106, -0.08426148444414139, -0.07948589324951172, -0.07471030205488205, -0.06993471086025238, -0.06515911966562271, -0.06038352847099304, -0.05560793727636337, -0.050832346081733704, -0.046056754887104034, -0.041281163692474365, -0.036505572497844696, -0.03172997757792473, -0.02695438638329506, -0.02217879518866539, -0.01740320399403572, -0.012627612799406052, -0.007852021604776382, -0.0030764304101467133, 0.001699160784482956, 0.006474751979112625, 0.011250343173742294, 0.016025934368371964, 0.020801525563001633, 0.025577116757631302, 0.03035270795226097, 0.03512829914689064, 0.03990389034152031, 0.04467948153614998]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 3.0, 5.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 12.0, 9.0, 15.0, 20.0, 24.0, 18.0, 15.0, 22.0, 25.0, 36.0, 35.0, 34.0, 29.0, 42.0, 40.0, 36.0, 41.0, 37.0, 40.0, 33.0, 33.0, 41.0, 34.0, 35.0, 23.0, 25.0, 34.0, 32.0, 20.0, 26.0, 23.0, 15.0, 11.0, 6.0, 13.0, 12.0, 8.0, 5.0, 7.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 4.0], "bins": [-0.027714073657989502, -0.026950374245643616, -0.02618667669594288, -0.02542297914624214, -0.024659279733896255, -0.02389558032155037, -0.023131882771849632, -0.022368185222148895, -0.02160448580980301, -0.020840786397457123, -0.020077088847756386, -0.01931339129805565, -0.018549691885709763, -0.017785992473363876, -0.01702229492366314, -0.016258597373962402, -0.015494897961616516, -0.014731199480593204, -0.013967500999569893, -0.013203802518546581, -0.01244010403752327, -0.011676405556499958, -0.010912707075476646, -0.010149008594453335, -0.009385310113430023, -0.008621611632406712, -0.0078579131513834, -0.007094214670360088, -0.006330516189336777, -0.005566817708313465, -0.0048031192272901535, -0.004039420746266842, -0.0032757222652435303, -0.0025120237842202187, -0.001748325303196907, -0.0009846268221735954, -0.0002209283411502838, 0.0005427701398730278, 0.0013064686208963394, 0.002070167101919651, 0.0028338655829429626, 0.0035975640639662743, 0.004361262544989586, 0.0051249610260128975, 0.005888659507036209, 0.006652357988059521, 0.007416056469082832, 0.008179754950106144, 0.008943453431129456, 0.009707151912152767, 0.010470850393176079, 0.01123454887419939, 0.011998247355222702, 0.012761945836246014, 0.013525644317269325, 0.014289342798292637, 0.015053041279315948, 0.015816740691661835, 0.01658043824136257, 0.01734413579106331, 0.018107835203409195, 0.01887153461575508, 0.019635232165455818, 0.020398929715156555, 0.02116262912750244]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 10.0, 10.0, 14.0, 5.0, 17.0, 13.0, 21.0, 21.0, 24.0, 27.0, 20.0, 43.0, 48.0, 38.0, 39.0, 56.0, 53.0, 40.0, 45.0, 45.0, 38.0, 49.0, 40.0, 54.0, 33.0, 27.0, 18.0, 29.0, 30.0, 21.0, 15.0, 9.0, 7.0, 8.0, 8.0, 4.0, 3.0, 8.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.6875, -11.25146484375, -10.8154296875, -10.37939453125, -9.943359375, -9.50732421875, -9.0712890625, -8.63525390625, -8.19921875, -7.76318359375, -7.3271484375, -6.89111328125, -6.455078125, -6.01904296875, -5.5830078125, -5.14697265625, -4.7109375, -4.27490234375, -3.8388671875, -3.40283203125, -2.966796875, -2.53076171875, -2.0947265625, -1.65869140625, -1.22265625, -0.78662109375, -0.3505859375, 0.08544921875, 0.521484375, 0.95751953125, 1.3935546875, 1.82958984375, 2.265625, 2.70166015625, 3.1376953125, 3.57373046875, 4.009765625, 4.44580078125, 4.8818359375, 5.31787109375, 5.75390625, 6.18994140625, 6.6259765625, 7.06201171875, 7.498046875, 7.93408203125, 8.3701171875, 8.80615234375, 9.2421875, 9.67822265625, 10.1142578125, 10.55029296875, 10.986328125, 11.42236328125, 11.8583984375, 12.29443359375, 12.73046875, 13.16650390625, 13.6025390625, 14.03857421875, 14.474609375, 14.91064453125, 15.3466796875, 15.78271484375, 16.21875]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 9.0, 10.0, 19.0, 19.0, 19.0, 41.0, 48.0, 68.0, 108.0, 117.0, 200.0, 267.0, 411.0, 676.0, 1007.0, 1657.0, 2588.0, 4539.0, 8701.0, 22300.0, 117306.0, 720497.0, 124412.0, 22640.0, 8902.0, 4614.0, 2645.0, 1577.0, 1073.0, 692.0, 423.0, 303.0, 194.0, 137.0, 94.0, 67.0, 47.0, 35.0, 28.0, 16.0, 11.0, 7.0, 9.0, 6.0, 7.0, 2.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-17.296875, -16.72998046875, -16.1630859375, -15.59619140625, -15.029296875, -14.46240234375, -13.8955078125, -13.32861328125, -12.76171875, -12.19482421875, -11.6279296875, -11.06103515625, -10.494140625, -9.92724609375, -9.3603515625, -8.79345703125, -8.2265625, -7.65966796875, -7.0927734375, -6.52587890625, -5.958984375, -5.39208984375, -4.8251953125, -4.25830078125, -3.69140625, -3.12451171875, -2.5576171875, -1.99072265625, -1.423828125, -0.85693359375, -0.2900390625, 0.27685546875, 0.84375, 1.41064453125, 1.9775390625, 2.54443359375, 3.111328125, 3.67822265625, 4.2451171875, 4.81201171875, 5.37890625, 5.94580078125, 6.5126953125, 7.07958984375, 7.646484375, 8.21337890625, 8.7802734375, 9.34716796875, 9.9140625, 10.48095703125, 11.0478515625, 11.61474609375, 12.181640625, 12.74853515625, 13.3154296875, 13.88232421875, 14.44921875, 15.01611328125, 15.5830078125, 16.14990234375, 16.716796875, 17.28369140625, 17.8505859375, 18.41748046875, 18.984375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 10.0, 12.0, 16.0, 15.0, 18.0, 25.0, 25.0, 27.0, 46.0, 31.0, 43.0, 40.0, 59.0, 64.0, 91.0, 343.0, 1622.0, 95.0, 58.0, 43.0, 36.0, 33.0, 38.0, 41.0, 36.0, 27.0, 22.0, 15.0, 17.0, 24.0, 9.0, 11.0, 10.0, 12.0, 5.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-39.03125, -37.736328125, -36.44140625, -35.146484375, -33.8515625, -32.556640625, -31.26171875, -29.966796875, -28.671875, -27.376953125, -26.08203125, -24.787109375, -23.4921875, -22.197265625, -20.90234375, -19.607421875, -18.3125, -17.017578125, -15.72265625, -14.427734375, -13.1328125, -11.837890625, -10.54296875, -9.248046875, -7.953125, -6.658203125, -5.36328125, -4.068359375, -2.7734375, -1.478515625, -0.18359375, 1.111328125, 2.40625, 3.701171875, 4.99609375, 6.291015625, 7.5859375, 8.880859375, 10.17578125, 11.470703125, 12.765625, 14.060546875, 15.35546875, 16.650390625, 17.9453125, 19.240234375, 20.53515625, 21.830078125, 23.125, 24.419921875, 25.71484375, 27.009765625, 28.3046875, 29.599609375, 30.89453125, 32.189453125, 33.484375, 34.779296875, 36.07421875, 37.369140625, 38.6640625, 39.958984375, 41.25390625, 42.548828125, 43.84375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 3.0, 6.0, 7.0, 12.0, 10.0, 18.0, 18.0, 23.0, 27.0, 22.0, 44.0, 62.0, 74.0, 116.0, 115.0, 175.0, 330.0, 692.0, 4004.0, 71816.0, 3047326.0, 17492.0, 1845.0, 515.0, 238.0, 160.0, 144.0, 95.0, 62.0, 50.0, 33.0, 29.0, 29.0, 23.0, 17.0, 14.0, 20.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-91.8125, -89.0556640625, -86.298828125, -83.5419921875, -80.78515625, -78.0283203125, -75.271484375, -72.5146484375, -69.7578125, -67.0009765625, -64.244140625, -61.4873046875, -58.73046875, -55.9736328125, -53.216796875, -50.4599609375, -47.703125, -44.9462890625, -42.189453125, -39.4326171875, -36.67578125, -33.9189453125, -31.162109375, -28.4052734375, -25.6484375, -22.8916015625, -20.134765625, -17.3779296875, -14.62109375, -11.8642578125, -9.107421875, -6.3505859375, -3.59375, -0.8369140625, 1.919921875, 4.6767578125, 7.43359375, 10.1904296875, 12.947265625, 15.7041015625, 18.4609375, 21.2177734375, 23.974609375, 26.7314453125, 29.48828125, 32.2451171875, 35.001953125, 37.7587890625, 40.515625, 43.2724609375, 46.029296875, 48.7861328125, 51.54296875, 54.2998046875, 57.056640625, 59.8134765625, 62.5703125, 65.3271484375, 68.083984375, 70.8408203125, 73.59765625, 76.3544921875, 79.111328125, 81.8681640625, 84.625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 8.0, 67.0, 253.0, 414.0, 203.0, 57.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-214.71463012695312, -210.3649139404297, -206.0152130126953, -201.66549682617188, -197.3157958984375, -192.96607971191406, -188.61636352539062, -184.26666259765625, -179.9169464111328, -175.56723022460938, -171.217529296875, -166.86781311035156, -162.5181121826172, -158.16839599609375, -153.81869506835938, -149.46897888183594, -145.1192626953125, -140.76954650878906, -136.4198455810547, -132.07012939453125, -127.72042083740234, -123.37071228027344, -119.02100372314453, -114.67129516601562, -110.32159423828125, -105.97188568115234, -101.62217712402344, -97.2724609375, -92.9227523803711, -88.57304382324219, -84.22333526611328, -79.87362670898438, -75.52389526367188, -71.17418670654297, -66.82447814941406, -62.47476577758789, -58.12505340576172, -53.77534484863281, -49.425636291503906, -45.075927734375, -40.726219177246094, -36.37651062011719, -32.026798248291016, -27.67708969116211, -23.32737922668457, -18.97766876220703, -14.627960205078125, -10.278249740600586, -5.928539276123047, -1.578829288482666, 2.770880699157715, 7.1205902099609375, 11.470300674438477, 15.820011138916016, 20.169719696044922, 24.51943016052246, 28.869140625, 33.218849182128906, 37.56856155395508, 41.918270111083984, 46.267982482910156, 50.61769104003906, 54.96739959716797, 59.317108154296875, 63.66682052612305]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 3.0, 4.0, 11.0, 12.0, 15.0, 13.0, 17.0, 11.0, 19.0, 22.0, 26.0, 26.0, 30.0, 33.0, 34.0, 37.0, 34.0, 29.0, 40.0, 39.0, 44.0, 39.0, 49.0, 39.0, 48.0, 33.0, 27.0, 29.0, 36.0, 32.0, 31.0, 22.0, 14.0, 20.0, 11.0, 9.0, 8.0, 15.0, 8.0, 7.0, 4.0, 5.0, 2.0, 6.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-94.56412506103516, -91.71785736083984, -88.87159729003906, -86.02532958984375, -83.17906951904297, -80.33280181884766, -77.48654174804688, -74.64027404785156, -71.79401397705078, -68.94774627685547, -66.10148620605469, -63.25522232055664, -60.408958435058594, -57.56269454956055, -54.7164306640625, -51.87016296386719, -49.02389907836914, -46.177635192871094, -43.33137130737305, -40.485107421875, -37.63884353637695, -34.792579650878906, -31.946313858032227, -29.10004997253418, -26.253786087036133, -23.407522201538086, -20.56125831604004, -17.71499252319336, -14.868729591369629, -12.022465705871582, -9.176200866699219, -6.329936981201172, -3.483673095703125, -0.637408971786499, 2.208855152130127, 5.055119514465332, 7.901383399963379, 10.747647285461426, 13.593912124633789, 16.440176010131836, 19.286439895629883, 22.13270378112793, 24.978967666625977, 27.825233459472656, 30.671497344970703, 33.51776123046875, 36.3640251159668, 39.210289001464844, 42.05655288696289, 44.90281677246094, 47.749080657958984, 50.59534454345703, 53.44160842895508, 56.287872314453125, 59.13414001464844, 61.98040008544922, 64.82666778564453, 67.67293548583984, 70.51919555664062, 73.36546325683594, 76.21172332763672, 79.05799102783203, 81.90425109863281, 84.75051879882812, 87.5967788696289]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 3.0, 12.0, 12.0, 6.0, 20.0, 11.0, 13.0, 17.0, 10.0, 24.0, 30.0, 30.0, 36.0, 30.0, 49.0, 48.0, 52.0, 44.0, 54.0, 36.0, 39.0, 47.0, 36.0, 38.0, 40.0, 44.0, 46.0, 20.0, 25.0, 23.0, 23.0, 16.0, 15.0, 11.0, 13.0, 2.0, 8.0, 6.0, 4.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0546875, -11.6112060546875, -11.167724609375, -10.7242431640625, -10.28076171875, -9.8372802734375, -9.393798828125, -8.9503173828125, -8.5068359375, -8.0633544921875, -7.619873046875, -7.1763916015625, -6.73291015625, -6.2894287109375, -5.845947265625, -5.4024658203125, -4.958984375, -4.5155029296875, -4.072021484375, -3.6285400390625, -3.18505859375, -2.7415771484375, -2.298095703125, -1.8546142578125, -1.4111328125, -0.9676513671875, -0.524169921875, -0.0806884765625, 0.36279296875, 0.8062744140625, 1.249755859375, 1.6932373046875, 2.13671875, 2.5802001953125, 3.023681640625, 3.4671630859375, 3.91064453125, 4.3541259765625, 4.797607421875, 5.2410888671875, 5.6845703125, 6.1280517578125, 6.571533203125, 7.0150146484375, 7.45849609375, 7.9019775390625, 8.345458984375, 8.7889404296875, 9.232421875, 9.6759033203125, 10.119384765625, 10.5628662109375, 11.00634765625, 11.4498291015625, 11.893310546875, 12.3367919921875, 12.7802734375, 13.2237548828125, 13.667236328125, 14.1107177734375, 14.55419921875, 14.9976806640625, 15.441162109375, 15.8846435546875, 16.328125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 4.0, 3.0, 3.0, 6.0, 16.0, 16.0, 15.0, 26.0, 24.0, 29.0, 24.0, 36.0, 48.0, 53.0, 97.0, 160.0, 286.0, 655.0, 1527.0, 4379.0, 14364.0, 85653.0, 1590128.0, 2326199.0, 144290.0, 17590.0, 4933.0, 1881.0, 803.0, 362.0, 214.0, 114.0, 93.0, 54.0, 39.0, 40.0, 26.0, 19.0, 24.0, 13.0, 11.0, 10.0, 11.0, 5.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.734375, -29.640380859375, -28.54638671875, -27.452392578125, -26.3583984375, -25.264404296875, -24.17041015625, -23.076416015625, -21.982421875, -20.888427734375, -19.79443359375, -18.700439453125, -17.6064453125, -16.512451171875, -15.41845703125, -14.324462890625, -13.23046875, -12.136474609375, -11.04248046875, -9.948486328125, -8.8544921875, -7.760498046875, -6.66650390625, -5.572509765625, -4.478515625, -3.384521484375, -2.29052734375, -1.196533203125, -0.1025390625, 0.991455078125, 2.08544921875, 3.179443359375, 4.2734375, 5.367431640625, 6.46142578125, 7.555419921875, 8.6494140625, 9.743408203125, 10.83740234375, 11.931396484375, 13.025390625, 14.119384765625, 15.21337890625, 16.307373046875, 17.4013671875, 18.495361328125, 19.58935546875, 20.683349609375, 21.77734375, 22.871337890625, 23.96533203125, 25.059326171875, 26.1533203125, 27.247314453125, 28.34130859375, 29.435302734375, 30.529296875, 31.623291015625, 32.71728515625, 33.811279296875, 34.9052734375, 35.999267578125, 37.09326171875, 38.187255859375, 39.28125]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 5.0, 4.0, 3.0, 9.0, 17.0, 13.0, 26.0, 39.0, 46.0, 59.0, 74.0, 130.0, 188.0, 336.0, 539.0, 689.0, 650.0, 483.0, 247.0, 172.0, 90.0, 74.0, 42.0, 34.0, 22.0, 18.0, 15.0, 15.0, 7.0, 10.0, 10.0, 4.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-36.0, -35.071533203125, -34.14306640625, -33.214599609375, -32.2861328125, -31.357666015625, -30.42919921875, -29.500732421875, -28.572265625, -27.643798828125, -26.71533203125, -25.786865234375, -24.8583984375, -23.929931640625, -23.00146484375, -22.072998046875, -21.14453125, -20.216064453125, -19.28759765625, -18.359130859375, -17.4306640625, -16.502197265625, -15.57373046875, -14.645263671875, -13.716796875, -12.788330078125, -11.85986328125, -10.931396484375, -10.0029296875, -9.074462890625, -8.14599609375, -7.217529296875, -6.2890625, -5.360595703125, -4.43212890625, -3.503662109375, -2.5751953125, -1.646728515625, -0.71826171875, 0.210205078125, 1.138671875, 2.067138671875, 2.99560546875, 3.924072265625, 4.8525390625, 5.781005859375, 6.70947265625, 7.637939453125, 8.56640625, 9.494873046875, 10.42333984375, 11.351806640625, 12.2802734375, 13.208740234375, 14.13720703125, 15.065673828125, 15.994140625, 16.922607421875, 17.85107421875, 18.779541015625, 19.7080078125, 20.636474609375, 21.56494140625, 22.493408203125, 23.421875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 3.0, 7.0, 6.0, 13.0, 11.0, 11.0, 14.0, 26.0, 25.0, 40.0, 51.0, 86.0, 152.0, 282.0, 667.0, 7524.0, 2757185.0, 1420938.0, 5918.0, 623.0, 254.0, 142.0, 77.0, 69.0, 45.0, 33.0, 28.0, 12.0, 17.0, 7.0, 3.0, 6.0, 5.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.5, -106.244140625, -101.98828125, -97.732421875, -93.4765625, -89.220703125, -84.96484375, -80.708984375, -76.453125, -72.197265625, -67.94140625, -63.685546875, -59.4296875, -55.173828125, -50.91796875, -46.662109375, -42.40625, -38.150390625, -33.89453125, -29.638671875, -25.3828125, -21.126953125, -16.87109375, -12.615234375, -8.359375, -4.103515625, 0.15234375, 4.408203125, 8.6640625, 12.919921875, 17.17578125, 21.431640625, 25.6875, 29.943359375, 34.19921875, 38.455078125, 42.7109375, 46.966796875, 51.22265625, 55.478515625, 59.734375, 63.990234375, 68.24609375, 72.501953125, 76.7578125, 81.013671875, 85.26953125, 89.525390625, 93.78125, 98.037109375, 102.29296875, 106.548828125, 110.8046875, 115.060546875, 119.31640625, 123.572265625, 127.828125, 132.083984375, 136.33984375, 140.595703125, 144.8515625, 149.107421875, 153.36328125, 157.619140625, 161.875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 9.0, 9.0, 35.0, 55.0, 119.0, 150.0, 181.0, 188.0, 122.0, 63.0, 37.0, 18.0, 15.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-253.97232055664062, -248.7565155029297, -243.54071044921875, -238.32489013671875, -233.1090850830078, -227.89328002929688, -222.67747497558594, -217.461669921875, -212.24586486816406, -207.03005981445312, -201.8142547607422, -196.59844970703125, -191.38262939453125, -186.1668243408203, -180.95101928710938, -175.73521423339844, -170.5194091796875, -165.30360412597656, -160.08779907226562, -154.87197875976562, -149.6561737060547, -144.44036865234375, -139.2245635986328, -134.00875854492188, -128.79293823242188, -123.57713317871094, -118.36132049560547, -113.14551544189453, -107.9297103881836, -102.71389770507812, -97.49809265136719, -92.28228759765625, -87.06649017333984, -81.8506851196289, -76.63487243652344, -71.4190673828125, -66.20326232910156, -60.98745346069336, -55.771644592285156, -50.55583953857422, -45.340030670166016, -40.12422180175781, -34.908416748046875, -29.692607879638672, -24.4768009185791, -19.26099395751953, -14.045185089111328, -8.82938003540039, -3.6135711669921875, 1.602236270904541, 6.8180437088012695, 12.033851623535156, 17.249658584594727, 22.465465545654297, 27.6812744140625, 32.89707946777344, 38.11288833618164, 43.328697204589844, 48.54450225830078, 53.760311126708984, 58.97611999511719, 64.19192504882812, 69.40773010253906, 74.62353515625, 79.83934783935547]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 8.0, 4.0, 8.0, 5.0, 13.0, 8.0, 22.0, 16.0, 24.0, 24.0, 17.0, 29.0, 26.0, 39.0, 27.0, 33.0, 39.0, 43.0, 35.0, 39.0, 48.0, 42.0, 52.0, 38.0, 47.0, 27.0, 44.0, 31.0, 35.0, 32.0, 29.0, 22.0, 17.0, 14.0, 17.0, 12.0, 8.0, 5.0, 9.0, 1.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-84.88372802734375, -82.41515350341797, -79.94657897949219, -77.4780044555664, -75.00942993164062, -72.54084777832031, -70.07227325439453, -67.60369873046875, -65.13512420654297, -62.66654968261719, -60.197975158691406, -57.72939682006836, -55.26082229614258, -52.7922477722168, -50.32366943359375, -47.85509490966797, -45.38652038574219, -42.917945861816406, -40.449371337890625, -37.98079299926758, -35.5122184753418, -33.043643951416016, -30.5750675201416, -28.106491088867188, -25.637916564941406, -23.169342041015625, -20.70076560974121, -18.232189178466797, -15.763614654541016, -13.295039176940918, -10.82646369934082, -8.357887268066406, -5.889320373535156, -3.4207448959350586, -0.9521694183349609, 1.5164060592651367, 3.9849815368652344, 6.453557014465332, 8.92213249206543, 11.390708923339844, 13.859283447265625, 16.327857971191406, 18.79643440246582, 21.265010833740234, 23.733585357666016, 26.202159881591797, 28.67073631286621, 31.139312744140625, 33.607887268066406, 36.07646179199219, 38.54503631591797, 41.013614654541016, 43.4821891784668, 45.95076370239258, 48.419342041015625, 50.887916564941406, 53.35649108886719, 55.82506561279297, 58.29364013671875, 60.7622184753418, 63.23079299926758, 65.69937133789062, 68.1679458618164, 70.63652038574219, 73.10509490966797]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 6.0, 6.0, 7.0, 9.0, 11.0, 10.0, 24.0, 19.0, 23.0, 22.0, 25.0, 28.0, 31.0, 44.0, 51.0, 41.0, 47.0, 57.0, 46.0, 48.0, 69.0, 45.0, 29.0, 34.0, 35.0, 35.0, 38.0, 22.0, 28.0, 25.0, 15.0, 17.0, 13.0, 12.0, 6.0, 10.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6015625, -14.142822265625, -13.68408203125, -13.225341796875, -12.7666015625, -12.307861328125, -11.84912109375, -11.390380859375, -10.931640625, -10.472900390625, -10.01416015625, -9.555419921875, -9.0966796875, -8.637939453125, -8.17919921875, -7.720458984375, -7.26171875, -6.802978515625, -6.34423828125, -5.885498046875, -5.4267578125, -4.968017578125, -4.50927734375, -4.050537109375, -3.591796875, -3.133056640625, -2.67431640625, -2.215576171875, -1.7568359375, -1.298095703125, -0.83935546875, -0.380615234375, 0.078125, 0.536865234375, 0.99560546875, 1.454345703125, 1.9130859375, 2.371826171875, 2.83056640625, 3.289306640625, 3.748046875, 4.206787109375, 4.66552734375, 5.124267578125, 5.5830078125, 6.041748046875, 6.50048828125, 6.959228515625, 7.41796875, 7.876708984375, 8.33544921875, 8.794189453125, 9.2529296875, 9.711669921875, 10.17041015625, 10.629150390625, 11.087890625, 11.546630859375, 12.00537109375, 12.464111328125, 12.9228515625, 13.381591796875, 13.84033203125, 14.299072265625, 14.7578125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 8.0, 7.0, 12.0, 19.0, 24.0, 44.0, 70.0, 98.0, 123.0, 216.0, 332.0, 473.0, 672.0, 1074.0, 1455.0, 2224.0, 3465.0, 5223.0, 7811.0, 12215.0, 19323.0, 30590.0, 51114.0, 84252.0, 135904.0, 192265.0, 181601.0, 121685.0, 74015.0, 45063.0, 27471.0, 17391.0, 11053.0, 7232.0, 4698.0, 3177.0, 2042.0, 1325.0, 945.0, 585.0, 398.0, 292.0, 192.0, 125.0, 88.0, 61.0, 24.0, 32.0, 19.0, 10.0, 10.0, 8.0, 4.0, 1.0, 4.0, 0.0, 0.0, 1.0], "bins": [-1.9482421875, -1.8871307373046875, -1.826019287109375, -1.7649078369140625, -1.70379638671875, -1.6426849365234375, -1.581573486328125, -1.5204620361328125, -1.4593505859375, -1.3982391357421875, -1.337127685546875, -1.2760162353515625, -1.21490478515625, -1.1537933349609375, -1.092681884765625, -1.0315704345703125, -0.970458984375, -0.9093475341796875, -0.848236083984375, -0.7871246337890625, -0.72601318359375, -0.6649017333984375, -0.603790283203125, -0.5426788330078125, -0.4815673828125, -0.4204559326171875, -0.359344482421875, -0.2982330322265625, -0.23712158203125, -0.1760101318359375, -0.114898681640625, -0.0537872314453125, 0.00732421875, 0.0684356689453125, 0.129547119140625, 0.1906585693359375, 0.25177001953125, 0.3128814697265625, 0.373992919921875, 0.4351043701171875, 0.4962158203125, 0.5573272705078125, 0.618438720703125, 0.6795501708984375, 0.74066162109375, 0.8017730712890625, 0.862884521484375, 0.9239959716796875, 0.985107421875, 1.0462188720703125, 1.107330322265625, 1.1684417724609375, 1.22955322265625, 1.2906646728515625, 1.351776123046875, 1.4128875732421875, 1.4739990234375, 1.5351104736328125, 1.596221923828125, 1.6573333740234375, 1.71844482421875, 1.7795562744140625, 1.840667724609375, 1.9017791748046875, 1.962890625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 9.0, 0.0, 8.0, 11.0, 9.0, 7.0, 13.0, 17.0, 17.0, 18.0, 22.0, 19.0, 26.0, 35.0, 37.0, 35.0, 40.0, 44.0, 45.0, 38.0, 44.0, 36.0, 1071.0, 38.0, 35.0, 36.0, 39.0, 48.0, 29.0, 35.0, 28.0, 18.0, 25.0, 19.0, 14.0, 10.0, 10.0, 12.0, 7.0, 9.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59375, -9.2945556640625, -8.995361328125, -8.6961669921875, -8.39697265625, -8.0977783203125, -7.798583984375, -7.4993896484375, -7.2001953125, -6.9010009765625, -6.601806640625, -6.3026123046875, -6.00341796875, -5.7042236328125, -5.405029296875, -5.1058349609375, -4.806640625, -4.5074462890625, -4.208251953125, -3.9090576171875, -3.60986328125, -3.3106689453125, -3.011474609375, -2.7122802734375, -2.4130859375, -2.1138916015625, -1.814697265625, -1.5155029296875, -1.21630859375, -0.9171142578125, -0.617919921875, -0.3187255859375, -0.01953125, 0.2796630859375, 0.578857421875, 0.8780517578125, 1.17724609375, 1.4764404296875, 1.775634765625, 2.0748291015625, 2.3740234375, 2.6732177734375, 2.972412109375, 3.2716064453125, 3.57080078125, 3.8699951171875, 4.169189453125, 4.4683837890625, 4.767578125, 5.0667724609375, 5.365966796875, 5.6651611328125, 5.96435546875, 6.2635498046875, 6.562744140625, 6.8619384765625, 7.1611328125, 7.4603271484375, 7.759521484375, 8.0587158203125, 8.35791015625, 8.6571044921875, 8.956298828125, 9.2554931640625, 9.5546875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 5.0, 0.0, 2.0, 10.0, 7.0, 8.0, 25.0, 32.0, 58.0, 94.0, 167.0, 234.0, 355.0, 610.0, 974.0, 1618.0, 2829.0, 4432.0, 7715.0, 12720.0, 22229.0, 39757.0, 72526.0, 132103.0, 303981.0, 1179624.0, 139069.0, 75917.0, 42087.0, 23710.0, 13843.0, 8228.0, 4789.0, 2908.0, 1719.0, 1061.0, 660.0, 370.0, 258.0, 139.0, 95.0, 58.0, 41.0, 22.0, 24.0, 17.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.390625, -1.3458251953125, -1.301025390625, -1.2562255859375, -1.21142578125, -1.1666259765625, -1.121826171875, -1.0770263671875, -1.0322265625, -0.9874267578125, -0.942626953125, -0.8978271484375, -0.85302734375, -0.8082275390625, -0.763427734375, -0.7186279296875, -0.673828125, -0.6290283203125, -0.584228515625, -0.5394287109375, -0.49462890625, -0.4498291015625, -0.405029296875, -0.3602294921875, -0.3154296875, -0.2706298828125, -0.225830078125, -0.1810302734375, -0.13623046875, -0.0914306640625, -0.046630859375, -0.0018310546875, 0.04296875, 0.0877685546875, 0.132568359375, 0.1773681640625, 0.22216796875, 0.2669677734375, 0.311767578125, 0.3565673828125, 0.4013671875, 0.4461669921875, 0.490966796875, 0.5357666015625, 0.58056640625, 0.6253662109375, 0.670166015625, 0.7149658203125, 0.759765625, 0.8045654296875, 0.849365234375, 0.8941650390625, 0.93896484375, 0.9837646484375, 1.028564453125, 1.0733642578125, 1.1181640625, 1.1629638671875, 1.207763671875, 1.2525634765625, 1.29736328125, 1.3421630859375, 1.386962890625, 1.4317626953125, 1.4765625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 4.0, 3.0, 5.0, 3.0, 4.0, 2.0, 4.0, 4.0, 13.0, 8.0, 12.0, 12.0, 16.0, 11.0, 15.0, 30.0, 36.0, 59.0, 70.0, 94.0, 126.0, 108.0, 92.0, 64.0, 30.0, 25.0, 39.0, 12.0, 17.0, 16.0, 12.0, 13.0, 8.0, 7.0, 3.0, 3.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0269775390625, -0.026132822036743164, -0.025288105010986328, -0.024443387985229492, -0.023598670959472656, -0.02275395393371582, -0.021909236907958984, -0.02106451988220215, -0.020219802856445312, -0.019375085830688477, -0.01853036880493164, -0.017685651779174805, -0.01684093475341797, -0.015996217727661133, -0.015151500701904297, -0.014306783676147461, -0.013462066650390625, -0.012617349624633789, -0.011772632598876953, -0.010927915573120117, -0.010083198547363281, -0.009238481521606445, -0.00839376449584961, -0.0075490474700927734, -0.0067043304443359375, -0.0058596134185791016, -0.005014896392822266, -0.00417017936706543, -0.0033254623413085938, -0.002480745315551758, -0.0016360282897949219, -0.0007913112640380859, 5.340576171875e-05, 0.0008981227874755859, 0.0017428398132324219, 0.002587556838989258, 0.0034322738647460938, 0.00427699089050293, 0.005121707916259766, 0.0059664249420166016, 0.0068111419677734375, 0.0076558589935302734, 0.00850057601928711, 0.009345293045043945, 0.010190010070800781, 0.011034727096557617, 0.011879444122314453, 0.012724161148071289, 0.013568878173828125, 0.014413595199584961, 0.015258312225341797, 0.016103029251098633, 0.01694774627685547, 0.017792463302612305, 0.01863718032836914, 0.019481897354125977, 0.020326614379882812, 0.02117133140563965, 0.022016048431396484, 0.02286076545715332, 0.023705482482910156, 0.024550199508666992, 0.025394916534423828, 0.026239633560180664, 0.0270843505859375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 8.0, 2.0, 5.0, 8.0, 9.0, 17.0, 17.0, 19.0, 29.0, 47.0, 70.0, 73.0, 146.0, 346.0, 2284.0, 605991.0, 436572.0, 2055.0, 334.0, 170.0, 101.0, 51.0, 34.0, 31.0, 18.0, 12.0, 17.0, 12.0, 15.0, 7.0, 8.0, 3.0, 6.0, 2.0, 3.0, 5.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0], "bins": [-0.57421875, -0.5562667846679688, -0.5383148193359375, -0.5203628540039062, -0.502410888671875, -0.48445892333984375, -0.4665069580078125, -0.44855499267578125, -0.43060302734375, -0.41265106201171875, -0.3946990966796875, -0.37674713134765625, -0.358795166015625, -0.34084320068359375, -0.3228912353515625, -0.30493927001953125, -0.2869873046875, -0.26903533935546875, -0.2510833740234375, -0.23313140869140625, -0.215179443359375, -0.19722747802734375, -0.1792755126953125, -0.16132354736328125, -0.14337158203125, -0.12541961669921875, -0.1074676513671875, -0.08951568603515625, -0.071563720703125, -0.05361175537109375, -0.0356597900390625, -0.01770782470703125, 0.000244140625, 0.01819610595703125, 0.0361480712890625, 0.05410003662109375, 0.072052001953125, 0.09000396728515625, 0.1079559326171875, 0.12590789794921875, 0.14385986328125, 0.16181182861328125, 0.1797637939453125, 0.19771575927734375, 0.215667724609375, 0.23361968994140625, 0.2515716552734375, 0.26952362060546875, 0.2874755859375, 0.30542755126953125, 0.3233795166015625, 0.34133148193359375, 0.359283447265625, 0.37723541259765625, 0.3951873779296875, 0.41313934326171875, 0.43109130859375, 0.44904327392578125, 0.4669952392578125, 0.48494720458984375, 0.502899169921875, 0.5208511352539062, 0.5388031005859375, 0.5567550659179688, 0.57470703125]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 15.0, 37.0, 85.0, 289.0, 383.0, 111.0, 54.0, 17.0, 3.0, 6.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09389685094356537, -0.08982937037944794, -0.0857618898153305, -0.08169440180063248, -0.07762692123651505, -0.07355944067239761, -0.06949195265769958, -0.06542447209358215, -0.06135699152946472, -0.05728951096534729, -0.05322202667593956, -0.04915454238653183, -0.0450870618224144, -0.04101958125829697, -0.036952096968889236, -0.032884612679481506, -0.028817132115364075, -0.024749649688601494, -0.020682167261838913, -0.016614684835076332, -0.012547202408313751, -0.00847971998155117, -0.0044122375547885895, -0.0003447551280260086, 0.0037227272987365723, 0.007790209725499153, 0.011857692152261734, 0.015925174579024315, 0.019992657005786896, 0.024060139432549477, 0.028127621859312057, 0.03219510614871979, 0.03626260161399841, 0.040330082178115845, 0.044397566467523575, 0.048465050756931305, 0.05253253132104874, 0.05660001188516617, 0.0606674961745739, 0.06473498046398163, 0.06880246102809906, 0.07286994159221649, 0.07693742215633392, 0.08100491017103195, 0.08507239073514938, 0.08913987129926682, 0.09320735931396484, 0.09727483987808228, 0.10134232044219971, 0.10540980100631714, 0.10947728157043457, 0.1135447695851326, 0.11761225014925003, 0.12167973071336746, 0.1257472187280655, 0.12981469929218292, 0.13388217985630035, 0.13794966042041779, 0.14201714098453522, 0.14608462154865265, 0.15015211701393127, 0.1542195975780487, 0.15828707814216614, 0.16235455870628357, 0.166422039270401]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 7.0, 4.0, 7.0, 7.0, 9.0, 7.0, 5.0, 8.0, 13.0, 16.0, 12.0, 16.0, 23.0, 24.0, 19.0, 24.0, 33.0, 27.0, 19.0, 29.0, 36.0, 46.0, 53.0, 48.0, 31.0, 45.0, 42.0, 36.0, 28.0, 31.0, 29.0, 21.0, 25.0, 26.0, 31.0, 21.0, 28.0, 17.0, 11.0, 14.0, 14.0, 7.0, 17.0, 6.0, 5.0, 5.0, 6.0, 2.0, 6.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 1.0], "bins": [-0.020461082458496094, -0.019826708361506462, -0.01919233426451683, -0.0185579601675272, -0.017923586070537567, -0.017289211973547935, -0.016654837876558304, -0.016020463779568672, -0.01538608968257904, -0.014751715585589409, -0.014117341488599777, -0.013482967391610146, -0.012848593294620514, -0.012214219197630882, -0.01157984510064125, -0.010945471003651619, -0.010311096906661987, -0.009676722809672356, -0.009042348712682724, -0.008407974615693092, -0.007773600518703461, -0.007139226421713829, -0.006504852324724197, -0.005870478227734566, -0.005236104130744934, -0.004601730033755302, -0.003967355936765671, -0.003332981839776039, -0.0026986077427864075, -0.002064233645796776, -0.0014298595488071442, -0.0007954854518175125, -0.00016111135482788086, 0.0004732627421617508, 0.0011076368391513824, 0.001742010936141014, 0.0023763850331306458, 0.0030107591301202774, 0.003645133227109909, 0.004279507324099541, 0.004913881421089172, 0.005548255518078804, 0.006182629615068436, 0.006817003712058067, 0.007451377809047699, 0.00808575190603733, 0.008720126003026962, 0.009354500100016594, 0.009988874197006226, 0.010623248293995857, 0.011257622390985489, 0.01189199648797512, 0.012526370584964752, 0.013160744681954384, 0.013795118778944016, 0.014429492875933647, 0.015063866972923279, 0.01569824106991291, 0.016332615166902542, 0.016966989263892174, 0.017601363360881805, 0.018235737457871437, 0.01887011155486107, 0.0195044856518507, 0.020138859748840332]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 6.0, 6.0, 6.0, 7.0, 9.0, 11.0, 11.0, 23.0, 19.0, 23.0, 22.0, 25.0, 28.0, 31.0, 44.0, 51.0, 41.0, 47.0, 57.0, 46.0, 48.0, 69.0, 45.0, 29.0, 35.0, 34.0, 36.0, 37.0, 22.0, 28.0, 24.0, 16.0, 17.0, 13.0, 12.0, 6.0, 10.0, 3.0, 3.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6015625, -14.142822265625, -13.68408203125, -13.225341796875, -12.7666015625, -12.307861328125, -11.84912109375, -11.390380859375, -10.931640625, -10.472900390625, -10.01416015625, -9.555419921875, -9.0966796875, -8.637939453125, -8.17919921875, -7.720458984375, -7.26171875, -6.802978515625, -6.34423828125, -5.885498046875, -5.4267578125, -4.968017578125, -4.50927734375, -4.050537109375, -3.591796875, -3.133056640625, -2.67431640625, -2.215576171875, -1.7568359375, -1.298095703125, -0.83935546875, -0.380615234375, 0.078125, 0.536865234375, 0.99560546875, 1.454345703125, 1.9130859375, 2.371826171875, 2.83056640625, 3.289306640625, 3.748046875, 4.206787109375, 4.66552734375, 5.124267578125, 5.5830078125, 6.041748046875, 6.50048828125, 6.959228515625, 7.41796875, 7.876708984375, 8.33544921875, 8.794189453125, 9.2529296875, 9.711669921875, 10.17041015625, 10.629150390625, 11.087890625, 11.546630859375, 12.00537109375, 12.464111328125, 12.9228515625, 13.381591796875, 13.84033203125, 14.299072265625, 14.7578125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 7.0, 6.0, 7.0, 21.0, 27.0, 41.0, 59.0, 72.0, 101.0, 133.0, 189.0, 260.0, 344.0, 499.0, 648.0, 858.0, 1183.0, 1641.0, 2365.0, 3407.0, 5235.0, 8035.0, 13841.0, 26391.0, 60084.0, 185242.0, 473087.0, 152171.0, 52511.0, 23526.0, 12828.0, 7644.0, 4792.0, 3186.0, 2234.0, 1553.0, 1146.0, 862.0, 653.0, 444.0, 349.0, 242.0, 165.0, 118.0, 115.0, 74.0, 50.0, 27.0, 32.0, 18.0, 8.0, 8.0, 6.0, 8.0, 3.0, 1.0, 2.0, 2.0], "bins": [-10.4296875, -10.1080322265625, -9.786376953125, -9.4647216796875, -9.14306640625, -8.8214111328125, -8.499755859375, -8.1781005859375, -7.8564453125, -7.5347900390625, -7.213134765625, -6.8914794921875, -6.56982421875, -6.2481689453125, -5.926513671875, -5.6048583984375, -5.283203125, -4.9615478515625, -4.639892578125, -4.3182373046875, -3.99658203125, -3.6749267578125, -3.353271484375, -3.0316162109375, -2.7099609375, -2.3883056640625, -2.066650390625, -1.7449951171875, -1.42333984375, -1.1016845703125, -0.780029296875, -0.4583740234375, -0.13671875, 0.1849365234375, 0.506591796875, 0.8282470703125, 1.14990234375, 1.4715576171875, 1.793212890625, 2.1148681640625, 2.4365234375, 2.7581787109375, 3.079833984375, 3.4014892578125, 3.72314453125, 4.0447998046875, 4.366455078125, 4.6881103515625, 5.009765625, 5.3314208984375, 5.653076171875, 5.9747314453125, 6.29638671875, 6.6180419921875, 6.939697265625, 7.2613525390625, 7.5830078125, 7.9046630859375, 8.226318359375, 8.5479736328125, 8.86962890625, 9.1912841796875, 9.512939453125, 9.8345947265625, 10.15625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 4.0, 4.0, 4.0, 3.0, 4.0, 5.0, 6.0, 10.0, 6.0, 12.0, 10.0, 21.0, 14.0, 20.0, 28.0, 23.0, 37.0, 38.0, 36.0, 52.0, 47.0, 51.0, 75.0, 128.0, 1713.0, 205.0, 80.0, 49.0, 38.0, 47.0, 35.0, 26.0, 26.0, 28.0, 26.0, 31.0, 21.0, 20.0, 21.0, 6.0, 5.0, 15.0, 8.0, 8.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.4375, -35.11865234375, -33.7998046875, -32.48095703125, -31.162109375, -29.84326171875, -28.5244140625, -27.20556640625, -25.88671875, -24.56787109375, -23.2490234375, -21.93017578125, -20.611328125, -19.29248046875, -17.9736328125, -16.65478515625, -15.3359375, -14.01708984375, -12.6982421875, -11.37939453125, -10.060546875, -8.74169921875, -7.4228515625, -6.10400390625, -4.78515625, -3.46630859375, -2.1474609375, -0.82861328125, 0.490234375, 1.80908203125, 3.1279296875, 4.44677734375, 5.765625, 7.08447265625, 8.4033203125, 9.72216796875, 11.041015625, 12.35986328125, 13.6787109375, 14.99755859375, 16.31640625, 17.63525390625, 18.9541015625, 20.27294921875, 21.591796875, 22.91064453125, 24.2294921875, 25.54833984375, 26.8671875, 28.18603515625, 29.5048828125, 30.82373046875, 32.142578125, 33.46142578125, 34.7802734375, 36.09912109375, 37.41796875, 38.73681640625, 40.0556640625, 41.37451171875, 42.693359375, 44.01220703125, 45.3310546875, 46.64990234375, 47.96875]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 1.0, 2.0, 4.0, 3.0, 15.0, 7.0, 12.0, 11.0, 7.0, 24.0, 24.0, 29.0, 34.0, 66.0, 56.0, 70.0, 97.0, 133.0, 161.0, 238.0, 423.0, 1588.0, 23523.0, 3064472.0, 50803.0, 2368.0, 510.0, 257.0, 174.0, 133.0, 102.0, 75.0, 65.0, 57.0, 32.0, 27.0, 32.0, 16.0, 12.0, 12.0, 8.0, 5.0, 6.0, 4.0, 6.0, 3.0, 4.0, 2.0, 1.0, 0.0, 3.0], "bins": [-113.0625, -109.97265625, -106.8828125, -103.79296875, -100.703125, -97.61328125, -94.5234375, -91.43359375, -88.34375, -85.25390625, -82.1640625, -79.07421875, -75.984375, -72.89453125, -69.8046875, -66.71484375, -63.625, -60.53515625, -57.4453125, -54.35546875, -51.265625, -48.17578125, -45.0859375, -41.99609375, -38.90625, -35.81640625, -32.7265625, -29.63671875, -26.546875, -23.45703125, -20.3671875, -17.27734375, -14.1875, -11.09765625, -8.0078125, -4.91796875, -1.828125, 1.26171875, 4.3515625, 7.44140625, 10.53125, 13.62109375, 16.7109375, 19.80078125, 22.890625, 25.98046875, 29.0703125, 32.16015625, 35.25, 38.33984375, 41.4296875, 44.51953125, 47.609375, 50.69921875, 53.7890625, 56.87890625, 59.96875, 63.05859375, 66.1484375, 69.23828125, 72.328125, 75.41796875, 78.5078125, 81.59765625, 84.6875]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 12.0, 260.0, 675.0, 66.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-573.7492065429688, -563.7349243164062, -553.7206420898438, -543.7064208984375, -533.692138671875, -523.6778564453125, -513.66357421875, -503.6492919921875, -493.6350402832031, -483.6207580566406, -473.60650634765625, -463.59222412109375, -453.57794189453125, -443.5636901855469, -433.5494079589844, -423.53515625, -413.5208740234375, -403.506591796875, -393.4923400878906, -383.4780578613281, -373.4637756347656, -363.44952392578125, -353.43524169921875, -343.42095947265625, -333.40667724609375, -323.39239501953125, -313.3781433105469, -303.3638610839844, -293.3495788574219, -283.3353271484375, -273.321044921875, -263.3067626953125, -253.29254150390625, -243.2782745361328, -233.2639923095703, -223.24972534179688, -213.23545837402344, -203.22119140625, -193.2069091796875, -183.19264221191406, -173.17835998535156, -163.16409301757812, -153.14981079101562, -143.1355438232422, -133.12127685546875, -123.10700225830078, -113.09272766113281, -103.07846069335938, -93.0641860961914, -83.04991149902344, -73.03564453125, -63.02136993408203, -53.00709915161133, -42.992828369140625, -32.978553771972656, -22.96428680419922, -12.95001220703125, -2.9357404708862305, 7.078531265258789, 17.092803955078125, 27.107074737548828, 37.12134552001953, 47.1356201171875, 57.14988708496094, 67.1641616821289]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 5.0, 1.0, 3.0, 5.0, 13.0, 8.0, 12.0, 15.0, 13.0, 17.0, 19.0, 18.0, 18.0, 28.0, 31.0, 29.0, 37.0, 32.0, 40.0, 37.0, 37.0, 36.0, 40.0, 27.0, 38.0, 28.0, 28.0, 39.0, 35.0, 36.0, 28.0, 29.0, 35.0, 24.0, 17.0, 25.0, 24.0, 15.0, 9.0, 21.0, 7.0, 8.0, 5.0, 5.0, 5.0, 7.0, 3.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-84.82170104980469, -82.07544708251953, -79.32918548583984, -76.58293151855469, -73.836669921875, -71.09041595458984, -68.34415435791016, -65.597900390625, -62.85163879394531, -60.10538101196289, -57.35912322998047, -54.61286544799805, -51.866607666015625, -49.1203498840332, -46.37409210205078, -43.627838134765625, -40.8815803527832, -38.13532257080078, -35.38906478881836, -32.64280700683594, -29.896549224853516, -27.150291442871094, -24.404035568237305, -21.657777786254883, -18.91152000427246, -16.16526222229004, -13.419004440307617, -10.672747611999512, -7.92648983001709, -5.180232048034668, -2.4339752197265625, 0.3122825622558594, 3.0585403442382812, 5.804798126220703, 8.551055908203125, 11.29731273651123, 14.043570518493652, 16.78982925415039, 19.53608512878418, 22.2823429107666, 25.028600692749023, 27.774858474731445, 30.521116256713867, 33.267372131347656, 36.01362991333008, 38.7598876953125, 41.50614547729492, 44.252403259277344, 46.998661041259766, 49.74491882324219, 52.49117660522461, 55.23743438720703, 57.98369216918945, 60.729949951171875, 63.47620391845703, 66.22246551513672, 68.96871948242188, 71.71497344970703, 74.46123504638672, 77.20748901367188, 79.95375061035156, 82.70000457763672, 85.4462661743164, 88.19252014160156, 90.93878173828125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 11.0, 5.0, 9.0, 8.0, 12.0, 10.0, 20.0, 25.0, 21.0, 23.0, 37.0, 26.0, 32.0, 43.0, 41.0, 34.0, 53.0, 44.0, 54.0, 48.0, 56.0, 43.0, 35.0, 31.0, 29.0, 25.0, 36.0, 29.0, 26.0, 34.0, 17.0, 21.0, 9.0, 13.0, 8.0, 10.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.78125, -14.33056640625, -13.8798828125, -13.42919921875, -12.978515625, -12.52783203125, -12.0771484375, -11.62646484375, -11.17578125, -10.72509765625, -10.2744140625, -9.82373046875, -9.373046875, -8.92236328125, -8.4716796875, -8.02099609375, -7.5703125, -7.11962890625, -6.6689453125, -6.21826171875, -5.767578125, -5.31689453125, -4.8662109375, -4.41552734375, -3.96484375, -3.51416015625, -3.0634765625, -2.61279296875, -2.162109375, -1.71142578125, -1.2607421875, -0.81005859375, -0.359375, 0.09130859375, 0.5419921875, 0.99267578125, 1.443359375, 1.89404296875, 2.3447265625, 2.79541015625, 3.24609375, 3.69677734375, 4.1474609375, 4.59814453125, 5.048828125, 5.49951171875, 5.9501953125, 6.40087890625, 6.8515625, 7.30224609375, 7.7529296875, 8.20361328125, 8.654296875, 9.10498046875, 9.5556640625, 10.00634765625, 10.45703125, 10.90771484375, 11.3583984375, 11.80908203125, 12.259765625, 12.71044921875, 13.1611328125, 13.61181640625, 14.0625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 1.0, 5.0, 6.0, 9.0, 5.0, 11.0, 7.0, 12.0, 20.0, 28.0, 30.0, 31.0, 62.0, 90.0, 175.0, 399.0, 930.0, 2828.0, 9052.0, 40863.0, 616064.0, 3136114.0, 349498.0, 27801.0, 6621.0, 2100.0, 751.0, 296.0, 160.0, 85.0, 62.0, 33.0, 28.0, 25.0, 20.0, 14.0, 12.0, 11.0, 8.0, 3.0, 6.0, 2.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-38.9375, -37.77197265625, -36.6064453125, -35.44091796875, -34.275390625, -33.10986328125, -31.9443359375, -30.77880859375, -29.61328125, -28.44775390625, -27.2822265625, -26.11669921875, -24.951171875, -23.78564453125, -22.6201171875, -21.45458984375, -20.2890625, -19.12353515625, -17.9580078125, -16.79248046875, -15.626953125, -14.46142578125, -13.2958984375, -12.13037109375, -10.96484375, -9.79931640625, -8.6337890625, -7.46826171875, -6.302734375, -5.13720703125, -3.9716796875, -2.80615234375, -1.640625, -0.47509765625, 0.6904296875, 1.85595703125, 3.021484375, 4.18701171875, 5.3525390625, 6.51806640625, 7.68359375, 8.84912109375, 10.0146484375, 11.18017578125, 12.345703125, 13.51123046875, 14.6767578125, 15.84228515625, 17.0078125, 18.17333984375, 19.3388671875, 20.50439453125, 21.669921875, 22.83544921875, 24.0009765625, 25.16650390625, 26.33203125, 27.49755859375, 28.6630859375, 29.82861328125, 30.994140625, 32.15966796875, 33.3251953125, 34.49072265625, 35.65625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 5.0, 9.0, 7.0, 17.0, 28.0, 25.0, 33.0, 51.0, 76.0, 124.0, 192.0, 274.0, 458.0, 725.0, 779.0, 481.0, 288.0, 157.0, 109.0, 73.0, 45.0, 32.0, 19.0, 14.0, 9.0, 8.0, 6.0, 5.0, 7.0, 6.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.953125, -30.9560546875, -29.958984375, -28.9619140625, -27.96484375, -26.9677734375, -25.970703125, -24.9736328125, -23.9765625, -22.9794921875, -21.982421875, -20.9853515625, -19.98828125, -18.9912109375, -17.994140625, -16.9970703125, -16.0, -15.0029296875, -14.005859375, -13.0087890625, -12.01171875, -11.0146484375, -10.017578125, -9.0205078125, -8.0234375, -7.0263671875, -6.029296875, -5.0322265625, -4.03515625, -3.0380859375, -2.041015625, -1.0439453125, -0.046875, 0.9501953125, 1.947265625, 2.9443359375, 3.94140625, 4.9384765625, 5.935546875, 6.9326171875, 7.9296875, 8.9267578125, 9.923828125, 10.9208984375, 11.91796875, 12.9150390625, 13.912109375, 14.9091796875, 15.90625, 16.9033203125, 17.900390625, 18.8974609375, 19.89453125, 20.8916015625, 21.888671875, 22.8857421875, 23.8828125, 24.8798828125, 25.876953125, 26.8740234375, 27.87109375, 28.8681640625, 29.865234375, 30.8623046875, 31.859375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 8.0, 4.0, 4.0, 10.0, 9.0, 10.0, 16.0, 25.0, 42.0, 61.0, 99.0, 166.0, 339.0, 1213.0, 21730.0, 4045399.0, 121289.0, 2711.0, 513.0, 220.0, 153.0, 79.0, 46.0, 37.0, 26.0, 23.0, 13.0, 14.0, 6.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.625, -141.02734375, -136.4296875, -131.83203125, -127.234375, -122.63671875, -118.0390625, -113.44140625, -108.84375, -104.24609375, -99.6484375, -95.05078125, -90.453125, -85.85546875, -81.2578125, -76.66015625, -72.0625, -67.46484375, -62.8671875, -58.26953125, -53.671875, -49.07421875, -44.4765625, -39.87890625, -35.28125, -30.68359375, -26.0859375, -21.48828125, -16.890625, -12.29296875, -7.6953125, -3.09765625, 1.5, 6.09765625, 10.6953125, 15.29296875, 19.890625, 24.48828125, 29.0859375, 33.68359375, 38.28125, 42.87890625, 47.4765625, 52.07421875, 56.671875, 61.26953125, 65.8671875, 70.46484375, 75.0625, 79.66015625, 84.2578125, 88.85546875, 93.453125, 98.05078125, 102.6484375, 107.24609375, 111.84375, 116.44140625, 121.0390625, 125.63671875, 130.234375, 134.83203125, 139.4296875, 144.02734375, 148.625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 4.0, 7.0, 19.0, 33.0, 53.0, 107.0, 161.0, 203.0, 168.0, 119.0, 65.0, 36.0, 21.0, 8.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-190.8119354248047, -185.6131134033203, -180.41429138183594, -175.21548461914062, -170.01666259765625, -164.81784057617188, -159.6190185546875, -154.42019653320312, -149.22137451171875, -144.02255249023438, -138.82373046875, -133.62490844726562, -128.4261016845703, -123.22727966308594, -118.02845764160156, -112.82963562011719, -107.63082122802734, -102.43199920654297, -97.23318481445312, -92.03436279296875, -86.83554077148438, -81.63671875, -76.43790435791016, -71.23908233642578, -66.04026794433594, -60.84144973754883, -55.64262771606445, -50.443809509277344, -45.24498748779297, -40.04616928100586, -34.84735107421875, -29.648529052734375, -24.44970703125, -19.250886917114258, -14.052067756652832, -8.853248596191406, -3.654428482055664, 1.5443916320800781, 6.7432098388671875, 11.942031860351562, 17.140850067138672, 22.339670181274414, 27.538490295410156, 32.737308502197266, 37.936126708984375, 43.13494873046875, 48.33376693725586, 53.532588958740234, 58.731407165527344, 63.93022537231445, 69.12904357910156, 74.32786560058594, 79.52668762207031, 84.72550964355469, 89.92432403564453, 95.1231460571289, 100.32196044921875, 105.52078247070312, 110.71959686279297, 115.91841888427734, 121.11724090576172, 126.31605529785156, 131.51487731933594, 136.7136993408203, 141.9125213623047]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 4.0, 3.0, 9.0, 5.0, 7.0, 6.0, 7.0, 12.0, 17.0, 13.0, 21.0, 21.0, 18.0, 22.0, 30.0, 27.0, 37.0, 19.0, 25.0, 35.0, 35.0, 45.0, 42.0, 58.0, 35.0, 37.0, 35.0, 40.0, 32.0, 41.0, 44.0, 28.0, 22.0, 24.0, 23.0, 25.0, 12.0, 7.0, 12.0, 12.0, 11.0, 8.0, 9.0, 13.0, 2.0, 4.0, 3.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-78.4686279296875, -76.06810760498047, -73.66758728027344, -71.26707458496094, -68.8665542602539, -66.46603393554688, -64.06552124023438, -61.665000915527344, -59.26448059082031, -56.86396026611328, -54.463443756103516, -52.06292724609375, -49.66240692138672, -47.26188659667969, -44.86137008666992, -42.460853576660156, -40.060333251953125, -37.659812927246094, -35.25929641723633, -32.85877990722656, -30.45825958251953, -28.057741165161133, -25.657222747802734, -23.256704330444336, -20.856185913085938, -18.45566749572754, -16.05514907836914, -13.654630661010742, -11.254112243652344, -8.853593826293945, -6.453075408935547, -4.052556991577148, -1.65203857421875, 0.7484798431396484, 3.148998260498047, 5.549516677856445, 7.950035095214844, 10.350553512573242, 12.75107192993164, 15.151590347290039, 17.552108764648438, 19.952627182006836, 22.353145599365234, 24.753664016723633, 27.15418243408203, 29.55470085144043, 31.955219268798828, 34.355735778808594, 36.756256103515625, 39.156776428222656, 41.55729293823242, 43.95780944824219, 46.35832977294922, 48.75885009765625, 51.159366607666016, 53.55988311767578, 55.96040344238281, 58.360923767089844, 60.76144027709961, 63.161956787109375, 65.5624771118164, 67.96299743652344, 70.36351013183594, 72.76403045654297, 75.16455078125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 4.0, 3.0, 7.0, 6.0, 9.0, 17.0, 11.0, 18.0, 17.0, 17.0, 21.0, 32.0, 28.0, 28.0, 28.0, 35.0, 47.0, 37.0, 41.0, 46.0, 41.0, 46.0, 52.0, 44.0, 36.0, 39.0, 34.0, 28.0, 32.0, 20.0, 29.0, 24.0, 20.0, 15.0, 18.0, 17.0, 14.0, 8.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.9765625, -12.5673828125, -12.158203125, -11.7490234375, -11.33984375, -10.9306640625, -10.521484375, -10.1123046875, -9.703125, -9.2939453125, -8.884765625, -8.4755859375, -8.06640625, -7.6572265625, -7.248046875, -6.8388671875, -6.4296875, -6.0205078125, -5.611328125, -5.2021484375, -4.79296875, -4.3837890625, -3.974609375, -3.5654296875, -3.15625, -2.7470703125, -2.337890625, -1.9287109375, -1.51953125, -1.1103515625, -0.701171875, -0.2919921875, 0.1171875, 0.5263671875, 0.935546875, 1.3447265625, 1.75390625, 2.1630859375, 2.572265625, 2.9814453125, 3.390625, 3.7998046875, 4.208984375, 4.6181640625, 5.02734375, 5.4365234375, 5.845703125, 6.2548828125, 6.6640625, 7.0732421875, 7.482421875, 7.8916015625, 8.30078125, 8.7099609375, 9.119140625, 9.5283203125, 9.9375, 10.3466796875, 10.755859375, 11.1650390625, 11.57421875, 11.9833984375, 12.392578125, 12.8017578125, 13.2109375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 15.0, 17.0, 33.0, 53.0, 77.0, 166.0, 200.0, 349.0, 478.0, 787.0, 1226.0, 2041.0, 3305.0, 5289.0, 8342.0, 13797.0, 22954.0, 39434.0, 68076.0, 119629.0, 194175.0, 217200.0, 146038.0, 84727.0, 48798.0, 28128.0, 16661.0, 9847.0, 6135.0, 3885.0, 2467.0, 1588.0, 948.0, 668.0, 389.0, 224.0, 162.0, 79.0, 73.0, 38.0, 27.0, 12.0, 6.0, 6.0, 4.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.234375, -2.16705322265625, -2.0997314453125, -2.03240966796875, -1.965087890625, -1.89776611328125, -1.8304443359375, -1.76312255859375, -1.69580078125, -1.62847900390625, -1.5611572265625, -1.49383544921875, -1.426513671875, -1.35919189453125, -1.2918701171875, -1.22454833984375, -1.1572265625, -1.08990478515625, -1.0225830078125, -0.95526123046875, -0.887939453125, -0.82061767578125, -0.7532958984375, -0.68597412109375, -0.61865234375, -0.55133056640625, -0.4840087890625, -0.41668701171875, -0.349365234375, -0.28204345703125, -0.2147216796875, -0.14739990234375, -0.080078125, -0.01275634765625, 0.0545654296875, 0.12188720703125, 0.189208984375, 0.25653076171875, 0.3238525390625, 0.39117431640625, 0.45849609375, 0.52581787109375, 0.5931396484375, 0.66046142578125, 0.727783203125, 0.79510498046875, 0.8624267578125, 0.92974853515625, 0.9970703125, 1.06439208984375, 1.1317138671875, 1.19903564453125, 1.266357421875, 1.33367919921875, 1.4010009765625, 1.46832275390625, 1.53564453125, 1.60296630859375, 1.6702880859375, 1.73760986328125, 1.804931640625, 1.87225341796875, 1.9395751953125, 2.00689697265625, 2.07421875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 6.0, 1.0, 4.0, 6.0, 13.0, 13.0, 9.0, 22.0, 22.0, 26.0, 36.0, 30.0, 34.0, 31.0, 43.0, 50.0, 32.0, 42.0, 48.0, 52.0, 1078.0, 44.0, 40.0, 50.0, 35.0, 29.0, 45.0, 40.0, 22.0, 19.0, 16.0, 19.0, 20.0, 14.0, 11.0, 9.0, 6.0, 6.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.390625, -11.065185546875, -10.73974609375, -10.414306640625, -10.0888671875, -9.763427734375, -9.43798828125, -9.112548828125, -8.787109375, -8.461669921875, -8.13623046875, -7.810791015625, -7.4853515625, -7.159912109375, -6.83447265625, -6.509033203125, -6.18359375, -5.858154296875, -5.53271484375, -5.207275390625, -4.8818359375, -4.556396484375, -4.23095703125, -3.905517578125, -3.580078125, -3.254638671875, -2.92919921875, -2.603759765625, -2.2783203125, -1.952880859375, -1.62744140625, -1.302001953125, -0.9765625, -0.651123046875, -0.32568359375, -0.000244140625, 0.3251953125, 0.650634765625, 0.97607421875, 1.301513671875, 1.626953125, 1.952392578125, 2.27783203125, 2.603271484375, 2.9287109375, 3.254150390625, 3.57958984375, 3.905029296875, 4.23046875, 4.555908203125, 4.88134765625, 5.206787109375, 5.5322265625, 5.857666015625, 6.18310546875, 6.508544921875, 6.833984375, 7.159423828125, 7.48486328125, 7.810302734375, 8.1357421875, 8.461181640625, 8.78662109375, 9.112060546875, 9.4375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 8.0, 3.0, 11.0, 11.0, 23.0, 33.0, 48.0, 70.0, 87.0, 152.0, 228.0, 310.0, 500.0, 743.0, 1288.0, 2066.0, 3398.0, 5874.0, 9633.0, 16190.0, 27883.0, 48698.0, 85767.0, 148569.0, 1265239.0, 197673.0, 118913.0, 68412.0, 39405.0, 22666.0, 13288.0, 7808.0, 4615.0, 2735.0, 1700.0, 1089.0, 665.0, 461.0, 284.0, 187.0, 131.0, 72.0, 64.0, 36.0, 36.0, 11.0, 17.0, 10.0, 8.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.322265625, -1.279327392578125, -1.23638916015625, -1.193450927734375, -1.1505126953125, -1.107574462890625, -1.06463623046875, -1.021697998046875, -0.978759765625, -0.935821533203125, -0.89288330078125, -0.849945068359375, -0.8070068359375, -0.764068603515625, -0.72113037109375, -0.678192138671875, -0.63525390625, -0.592315673828125, -0.54937744140625, -0.506439208984375, -0.4635009765625, -0.420562744140625, -0.37762451171875, -0.334686279296875, -0.291748046875, -0.248809814453125, -0.20587158203125, -0.162933349609375, -0.1199951171875, -0.077056884765625, -0.03411865234375, 0.008819580078125, 0.0517578125, 0.094696044921875, 0.13763427734375, 0.180572509765625, 0.2235107421875, 0.266448974609375, 0.30938720703125, 0.352325439453125, 0.395263671875, 0.438201904296875, 0.48114013671875, 0.524078369140625, 0.5670166015625, 0.609954833984375, 0.65289306640625, 0.695831298828125, 0.73876953125, 0.781707763671875, 0.82464599609375, 0.867584228515625, 0.9105224609375, 0.953460693359375, 0.99639892578125, 1.039337158203125, 1.082275390625, 1.125213623046875, 1.16815185546875, 1.211090087890625, 1.2540283203125, 1.296966552734375, 1.33990478515625, 1.382843017578125, 1.42578125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 11.0, 13.0, 6.0, 12.0, 14.0, 17.0, 26.0, 36.0, 32.0, 48.0, 69.0, 87.0, 122.0, 115.0, 74.0, 60.0, 50.0, 39.0, 33.0, 29.0, 17.0, 14.0, 9.0, 12.0, 15.0, 9.0, 3.0, 3.0, 2.0, 3.0, 1.0, 7.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02679443359375, -0.02590203285217285, -0.025009632110595703, -0.024117231369018555, -0.023224830627441406, -0.022332429885864258, -0.02144002914428711, -0.02054762840270996, -0.019655227661132812, -0.018762826919555664, -0.017870426177978516, -0.016978025436401367, -0.01608562469482422, -0.01519322395324707, -0.014300823211669922, -0.013408422470092773, -0.012516021728515625, -0.011623620986938477, -0.010731220245361328, -0.00983881950378418, -0.008946418762207031, -0.008054018020629883, -0.007161617279052734, -0.006269216537475586, -0.0053768157958984375, -0.004484415054321289, -0.0035920143127441406, -0.002699613571166992, -0.0018072128295898438, -0.0009148120880126953, -2.2411346435546875e-05, 0.0008699893951416016, 0.00176239013671875, 0.0026547908782958984, 0.003547191619873047, 0.004439592361450195, 0.005331993103027344, 0.006224393844604492, 0.007116794586181641, 0.008009195327758789, 0.008901596069335938, 0.009793996810913086, 0.010686397552490234, 0.011578798294067383, 0.012471199035644531, 0.01336359977722168, 0.014256000518798828, 0.015148401260375977, 0.016040802001953125, 0.016933202743530273, 0.017825603485107422, 0.01871800422668457, 0.01961040496826172, 0.020502805709838867, 0.021395206451416016, 0.022287607192993164, 0.023180007934570312, 0.02407240867614746, 0.02496480941772461, 0.025857210159301758, 0.026749610900878906, 0.027642011642456055, 0.028534412384033203, 0.02942681312561035, 0.0303192138671875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 7.0, 2.0, 2.0, 0.0, 7.0, 5.0, 14.0, 13.0, 15.0, 14.0, 17.0, 32.0, 51.0, 66.0, 83.0, 164.0, 354.0, 1210.0, 805891.0, 238863.0, 963.0, 323.0, 152.0, 84.0, 51.0, 47.0, 28.0, 24.0, 16.0, 7.0, 14.0, 13.0, 8.0, 3.0, 5.0, 1.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6494140625, -0.630279541015625, -0.61114501953125, -0.592010498046875, -0.5728759765625, -0.553741455078125, -0.53460693359375, -0.515472412109375, -0.496337890625, -0.477203369140625, -0.45806884765625, -0.438934326171875, -0.4197998046875, -0.400665283203125, -0.38153076171875, -0.362396240234375, -0.34326171875, -0.324127197265625, -0.30499267578125, -0.285858154296875, -0.2667236328125, -0.247589111328125, -0.22845458984375, -0.209320068359375, -0.190185546875, -0.171051025390625, -0.15191650390625, -0.132781982421875, -0.1136474609375, -0.094512939453125, -0.07537841796875, -0.056243896484375, -0.037109375, -0.017974853515625, 0.00115966796875, 0.020294189453125, 0.0394287109375, 0.058563232421875, 0.07769775390625, 0.096832275390625, 0.115966796875, 0.135101318359375, 0.15423583984375, 0.173370361328125, 0.1925048828125, 0.211639404296875, 0.23077392578125, 0.249908447265625, 0.26904296875, 0.288177490234375, 0.30731201171875, 0.326446533203125, 0.3455810546875, 0.364715576171875, 0.38385009765625, 0.402984619140625, 0.422119140625, 0.441253662109375, 0.46038818359375, 0.479522705078125, 0.4986572265625, 0.517791748046875, 0.53692626953125, 0.556060791015625, 0.5751953125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 80.0, 881.0, 47.0, 4.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11109989881515503, -0.09796919673681259, -0.08483849465847015, -0.07170780003070831, -0.05857709422707558, -0.04544639587402344, -0.032315693795681, -0.019184991717338562, -0.006054289638996124, 0.007076411508023739, 0.020207112655043602, 0.03333781287074089, 0.04646851494908333, 0.05959921330213547, 0.0727299153804779, 0.08586061745882034, 0.09899131953716278, 0.11212202161550522, 0.12525272369384766, 0.1383834183216095, 0.15151412785053253, 0.16464482247829437, 0.1777755320072174, 0.19090622663497925, 0.2040369212627411, 0.21716761589050293, 0.23029832541942596, 0.2434290200471878, 0.25655972957611084, 0.2696904242038727, 0.2828211188316345, 0.29595184326171875, 0.3090825378894806, 0.32221323251724243, 0.3353439271450043, 0.3484746515750885, 0.36160534620285034, 0.3747360408306122, 0.387866735458374, 0.40099745988845825, 0.4141281545162201, 0.42725884914398193, 0.4403895437717438, 0.453520268201828, 0.46665096282958984, 0.4797816574573517, 0.4929123520851135, 0.5060430765151978, 0.5191737413406372, 0.5323044657707214, 0.5454351305961609, 0.5585658550262451, 0.5716965198516846, 0.5848272442817688, 0.597957968711853, 0.6110886335372925, 0.6242193579673767, 0.6373500823974609, 0.6504807472229004, 0.6636114716529846, 0.6767421364784241, 0.6898728609085083, 0.7030035853385925, 0.716134250164032, 0.7292649745941162]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 5.0, 4.0, 3.0, 6.0, 4.0, 11.0, 9.0, 16.0, 15.0, 16.0, 19.0, 18.0, 26.0, 30.0, 32.0, 33.0, 31.0, 30.0, 35.0, 37.0, 38.0, 36.0, 42.0, 37.0, 34.0, 28.0, 38.0, 30.0, 42.0, 32.0, 45.0, 24.0, 25.0, 20.0, 24.0, 30.0, 25.0, 19.0, 13.0, 9.0, 6.0, 5.0, 6.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 4.0, 0.0, 2.0], "bins": [-0.03635573387145996, -0.03531833365559578, -0.0342809334397316, -0.033243533223867416, -0.032206133008003235, -0.031168732792139053, -0.030131332576274872, -0.02909393236041069, -0.02805653214454651, -0.027019131928682327, -0.025981731712818146, -0.024944331496953964, -0.023906931281089783, -0.0228695310652256, -0.02183213084936142, -0.020794730633497238, -0.019757330417633057, -0.018719930201768875, -0.017682529985904694, -0.016645129770040512, -0.01560772955417633, -0.014570329338312149, -0.013532929122447968, -0.012495528906583786, -0.011458128690719604, -0.010420728474855423, -0.009383328258991241, -0.00834592804312706, -0.007308527827262878, -0.006271127611398697, -0.005233727395534515, -0.004196327179670334, -0.0031589269638061523, -0.002121526747941971, -0.0010841265320777893, -4.672631621360779e-05, 0.0009906738996505737, 0.0020280741155147552, 0.0030654743313789368, 0.004102874547243118, 0.0051402747631073, 0.006177674978971481, 0.007215075194835663, 0.008252475410699844, 0.009289875626564026, 0.010327275842428207, 0.011364676058292389, 0.01240207627415657, 0.013439476490020752, 0.014476876705884933, 0.015514276921749115, 0.016551677137613297, 0.017589077353477478, 0.01862647756934166, 0.01966387778520584, 0.020701278001070023, 0.021738678216934204, 0.022776078432798386, 0.023813478648662567, 0.02485087886452675, 0.02588827908039093, 0.02692567929625511, 0.027963079512119293, 0.029000479727983475, 0.030037879943847656]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 1.0, 4.0, 7.0, 4.0, 3.0, 7.0, 6.0, 9.0, 17.0, 11.0, 18.0, 17.0, 17.0, 21.0, 32.0, 28.0, 28.0, 28.0, 35.0, 47.0, 36.0, 42.0, 46.0, 40.0, 44.0, 54.0, 45.0, 36.0, 39.0, 34.0, 28.0, 31.0, 20.0, 30.0, 24.0, 20.0, 15.0, 18.0, 17.0, 14.0, 8.0, 4.0, 5.0, 4.0, 5.0, 2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-12.9765625, -12.5675048828125, -12.158447265625, -11.7493896484375, -11.34033203125, -10.9312744140625, -10.522216796875, -10.1131591796875, -9.7041015625, -9.2950439453125, -8.885986328125, -8.4769287109375, -8.06787109375, -7.6588134765625, -7.249755859375, -6.8406982421875, -6.431640625, -6.0225830078125, -5.613525390625, -5.2044677734375, -4.79541015625, -4.3863525390625, -3.977294921875, -3.5682373046875, -3.1591796875, -2.7501220703125, -2.341064453125, -1.9320068359375, -1.52294921875, -1.1138916015625, -0.704833984375, -0.2957763671875, 0.11328125, 0.5223388671875, 0.931396484375, 1.3404541015625, 1.74951171875, 2.1585693359375, 2.567626953125, 2.9766845703125, 3.3857421875, 3.7947998046875, 4.203857421875, 4.6129150390625, 5.02197265625, 5.4310302734375, 5.840087890625, 6.2491455078125, 6.658203125, 7.0672607421875, 7.476318359375, 7.8853759765625, 8.29443359375, 8.7034912109375, 9.112548828125, 9.5216064453125, 9.9306640625, 10.3397216796875, 10.748779296875, 11.1578369140625, 11.56689453125, 11.9759521484375, 12.385009765625, 12.7940673828125, 13.203125]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 6.0, 5.0, 16.0, 16.0, 24.0, 13.0, 27.0, 51.0, 46.0, 88.0, 104.0, 147.0, 187.0, 261.0, 375.0, 551.0, 810.0, 1205.0, 1695.0, 2640.0, 4193.0, 6804.0, 11869.0, 23197.0, 53304.0, 167322.0, 509087.0, 159798.0, 51557.0, 22585.0, 11604.0, 6692.0, 4108.0, 2560.0, 1730.0, 1181.0, 806.0, 565.0, 350.0, 250.0, 202.0, 144.0, 97.0, 85.0, 38.0, 41.0, 36.0, 21.0, 21.0, 12.0, 5.0, 8.0, 5.0, 6.0, 2.0, 4.0, 1.0, 5.0], "bins": [-13.6796875, -13.258544921875, -12.83740234375, -12.416259765625, -11.9951171875, -11.573974609375, -11.15283203125, -10.731689453125, -10.310546875, -9.889404296875, -9.46826171875, -9.047119140625, -8.6259765625, -8.204833984375, -7.78369140625, -7.362548828125, -6.94140625, -6.520263671875, -6.09912109375, -5.677978515625, -5.2568359375, -4.835693359375, -4.41455078125, -3.993408203125, -3.572265625, -3.151123046875, -2.72998046875, -2.308837890625, -1.8876953125, -1.466552734375, -1.04541015625, -0.624267578125, -0.203125, 0.218017578125, 0.63916015625, 1.060302734375, 1.4814453125, 1.902587890625, 2.32373046875, 2.744873046875, 3.166015625, 3.587158203125, 4.00830078125, 4.429443359375, 4.8505859375, 5.271728515625, 5.69287109375, 6.114013671875, 6.53515625, 6.956298828125, 7.37744140625, 7.798583984375, 8.2197265625, 8.640869140625, 9.06201171875, 9.483154296875, 9.904296875, 10.325439453125, 10.74658203125, 11.167724609375, 11.5888671875, 12.010009765625, 12.43115234375, 12.852294921875, 13.2734375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 8.0, 6.0, 3.0, 10.0, 8.0, 6.0, 10.0, 16.0, 22.0, 22.0, 18.0, 24.0, 12.0, 36.0, 32.0, 44.0, 40.0, 43.0, 70.0, 100.0, 206.0, 1619.0, 188.0, 91.0, 63.0, 47.0, 42.0, 34.0, 45.0, 22.0, 27.0, 31.0, 28.0, 12.0, 17.0, 15.0, 9.0, 11.0, 6.0, 3.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-43.03125, -41.81689453125, -40.6025390625, -39.38818359375, -38.173828125, -36.95947265625, -35.7451171875, -34.53076171875, -33.31640625, -32.10205078125, -30.8876953125, -29.67333984375, -28.458984375, -27.24462890625, -26.0302734375, -24.81591796875, -23.6015625, -22.38720703125, -21.1728515625, -19.95849609375, -18.744140625, -17.52978515625, -16.3154296875, -15.10107421875, -13.88671875, -12.67236328125, -11.4580078125, -10.24365234375, -9.029296875, -7.81494140625, -6.6005859375, -5.38623046875, -4.171875, -2.95751953125, -1.7431640625, -0.52880859375, 0.685546875, 1.89990234375, 3.1142578125, 4.32861328125, 5.54296875, 6.75732421875, 7.9716796875, 9.18603515625, 10.400390625, 11.61474609375, 12.8291015625, 14.04345703125, 15.2578125, 16.47216796875, 17.6865234375, 18.90087890625, 20.115234375, 21.32958984375, 22.5439453125, 23.75830078125, 24.97265625, 26.18701171875, 27.4013671875, 28.61572265625, 29.830078125, 31.04443359375, 32.2587890625, 33.47314453125, 34.6875]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 4.0, 1.0, 7.0, 8.0, 9.0, 9.0, 11.0, 23.0, 17.0, 29.0, 45.0, 68.0, 86.0, 117.0, 209.0, 320.0, 717.0, 2810.0, 41517.0, 3064573.0, 30974.0, 2517.0, 704.0, 310.0, 175.0, 106.0, 84.0, 61.0, 47.0, 34.0, 23.0, 21.0, 20.0, 12.0, 11.0, 5.0, 3.0, 4.0, 8.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0], "bins": [-120.9375, -117.52734375, -114.1171875, -110.70703125, -107.296875, -103.88671875, -100.4765625, -97.06640625, -93.65625, -90.24609375, -86.8359375, -83.42578125, -80.015625, -76.60546875, -73.1953125, -69.78515625, -66.375, -62.96484375, -59.5546875, -56.14453125, -52.734375, -49.32421875, -45.9140625, -42.50390625, -39.09375, -35.68359375, -32.2734375, -28.86328125, -25.453125, -22.04296875, -18.6328125, -15.22265625, -11.8125, -8.40234375, -4.9921875, -1.58203125, 1.828125, 5.23828125, 8.6484375, 12.05859375, 15.46875, 18.87890625, 22.2890625, 25.69921875, 29.109375, 32.51953125, 35.9296875, 39.33984375, 42.75, 46.16015625, 49.5703125, 52.98046875, 56.390625, 59.80078125, 63.2109375, 66.62109375, 70.03125, 73.44140625, 76.8515625, 80.26171875, 83.671875, 87.08203125, 90.4921875, 93.90234375, 97.3125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 61.0, 434.0, 452.0, 54.0, 8.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-414.2214660644531, -405.9256896972656, -397.6299133300781, -389.3341369628906, -381.0383605957031, -372.74261474609375, -364.44683837890625, -356.15106201171875, -347.85528564453125, -339.55950927734375, -331.26373291015625, -322.96795654296875, -314.67218017578125, -306.37640380859375, -298.08062744140625, -289.7848815917969, -281.48907470703125, -273.19329833984375, -264.89752197265625, -256.60174560546875, -248.3059844970703, -240.0102081298828, -231.7144317626953, -223.4186553955078, -215.12289428710938, -206.82711791992188, -198.53134155273438, -190.23556518554688, -181.93980407714844, -173.64402770996094, -165.34825134277344, -157.05247497558594, -148.75669860839844, -140.46092224121094, -132.16514587402344, -123.86937713623047, -115.5736083984375, -107.27783203125, -98.9820556640625, -90.686279296875, -82.39051055908203, -74.09473419189453, -65.79896545410156, -57.50318908691406, -49.20741653442383, -40.911643981933594, -32.615867614746094, -24.32009506225586, -16.024322509765625, -7.728549003601074, 0.5672245025634766, 8.862998962402344, 17.158771514892578, 25.454544067382812, 33.75032043457031, 42.04609298706055, 50.34186553955078, 58.637638092041016, 66.93341064453125, 75.22918701171875, 83.52496337890625, 91.82073211669922, 100.11650848388672, 108.41227722167969, 116.70805358886719]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 0.0, 3.0, 3.0, 10.0, 12.0, 12.0, 14.0, 19.0, 13.0, 24.0, 23.0, 35.0, 34.0, 29.0, 35.0, 35.0, 38.0, 37.0, 38.0, 51.0, 45.0, 45.0, 41.0, 42.0, 34.0, 39.0, 40.0, 42.0, 45.0, 29.0, 28.0, 16.0, 25.0, 17.0, 11.0, 16.0, 5.0, 1.0, 2.0, 8.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-105.38029479980469, -102.15509796142578, -98.92989349365234, -95.70469665527344, -92.4794921875, -89.2542953491211, -86.02909851074219, -82.80389404296875, -79.57869720458984, -76.35350036621094, -73.1282958984375, -69.9030990600586, -66.67789459228516, -63.45269775390625, -60.22749710083008, -57.002296447753906, -53.777095794677734, -50.55189514160156, -47.32669448852539, -44.10149383544922, -40.87629699707031, -37.65109634399414, -34.42589569091797, -31.20069694519043, -27.975496292114258, -24.750295639038086, -21.525096893310547, -18.299896240234375, -15.07469654083252, -11.849496841430664, -8.624296188354492, -5.399097442626953, -2.1738967895507812, 1.0513031482696533, 4.276503086090088, 7.501703262329102, 10.726902961730957, 13.952102661132812, 17.177303314208984, 20.402502059936523, 23.627702713012695, 26.852903366088867, 30.078102111816406, 33.30330276489258, 36.52850341796875, 39.753700256347656, 42.978904724121094, 46.2041015625, 49.42930221557617, 52.654502868652344, 55.879703521728516, 59.10490417480469, 62.330101013183594, 65.5552978515625, 68.78050231933594, 72.00569915771484, 75.23090362548828, 78.45610046386719, 81.68130493164062, 84.90650177001953, 88.13170623779297, 91.35690307617188, 94.58210754394531, 97.80730438232422, 101.03250122070312]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 5.0, 2.0, 5.0, 3.0, 8.0, 7.0, 9.0, 13.0, 13.0, 18.0, 21.0, 18.0, 26.0, 30.0, 20.0, 26.0, 38.0, 43.0, 41.0, 39.0, 37.0, 32.0, 40.0, 54.0, 51.0, 40.0, 42.0, 38.0, 27.0, 26.0, 25.0, 29.0, 24.0, 21.0, 29.0, 18.0, 14.0, 17.0, 10.0, 13.0, 6.0, 5.0, 7.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.46875, -13.0440673828125, -12.619384765625, -12.1947021484375, -11.77001953125, -11.3453369140625, -10.920654296875, -10.4959716796875, -10.0712890625, -9.6466064453125, -9.221923828125, -8.7972412109375, -8.37255859375, -7.9478759765625, -7.523193359375, -7.0985107421875, -6.673828125, -6.2491455078125, -5.824462890625, -5.3997802734375, -4.97509765625, -4.5504150390625, -4.125732421875, -3.7010498046875, -3.2763671875, -2.8516845703125, -2.427001953125, -2.0023193359375, -1.57763671875, -1.1529541015625, -0.728271484375, -0.3035888671875, 0.12109375, 0.5457763671875, 0.970458984375, 1.3951416015625, 1.81982421875, 2.2445068359375, 2.669189453125, 3.0938720703125, 3.5185546875, 3.9432373046875, 4.367919921875, 4.7926025390625, 5.21728515625, 5.6419677734375, 6.066650390625, 6.4913330078125, 6.916015625, 7.3406982421875, 7.765380859375, 8.1900634765625, 8.61474609375, 9.0394287109375, 9.464111328125, 9.8887939453125, 10.3134765625, 10.7381591796875, 11.162841796875, 11.5875244140625, 12.01220703125, 12.4368896484375, 12.861572265625, 13.2862548828125, 13.7109375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 4.0, 4.0, 8.0, 8.0, 4.0, 11.0, 7.0, 14.0, 13.0, 26.0, 28.0, 32.0, 37.0, 60.0, 100.0, 225.0, 497.0, 1337.0, 3918.0, 16251.0, 190363.0, 3485395.0, 464503.0, 23695.0, 4881.0, 1574.0, 658.0, 244.0, 112.0, 64.0, 37.0, 23.0, 40.0, 21.0, 14.0, 8.0, 16.0, 11.0, 7.0, 9.0, 7.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.25, -47.69189453125, -46.1337890625, -44.57568359375, -43.017578125, -41.45947265625, -39.9013671875, -38.34326171875, -36.78515625, -35.22705078125, -33.6689453125, -32.11083984375, -30.552734375, -28.99462890625, -27.4365234375, -25.87841796875, -24.3203125, -22.76220703125, -21.2041015625, -19.64599609375, -18.087890625, -16.52978515625, -14.9716796875, -13.41357421875, -11.85546875, -10.29736328125, -8.7392578125, -7.18115234375, -5.623046875, -4.06494140625, -2.5068359375, -0.94873046875, 0.609375, 2.16748046875, 3.7255859375, 5.28369140625, 6.841796875, 8.39990234375, 9.9580078125, 11.51611328125, 13.07421875, 14.63232421875, 16.1904296875, 17.74853515625, 19.306640625, 20.86474609375, 22.4228515625, 23.98095703125, 25.5390625, 27.09716796875, 28.6552734375, 30.21337890625, 31.771484375, 33.32958984375, 34.8876953125, 36.44580078125, 38.00390625, 39.56201171875, 41.1201171875, 42.67822265625, 44.236328125, 45.79443359375, 47.3525390625, 48.91064453125, 50.46875]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 6.0, 6.0, 15.0, 17.0, 28.0, 38.0, 66.0, 117.0, 178.0, 394.0, 850.0, 1050.0, 649.0, 301.0, 143.0, 86.0, 46.0, 37.0, 22.0, 10.0, 7.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.15625, -25.75048828125, -24.3447265625, -22.93896484375, -21.533203125, -20.12744140625, -18.7216796875, -17.31591796875, -15.91015625, -14.50439453125, -13.0986328125, -11.69287109375, -10.287109375, -8.88134765625, -7.4755859375, -6.06982421875, -4.6640625, -3.25830078125, -1.8525390625, -0.44677734375, 0.958984375, 2.36474609375, 3.7705078125, 5.17626953125, 6.58203125, 7.98779296875, 9.3935546875, 10.79931640625, 12.205078125, 13.61083984375, 15.0166015625, 16.42236328125, 17.828125, 19.23388671875, 20.6396484375, 22.04541015625, 23.451171875, 24.85693359375, 26.2626953125, 27.66845703125, 29.07421875, 30.47998046875, 31.8857421875, 33.29150390625, 34.697265625, 36.10302734375, 37.5087890625, 38.91455078125, 40.3203125, 41.72607421875, 43.1318359375, 44.53759765625, 45.943359375, 47.34912109375, 48.7548828125, 50.16064453125, 51.56640625, 52.97216796875, 54.3779296875, 55.78369140625, 57.189453125, 58.59521484375, 60.0009765625, 61.40673828125, 62.8125]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 6.0, 3.0, 11.0, 13.0, 20.0, 32.0, 60.0, 104.0, 249.0, 646.0, 4331.0, 4061637.0, 124892.0, 1441.0, 448.0, 179.0, 90.0, 43.0, 31.0, 15.0, 20.0, 5.0, 7.0, 2.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-329.75, -322.38671875, -315.0234375, -307.66015625, -300.296875, -292.93359375, -285.5703125, -278.20703125, -270.84375, -263.48046875, -256.1171875, -248.75390625, -241.390625, -234.02734375, -226.6640625, -219.30078125, -211.9375, -204.57421875, -197.2109375, -189.84765625, -182.484375, -175.12109375, -167.7578125, -160.39453125, -153.03125, -145.66796875, -138.3046875, -130.94140625, -123.578125, -116.21484375, -108.8515625, -101.48828125, -94.125, -86.76171875, -79.3984375, -72.03515625, -64.671875, -57.30859375, -49.9453125, -42.58203125, -35.21875, -27.85546875, -20.4921875, -13.12890625, -5.765625, 1.59765625, 8.9609375, 16.32421875, 23.6875, 31.05078125, 38.4140625, 45.77734375, 53.140625, 60.50390625, 67.8671875, 75.23046875, 82.59375, 89.95703125, 97.3203125, 104.68359375, 112.046875, 119.41015625, 126.7734375, 134.13671875, 141.5]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 9.0, 40.0, 94.0, 197.0, 285.0, 202.0, 113.0, 38.0, 24.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-355.6307067871094, -347.6522521972656, -339.6737976074219, -331.6953430175781, -323.7169189453125, -315.73846435546875, -307.760009765625, -299.78155517578125, -291.8031005859375, -283.82464599609375, -275.84619140625, -267.86773681640625, -259.8892822265625, -251.9108428955078, -243.93240356445312, -235.95394897460938, -227.97549438476562, -219.99703979492188, -212.01858520507812, -204.04014587402344, -196.0616912841797, -188.08323669433594, -180.10479736328125, -172.1263427734375, -164.14788818359375, -156.16943359375, -148.19097900390625, -140.21253967285156, -132.2340850830078, -124.25563049316406, -116.27718353271484, -108.29873657226562, -100.32029724121094, -92.34184265136719, -84.36339569091797, -76.38494873046875, -68.406494140625, -60.428043365478516, -52.44959259033203, -44.47114181518555, -36.49269104003906, -28.514240264892578, -20.535789489746094, -12.55733871459961, -4.578887939453125, 3.3995628356933594, 11.378013610839844, 19.356464385986328, 27.334915161132812, 35.3133659362793, 43.29181671142578, 51.270267486572266, 59.24871826171875, 67.2271728515625, 75.20561981201172, 83.18406677246094, 91.16252136230469, 99.14097595214844, 107.11942291259766, 115.09786987304688, 123.07632446289062, 131.05477905273438, 139.03323364257812, 147.0116729736328, 154.99012756347656]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 2.0, 5.0, 3.0, 4.0, 5.0, 7.0, 7.0, 5.0, 15.0, 11.0, 11.0, 18.0, 20.0, 11.0, 26.0, 30.0, 32.0, 25.0, 26.0, 29.0, 33.0, 32.0, 39.0, 47.0, 40.0, 37.0, 47.0, 44.0, 48.0, 29.0, 35.0, 40.0, 29.0, 21.0, 33.0, 19.0, 21.0, 17.0, 14.0, 19.0, 11.0, 10.0, 12.0, 10.0, 5.0, 9.0, 7.0, 6.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-78.02896118164062, -75.58889770507812, -73.1488265991211, -70.70875549316406, -68.26869201660156, -65.82862854003906, -63.38855743408203, -60.948490142822266, -58.5084228515625, -56.068355560302734, -53.62828826904297, -51.1882209777832, -48.74815368652344, -46.30808639526367, -43.868019104003906, -41.42795181274414, -38.987884521484375, -36.54781723022461, -34.107749938964844, -31.667682647705078, -29.227615356445312, -26.787548065185547, -24.34748077392578, -21.907413482666016, -19.46734619140625, -17.027278900146484, -14.587211608886719, -12.147144317626953, -9.707077026367188, -7.267009735107422, -4.826942443847656, -2.3868751525878906, 0.053192138671875, 2.4932594299316406, 4.933326721191406, 7.373394012451172, 9.813461303710938, 12.253528594970703, 14.693595886230469, 17.133663177490234, 19.57373046875, 22.013797760009766, 24.45386505126953, 26.893932342529297, 29.333999633789062, 31.774066925048828, 34.214134216308594, 36.65420150756836, 39.094268798828125, 41.53433609008789, 43.974403381347656, 46.41447067260742, 48.85453796386719, 51.29460525512695, 53.73467254638672, 56.174739837646484, 58.61480712890625, 61.054874420166016, 63.49494171142578, 65.93501281738281, 68.37507629394531, 70.81513977050781, 73.25521087646484, 75.69528198242188, 78.13534545898438]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 9.0, 6.0, 4.0, 6.0, 9.0, 15.0, 12.0, 12.0, 20.0, 20.0, 26.0, 24.0, 27.0, 28.0, 41.0, 34.0, 42.0, 43.0, 38.0, 41.0, 52.0, 43.0, 37.0, 37.0, 44.0, 32.0, 27.0, 47.0, 31.0, 27.0, 19.0, 19.0, 15.0, 22.0, 12.0, 11.0, 15.0, 10.0, 6.0, 9.0, 13.0, 0.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.265625, -12.83447265625, -12.4033203125, -11.97216796875, -11.541015625, -11.10986328125, -10.6787109375, -10.24755859375, -9.81640625, -9.38525390625, -8.9541015625, -8.52294921875, -8.091796875, -7.66064453125, -7.2294921875, -6.79833984375, -6.3671875, -5.93603515625, -5.5048828125, -5.07373046875, -4.642578125, -4.21142578125, -3.7802734375, -3.34912109375, -2.91796875, -2.48681640625, -2.0556640625, -1.62451171875, -1.193359375, -0.76220703125, -0.3310546875, 0.10009765625, 0.53125, 0.96240234375, 1.3935546875, 1.82470703125, 2.255859375, 2.68701171875, 3.1181640625, 3.54931640625, 3.98046875, 4.41162109375, 4.8427734375, 5.27392578125, 5.705078125, 6.13623046875, 6.5673828125, 6.99853515625, 7.4296875, 7.86083984375, 8.2919921875, 8.72314453125, 9.154296875, 9.58544921875, 10.0166015625, 10.44775390625, 10.87890625, 11.31005859375, 11.7412109375, 12.17236328125, 12.603515625, 13.03466796875, 13.4658203125, 13.89697265625, 14.328125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 3.0, 7.0, 16.0, 14.0, 16.0, 30.0, 57.0, 47.0, 65.0, 98.0, 115.0, 208.0, 298.0, 419.0, 560.0, 815.0, 1073.0, 1652.0, 2395.0, 3436.0, 5203.0, 7661.0, 11775.0, 18419.0, 29264.0, 47035.0, 77668.0, 123369.0, 175577.0, 181923.0, 133307.0, 83893.0, 52063.0, 31786.0, 19458.0, 12816.0, 8256.0, 5576.0, 3738.0, 2581.0, 1785.0, 1186.0, 824.0, 608.0, 438.0, 310.0, 214.0, 138.0, 104.0, 63.0, 70.0, 48.0, 24.0, 22.0, 19.0, 14.0, 3.0, 4.0, 3.0, 1.0, 1.0], "bins": [-1.9541015625, -1.8932037353515625, -1.832305908203125, -1.7714080810546875, -1.71051025390625, -1.6496124267578125, -1.588714599609375, -1.5278167724609375, -1.4669189453125, -1.4060211181640625, -1.345123291015625, -1.2842254638671875, -1.22332763671875, -1.1624298095703125, -1.101531982421875, -1.0406341552734375, -0.979736328125, -0.9188385009765625, -0.857940673828125, -0.7970428466796875, -0.73614501953125, -0.6752471923828125, -0.614349365234375, -0.5534515380859375, -0.4925537109375, -0.4316558837890625, -0.370758056640625, -0.3098602294921875, -0.24896240234375, -0.1880645751953125, -0.127166748046875, -0.0662689208984375, -0.00537109375, 0.0555267333984375, 0.116424560546875, 0.1773223876953125, 0.23822021484375, 0.2991180419921875, 0.360015869140625, 0.4209136962890625, 0.4818115234375, 0.5427093505859375, 0.603607177734375, 0.6645050048828125, 0.72540283203125, 0.7863006591796875, 0.847198486328125, 0.9080963134765625, 0.968994140625, 1.0298919677734375, 1.090789794921875, 1.1516876220703125, 1.21258544921875, 1.2734832763671875, 1.334381103515625, 1.3952789306640625, 1.4561767578125, 1.5170745849609375, 1.577972412109375, 1.6388702392578125, 1.69976806640625, 1.7606658935546875, 1.821563720703125, 1.8824615478515625, 1.943359375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 4.0, 2.0, 4.0, 5.0, 8.0, 7.0, 7.0, 12.0, 7.0, 9.0, 17.0, 15.0, 15.0, 29.0, 19.0, 17.0, 29.0, 24.0, 35.0, 31.0, 32.0, 34.0, 41.0, 28.0, 32.0, 1074.0, 43.0, 37.0, 37.0, 30.0, 23.0, 38.0, 35.0, 27.0, 21.0, 27.0, 26.0, 18.0, 12.0, 20.0, 15.0, 14.0, 11.0, 11.0, 9.0, 10.0, 6.0, 7.0, 10.0, 3.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.58203125, -7.30828857421875, -7.0345458984375, -6.76080322265625, -6.487060546875, -6.21331787109375, -5.9395751953125, -5.66583251953125, -5.39208984375, -5.11834716796875, -4.8446044921875, -4.57086181640625, -4.297119140625, -4.02337646484375, -3.7496337890625, -3.47589111328125, -3.2021484375, -2.92840576171875, -2.6546630859375, -2.38092041015625, -2.107177734375, -1.83343505859375, -1.5596923828125, -1.28594970703125, -1.01220703125, -0.73846435546875, -0.4647216796875, -0.19097900390625, 0.082763671875, 0.35650634765625, 0.6302490234375, 0.90399169921875, 1.177734375, 1.45147705078125, 1.7252197265625, 1.99896240234375, 2.272705078125, 2.54644775390625, 2.8201904296875, 3.09393310546875, 3.36767578125, 3.64141845703125, 3.9151611328125, 4.18890380859375, 4.462646484375, 4.73638916015625, 5.0101318359375, 5.28387451171875, 5.5576171875, 5.83135986328125, 6.1051025390625, 6.37884521484375, 6.652587890625, 6.92633056640625, 7.2000732421875, 7.47381591796875, 7.74755859375, 8.02130126953125, 8.2950439453125, 8.56878662109375, 8.842529296875, 9.11627197265625, 9.3900146484375, 9.66375732421875, 9.9375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 7.0, 3.0, 4.0, 8.0, 14.0, 14.0, 24.0, 37.0, 58.0, 81.0, 90.0, 144.0, 203.0, 297.0, 420.0, 612.0, 878.0, 1225.0, 1790.0, 2556.0, 3815.0, 5557.0, 7992.0, 12076.0, 17665.0, 26861.0, 40769.0, 62201.0, 95199.0, 141202.0, 1223723.0, 149959.0, 102561.0, 67737.0, 43880.0, 28613.0, 18808.0, 12767.0, 8593.0, 5778.0, 4042.0, 2711.0, 1912.0, 1271.0, 916.0, 619.0, 424.0, 307.0, 219.0, 157.0, 113.0, 67.0, 43.0, 29.0, 23.0, 26.0, 15.0, 12.0, 7.0, 8.0, 1.0, 3.0], "bins": [-1.171875, -1.1359100341796875, -1.099945068359375, -1.0639801025390625, -1.02801513671875, -0.9920501708984375, -0.956085205078125, -0.9201202392578125, -0.8841552734375, -0.8481903076171875, -0.812225341796875, -0.7762603759765625, -0.74029541015625, -0.7043304443359375, -0.668365478515625, -0.6324005126953125, -0.596435546875, -0.5604705810546875, -0.524505615234375, -0.4885406494140625, -0.45257568359375, -0.4166107177734375, -0.380645751953125, -0.3446807861328125, -0.3087158203125, -0.2727508544921875, -0.236785888671875, -0.2008209228515625, -0.16485595703125, -0.1288909912109375, -0.092926025390625, -0.0569610595703125, -0.02099609375, 0.0149688720703125, 0.050933837890625, 0.0868988037109375, 0.12286376953125, 0.1588287353515625, 0.194793701171875, 0.2307586669921875, 0.2667236328125, 0.3026885986328125, 0.338653564453125, 0.3746185302734375, 0.41058349609375, 0.4465484619140625, 0.482513427734375, 0.5184783935546875, 0.554443359375, 0.5904083251953125, 0.626373291015625, 0.6623382568359375, 0.69830322265625, 0.7342681884765625, 0.770233154296875, 0.8061981201171875, 0.8421630859375, 0.8781280517578125, 0.914093017578125, 0.9500579833984375, 0.98602294921875, 1.0219879150390625, 1.057952880859375, 1.0939178466796875, 1.1298828125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 1.0, 4.0, 5.0, 8.0, 2.0, 4.0, 3.0, 4.0, 7.0, 14.0, 22.0, 15.0, 16.0, 26.0, 31.0, 29.0, 31.0, 49.0, 53.0, 69.0, 90.0, 97.0, 72.0, 54.0, 47.0, 39.0, 22.0, 20.0, 19.0, 24.0, 16.0, 15.0, 16.0, 14.0, 16.0, 12.0, 7.0, 6.0, 6.0, 5.0, 5.0, 2.0, 6.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02337646484375, -0.022624969482421875, -0.02187347412109375, -0.021121978759765625, -0.0203704833984375, -0.019618988037109375, -0.01886749267578125, -0.018115997314453125, -0.017364501953125, -0.016613006591796875, -0.01586151123046875, -0.015110015869140625, -0.0143585205078125, -0.013607025146484375, -0.01285552978515625, -0.012104034423828125, -0.0113525390625, -0.010601043701171875, -0.00984954833984375, -0.009098052978515625, -0.0083465576171875, -0.007595062255859375, -0.00684356689453125, -0.006092071533203125, -0.005340576171875, -0.004589080810546875, -0.00383758544921875, -0.003086090087890625, -0.0023345947265625, -0.001583099365234375, -0.00083160400390625, -8.0108642578125e-05, 0.00067138671875, 0.001422882080078125, 0.00217437744140625, 0.002925872802734375, 0.0036773681640625, 0.004428863525390625, 0.00518035888671875, 0.005931854248046875, 0.006683349609375, 0.007434844970703125, 0.00818634033203125, 0.008937835693359375, 0.0096893310546875, 0.010440826416015625, 0.01119232177734375, 0.011943817138671875, 0.0126953125, 0.013446807861328125, 0.01419830322265625, 0.014949798583984375, 0.0157012939453125, 0.016452789306640625, 0.01720428466796875, 0.017955780029296875, 0.018707275390625, 0.019458770751953125, 0.02021026611328125, 0.020961761474609375, 0.0217132568359375, 0.022464752197265625, 0.02321624755859375, 0.023967742919921875, 0.02471923828125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 7.0, 3.0, 5.0, 11.0, 4.0, 10.0, 17.0, 22.0, 20.0, 23.0, 27.0, 35.0, 57.0, 43.0, 70.0, 82.0, 150.0, 313.0, 743.0, 13045.0, 981130.0, 50563.0, 1190.0, 337.0, 204.0, 121.0, 75.0, 66.0, 37.0, 24.0, 29.0, 16.0, 21.0, 10.0, 9.0, 6.0, 4.0, 6.0, 7.0, 4.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.51318359375, -0.49745941162109375, -0.4817352294921875, -0.46601104736328125, -0.450286865234375, -0.43456268310546875, -0.4188385009765625, -0.40311431884765625, -0.38739013671875, -0.37166595458984375, -0.3559417724609375, -0.34021759033203125, -0.324493408203125, -0.30876922607421875, -0.2930450439453125, -0.27732086181640625, -0.2615966796875, -0.24587249755859375, -0.2301483154296875, -0.21442413330078125, -0.198699951171875, -0.18297576904296875, -0.1672515869140625, -0.15152740478515625, -0.13580322265625, -0.12007904052734375, -0.1043548583984375, -0.08863067626953125, -0.072906494140625, -0.05718231201171875, -0.0414581298828125, -0.02573394775390625, -0.010009765625, 0.00571441650390625, 0.0214385986328125, 0.03716278076171875, 0.052886962890625, 0.06861114501953125, 0.0843353271484375, 0.10005950927734375, 0.11578369140625, 0.13150787353515625, 0.1472320556640625, 0.16295623779296875, 0.178680419921875, 0.19440460205078125, 0.2101287841796875, 0.22585296630859375, 0.2415771484375, 0.25730133056640625, 0.2730255126953125, 0.28874969482421875, 0.304473876953125, 0.32019805908203125, 0.3359222412109375, 0.35164642333984375, 0.36737060546875, 0.38309478759765625, 0.3988189697265625, 0.41454315185546875, 0.430267333984375, 0.44599151611328125, 0.4617156982421875, 0.47743988037109375, 0.4931640625]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 74.0, 878.0, 60.0, 5.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1237386167049408, -0.10448823124170303, -0.08523784577846527, -0.06598746031522751, -0.046737074851989746, -0.027486689388751984, -0.008236303925514221, 0.011014074087142944, 0.030264467000961304, 0.049514852464199066, 0.06876523792743683, 0.08801562339067459, 0.10726600885391235, 0.1265164017677307, 0.14576677978038788, 0.16501715779304504, 0.1842675507068634, 0.20351794362068176, 0.22276832163333893, 0.2420186996459961, 0.26126909255981445, 0.2805194854736328, 0.29976987838745117, 0.31902024149894714, 0.3382706344127655, 0.35752102732658386, 0.37677139043807983, 0.3960217833518982, 0.41527217626571655, 0.4345225691795349, 0.45377296209335327, 0.47302332520484924, 0.4922736883163452, 0.5115240812301636, 0.5307744741439819, 0.5500248670578003, 0.5692752599716187, 0.5885255932807922, 0.6077759861946106, 0.627026379108429, 0.6462767720222473, 0.6655271649360657, 0.684777557849884, 0.7040279507637024, 0.723278284072876, 0.7425286769866943, 0.7617790699005127, 0.781029462814331, 0.8002798557281494, 0.8195302486419678, 0.8387806415557861, 0.8580310344696045, 0.8772814273834229, 0.8965317606925964, 0.9157821536064148, 0.9350325465202332, 0.9542829394340515, 0.9735333323478699, 0.9927837252616882, 1.0120340585708618, 1.0312844514846802, 1.0505348443984985, 1.069785237312317, 1.0890356302261353, 1.1082860231399536]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 1.0, 3.0, 8.0, 8.0, 12.0, 10.0, 8.0, 15.0, 15.0, 19.0, 26.0, 25.0, 34.0, 30.0, 34.0, 36.0, 39.0, 50.0, 44.0, 37.0, 43.0, 42.0, 43.0, 39.0, 31.0, 47.0, 40.0, 34.0, 30.0, 30.0, 27.0, 27.0, 23.0, 18.0, 17.0, 10.0, 15.0, 8.0, 7.0, 6.0, 3.0, 4.0, 4.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.05608034133911133, -0.05455788969993591, -0.0530354380607605, -0.051512982696294785, -0.04999053105711937, -0.048468079417943954, -0.04694562405347824, -0.045423172414302826, -0.04390072077512741, -0.042378269135951996, -0.04085581749677658, -0.03933336213231087, -0.03781091049313545, -0.03628845885396004, -0.034766003489494324, -0.03324355185031891, -0.031721100211143494, -0.03019864857196808, -0.028676195070147514, -0.02715374156832695, -0.025631289929151535, -0.02410883828997612, -0.022586384788155556, -0.02106393128633499, -0.019541479647159576, -0.01801902800798416, -0.016496574506163597, -0.014974121935665607, -0.013451669365167618, -0.011929216794669628, -0.010406764224171638, -0.008884311653673649, -0.007361859083175659, -0.0058394065126776695, -0.00431695394217968, -0.00279450137168169, -0.0012720488011837006, 0.0002504037693142891, 0.0017728563398122787, 0.0032953089103102684, 0.004817761480808258, 0.006340214051306248, 0.007862666621804237, 0.009385119192302227, 0.010907571762800217, 0.012430024333298206, 0.013952476903796196, 0.015474929474294186, 0.016997382044792175, 0.01851983368396759, 0.020042287185788155, 0.02156474068760872, 0.023087192326784134, 0.02460964396595955, 0.026132097467780113, 0.027654550969600677, 0.029177002608776093, 0.030699454247951508, 0.03222190588712692, 0.033744361251592636, 0.03526681289076805, 0.036789264529943466, 0.03831171989440918, 0.039834171533584595, 0.04135662317276001]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 9.0, 6.0, 4.0, 6.0, 9.0, 15.0, 12.0, 12.0, 20.0, 20.0, 26.0, 24.0, 27.0, 28.0, 40.0, 35.0, 41.0, 43.0, 39.0, 41.0, 52.0, 42.0, 35.0, 40.0, 44.0, 32.0, 27.0, 47.0, 31.0, 27.0, 19.0, 19.0, 15.0, 22.0, 12.0, 11.0, 15.0, 10.0, 6.0, 8.0, 13.0, 1.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-13.265625, -12.8345947265625, -12.403564453125, -11.9725341796875, -11.54150390625, -11.1104736328125, -10.679443359375, -10.2484130859375, -9.8173828125, -9.3863525390625, -8.955322265625, -8.5242919921875, -8.09326171875, -7.6622314453125, -7.231201171875, -6.8001708984375, -6.369140625, -5.9381103515625, -5.507080078125, -5.0760498046875, -4.64501953125, -4.2139892578125, -3.782958984375, -3.3519287109375, -2.9208984375, -2.4898681640625, -2.058837890625, -1.6278076171875, -1.19677734375, -0.7657470703125, -0.334716796875, 0.0963134765625, 0.52734375, 0.9583740234375, 1.389404296875, 1.8204345703125, 2.25146484375, 2.6824951171875, 3.113525390625, 3.5445556640625, 3.9755859375, 4.4066162109375, 4.837646484375, 5.2686767578125, 5.69970703125, 6.1307373046875, 6.561767578125, 6.9927978515625, 7.423828125, 7.8548583984375, 8.285888671875, 8.7169189453125, 9.14794921875, 9.5789794921875, 10.010009765625, 10.4410400390625, 10.8720703125, 11.3031005859375, 11.734130859375, 12.1651611328125, 12.59619140625, 13.0272216796875, 13.458251953125, 13.8892822265625, 14.3203125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 3.0, 3.0, 3.0, 12.0, 12.0, 9.0, 9.0, 12.0, 24.0, 31.0, 33.0, 59.0, 70.0, 102.0, 151.0, 254.0, 367.0, 629.0, 1105.0, 2096.0, 4636.0, 13537.0, 61674.0, 677438.0, 238463.0, 31887.0, 8535.0, 3418.0, 1650.0, 813.0, 510.0, 331.0, 188.0, 130.0, 86.0, 62.0, 62.0, 35.0, 22.0, 22.0, 15.0, 14.0, 11.0, 14.0, 2.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-22.15625, -21.43701171875, -20.7177734375, -19.99853515625, -19.279296875, -18.56005859375, -17.8408203125, -17.12158203125, -16.40234375, -15.68310546875, -14.9638671875, -14.24462890625, -13.525390625, -12.80615234375, -12.0869140625, -11.36767578125, -10.6484375, -9.92919921875, -9.2099609375, -8.49072265625, -7.771484375, -7.05224609375, -6.3330078125, -5.61376953125, -4.89453125, -4.17529296875, -3.4560546875, -2.73681640625, -2.017578125, -1.29833984375, -0.5791015625, 0.14013671875, 0.859375, 1.57861328125, 2.2978515625, 3.01708984375, 3.736328125, 4.45556640625, 5.1748046875, 5.89404296875, 6.61328125, 7.33251953125, 8.0517578125, 8.77099609375, 9.490234375, 10.20947265625, 10.9287109375, 11.64794921875, 12.3671875, 13.08642578125, 13.8056640625, 14.52490234375, 15.244140625, 15.96337890625, 16.6826171875, 17.40185546875, 18.12109375, 18.84033203125, 19.5595703125, 20.27880859375, 20.998046875, 21.71728515625, 22.4365234375, 23.15576171875, 23.875]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 3.0, 6.0, 14.0, 7.0, 16.0, 20.0, 21.0, 23.0, 18.0, 18.0, 28.0, 33.0, 43.0, 53.0, 54.0, 60.0, 153.0, 1821.0, 167.0, 67.0, 49.0, 49.0, 43.0, 45.0, 39.0, 17.0, 25.0, 23.0, 24.0, 22.0, 20.0, 10.0, 17.0, 10.0, 5.0, 3.0, 6.0, 2.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.625, -39.20166015625, -37.7783203125, -36.35498046875, -34.931640625, -33.50830078125, -32.0849609375, -30.66162109375, -29.23828125, -27.81494140625, -26.3916015625, -24.96826171875, -23.544921875, -22.12158203125, -20.6982421875, -19.27490234375, -17.8515625, -16.42822265625, -15.0048828125, -13.58154296875, -12.158203125, -10.73486328125, -9.3115234375, -7.88818359375, -6.46484375, -5.04150390625, -3.6181640625, -2.19482421875, -0.771484375, 0.65185546875, 2.0751953125, 3.49853515625, 4.921875, 6.34521484375, 7.7685546875, 9.19189453125, 10.615234375, 12.03857421875, 13.4619140625, 14.88525390625, 16.30859375, 17.73193359375, 19.1552734375, 20.57861328125, 22.001953125, 23.42529296875, 24.8486328125, 26.27197265625, 27.6953125, 29.11865234375, 30.5419921875, 31.96533203125, 33.388671875, 34.81201171875, 36.2353515625, 37.65869140625, 39.08203125, 40.50537109375, 41.9287109375, 43.35205078125, 44.775390625, 46.19873046875, 47.6220703125, 49.04541015625, 50.46875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 8.0, 5.0, 8.0, 7.0, 4.0, 15.0, 18.0, 21.0, 28.0, 38.0, 34.0, 42.0, 68.0, 118.0, 202.0, 476.0, 2261.0, 2741268.0, 398352.0, 1824.0, 407.0, 186.0, 84.0, 61.0, 39.0, 24.0, 32.0, 29.0, 16.0, 15.0, 6.0, 6.0, 6.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.75, -138.607421875, -133.46484375, -128.322265625, -123.1796875, -118.037109375, -112.89453125, -107.751953125, -102.609375, -97.466796875, -92.32421875, -87.181640625, -82.0390625, -76.896484375, -71.75390625, -66.611328125, -61.46875, -56.326171875, -51.18359375, -46.041015625, -40.8984375, -35.755859375, -30.61328125, -25.470703125, -20.328125, -15.185546875, -10.04296875, -4.900390625, 0.2421875, 5.384765625, 10.52734375, 15.669921875, 20.8125, 25.955078125, 31.09765625, 36.240234375, 41.3828125, 46.525390625, 51.66796875, 56.810546875, 61.953125, 67.095703125, 72.23828125, 77.380859375, 82.5234375, 87.666015625, 92.80859375, 97.951171875, 103.09375, 108.236328125, 113.37890625, 118.521484375, 123.6640625, 128.806640625, 133.94921875, 139.091796875, 144.234375, 149.376953125, 154.51953125, 159.662109375, 164.8046875, 169.947265625, 175.08984375, 180.232421875, 185.375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 266.0, 726.0, 24.0], "bins": [-812.8474731445312, -799.777587890625, -786.707763671875, -773.6378784179688, -760.5680541992188, -747.4981689453125, -734.4283447265625, -721.3584594726562, -708.28857421875, -695.2186889648438, -682.1488647460938, -669.0789794921875, -656.0091552734375, -642.9392700195312, -629.869384765625, -616.799560546875, -603.729736328125, -590.6598510742188, -577.5900268554688, -564.5201416015625, -551.4503173828125, -538.3804321289062, -525.310546875, -512.24072265625, -499.17083740234375, -486.1009826660156, -473.0311279296875, -459.96124267578125, -446.8913879394531, -433.821533203125, -420.7516784667969, -407.68182373046875, -394.6119384765625, -381.5420837402344, -368.47222900390625, -355.40234375, -342.3324890136719, -329.26263427734375, -316.1927795410156, -303.1229248046875, -290.05303955078125, -276.9831848144531, -263.913330078125, -250.8434600830078, -237.77359008789062, -224.7037353515625, -211.63388061523438, -198.56402587890625, -185.49415588378906, -172.42430114746094, -159.35443115234375, -146.28457641601562, -133.2147216796875, -120.14485168457031, -107.07499694824219, -94.00513458251953, -80.93527221679688, -67.86540985107422, -54.79555130004883, -41.72569274902344, -28.65583038330078, -15.585968017578125, -2.51611328125, 10.553749084472656, 23.62360954284668]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 7.0, 5.0, 4.0, 11.0, 4.0, 8.0, 21.0, 20.0, 19.0, 19.0, 23.0, 21.0, 37.0, 38.0, 31.0, 31.0, 37.0, 40.0, 43.0, 43.0, 36.0, 52.0, 30.0, 41.0, 32.0, 35.0, 29.0, 30.0, 28.0, 19.0, 26.0, 22.0, 25.0, 23.0, 19.0, 13.0, 14.0, 6.0, 12.0, 7.0, 7.0, 9.0, 7.0, 5.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-117.62258911132812, -114.00001525878906, -110.37743377685547, -106.75485229492188, -103.13227844238281, -99.50970458984375, -95.88712310791016, -92.26454162597656, -88.6419677734375, -85.01939392089844, -81.39681243896484, -77.77423095703125, -74.15165710449219, -70.52908325195312, -66.90650177001953, -63.2839241027832, -59.661346435546875, -56.03876876831055, -52.41619110107422, -48.79361343383789, -45.17103576660156, -41.548458099365234, -37.925880432128906, -34.30330276489258, -30.68072509765625, -27.058147430419922, -23.435569763183594, -19.812992095947266, -16.190414428710938, -12.56783676147461, -8.945259094238281, -5.322681427001953, -1.700103759765625, 1.9224739074707031, 5.545051574707031, 9.16762924194336, 12.790206909179688, 16.412784576416016, 20.035362243652344, 23.657939910888672, 27.280517578125, 30.903095245361328, 34.525672912597656, 38.148250579833984, 41.77082824707031, 45.39340591430664, 49.01598358154297, 52.6385612487793, 56.261138916015625, 59.88371658325195, 63.50629425048828, 67.12887573242188, 70.75144958496094, 74.3740234375, 77.9966049194336, 81.61918640136719, 85.24176025390625, 88.86433410644531, 92.4869155883789, 96.1094970703125, 99.73207092285156, 103.35464477539062, 106.97722625732422, 110.59980773925781, 114.22238159179688]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 4.0, 6.0, 4.0, 7.0, 8.0, 14.0, 18.0, 13.0, 20.0, 24.0, 27.0, 26.0, 27.0, 19.0, 48.0, 29.0, 34.0, 50.0, 47.0, 46.0, 42.0, 33.0, 41.0, 40.0, 46.0, 39.0, 36.0, 38.0, 29.0, 24.0, 17.0, 18.0, 23.0, 17.0, 15.0, 11.0, 11.0, 7.0, 2.0, 7.0, 10.0, 7.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-15.265625, -14.7945556640625, -14.323486328125, -13.8524169921875, -13.38134765625, -12.9102783203125, -12.439208984375, -11.9681396484375, -11.4970703125, -11.0260009765625, -10.554931640625, -10.0838623046875, -9.61279296875, -9.1417236328125, -8.670654296875, -8.1995849609375, -7.728515625, -7.2574462890625, -6.786376953125, -6.3153076171875, -5.84423828125, -5.3731689453125, -4.902099609375, -4.4310302734375, -3.9599609375, -3.4888916015625, -3.017822265625, -2.5467529296875, -2.07568359375, -1.6046142578125, -1.133544921875, -0.6624755859375, -0.19140625, 0.2796630859375, 0.750732421875, 1.2218017578125, 1.69287109375, 2.1639404296875, 2.635009765625, 3.1060791015625, 3.5771484375, 4.0482177734375, 4.519287109375, 4.9903564453125, 5.46142578125, 5.9324951171875, 6.403564453125, 6.8746337890625, 7.345703125, 7.8167724609375, 8.287841796875, 8.7589111328125, 9.22998046875, 9.7010498046875, 10.172119140625, 10.6431884765625, 11.1142578125, 11.5853271484375, 12.056396484375, 12.5274658203125, 12.99853515625, 13.4696044921875, 13.940673828125, 14.4117431640625, 14.8828125]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 1.0, 5.0, 5.0, 8.0, 12.0, 26.0, 30.0, 42.0, 45.0, 80.0, 92.0, 120.0, 184.0, 263.0, 375.0, 561.0, 868.0, 1228.0, 2032.0, 3380.0, 5855.0, 10889.0, 22317.0, 59918.0, 198926.0, 727049.0, 1686282.0, 1018639.0, 305334.0, 88247.0, 30476.0, 13331.0, 7002.0, 3998.0, 2329.0, 1437.0, 938.0, 554.0, 445.0, 286.0, 197.0, 135.0, 92.0, 80.0, 34.0, 40.0, 31.0, 16.0, 19.0, 15.0, 10.0, 8.0, 2.0, 2.0, 2.0, 0.0, 1.0], "bins": [-18.40625, -17.859375, -17.3125, -16.765625, -16.21875, -15.671875, -15.125, -14.578125, -14.03125, -13.484375, -12.9375, -12.390625, -11.84375, -11.296875, -10.75, -10.203125, -9.65625, -9.109375, -8.5625, -8.015625, -7.46875, -6.921875, -6.375, -5.828125, -5.28125, -4.734375, -4.1875, -3.640625, -3.09375, -2.546875, -2.0, -1.453125, -0.90625, -0.359375, 0.1875, 0.734375, 1.28125, 1.828125, 2.375, 2.921875, 3.46875, 4.015625, 4.5625, 5.109375, 5.65625, 6.203125, 6.75, 7.296875, 7.84375, 8.390625, 8.9375, 9.484375, 10.03125, 10.578125, 11.125, 11.671875, 12.21875, 12.765625, 13.3125, 13.859375, 14.40625, 14.953125, 15.5, 16.046875, 16.59375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 2.0, 9.0, 12.0, 9.0, 14.0, 18.0, 19.0, 22.0, 30.0, 36.0, 65.0, 64.0, 105.0, 126.0, 235.0, 317.0, 526.0, 670.0, 565.0, 436.0, 247.0, 161.0, 131.0, 74.0, 52.0, 32.0, 26.0, 14.0, 13.0, 9.0, 10.0, 11.0, 3.0, 2.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-30.765625, -29.825927734375, -28.88623046875, -27.946533203125, -27.0068359375, -26.067138671875, -25.12744140625, -24.187744140625, -23.248046875, -22.308349609375, -21.36865234375, -20.428955078125, -19.4892578125, -18.549560546875, -17.60986328125, -16.670166015625, -15.73046875, -14.790771484375, -13.85107421875, -12.911376953125, -11.9716796875, -11.031982421875, -10.09228515625, -9.152587890625, -8.212890625, -7.273193359375, -6.33349609375, -5.393798828125, -4.4541015625, -3.514404296875, -2.57470703125, -1.635009765625, -0.6953125, 0.244384765625, 1.18408203125, 2.123779296875, 3.0634765625, 4.003173828125, 4.94287109375, 5.882568359375, 6.822265625, 7.761962890625, 8.70166015625, 9.641357421875, 10.5810546875, 11.520751953125, 12.46044921875, 13.400146484375, 14.33984375, 15.279541015625, 16.21923828125, 17.158935546875, 18.0986328125, 19.038330078125, 19.97802734375, 20.917724609375, 21.857421875, 22.797119140625, 23.73681640625, 24.676513671875, 25.6162109375, 26.555908203125, 27.49560546875, 28.435302734375, 29.375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 4.0, 7.0, 11.0, 9.0, 16.0, 17.0, 26.0, 42.0, 61.0, 110.0, 199.0, 405.0, 1106.0, 6001.0, 112583.0, 3969315.0, 96469.0, 5717.0, 1116.0, 443.0, 206.0, 113.0, 73.0, 61.0, 39.0, 29.0, 23.0, 21.0, 14.0, 11.0, 11.0, 3.0, 7.0, 6.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-113.625, -110.126953125, -106.62890625, -103.130859375, -99.6328125, -96.134765625, -92.63671875, -89.138671875, -85.640625, -82.142578125, -78.64453125, -75.146484375, -71.6484375, -68.150390625, -64.65234375, -61.154296875, -57.65625, -54.158203125, -50.66015625, -47.162109375, -43.6640625, -40.166015625, -36.66796875, -33.169921875, -29.671875, -26.173828125, -22.67578125, -19.177734375, -15.6796875, -12.181640625, -8.68359375, -5.185546875, -1.6875, 1.810546875, 5.30859375, 8.806640625, 12.3046875, 15.802734375, 19.30078125, 22.798828125, 26.296875, 29.794921875, 33.29296875, 36.791015625, 40.2890625, 43.787109375, 47.28515625, 50.783203125, 54.28125, 57.779296875, 61.27734375, 64.775390625, 68.2734375, 71.771484375, 75.26953125, 78.767578125, 82.265625, 85.763671875, 89.26171875, 92.759765625, 96.2578125, 99.755859375, 103.25390625, 106.751953125, 110.25]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 26.0, 433.0, 523.0, 29.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1150.5728759765625, -1125.6065673828125, -1100.640380859375, -1075.674072265625, -1050.707763671875, -1025.7415771484375, -1000.7752685546875, -975.8089599609375, -950.8427124023438, -925.87646484375, -900.91015625, -875.9439086914062, -850.9776611328125, -826.0113525390625, -801.0451049804688, -776.078857421875, -751.112548828125, -726.1463012695312, -701.1799926757812, -676.2137451171875, -651.2474365234375, -626.2811889648438, -601.31494140625, -576.3486328125, -551.3823852539062, -526.4161376953125, -501.4498291015625, -476.48358154296875, -451.5173034667969, -426.551025390625, -401.58477783203125, -376.6184997558594, -351.65228271484375, -326.6860046386719, -301.7197265625, -276.75347900390625, -251.78720092773438, -226.8209228515625, -201.8546600341797, -176.88839721679688, -151.922119140625, -126.95584869384766, -101.98957824707031, -77.02330780029297, -52.057037353515625, -27.09076690673828, -2.1244964599609375, 22.841766357421875, 47.80804443359375, 72.7743148803711, 97.74058532714844, 122.70685577392578, 147.67312622070312, 172.639404296875, 197.6056671142578, 222.57192993164062, 247.5382080078125, 272.5044860839844, 297.47076416015625, 322.43701171875, 347.4032897949219, 372.36956787109375, 397.3358154296875, 422.3020935058594, 447.26837158203125]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 7.0, 9.0, 11.0, 15.0, 17.0, 18.0, 9.0, 24.0, 29.0, 32.0, 25.0, 37.0, 46.0, 36.0, 47.0, 60.0, 53.0, 53.0, 58.0, 48.0, 49.0, 42.0, 49.0, 37.0, 29.0, 24.0, 28.0, 21.0, 16.0, 18.0, 21.0, 7.0, 11.0, 1.0, 4.0, 4.0, 6.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-98.77984619140625, -95.31404113769531, -91.8482437133789, -88.38243865966797, -84.91664123535156, -81.45083618164062, -77.98503112792969, -74.51922607421875, -71.05342864990234, -67.5876235961914, -64.121826171875, -60.65602111816406, -57.19021987915039, -53.72441864013672, -50.25861358642578, -46.79281234741211, -43.32701110839844, -39.861209869384766, -36.395408630371094, -32.929603576660156, -29.463802337646484, -25.998001098632812, -22.532197952270508, -19.066394805908203, -15.600593566894531, -12.134791374206543, -8.668989181518555, -5.203186988830566, -1.7373847961425781, 1.7284164428710938, 5.194219589233398, 8.660022735595703, 12.125823974609375, 15.591626167297363, 19.05742835998535, 22.523231506347656, 25.989032745361328, 29.454833984375, 32.92063903808594, 36.38644027709961, 39.85224151611328, 43.31804275512695, 46.783843994140625, 50.24964904785156, 53.715450286865234, 57.181251525878906, 60.647056579589844, 64.11285400390625, 67.57865905761719, 71.04446411132812, 74.51026153564453, 77.97606658935547, 81.44186401367188, 84.90766906738281, 88.37347412109375, 91.83927917480469, 95.3050765991211, 98.77088165283203, 102.23667907714844, 105.70248413085938, 109.16828918457031, 112.63408660888672, 116.09989166259766, 119.56568908691406, 123.031494140625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 4.0, 7.0, 10.0, 13.0, 17.0, 12.0, 11.0, 22.0, 20.0, 24.0, 36.0, 35.0, 31.0, 54.0, 44.0, 55.0, 50.0, 53.0, 55.0, 52.0, 32.0, 32.0, 51.0, 41.0, 35.0, 22.0, 29.0, 24.0, 30.0, 19.0, 13.0, 16.0, 11.0, 5.0, 5.0, 8.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2109375, -13.7037353515625, -13.196533203125, -12.6893310546875, -12.18212890625, -11.6749267578125, -11.167724609375, -10.6605224609375, -10.1533203125, -9.6461181640625, -9.138916015625, -8.6317138671875, -8.12451171875, -7.6173095703125, -7.110107421875, -6.6029052734375, -6.095703125, -5.5885009765625, -5.081298828125, -4.5740966796875, -4.06689453125, -3.5596923828125, -3.052490234375, -2.5452880859375, -2.0380859375, -1.5308837890625, -1.023681640625, -0.5164794921875, -0.00927734375, 0.4979248046875, 1.005126953125, 1.5123291015625, 2.01953125, 2.5267333984375, 3.033935546875, 3.5411376953125, 4.04833984375, 4.5555419921875, 5.062744140625, 5.5699462890625, 6.0771484375, 6.5843505859375, 7.091552734375, 7.5987548828125, 8.10595703125, 8.6131591796875, 9.120361328125, 9.6275634765625, 10.134765625, 10.6419677734375, 11.149169921875, 11.6563720703125, 12.16357421875, 12.6707763671875, 13.177978515625, 13.6851806640625, 14.1923828125, 14.6995849609375, 15.206787109375, 15.7139892578125, 16.22119140625, 16.7283935546875, 17.235595703125, 17.7427978515625, 18.25]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 5.0, 6.0, 11.0, 14.0, 23.0, 27.0, 43.0, 55.0, 107.0, 169.0, 265.0, 406.0, 616.0, 851.0, 1424.0, 2191.0, 3434.0, 5567.0, 8972.0, 14853.0, 24761.0, 41263.0, 69968.0, 117109.0, 186663.0, 209607.0, 144082.0, 86403.0, 51134.0, 30630.0, 18339.0, 11171.0, 6719.0, 4169.0, 2611.0, 1720.0, 1111.0, 707.0, 482.0, 323.0, 210.0, 115.0, 86.0, 51.0, 35.0, 23.0, 8.0, 11.0, 4.0, 9.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1484375, -2.07958984375, -2.0107421875, -1.94189453125, -1.873046875, -1.80419921875, -1.7353515625, -1.66650390625, -1.59765625, -1.52880859375, -1.4599609375, -1.39111328125, -1.322265625, -1.25341796875, -1.1845703125, -1.11572265625, -1.046875, -0.97802734375, -0.9091796875, -0.84033203125, -0.771484375, -0.70263671875, -0.6337890625, -0.56494140625, -0.49609375, -0.42724609375, -0.3583984375, -0.28955078125, -0.220703125, -0.15185546875, -0.0830078125, -0.01416015625, 0.0546875, 0.12353515625, 0.1923828125, 0.26123046875, 0.330078125, 0.39892578125, 0.4677734375, 0.53662109375, 0.60546875, 0.67431640625, 0.7431640625, 0.81201171875, 0.880859375, 0.94970703125, 1.0185546875, 1.08740234375, 1.15625, 1.22509765625, 1.2939453125, 1.36279296875, 1.431640625, 1.50048828125, 1.5693359375, 1.63818359375, 1.70703125, 1.77587890625, 1.8447265625, 1.91357421875, 1.982421875, 2.05126953125, 2.1201171875, 2.18896484375, 2.2578125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 10.0, 12.0, 5.0, 14.0, 11.0, 13.0, 12.0, 23.0, 20.0, 25.0, 31.0, 33.0, 33.0, 30.0, 26.0, 35.0, 41.0, 36.0, 39.0, 1054.0, 53.0, 43.0, 48.0, 28.0, 42.0, 35.0, 23.0, 33.0, 31.0, 24.0, 18.0, 20.0, 14.0, 17.0, 17.0, 13.0, 3.0, 8.0, 13.0, 5.0, 6.0, 5.0, 7.0, 6.0, 3.0, 3.0, 0.0, 0.0, 1.0], "bins": [-9.921875, -9.634765625, -9.34765625, -9.060546875, -8.7734375, -8.486328125, -8.19921875, -7.912109375, -7.625, -7.337890625, -7.05078125, -6.763671875, -6.4765625, -6.189453125, -5.90234375, -5.615234375, -5.328125, -5.041015625, -4.75390625, -4.466796875, -4.1796875, -3.892578125, -3.60546875, -3.318359375, -3.03125, -2.744140625, -2.45703125, -2.169921875, -1.8828125, -1.595703125, -1.30859375, -1.021484375, -0.734375, -0.447265625, -0.16015625, 0.126953125, 0.4140625, 0.701171875, 0.98828125, 1.275390625, 1.5625, 1.849609375, 2.13671875, 2.423828125, 2.7109375, 2.998046875, 3.28515625, 3.572265625, 3.859375, 4.146484375, 4.43359375, 4.720703125, 5.0078125, 5.294921875, 5.58203125, 5.869140625, 6.15625, 6.443359375, 6.73046875, 7.017578125, 7.3046875, 7.591796875, 7.87890625, 8.166015625, 8.453125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 5.0, 12.0, 7.0, 19.0, 20.0, 23.0, 43.0, 67.0, 81.0, 105.0, 208.0, 266.0, 409.0, 554.0, 882.0, 1328.0, 1923.0, 3022.0, 4393.0, 6857.0, 10556.0, 16352.0, 26342.0, 42460.0, 69051.0, 110669.0, 167418.0, 1239147.0, 145560.0, 93444.0, 57842.0, 35542.0, 22284.0, 13977.0, 8907.0, 5825.0, 3834.0, 2489.0, 1668.0, 1128.0, 776.0, 497.0, 363.0, 247.0, 158.0, 132.0, 81.0, 56.0, 35.0, 23.0, 22.0, 10.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-1.2548828125, -1.214813232421875, -1.17474365234375, -1.134674072265625, -1.0946044921875, -1.054534912109375, -1.01446533203125, -0.974395751953125, -0.934326171875, -0.894256591796875, -0.85418701171875, -0.814117431640625, -0.7740478515625, -0.733978271484375, -0.69390869140625, -0.653839111328125, -0.61376953125, -0.573699951171875, -0.53363037109375, -0.493560791015625, -0.4534912109375, -0.413421630859375, -0.37335205078125, -0.333282470703125, -0.293212890625, -0.253143310546875, -0.21307373046875, -0.173004150390625, -0.1329345703125, -0.092864990234375, -0.05279541015625, -0.012725830078125, 0.02734375, 0.067413330078125, 0.10748291015625, 0.147552490234375, 0.1876220703125, 0.227691650390625, 0.26776123046875, 0.307830810546875, 0.347900390625, 0.387969970703125, 0.42803955078125, 0.468109130859375, 0.5081787109375, 0.548248291015625, 0.58831787109375, 0.628387451171875, 0.66845703125, 0.708526611328125, 0.74859619140625, 0.788665771484375, 0.8287353515625, 0.868804931640625, 0.90887451171875, 0.948944091796875, 0.989013671875, 1.029083251953125, 1.06915283203125, 1.109222412109375, 1.1492919921875, 1.189361572265625, 1.22943115234375, 1.269500732421875, 1.3095703125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 5.0, 2.0, 9.0, 10.0, 6.0, 11.0, 5.0, 8.0, 9.0, 20.0, 16.0, 33.0, 41.0, 47.0, 68.0, 80.0, 91.0, 132.0, 85.0, 64.0, 56.0, 48.0, 25.0, 27.0, 26.0, 13.0, 19.0, 7.0, 6.0, 5.0, 6.0, 3.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.044281005859375, -0.043055057525634766, -0.04182910919189453, -0.0406031608581543, -0.03937721252441406, -0.03815126419067383, -0.036925315856933594, -0.03569936752319336, -0.034473419189453125, -0.03324747085571289, -0.032021522521972656, -0.030795574188232422, -0.029569625854492188, -0.028343677520751953, -0.02711772918701172, -0.025891780853271484, -0.02466583251953125, -0.023439884185791016, -0.02221393585205078, -0.020987987518310547, -0.019762039184570312, -0.018536090850830078, -0.017310142517089844, -0.01608419418334961, -0.014858245849609375, -0.01363229751586914, -0.012406349182128906, -0.011180400848388672, -0.009954452514648438, -0.008728504180908203, -0.007502555847167969, -0.006276607513427734, -0.0050506591796875, -0.0038247108459472656, -0.0025987625122070312, -0.0013728141784667969, -0.0001468658447265625, 0.0010790824890136719, 0.0023050308227539062, 0.0035309791564941406, 0.004756927490234375, 0.005982875823974609, 0.007208824157714844, 0.008434772491455078, 0.009660720825195312, 0.010886669158935547, 0.012112617492675781, 0.013338565826416016, 0.01456451416015625, 0.015790462493896484, 0.01701641082763672, 0.018242359161376953, 0.019468307495117188, 0.020694255828857422, 0.021920204162597656, 0.02314615249633789, 0.024372100830078125, 0.02559804916381836, 0.026823997497558594, 0.028049945831298828, 0.029275894165039062, 0.030501842498779297, 0.03172779083251953, 0.032953739166259766, 0.0341796875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 6.0, 2.0, 9.0, 6.0, 15.0, 9.0, 26.0, 23.0, 32.0, 52.0, 87.0, 131.0, 208.0, 437.0, 3663.0, 1036305.0, 6359.0, 521.0, 242.0, 127.0, 77.0, 42.0, 40.0, 23.0, 19.0, 14.0, 18.0, 12.0, 15.0, 8.0, 5.0, 4.0, 2.0, 5.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7490234375, -0.7218399047851562, -0.6946563720703125, -0.6674728393554688, -0.640289306640625, -0.6131057739257812, -0.5859222412109375, -0.5587387084960938, -0.53155517578125, -0.5043716430664062, -0.4771881103515625, -0.45000457763671875, -0.422821044921875, -0.39563751220703125, -0.3684539794921875, -0.34127044677734375, -0.3140869140625, -0.28690338134765625, -0.2597198486328125, -0.23253631591796875, -0.205352783203125, -0.17816925048828125, -0.1509857177734375, -0.12380218505859375, -0.09661865234375, -0.06943511962890625, -0.0422515869140625, -0.01506805419921875, 0.012115478515625, 0.03929901123046875, 0.0664825439453125, 0.09366607666015625, 0.120849609375, 0.14803314208984375, 0.1752166748046875, 0.20240020751953125, 0.229583740234375, 0.25676727294921875, 0.2839508056640625, 0.31113433837890625, 0.33831787109375, 0.36550140380859375, 0.3926849365234375, 0.41986846923828125, 0.447052001953125, 0.47423553466796875, 0.5014190673828125, 0.5286026000976562, 0.5557861328125, 0.5829696655273438, 0.6101531982421875, 0.6373367309570312, 0.664520263671875, 0.6917037963867188, 0.7188873291015625, 0.7460708618164062, 0.77325439453125, 0.8004379272460938, 0.8276214599609375, 0.8548049926757812, 0.881988525390625, 0.9091720581054688, 0.9363555908203125, 0.9635391235351562, 0.99072265625]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 36.0, 960.0, 21.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1442357897758484, -0.11770550906658173, -0.09117522090673447, -0.06464493274688721, -0.038114652037620544, -0.011584371328353882, 0.014945924282073975, 0.04147620499134064, 0.0680064857006073, 0.09453676640987396, 0.12106705456972122, 0.14759734272956848, 0.17412762343883514, 0.2006579041481018, 0.22718819975852966, 0.2537184953689575, 0.280248761177063, 0.30677905678749084, 0.3333093225955963, 0.35983961820602417, 0.38636988401412964, 0.4129001796245575, 0.43943047523498535, 0.4659607410430908, 0.4924910366535187, 0.5190213322639465, 0.545551598072052, 0.5720819234848022, 0.5986121892929077, 0.6251424551010132, 0.6516727209091187, 0.6782030463218689, 0.7047333717346191, 0.7312636375427246, 0.7577939629554749, 0.7843242287635803, 0.8108544945716858, 0.837384819984436, 0.8639150857925415, 0.890445351600647, 0.9169756174087524, 0.9435058832168579, 0.9700362086296082, 0.9965664744377136, 1.0230967998504639, 1.0496270656585693, 1.0761573314666748, 1.1026875972747803, 1.1292178630828857, 1.1557481288909912, 1.1822783946990967, 1.2088086605072021, 1.2353390455245972, 1.2618693113327026, 1.288399577140808, 1.3149298429489136, 1.3414602279663086, 1.367990493774414, 1.3945207595825195, 1.421051025390625, 1.44758141040802, 1.4741116762161255, 1.500641942024231, 1.5271722078323364, 1.553702473640442]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 5.0, 0.0, 2.0, 2.0, 10.0, 11.0, 12.0, 17.0, 22.0, 26.0, 24.0, 24.0, 39.0, 38.0, 26.0, 41.0, 37.0, 41.0, 54.0, 36.0, 41.0, 38.0, 40.0, 49.0, 29.0, 41.0, 35.0, 31.0, 30.0, 38.0, 31.0, 20.0, 23.0, 16.0, 15.0, 13.0, 10.0, 13.0, 6.0, 9.0, 3.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.07374215126037598, -0.07173891365528107, -0.06973568350076675, -0.06773245334625244, -0.06572921574115753, -0.06372597813606262, -0.06172274798154831, -0.0597195141017437, -0.05771628022193909, -0.055713046342134476, -0.053709812462329865, -0.05170657858252525, -0.04970334470272064, -0.04770011082291603, -0.04569687694311142, -0.04369364306330681, -0.0416904091835022, -0.039687175303697586, -0.037683941423892975, -0.035680707544088364, -0.03367747366428375, -0.03167423978447914, -0.02967100590467453, -0.02766777202486992, -0.025664538145065308, -0.023661304265260696, -0.021658070385456085, -0.019654836505651474, -0.017651602625846863, -0.01564836874604225, -0.01364513486623764, -0.01164190098643303, -0.009638667106628418, -0.007635433226823807, -0.0056321993470191956, -0.0036289654672145844, -0.0016257315874099731, 0.00037750229239463806, 0.0023807361721992493, 0.0043839700520038605, 0.006387203931808472, 0.008390437811613083, 0.010393671691417694, 0.012396905571222305, 0.014400139451026917, 0.016403373330831528, 0.01840660721063614, 0.02040984109044075, 0.02241307497024536, 0.024416308850049973, 0.026419542729854584, 0.028422776609659195, 0.030426010489463806, 0.03242924436926842, 0.03443247824907303, 0.03643571212887764, 0.03843894600868225, 0.04044217988848686, 0.04244541376829147, 0.044448647648096085, 0.046451881527900696, 0.04845511540770531, 0.05045834928750992, 0.05246158316731453, 0.05446481704711914]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 5.0, 2.0, 5.0, 4.0, 7.0, 11.0, 12.0, 17.0, 12.0, 11.0, 22.0, 20.0, 26.0, 34.0, 35.0, 32.0, 54.0, 44.0, 54.0, 50.0, 54.0, 54.0, 52.0, 32.0, 33.0, 50.0, 41.0, 35.0, 23.0, 28.0, 24.0, 30.0, 21.0, 11.0, 16.0, 11.0, 5.0, 5.0, 8.0, 4.0, 4.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.203125, -13.696044921875, -13.18896484375, -12.681884765625, -12.1748046875, -11.667724609375, -11.16064453125, -10.653564453125, -10.146484375, -9.639404296875, -9.13232421875, -8.625244140625, -8.1181640625, -7.611083984375, -7.10400390625, -6.596923828125, -6.08984375, -5.582763671875, -5.07568359375, -4.568603515625, -4.0615234375, -3.554443359375, -3.04736328125, -2.540283203125, -2.033203125, -1.526123046875, -1.01904296875, -0.511962890625, -0.0048828125, 0.502197265625, 1.00927734375, 1.516357421875, 2.0234375, 2.530517578125, 3.03759765625, 3.544677734375, 4.0517578125, 4.558837890625, 5.06591796875, 5.572998046875, 6.080078125, 6.587158203125, 7.09423828125, 7.601318359375, 8.1083984375, 8.615478515625, 9.12255859375, 9.629638671875, 10.13671875, 10.643798828125, 11.15087890625, 11.657958984375, 12.1650390625, 12.672119140625, 13.17919921875, 13.686279296875, 14.193359375, 14.700439453125, 15.20751953125, 15.714599609375, 16.2216796875, 16.728759765625, 17.23583984375, 17.742919921875, 18.25]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 5.0, 5.0, 12.0, 12.0, 25.0, 21.0, 36.0, 65.0, 93.0, 136.0, 150.0, 263.0, 387.0, 631.0, 857.0, 1378.0, 2014.0, 3358.0, 5242.0, 9191.0, 17222.0, 38868.0, 122026.0, 549409.0, 195396.0, 52274.0, 21456.0, 10897.0, 6284.0, 3846.0, 2411.0, 1492.0, 1047.0, 704.0, 468.0, 275.0, 186.0, 121.0, 99.0, 59.0, 45.0, 35.0, 14.0, 21.0, 7.0, 7.0, 2.0, 7.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-18.46875, -17.88525390625, -17.3017578125, -16.71826171875, -16.134765625, -15.55126953125, -14.9677734375, -14.38427734375, -13.80078125, -13.21728515625, -12.6337890625, -12.05029296875, -11.466796875, -10.88330078125, -10.2998046875, -9.71630859375, -9.1328125, -8.54931640625, -7.9658203125, -7.38232421875, -6.798828125, -6.21533203125, -5.6318359375, -5.04833984375, -4.46484375, -3.88134765625, -3.2978515625, -2.71435546875, -2.130859375, -1.54736328125, -0.9638671875, -0.38037109375, 0.203125, 0.78662109375, 1.3701171875, 1.95361328125, 2.537109375, 3.12060546875, 3.7041015625, 4.28759765625, 4.87109375, 5.45458984375, 6.0380859375, 6.62158203125, 7.205078125, 7.78857421875, 8.3720703125, 8.95556640625, 9.5390625, 10.12255859375, 10.7060546875, 11.28955078125, 11.873046875, 12.45654296875, 13.0400390625, 13.62353515625, 14.20703125, 14.79052734375, 15.3740234375, 15.95751953125, 16.541015625, 17.12451171875, 17.7080078125, 18.29150390625, 18.875]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 0.0, 5.0, 6.0, 13.0, 6.0, 7.0, 13.0, 11.0, 23.0, 28.0, 17.0, 31.0, 37.0, 29.0, 40.0, 34.0, 42.0, 58.0, 69.0, 212.0, 1696.0, 185.0, 71.0, 49.0, 40.0, 35.0, 35.0, 32.0, 22.0, 30.0, 23.0, 28.0, 20.0, 13.0, 9.0, 19.0, 13.0, 13.0, 5.0, 7.0, 7.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-47.25, -45.87841796875, -44.5068359375, -43.13525390625, -41.763671875, -40.39208984375, -39.0205078125, -37.64892578125, -36.27734375, -34.90576171875, -33.5341796875, -32.16259765625, -30.791015625, -29.41943359375, -28.0478515625, -26.67626953125, -25.3046875, -23.93310546875, -22.5615234375, -21.18994140625, -19.818359375, -18.44677734375, -17.0751953125, -15.70361328125, -14.33203125, -12.96044921875, -11.5888671875, -10.21728515625, -8.845703125, -7.47412109375, -6.1025390625, -4.73095703125, -3.359375, -1.98779296875, -0.6162109375, 0.75537109375, 2.126953125, 3.49853515625, 4.8701171875, 6.24169921875, 7.61328125, 8.98486328125, 10.3564453125, 11.72802734375, 13.099609375, 14.47119140625, 15.8427734375, 17.21435546875, 18.5859375, 19.95751953125, 21.3291015625, 22.70068359375, 24.072265625, 25.44384765625, 26.8154296875, 28.18701171875, 29.55859375, 30.93017578125, 32.3017578125, 33.67333984375, 35.044921875, 36.41650390625, 37.7880859375, 39.15966796875, 40.53125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 8.0, 6.0, 13.0, 16.0, 27.0, 19.0, 29.0, 37.0, 61.0, 62.0, 97.0, 127.0, 197.0, 465.0, 1394.0, 7735.0, 103960.0, 2984984.0, 39871.0, 4650.0, 1029.0, 302.0, 166.0, 116.0, 86.0, 52.0, 46.0, 28.0, 20.0, 22.0, 19.0, 11.0, 10.0, 3.0, 5.0, 6.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-91.0625, -88.412109375, -85.76171875, -83.111328125, -80.4609375, -77.810546875, -75.16015625, -72.509765625, -69.859375, -67.208984375, -64.55859375, -61.908203125, -59.2578125, -56.607421875, -53.95703125, -51.306640625, -48.65625, -46.005859375, -43.35546875, -40.705078125, -38.0546875, -35.404296875, -32.75390625, -30.103515625, -27.453125, -24.802734375, -22.15234375, -19.501953125, -16.8515625, -14.201171875, -11.55078125, -8.900390625, -6.25, -3.599609375, -0.94921875, 1.701171875, 4.3515625, 7.001953125, 9.65234375, 12.302734375, 14.953125, 17.603515625, 20.25390625, 22.904296875, 25.5546875, 28.205078125, 30.85546875, 33.505859375, 36.15625, 38.806640625, 41.45703125, 44.107421875, 46.7578125, 49.408203125, 52.05859375, 54.708984375, 57.359375, 60.009765625, 62.66015625, 65.310546875, 67.9609375, 70.611328125, 73.26171875, 75.912109375, 78.5625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 15.0, 21.0, 64.0, 147.0, 206.0, 223.0, 177.0, 89.0, 36.0, 13.0, 8.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.734901428222656, -44.575138092041016, -41.41537857055664, -38.255615234375, -35.095855712890625, -31.936092376708984, -28.776329040527344, -25.616567611694336, -22.456806182861328, -19.29704475402832, -16.137283325195312, -12.977519989013672, -9.817758560180664, -6.657997131347656, -3.4982337951660156, -0.3384723663330078, 2.8212890625, 5.981050968170166, 9.140812873840332, 12.300575256347656, 15.460336685180664, 18.620098114013672, 21.779861450195312, 24.93962287902832, 28.099384307861328, 31.259145736694336, 34.418907165527344, 37.578670501708984, 40.738433837890625, 43.898193359375, 47.05795669555664, 50.21772003173828, 53.377471923828125, 56.537235260009766, 59.69699478149414, 62.85675811767578, 66.01651763916016, 69.17628479003906, 72.33604431152344, 75.49580383300781, 78.65556335449219, 81.81532287597656, 84.97509002685547, 88.13484954833984, 91.29460906982422, 94.45437622070312, 97.6141357421875, 100.77389526367188, 103.93366241455078, 107.09342193603516, 110.25318908691406, 113.41294860839844, 116.57270812988281, 119.73246765136719, 122.8922348022461, 126.05199432373047, 129.21176147460938, 132.37152099609375, 135.53128051757812, 138.6910400390625, 141.85081481933594, 145.0105743408203, 148.1703338623047, 151.33009338378906, 154.48985290527344]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 3.0, 3.0, 3.0, 8.0, 7.0, 7.0, 13.0, 19.0, 9.0, 16.0, 14.0, 26.0, 32.0, 26.0, 28.0, 32.0, 42.0, 40.0, 29.0, 57.0, 36.0, 46.0, 33.0, 39.0, 51.0, 36.0, 42.0, 40.0, 32.0, 21.0, 26.0, 24.0, 18.0, 24.0, 16.0, 15.0, 9.0, 15.0, 14.0, 14.0, 9.0, 5.0, 7.0, 8.0, 4.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-112.84426879882812, -109.51905822753906, -106.19384765625, -102.86863708496094, -99.5434341430664, -96.21822357177734, -92.89301300048828, -89.56780242919922, -86.24259185791016, -82.9173812866211, -79.59217071533203, -76.2669677734375, -72.94175720214844, -69.61654663085938, -66.29133605957031, -62.96612548828125, -59.64091873168945, -56.31570816040039, -52.990501403808594, -49.66529083251953, -46.34008026123047, -43.014869689941406, -39.68966293334961, -36.36445236206055, -33.03924560546875, -29.71403694152832, -26.388826370239258, -23.063617706298828, -19.738407135009766, -16.413198471069336, -13.087989807128906, -9.762779235839844, -6.437568664550781, -3.1123592853546143, 0.21285009384155273, 3.5380592346191406, 6.863268852233887, 10.188478469848633, 13.513687133789062, 16.838897705078125, 20.164106369018555, 23.489315032958984, 26.814525604248047, 30.139734268188477, 33.464942932128906, 36.79015350341797, 40.11536407470703, 43.440574645996094, 46.76578140258789, 50.09099197387695, 53.41619873046875, 56.74140930175781, 60.066619873046875, 63.39183044433594, 66.717041015625, 70.04225158691406, 73.3674545288086, 76.69266510009766, 80.01787567138672, 83.34307861328125, 86.66828918457031, 89.99349975585938, 93.31871032714844, 96.6439208984375, 99.96913146972656]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 4.0, 2.0, 3.0, 1.0, 4.0, 4.0, 7.0, 11.0, 8.0, 14.0, 15.0, 14.0, 9.0, 9.0, 18.0, 28.0, 24.0, 34.0, 25.0, 35.0, 52.0, 52.0, 41.0, 43.0, 56.0, 53.0, 48.0, 36.0, 42.0, 37.0, 29.0, 43.0, 28.0, 34.0, 18.0, 17.0, 16.0, 25.0, 14.0, 12.0, 5.0, 14.0, 2.0, 5.0, 9.0, 7.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.4140625, -12.9180908203125, -12.422119140625, -11.9261474609375, -11.43017578125, -10.9342041015625, -10.438232421875, -9.9422607421875, -9.4462890625, -8.9503173828125, -8.454345703125, -7.9583740234375, -7.46240234375, -6.9664306640625, -6.470458984375, -5.9744873046875, -5.478515625, -4.9825439453125, -4.486572265625, -3.9906005859375, -3.49462890625, -2.9986572265625, -2.502685546875, -2.0067138671875, -1.5107421875, -1.0147705078125, -0.518798828125, -0.0228271484375, 0.47314453125, 0.9691162109375, 1.465087890625, 1.9610595703125, 2.45703125, 2.9530029296875, 3.448974609375, 3.9449462890625, 4.44091796875, 4.9368896484375, 5.432861328125, 5.9288330078125, 6.4248046875, 6.9207763671875, 7.416748046875, 7.9127197265625, 8.40869140625, 8.9046630859375, 9.400634765625, 9.8966064453125, 10.392578125, 10.8885498046875, 11.384521484375, 11.8804931640625, 12.37646484375, 12.8724365234375, 13.368408203125, 13.8643798828125, 14.3603515625, 14.8563232421875, 15.352294921875, 15.8482666015625, 16.34423828125, 16.8402099609375, 17.336181640625, 17.8321533203125, 18.328125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 6.0, 4.0, 3.0, 4.0, 6.0, 9.0, 12.0, 28.0, 22.0, 27.0, 53.0, 36.0, 69.0, 109.0, 125.0, 191.0, 267.0, 426.0, 621.0, 1023.0, 1844.0, 3525.0, 6804.0, 15238.0, 42193.0, 205703.0, 1542045.0, 2007388.0, 281362.0, 50585.0, 17529.0, 7731.0, 3885.0, 2101.0, 1175.0, 672.0, 440.0, 293.0, 184.0, 131.0, 98.0, 71.0, 58.0, 51.0, 34.0, 24.0, 23.0, 22.0, 13.0, 6.0, 7.0, 4.0, 7.0, 1.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0], "bins": [-26.875, -26.01025390625, -25.1455078125, -24.28076171875, -23.416015625, -22.55126953125, -21.6865234375, -20.82177734375, -19.95703125, -19.09228515625, -18.2275390625, -17.36279296875, -16.498046875, -15.63330078125, -14.7685546875, -13.90380859375, -13.0390625, -12.17431640625, -11.3095703125, -10.44482421875, -9.580078125, -8.71533203125, -7.8505859375, -6.98583984375, -6.12109375, -5.25634765625, -4.3916015625, -3.52685546875, -2.662109375, -1.79736328125, -0.9326171875, -0.06787109375, 0.796875, 1.66162109375, 2.5263671875, 3.39111328125, 4.255859375, 5.12060546875, 5.9853515625, 6.85009765625, 7.71484375, 8.57958984375, 9.4443359375, 10.30908203125, 11.173828125, 12.03857421875, 12.9033203125, 13.76806640625, 14.6328125, 15.49755859375, 16.3623046875, 17.22705078125, 18.091796875, 18.95654296875, 19.8212890625, 20.68603515625, 21.55078125, 22.41552734375, 23.2802734375, 24.14501953125, 25.009765625, 25.87451171875, 26.7392578125, 27.60400390625, 28.46875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 3.0, 5.0, 10.0, 19.0, 24.0, 21.0, 24.0, 46.0, 78.0, 91.0, 164.0, 255.0, 516.0, 803.0, 784.0, 495.0, 282.0, 149.0, 81.0, 64.0, 53.0, 31.0, 21.0, 16.0, 10.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.8125, -41.58837890625, -40.3642578125, -39.14013671875, -37.916015625, -36.69189453125, -35.4677734375, -34.24365234375, -33.01953125, -31.79541015625, -30.5712890625, -29.34716796875, -28.123046875, -26.89892578125, -25.6748046875, -24.45068359375, -23.2265625, -22.00244140625, -20.7783203125, -19.55419921875, -18.330078125, -17.10595703125, -15.8818359375, -14.65771484375, -13.43359375, -12.20947265625, -10.9853515625, -9.76123046875, -8.537109375, -7.31298828125, -6.0888671875, -4.86474609375, -3.640625, -2.41650390625, -1.1923828125, 0.03173828125, 1.255859375, 2.47998046875, 3.7041015625, 4.92822265625, 6.15234375, 7.37646484375, 8.6005859375, 9.82470703125, 11.048828125, 12.27294921875, 13.4970703125, 14.72119140625, 15.9453125, 17.16943359375, 18.3935546875, 19.61767578125, 20.841796875, 22.06591796875, 23.2900390625, 24.51416015625, 25.73828125, 26.96240234375, 28.1865234375, 29.41064453125, 30.634765625, 31.85888671875, 33.0830078125, 34.30712890625, 35.53125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 4.0, 5.0, 5.0, 8.0, 11.0, 13.0, 24.0, 54.0, 72.0, 108.0, 207.0, 498.0, 1584.0, 8216.0, 174524.0, 3943099.0, 58996.0, 4922.0, 1049.0, 410.0, 172.0, 106.0, 54.0, 33.0, 35.0, 26.0, 13.0, 13.0, 6.0, 6.0, 0.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-125.375, -121.24609375, -117.1171875, -112.98828125, -108.859375, -104.73046875, -100.6015625, -96.47265625, -92.34375, -88.21484375, -84.0859375, -79.95703125, -75.828125, -71.69921875, -67.5703125, -63.44140625, -59.3125, -55.18359375, -51.0546875, -46.92578125, -42.796875, -38.66796875, -34.5390625, -30.41015625, -26.28125, -22.15234375, -18.0234375, -13.89453125, -9.765625, -5.63671875, -1.5078125, 2.62109375, 6.75, 10.87890625, 15.0078125, 19.13671875, 23.265625, 27.39453125, 31.5234375, 35.65234375, 39.78125, 43.91015625, 48.0390625, 52.16796875, 56.296875, 60.42578125, 64.5546875, 68.68359375, 72.8125, 76.94140625, 81.0703125, 85.19921875, 89.328125, 93.45703125, 97.5859375, 101.71484375, 105.84375, 109.97265625, 114.1015625, 118.23046875, 122.359375, 126.48828125, 130.6171875, 134.74609375, 138.875]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 9.0, 12.0, 27.0, 71.0, 159.0, 267.0, 257.0, 126.0, 50.0, 18.0, 11.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-254.55860900878906, -246.32427978515625, -238.08995056152344, -229.85562133789062, -221.6212921142578, -213.386962890625, -205.15261840820312, -196.91830444335938, -188.6839599609375, -180.4496307373047, -172.21530151367188, -163.98097229003906, -155.74664306640625, -147.51231384277344, -139.27798461914062, -131.04364013671875, -122.809326171875, -114.57499694824219, -106.34066772460938, -98.10633850097656, -89.87200927734375, -81.63768005371094, -73.4033432006836, -65.16901397705078, -56.93468475341797, -48.700355529785156, -40.466026306152344, -32.231693267822266, -23.997364044189453, -15.76303482055664, -7.5287017822265625, 0.70562744140625, 8.93994140625, 17.174270629882812, 25.408601760864258, 33.6429328918457, 41.877262115478516, 50.11159133911133, 58.345924377441406, 66.58025360107422, 74.81458282470703, 83.04891204833984, 91.28324127197266, 99.517578125, 107.75190734863281, 115.98623657226562, 124.22056579589844, 132.45489501953125, 140.68922424316406, 148.92355346679688, 157.1578826904297, 165.3922119140625, 173.6265411376953, 181.86087036132812, 190.09521484375, 198.32952880859375, 206.56387329101562, 214.79820251464844, 223.03253173828125, 231.26686096191406, 239.50119018554688, 247.7355194091797, 255.9698486328125, 264.2041931152344, 272.4385070800781]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 5.0, 5.0, 10.0, 11.0, 16.0, 17.0, 21.0, 23.0, 13.0, 23.0, 16.0, 24.0, 24.0, 27.0, 29.0, 35.0, 32.0, 27.0, 48.0, 28.0, 27.0, 45.0, 41.0, 29.0, 37.0, 45.0, 30.0, 35.0, 24.0, 24.0, 22.0, 32.0, 22.0, 16.0, 19.0, 12.0, 12.0, 15.0, 8.0, 16.0, 10.0, 7.0, 7.0, 6.0, 11.0, 5.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-86.99964141845703, -84.47054290771484, -81.94145202636719, -79.412353515625, -76.88325500488281, -74.35415649414062, -71.82505798339844, -69.29596710205078, -66.7668685913086, -64.2377700805664, -61.708675384521484, -59.17958068847656, -56.650482177734375, -54.12138366699219, -51.592288970947266, -49.063194274902344, -46.534095764160156, -44.00499725341797, -41.47590255737305, -38.946807861328125, -36.41770935058594, -33.88861083984375, -31.359516143798828, -28.830419540405273, -26.30132293701172, -23.772226333618164, -21.24312973022461, -18.714033126831055, -16.1849365234375, -13.655839920043945, -11.12674331665039, -8.597646713256836, -6.06854248046875, -3.5394458770751953, -1.0103492736816406, 1.518747329711914, 4.047843933105469, 6.576940536499023, 9.106037139892578, 11.635133743286133, 14.164230346679688, 16.693326950073242, 19.222423553466797, 21.75152015686035, 24.280616760253906, 26.80971336364746, 29.338809967041016, 31.86790657043457, 34.397003173828125, 36.92610168457031, 39.455196380615234, 41.984291076660156, 44.513389587402344, 47.04248809814453, 49.57158279418945, 52.100677490234375, 54.62977600097656, 57.15887451171875, 59.68796920776367, 62.217063903808594, 64.74616241455078, 67.27526092529297, 69.80435180664062, 72.33345031738281, 74.862548828125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 9.0, 12.0, 14.0, 9.0, 14.0, 16.0, 17.0, 17.0, 17.0, 27.0, 20.0, 37.0, 31.0, 40.0, 35.0, 41.0, 47.0, 38.0, 49.0, 52.0, 42.0, 39.0, 40.0, 40.0, 31.0, 24.0, 37.0, 19.0, 34.0, 18.0, 19.0, 11.0, 17.0, 16.0, 8.0, 16.0, 9.0, 8.0, 9.0, 6.0, 3.0, 2.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5078125, -14.0147705078125, -13.521728515625, -13.0286865234375, -12.53564453125, -12.0426025390625, -11.549560546875, -11.0565185546875, -10.5634765625, -10.0704345703125, -9.577392578125, -9.0843505859375, -8.59130859375, -8.0982666015625, -7.605224609375, -7.1121826171875, -6.619140625, -6.1260986328125, -5.633056640625, -5.1400146484375, -4.64697265625, -4.1539306640625, -3.660888671875, -3.1678466796875, -2.6748046875, -2.1817626953125, -1.688720703125, -1.1956787109375, -0.70263671875, -0.2095947265625, 0.283447265625, 0.7764892578125, 1.26953125, 1.7625732421875, 2.255615234375, 2.7486572265625, 3.24169921875, 3.7347412109375, 4.227783203125, 4.7208251953125, 5.2138671875, 5.7069091796875, 6.199951171875, 6.6929931640625, 7.18603515625, 7.6790771484375, 8.172119140625, 8.6651611328125, 9.158203125, 9.6512451171875, 10.144287109375, 10.6373291015625, 11.13037109375, 11.6234130859375, 12.116455078125, 12.6094970703125, 13.1025390625, 13.5955810546875, 14.088623046875, 14.5816650390625, 15.07470703125, 15.5677490234375, 16.060791015625, 16.5538330078125, 17.046875]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 8.0, 5.0, 14.0, 20.0, 23.0, 50.0, 51.0, 86.0, 125.0, 203.0, 262.0, 422.0, 604.0, 828.0, 1233.0, 1849.0, 2826.0, 4154.0, 6204.0, 9636.0, 14995.0, 23201.0, 36201.0, 58353.0, 94616.0, 148274.0, 192784.0, 163235.0, 106790.0, 65888.0, 41187.0, 26008.0, 16504.0, 10861.0, 6946.0, 4666.0, 3014.0, 2103.0, 1384.0, 1022.0, 606.0, 432.0, 309.0, 172.0, 142.0, 80.0, 56.0, 61.0, 30.0, 14.0, 17.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.0693359375, -2.00390625, -1.9384765625, -1.873046875, -1.8076171875, -1.7421875, -1.6767578125, -1.611328125, -1.5458984375, -1.48046875, -1.4150390625, -1.349609375, -1.2841796875, -1.21875, -1.1533203125, -1.087890625, -1.0224609375, -0.95703125, -0.8916015625, -0.826171875, -0.7607421875, -0.6953125, -0.6298828125, -0.564453125, -0.4990234375, -0.43359375, -0.3681640625, -0.302734375, -0.2373046875, -0.171875, -0.1064453125, -0.041015625, 0.0244140625, 0.08984375, 0.1552734375, 0.220703125, 0.2861328125, 0.3515625, 0.4169921875, 0.482421875, 0.5478515625, 0.61328125, 0.6787109375, 0.744140625, 0.8095703125, 0.875, 0.9404296875, 1.005859375, 1.0712890625, 1.13671875, 1.2021484375, 1.267578125, 1.3330078125, 1.3984375, 1.4638671875, 1.529296875, 1.5947265625, 1.66015625, 1.7255859375, 1.791015625, 1.8564453125, 1.921875, 1.9873046875, 2.052734375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 7.0, 8.0, 5.0, 10.0, 4.0, 14.0, 6.0, 11.0, 14.0, 16.0, 15.0, 23.0, 21.0, 23.0, 25.0, 24.0, 24.0, 32.0, 28.0, 51.0, 39.0, 23.0, 43.0, 1060.0, 31.0, 36.0, 31.0, 44.0, 37.0, 31.0, 37.0, 25.0, 31.0, 28.0, 15.0, 17.0, 25.0, 15.0, 16.0, 16.0, 15.0, 12.0, 11.0, 4.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.0234375, -8.7313232421875, -8.439208984375, -8.1470947265625, -7.85498046875, -7.5628662109375, -7.270751953125, -6.9786376953125, -6.6865234375, -6.3944091796875, -6.102294921875, -5.8101806640625, -5.51806640625, -5.2259521484375, -4.933837890625, -4.6417236328125, -4.349609375, -4.0574951171875, -3.765380859375, -3.4732666015625, -3.18115234375, -2.8890380859375, -2.596923828125, -2.3048095703125, -2.0126953125, -1.7205810546875, -1.428466796875, -1.1363525390625, -0.84423828125, -0.5521240234375, -0.260009765625, 0.0321044921875, 0.32421875, 0.6163330078125, 0.908447265625, 1.2005615234375, 1.49267578125, 1.7847900390625, 2.076904296875, 2.3690185546875, 2.6611328125, 2.9532470703125, 3.245361328125, 3.5374755859375, 3.82958984375, 4.1217041015625, 4.413818359375, 4.7059326171875, 4.998046875, 5.2901611328125, 5.582275390625, 5.8743896484375, 6.16650390625, 6.4586181640625, 6.750732421875, 7.0428466796875, 7.3349609375, 7.6270751953125, 7.919189453125, 8.2113037109375, 8.50341796875, 8.7955322265625, 9.087646484375, 9.3797607421875, 9.671875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 6.0, 4.0, 11.0, 7.0, 35.0, 26.0, 47.0, 65.0, 79.0, 125.0, 194.0, 257.0, 341.0, 512.0, 766.0, 1109.0, 1701.0, 2423.0, 3504.0, 4994.0, 7766.0, 11535.0, 17569.0, 27266.0, 42950.0, 69358.0, 110358.0, 167745.0, 1229901.0, 142878.0, 92214.0, 56904.0, 36257.0, 22877.0, 14894.0, 9735.0, 6592.0, 4550.0, 3045.0, 1979.0, 1421.0, 974.0, 662.0, 436.0, 342.0, 207.0, 158.0, 124.0, 71.0, 53.0, 34.0, 28.0, 19.0, 10.0, 9.0, 6.0, 2.0, 2.0, 3.0, 3.0], "bins": [-1.33984375, -1.298370361328125, -1.25689697265625, -1.215423583984375, -1.1739501953125, -1.132476806640625, -1.09100341796875, -1.049530029296875, -1.008056640625, -0.966583251953125, -0.92510986328125, -0.883636474609375, -0.8421630859375, -0.800689697265625, -0.75921630859375, -0.717742919921875, -0.67626953125, -0.634796142578125, -0.59332275390625, -0.551849365234375, -0.5103759765625, -0.468902587890625, -0.42742919921875, -0.385955810546875, -0.344482421875, -0.303009033203125, -0.26153564453125, -0.220062255859375, -0.1785888671875, -0.137115478515625, -0.09564208984375, -0.054168701171875, -0.0126953125, 0.028778076171875, 0.07025146484375, 0.111724853515625, 0.1531982421875, 0.194671630859375, 0.23614501953125, 0.277618408203125, 0.319091796875, 0.360565185546875, 0.40203857421875, 0.443511962890625, 0.4849853515625, 0.526458740234375, 0.56793212890625, 0.609405517578125, 0.65087890625, 0.692352294921875, 0.73382568359375, 0.775299072265625, 0.8167724609375, 0.858245849609375, 0.89971923828125, 0.941192626953125, 0.982666015625, 1.024139404296875, 1.06561279296875, 1.107086181640625, 1.1485595703125, 1.190032958984375, 1.23150634765625, 1.272979736328125, 1.314453125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 7.0, 2.0, 1.0, 6.0, 8.0, 7.0, 4.0, 6.0, 9.0, 2.0, 12.0, 11.0, 16.0, 20.0, 17.0, 31.0, 32.0, 33.0, 39.0, 53.0, 78.0, 125.0, 97.0, 79.0, 62.0, 44.0, 38.0, 34.0, 19.0, 21.0, 17.0, 18.0, 12.0, 9.0, 9.0, 11.0, 3.0, 2.0, 4.0, 6.0, 4.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.033294677734375, -0.03213977813720703, -0.030984878540039062, -0.029829978942871094, -0.028675079345703125, -0.027520179748535156, -0.026365280151367188, -0.02521038055419922, -0.02405548095703125, -0.02290058135986328, -0.021745681762695312, -0.020590782165527344, -0.019435882568359375, -0.018280982971191406, -0.017126083374023438, -0.01597118377685547, -0.0148162841796875, -0.013661384582519531, -0.012506484985351562, -0.011351585388183594, -0.010196685791015625, -0.009041786193847656, -0.007886886596679688, -0.006731986999511719, -0.00557708740234375, -0.004422187805175781, -0.0032672882080078125, -0.0021123886108398438, -0.000957489013671875, 0.00019741058349609375, 0.0013523101806640625, 0.0025072097778320312, 0.003662109375, 0.004817008972167969, 0.0059719085693359375, 0.007126808166503906, 0.008281707763671875, 0.009436607360839844, 0.010591506958007812, 0.011746406555175781, 0.01290130615234375, 0.014056205749511719, 0.015211105346679688, 0.016366004943847656, 0.017520904541015625, 0.018675804138183594, 0.019830703735351562, 0.02098560333251953, 0.0221405029296875, 0.02329540252685547, 0.024450302124023438, 0.025605201721191406, 0.026760101318359375, 0.027915000915527344, 0.029069900512695312, 0.03022480010986328, 0.03137969970703125, 0.03253459930419922, 0.03368949890136719, 0.034844398498535156, 0.035999298095703125, 0.037154197692871094, 0.03830909729003906, 0.03946399688720703, 0.040618896484375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 5.0, 6.0, 4.0, 2.0, 6.0, 13.0, 11.0, 11.0, 24.0, 24.0, 33.0, 34.0, 53.0, 82.0, 111.0, 168.0, 328.0, 819.0, 80248.0, 964046.0, 1478.0, 348.0, 228.0, 132.0, 81.0, 63.0, 32.0, 27.0, 29.0, 21.0, 18.0, 9.0, 15.0, 10.0, 9.0, 6.0, 10.0, 4.0, 2.0, 2.0, 7.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.87255859375, -0.8477325439453125, -0.822906494140625, -0.7980804443359375, -0.77325439453125, -0.7484283447265625, -0.723602294921875, -0.6987762451171875, -0.6739501953125, -0.6491241455078125, -0.624298095703125, -0.5994720458984375, -0.57464599609375, -0.5498199462890625, -0.524993896484375, -0.5001678466796875, -0.475341796875, -0.4505157470703125, -0.425689697265625, -0.4008636474609375, -0.37603759765625, -0.3512115478515625, -0.326385498046875, -0.3015594482421875, -0.2767333984375, -0.2519073486328125, -0.227081298828125, -0.2022552490234375, -0.17742919921875, -0.1526031494140625, -0.127777099609375, -0.1029510498046875, -0.078125, -0.0532989501953125, -0.028472900390625, -0.0036468505859375, 0.02117919921875, 0.0460052490234375, 0.070831298828125, 0.0956573486328125, 0.1204833984375, 0.1453094482421875, 0.170135498046875, 0.1949615478515625, 0.21978759765625, 0.2446136474609375, 0.269439697265625, 0.2942657470703125, 0.319091796875, 0.3439178466796875, 0.368743896484375, 0.3935699462890625, 0.41839599609375, 0.4432220458984375, 0.468048095703125, 0.4928741455078125, 0.5177001953125, 0.5425262451171875, 0.567352294921875, 0.5921783447265625, 0.61700439453125, 0.6418304443359375, 0.666656494140625, 0.6914825439453125, 0.71630859375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 79.0, 928.0, 9.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2220216691493988, -0.19803713262081146, -0.17405261099338531, -0.15006807446479797, -0.12608355283737183, -0.10209901630878448, -0.07811447978019714, -0.054129958152770996, -0.030145421624183655, -0.006160890683531761, 0.017823640257120132, 0.041808173060417175, 0.06579270213842392, 0.08977723121643066, 0.113761767745018, 0.13774628937244415, 0.1617308259010315, 0.18571536242961884, 0.20969988405704498, 0.23368442058563232, 0.25766894221305847, 0.2816534638404846, 0.30563801527023315, 0.3296225368976593, 0.35360705852508545, 0.3775915801525116, 0.40157613158226013, 0.4255606532096863, 0.4495451748371124, 0.4735296964645386, 0.4975142478942871, 0.5214987993240356, 0.5454832911491394, 0.5694678425788879, 0.5934523344039917, 0.6174368858337402, 0.6414214372634888, 0.6654059290885925, 0.6893904805183411, 0.7133749723434448, 0.7373595237731934, 0.7613440752029419, 0.7853285670280457, 0.8093131184577942, 0.8332976698875427, 0.8572821617126465, 0.881266713142395, 0.9052512645721436, 0.9292358160018921, 0.9532203674316406, 0.9772048592567444, 1.0011894702911377, 1.0251739025115967, 1.0491584539413452, 1.0731430053710938, 1.0971275568008423, 1.1211119890213013, 1.1450965404510498, 1.1690810918807983, 1.1930656433105469, 1.2170500755310059, 1.2410346269607544, 1.265019178390503, 1.2890037298202515, 1.31298828125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 5.0, 9.0, 4.0, 8.0, 11.0, 17.0, 19.0, 21.0, 19.0, 35.0, 34.0, 26.0, 41.0, 30.0, 42.0, 46.0, 45.0, 52.0, 40.0, 49.0, 44.0, 46.0, 45.0, 28.0, 51.0, 24.0, 28.0, 22.0, 28.0, 30.0, 13.0, 14.0, 14.0, 10.0, 14.0, 6.0, 7.0, 6.0, 7.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06216925382614136, -0.06041756272315979, -0.05866587162017822, -0.05691417679190636, -0.05516248568892479, -0.05341079458594322, -0.051659099757671356, -0.04990740865468979, -0.04815571755170822, -0.046404026448726654, -0.04465233534574509, -0.04290064051747322, -0.04114894941449165, -0.039397258311510086, -0.03764556348323822, -0.03589387238025665, -0.034142181277275085, -0.03239049017429352, -0.0306387972086668, -0.028887104243040085, -0.027135413140058517, -0.02538372203707695, -0.023632029071450233, -0.021880336105823517, -0.02012864500284195, -0.018376953899860382, -0.016625260934233665, -0.014873568899929523, -0.013121876865625381, -0.01137018483132124, -0.009618492797017097, -0.007866800762712955, -0.0061151087284088135, -0.0043634166941046715, -0.0026117246598005295, -0.0008600326254963875, 0.0008916594088077545, 0.0026433514431118965, 0.0043950434774160385, 0.0061467355117201805, 0.007898427546024323, 0.009650119580328465, 0.011401811614632607, 0.013153503648936749, 0.01490519568324089, 0.016656886786222458, 0.018408579751849174, 0.02016027271747589, 0.02191196382045746, 0.023663654923439026, 0.025415347889065742, 0.02716704085469246, 0.028918731957674026, 0.030670423060655594, 0.03242211788892746, 0.03417380899190903, 0.035925500094890594, 0.03767719119787216, 0.03942888230085373, 0.041180577129125595, 0.04293226823210716, 0.04468395933508873, 0.046435654163360596, 0.04818734526634216, 0.04993903636932373]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 4.0, 9.0, 12.0, 14.0, 9.0, 14.0, 16.0, 17.0, 17.0, 16.0, 28.0, 20.0, 35.0, 33.0, 40.0, 34.0, 42.0, 47.0, 38.0, 49.0, 52.0, 42.0, 39.0, 40.0, 40.0, 31.0, 24.0, 37.0, 19.0, 34.0, 17.0, 20.0, 11.0, 17.0, 16.0, 8.0, 16.0, 9.0, 8.0, 9.0, 6.0, 3.0, 2.0, 8.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5078125, -14.0147705078125, -13.521728515625, -13.0286865234375, -12.53564453125, -12.0426025390625, -11.549560546875, -11.0565185546875, -10.5634765625, -10.0704345703125, -9.577392578125, -9.0843505859375, -8.59130859375, -8.0982666015625, -7.605224609375, -7.1121826171875, -6.619140625, -6.1260986328125, -5.633056640625, -5.1400146484375, -4.64697265625, -4.1539306640625, -3.660888671875, -3.1678466796875, -2.6748046875, -2.1817626953125, -1.688720703125, -1.1956787109375, -0.70263671875, -0.2095947265625, 0.283447265625, 0.7764892578125, 1.26953125, 1.7625732421875, 2.255615234375, 2.7486572265625, 3.24169921875, 3.7347412109375, 4.227783203125, 4.7208251953125, 5.2138671875, 5.7069091796875, 6.199951171875, 6.6929931640625, 7.18603515625, 7.6790771484375, 8.172119140625, 8.6651611328125, 9.158203125, 9.6512451171875, 10.144287109375, 10.6373291015625, 11.13037109375, 11.6234130859375, 12.116455078125, 12.6094970703125, 13.1025390625, 13.5955810546875, 14.088623046875, 14.5816650390625, 15.07470703125, 15.5677490234375, 16.060791015625, 16.5538330078125, 17.046875]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 3.0, 8.0, 10.0, 14.0, 26.0, 32.0, 37.0, 40.0, 43.0, 80.0, 103.0, 135.0, 189.0, 300.0, 495.0, 753.0, 1101.0, 1767.0, 3100.0, 6164.0, 15083.0, 79838.0, 829055.0, 80390.0, 15412.0, 6122.0, 3116.0, 1783.0, 1132.0, 722.0, 453.0, 306.0, 221.0, 151.0, 81.0, 67.0, 38.0, 38.0, 33.0, 31.0, 16.0, 15.0, 17.0, 5.0, 6.0, 7.0, 7.0, 6.0, 4.0, 2.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-28.328125, -27.367919921875, -26.40771484375, -25.447509765625, -24.4873046875, -23.527099609375, -22.56689453125, -21.606689453125, -20.646484375, -19.686279296875, -18.72607421875, -17.765869140625, -16.8056640625, -15.845458984375, -14.88525390625, -13.925048828125, -12.96484375, -12.004638671875, -11.04443359375, -10.084228515625, -9.1240234375, -8.163818359375, -7.20361328125, -6.243408203125, -5.283203125, -4.322998046875, -3.36279296875, -2.402587890625, -1.4423828125, -0.482177734375, 0.47802734375, 1.438232421875, 2.3984375, 3.358642578125, 4.31884765625, 5.279052734375, 6.2392578125, 7.199462890625, 8.15966796875, 9.119873046875, 10.080078125, 11.040283203125, 12.00048828125, 12.960693359375, 13.9208984375, 14.881103515625, 15.84130859375, 16.801513671875, 17.76171875, 18.721923828125, 19.68212890625, 20.642333984375, 21.6025390625, 22.562744140625, 23.52294921875, 24.483154296875, 25.443359375, 26.403564453125, 27.36376953125, 28.323974609375, 29.2841796875, 30.244384765625, 31.20458984375, 32.164794921875, 33.125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 6.0, 7.0, 6.0, 8.0, 12.0, 15.0, 15.0, 14.0, 20.0, 24.0, 22.0, 35.0, 37.0, 51.0, 39.0, 52.0, 50.0, 97.0, 510.0, 1571.0, 84.0, 36.0, 55.0, 45.0, 43.0, 31.0, 35.0, 19.0, 16.0, 16.0, 11.0, 12.0, 9.0, 7.0, 15.0, 7.0, 5.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-60.0, -58.33349609375, -56.6669921875, -55.00048828125, -53.333984375, -51.66748046875, -50.0009765625, -48.33447265625, -46.66796875, -45.00146484375, -43.3349609375, -41.66845703125, -40.001953125, -38.33544921875, -36.6689453125, -35.00244140625, -33.3359375, -31.66943359375, -30.0029296875, -28.33642578125, -26.669921875, -25.00341796875, -23.3369140625, -21.67041015625, -20.00390625, -18.33740234375, -16.6708984375, -15.00439453125, -13.337890625, -11.67138671875, -10.0048828125, -8.33837890625, -6.671875, -5.00537109375, -3.3388671875, -1.67236328125, -0.005859375, 1.66064453125, 3.3271484375, 4.99365234375, 6.66015625, 8.32666015625, 9.9931640625, 11.65966796875, 13.326171875, 14.99267578125, 16.6591796875, 18.32568359375, 19.9921875, 21.65869140625, 23.3251953125, 24.99169921875, 26.658203125, 28.32470703125, 29.9912109375, 31.65771484375, 33.32421875, 34.99072265625, 36.6572265625, 38.32373046875, 39.990234375, 41.65673828125, 43.3232421875, 44.98974609375, 46.65625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 6.0, 7.0, 5.0, 5.0, 15.0, 7.0, 12.0, 17.0, 15.0, 15.0, 19.0, 32.0, 52.0, 58.0, 83.0, 119.0, 272.0, 905.0, 6549.0, 2945620.0, 186451.0, 4103.0, 622.0, 231.0, 124.0, 87.0, 50.0, 49.0, 40.0, 26.0, 22.0, 14.0, 19.0, 13.0, 9.0, 10.0, 5.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-105.25, -101.4765625, -97.703125, -93.9296875, -90.15625, -86.3828125, -82.609375, -78.8359375, -75.0625, -71.2890625, -67.515625, -63.7421875, -59.96875, -56.1953125, -52.421875, -48.6484375, -44.875, -41.1015625, -37.328125, -33.5546875, -29.78125, -26.0078125, -22.234375, -18.4609375, -14.6875, -10.9140625, -7.140625, -3.3671875, 0.40625, 4.1796875, 7.953125, 11.7265625, 15.5, 19.2734375, 23.046875, 26.8203125, 30.59375, 34.3671875, 38.140625, 41.9140625, 45.6875, 49.4609375, 53.234375, 57.0078125, 60.78125, 64.5546875, 68.328125, 72.1015625, 75.875, 79.6484375, 83.421875, 87.1953125, 90.96875, 94.7421875, 98.515625, 102.2890625, 106.0625, 109.8359375, 113.609375, 117.3828125, 121.15625, 124.9296875, 128.703125, 132.4765625, 136.25]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 40.0, 214.0, 478.0, 220.0, 48.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.16341781616211, -35.44236373901367, -30.721309661865234, -26.000255584716797, -21.27920150756836, -16.558147430419922, -11.837093353271484, -7.116039276123047, -2.3949851989746094, 2.326068878173828, 7.047122955322266, 11.768177032470703, 16.48923110961914, 21.210285186767578, 25.931339263916016, 30.652393341064453, 35.37344741821289, 40.09450149536133, 44.815555572509766, 49.5366096496582, 54.25766372680664, 58.97871780395508, 63.699771881103516, 68.42082214355469, 73.14187622070312, 77.86293029785156, 82.583984375, 87.30503845214844, 92.02609252929688, 96.74714660644531, 101.46820068359375, 106.18925476074219, 110.91030883789062, 115.63136291503906, 120.3524169921875, 125.07347106933594, 129.79452514648438, 134.5155792236328, 139.23663330078125, 143.9576873779297, 148.67874145507812, 153.39979553222656, 158.120849609375, 162.84190368652344, 167.56295776367188, 172.2840118408203, 177.00506591796875, 181.7261199951172, 186.44717407226562, 191.16822814941406, 195.8892822265625, 200.61033630371094, 205.33139038085938, 210.0524444580078, 214.77349853515625, 219.4945526123047, 224.21560668945312, 228.93666076660156, 233.65771484375, 238.37876892089844, 243.09982299804688, 247.8208770751953, 252.54193115234375, 257.26300048828125, 261.9840393066406]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 4.0, 8.0, 5.0, 9.0, 14.0, 13.0, 16.0, 18.0, 25.0, 13.0, 23.0, 21.0, 31.0, 33.0, 29.0, 26.0, 43.0, 42.0, 33.0, 28.0, 29.0, 39.0, 36.0, 42.0, 48.0, 33.0, 32.0, 31.0, 33.0, 30.0, 25.0, 31.0, 31.0, 20.0, 24.0, 16.0, 18.0, 9.0, 5.0, 7.0, 9.0, 4.0, 2.0, 3.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-109.09172821044922, -105.55287170410156, -102.01400756835938, -98.47515106201172, -94.93629455566406, -91.3974380493164, -87.85858154296875, -84.31971740722656, -80.7808609008789, -77.24200439453125, -73.70314025878906, -70.1642837524414, -66.62542724609375, -63.086570739746094, -59.54771041870117, -56.00885009765625, -52.469993591308594, -48.93113708496094, -45.392276763916016, -41.853416442871094, -38.31455993652344, -34.77570343017578, -31.23684310913086, -27.69798469543457, -24.15912628173828, -20.620267868041992, -17.081409454345703, -13.542551040649414, -10.003692626953125, -6.464834213256836, -2.925975799560547, 0.6128826141357422, 4.1517486572265625, 7.690607070922852, 11.22946548461914, 14.76832389831543, 18.30718231201172, 21.846040725708008, 25.384899139404297, 28.923757553100586, 32.462615966796875, 36.00147247314453, 39.54033279418945, 43.079193115234375, 46.61804962158203, 50.15690612792969, 53.69576644897461, 57.23462677001953, 60.77348327636719, 64.31233978271484, 67.8511962890625, 71.39006042480469, 74.92891693115234, 78.4677734375, 82.00663757324219, 85.54549407958984, 89.0843505859375, 92.62320709228516, 96.16206359863281, 99.700927734375, 103.23978424072266, 106.77864074707031, 110.3175048828125, 113.85636138916016, 117.39521789550781]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 6.0, 9.0, 5.0, 16.0, 12.0, 18.0, 15.0, 15.0, 22.0, 15.0, 27.0, 24.0, 34.0, 35.0, 32.0, 42.0, 46.0, 46.0, 49.0, 47.0, 40.0, 46.0, 41.0, 41.0, 39.0, 30.0, 32.0, 22.0, 26.0, 21.0, 26.0, 17.0, 18.0, 11.0, 14.0, 11.0, 15.0, 6.0, 10.0, 3.0, 7.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9609375, -15.4285888671875, -14.896240234375, -14.3638916015625, -13.83154296875, -13.2991943359375, -12.766845703125, -12.2344970703125, -11.7021484375, -11.1697998046875, -10.637451171875, -10.1051025390625, -9.57275390625, -9.0404052734375, -8.508056640625, -7.9757080078125, -7.443359375, -6.9110107421875, -6.378662109375, -5.8463134765625, -5.31396484375, -4.7816162109375, -4.249267578125, -3.7169189453125, -3.1845703125, -2.6522216796875, -2.119873046875, -1.5875244140625, -1.05517578125, -0.5228271484375, 0.009521484375, 0.5418701171875, 1.07421875, 1.6065673828125, 2.138916015625, 2.6712646484375, 3.20361328125, 3.7359619140625, 4.268310546875, 4.8006591796875, 5.3330078125, 5.8653564453125, 6.397705078125, 6.9300537109375, 7.46240234375, 7.9947509765625, 8.527099609375, 9.0594482421875, 9.591796875, 10.1241455078125, 10.656494140625, 11.1888427734375, 11.72119140625, 12.2535400390625, 12.785888671875, 13.3182373046875, 13.8505859375, 14.3829345703125, 14.915283203125, 15.4476318359375, 15.97998046875, 16.5123291015625, 17.044677734375, 17.5770263671875, 18.109375]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 15.0, 3.0, 12.0, 19.0, 17.0, 30.0, 35.0, 55.0, 95.0, 154.0, 253.0, 528.0, 1022.0, 2143.0, 4781.0, 11839.0, 38206.0, 233782.0, 1949356.0, 1712486.0, 187415.0, 32706.0, 10530.0, 4500.0, 2028.0, 958.0, 551.0, 283.0, 149.0, 88.0, 70.0, 42.0, 36.0, 22.0, 13.0, 10.0, 11.0, 4.0, 7.0, 6.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-35.0, -33.93798828125, -32.8759765625, -31.81396484375, -30.751953125, -29.68994140625, -28.6279296875, -27.56591796875, -26.50390625, -25.44189453125, -24.3798828125, -23.31787109375, -22.255859375, -21.19384765625, -20.1318359375, -19.06982421875, -18.0078125, -16.94580078125, -15.8837890625, -14.82177734375, -13.759765625, -12.69775390625, -11.6357421875, -10.57373046875, -9.51171875, -8.44970703125, -7.3876953125, -6.32568359375, -5.263671875, -4.20166015625, -3.1396484375, -2.07763671875, -1.015625, 0.04638671875, 1.1083984375, 2.17041015625, 3.232421875, 4.29443359375, 5.3564453125, 6.41845703125, 7.48046875, 8.54248046875, 9.6044921875, 10.66650390625, 11.728515625, 12.79052734375, 13.8525390625, 14.91455078125, 15.9765625, 17.03857421875, 18.1005859375, 19.16259765625, 20.224609375, 21.28662109375, 22.3486328125, 23.41064453125, 24.47265625, 25.53466796875, 26.5966796875, 27.65869140625, 28.720703125, 29.78271484375, 30.8447265625, 31.90673828125, 32.96875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 12.0, 9.0, 12.0, 17.0, 32.0, 38.0, 48.0, 79.0, 113.0, 157.0, 325.0, 598.0, 763.0, 699.0, 470.0, 257.0, 138.0, 85.0, 57.0, 40.0, 36.0, 18.0, 19.0, 16.0, 3.0, 8.0, 4.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-51.625, -50.41845703125, -49.2119140625, -48.00537109375, -46.798828125, -45.59228515625, -44.3857421875, -43.17919921875, -41.97265625, -40.76611328125, -39.5595703125, -38.35302734375, -37.146484375, -35.93994140625, -34.7333984375, -33.52685546875, -32.3203125, -31.11376953125, -29.9072265625, -28.70068359375, -27.494140625, -26.28759765625, -25.0810546875, -23.87451171875, -22.66796875, -21.46142578125, -20.2548828125, -19.04833984375, -17.841796875, -16.63525390625, -15.4287109375, -14.22216796875, -13.015625, -11.80908203125, -10.6025390625, -9.39599609375, -8.189453125, -6.98291015625, -5.7763671875, -4.56982421875, -3.36328125, -2.15673828125, -0.9501953125, 0.25634765625, 1.462890625, 2.66943359375, 3.8759765625, 5.08251953125, 6.2890625, 7.49560546875, 8.7021484375, 9.90869140625, 11.115234375, 12.32177734375, 13.5283203125, 14.73486328125, 15.94140625, 17.14794921875, 18.3544921875, 19.56103515625, 20.767578125, 21.97412109375, 23.1806640625, 24.38720703125, 25.59375]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 3.0, 10.0, 4.0, 9.0, 17.0, 37.0, 39.0, 78.0, 98.0, 163.0, 321.0, 825.0, 2465.0, 12273.0, 139031.0, 3772167.0, 244627.0, 17226.0, 3008.0, 936.0, 391.0, 212.0, 115.0, 83.0, 40.0, 35.0, 17.0, 20.0, 14.0, 5.0, 2.0, 2.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.6875, -61.6904296875, -58.693359375, -55.6962890625, -52.69921875, -49.7021484375, -46.705078125, -43.7080078125, -40.7109375, -37.7138671875, -34.716796875, -31.7197265625, -28.72265625, -25.7255859375, -22.728515625, -19.7314453125, -16.734375, -13.7373046875, -10.740234375, -7.7431640625, -4.74609375, -1.7490234375, 1.248046875, 4.2451171875, 7.2421875, 10.2392578125, 13.236328125, 16.2333984375, 19.23046875, 22.2275390625, 25.224609375, 28.2216796875, 31.21875, 34.2158203125, 37.212890625, 40.2099609375, 43.20703125, 46.2041015625, 49.201171875, 52.1982421875, 55.1953125, 58.1923828125, 61.189453125, 64.1865234375, 67.18359375, 70.1806640625, 73.177734375, 76.1748046875, 79.171875, 82.1689453125, 85.166015625, 88.1630859375, 91.16015625, 94.1572265625, 97.154296875, 100.1513671875, 103.1484375, 106.1455078125, 109.142578125, 112.1396484375, 115.13671875, 118.1337890625, 121.130859375, 124.1279296875, 127.125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 23.0, 55.0, 182.0, 317.0, 260.0, 118.0, 43.0, 8.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.6817626953125, -96.8416519165039, -87.00153350830078, -77.16142272949219, -67.32130432128906, -57.48119354248047, -47.641082763671875, -37.80096435546875, -27.960853576660156, -18.120738983154297, -8.28062629699707, 1.5594863891601562, 11.399600982666016, 21.239715576171875, 31.07982635498047, 40.919944763183594, 50.76005554199219, 60.60017013549805, 70.4402847290039, 80.2803955078125, 90.12051391601562, 99.96062469482422, 109.80073547363281, 119.64085388183594, 129.48095703125, 139.32107543945312, 149.1611785888672, 159.0012969970703, 168.84141540527344, 178.6815185546875, 188.52163696289062, 198.36175537109375, 208.20187377929688, 218.0419921875, 227.88209533691406, 237.7222137451172, 247.5623321533203, 257.4024353027344, 267.2425537109375, 277.0826721191406, 286.92279052734375, 296.7629089355469, 306.60302734375, 316.443115234375, 326.2832336425781, 336.12335205078125, 345.9634704589844, 355.8035888671875, 365.6436767578125, 375.4837951660156, 385.32391357421875, 395.16400146484375, 405.0041198730469, 414.84423828125, 424.6843566894531, 434.52447509765625, 444.3645935058594, 454.2047119140625, 464.0448303222656, 473.88494873046875, 483.72503662109375, 493.5651550292969, 503.4052734375, 513.245361328125, 523.0855102539062]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 5.0, 3.0, 3.0, 4.0, 4.0, 8.0, 11.0, 5.0, 15.0, 7.0, 19.0, 14.0, 28.0, 22.0, 28.0, 25.0, 28.0, 24.0, 26.0, 31.0, 44.0, 34.0, 30.0, 38.0, 55.0, 40.0, 43.0, 34.0, 38.0, 44.0, 26.0, 42.0, 20.0, 23.0, 25.0, 24.0, 17.0, 16.0, 14.0, 22.0, 12.0, 12.0, 5.0, 9.0, 10.0, 5.0, 5.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-90.29818725585938, -87.43455505371094, -84.5709228515625, -81.70728302001953, -78.8436508178711, -75.98001861572266, -73.11637878417969, -70.25274658203125, -67.38911437988281, -64.52548217773438, -61.66184616088867, -58.79821014404297, -55.93457794189453, -53.070945739746094, -50.20730972290039, -47.34367370605469, -44.48004150390625, -41.61640930175781, -38.75277328491211, -35.889137268066406, -33.02550506591797, -30.1618709564209, -27.298236846923828, -24.434602737426758, -21.570968627929688, -18.707334518432617, -15.843700408935547, -12.980066299438477, -10.116432189941406, -7.252798080444336, -4.389163970947266, -1.5255298614501953, 1.338104248046875, 4.201738357543945, 7.065372467041016, 9.929006576538086, 12.792640686035156, 15.656274795532227, 18.519908905029297, 21.383543014526367, 24.247177124023438, 27.110811233520508, 29.974445343017578, 32.83808135986328, 35.70171356201172, 38.565345764160156, 41.42898178100586, 44.29261779785156, 47.15625, 50.01988220214844, 52.88351821899414, 55.747154235839844, 58.61078643798828, 61.47441864013672, 64.33805847167969, 67.20169067382812, 70.06532287597656, 72.928955078125, 75.79258728027344, 78.6562271118164, 81.51985931396484, 84.38349151611328, 87.24713134765625, 90.11076354980469, 92.97439575195312]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 6.0, 7.0, 6.0, 8.0, 14.0, 7.0, 14.0, 17.0, 19.0, 20.0, 28.0, 31.0, 33.0, 37.0, 46.0, 31.0, 33.0, 37.0, 44.0, 57.0, 48.0, 40.0, 41.0, 41.0, 44.0, 48.0, 27.0, 32.0, 26.0, 26.0, 24.0, 19.0, 21.0, 12.0, 15.0, 12.0, 11.0, 6.0, 7.0, 10.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.71875, -16.1484375, -15.578125, -15.0078125, -14.4375, -13.8671875, -13.296875, -12.7265625, -12.15625, -11.5859375, -11.015625, -10.4453125, -9.875, -9.3046875, -8.734375, -8.1640625, -7.59375, -7.0234375, -6.453125, -5.8828125, -5.3125, -4.7421875, -4.171875, -3.6015625, -3.03125, -2.4609375, -1.890625, -1.3203125, -0.75, -0.1796875, 0.390625, 0.9609375, 1.53125, 2.1015625, 2.671875, 3.2421875, 3.8125, 4.3828125, 4.953125, 5.5234375, 6.09375, 6.6640625, 7.234375, 7.8046875, 8.375, 8.9453125, 9.515625, 10.0859375, 10.65625, 11.2265625, 11.796875, 12.3671875, 12.9375, 13.5078125, 14.078125, 14.6484375, 15.21875, 15.7890625, 16.359375, 16.9296875, 17.5, 18.0703125, 18.640625, 19.2109375, 19.78125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 4.0, 10.0, 17.0, 30.0, 28.0, 42.0, 61.0, 91.0, 141.0, 231.0, 335.0, 544.0, 802.0, 1172.0, 2024.0, 3120.0, 4852.0, 7819.0, 12196.0, 19614.0, 31750.0, 52371.0, 86873.0, 138996.0, 197384.0, 180678.0, 118911.0, 72402.0, 44045.0, 26704.0, 16876.0, 10341.0, 6469.0, 4198.0, 2723.0, 1637.0, 1081.0, 704.0, 419.0, 265.0, 178.0, 147.0, 89.0, 69.0, 29.0, 28.0, 17.0, 11.0, 8.0, 8.0, 7.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-2.291015625, -2.221221923828125, -2.15142822265625, -2.081634521484375, -2.0118408203125, -1.942047119140625, -1.87225341796875, -1.802459716796875, -1.732666015625, -1.662872314453125, -1.59307861328125, -1.523284912109375, -1.4534912109375, -1.383697509765625, -1.31390380859375, -1.244110107421875, -1.17431640625, -1.104522705078125, -1.03472900390625, -0.964935302734375, -0.8951416015625, -0.825347900390625, -0.75555419921875, -0.685760498046875, -0.615966796875, -0.546173095703125, -0.47637939453125, -0.406585693359375, -0.3367919921875, -0.266998291015625, -0.19720458984375, -0.127410888671875, -0.0576171875, 0.012176513671875, 0.08197021484375, 0.151763916015625, 0.2215576171875, 0.291351318359375, 0.36114501953125, 0.430938720703125, 0.500732421875, 0.570526123046875, 0.64031982421875, 0.710113525390625, 0.7799072265625, 0.849700927734375, 0.91949462890625, 0.989288330078125, 1.05908203125, 1.128875732421875, 1.19866943359375, 1.268463134765625, 1.3382568359375, 1.408050537109375, 1.47784423828125, 1.547637939453125, 1.617431640625, 1.687225341796875, 1.75701904296875, 1.826812744140625, 1.8966064453125, 1.966400146484375, 2.03619384765625, 2.105987548828125, 2.17578125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 3.0, 0.0, 4.0, 4.0, 5.0, 11.0, 7.0, 9.0, 9.0, 16.0, 16.0, 19.0, 20.0, 40.0, 15.0, 32.0, 42.0, 32.0, 32.0, 39.0, 36.0, 29.0, 36.0, 48.0, 1057.0, 45.0, 38.0, 36.0, 34.0, 37.0, 25.0, 32.0, 20.0, 28.0, 18.0, 26.0, 13.0, 20.0, 23.0, 12.0, 10.0, 10.0, 12.0, 6.0, 0.0, 3.0, 4.0, 2.0, 3.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-10.4921875, -10.1650390625, -9.837890625, -9.5107421875, -9.18359375, -8.8564453125, -8.529296875, -8.2021484375, -7.875, -7.5478515625, -7.220703125, -6.8935546875, -6.56640625, -6.2392578125, -5.912109375, -5.5849609375, -5.2578125, -4.9306640625, -4.603515625, -4.2763671875, -3.94921875, -3.6220703125, -3.294921875, -2.9677734375, -2.640625, -2.3134765625, -1.986328125, -1.6591796875, -1.33203125, -1.0048828125, -0.677734375, -0.3505859375, -0.0234375, 0.3037109375, 0.630859375, 0.9580078125, 1.28515625, 1.6123046875, 1.939453125, 2.2666015625, 2.59375, 2.9208984375, 3.248046875, 3.5751953125, 3.90234375, 4.2294921875, 4.556640625, 4.8837890625, 5.2109375, 5.5380859375, 5.865234375, 6.1923828125, 6.51953125, 6.8466796875, 7.173828125, 7.5009765625, 7.828125, 8.1552734375, 8.482421875, 8.8095703125, 9.13671875, 9.4638671875, 9.791015625, 10.1181640625, 10.4453125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 5.0, 6.0, 5.0, 10.0, 9.0, 19.0, 25.0, 35.0, 65.0, 104.0, 133.0, 197.0, 283.0, 388.0, 595.0, 900.0, 1344.0, 2110.0, 3088.0, 4718.0, 7200.0, 11483.0, 18208.0, 29490.0, 49203.0, 82090.0, 136959.0, 1219943.0, 216907.0, 122380.0, 73075.0, 43764.0, 26457.0, 16543.0, 10285.0, 6614.0, 4220.0, 2754.0, 1826.0, 1224.0, 812.0, 569.0, 327.0, 256.0, 156.0, 111.0, 74.0, 52.0, 30.0, 33.0, 25.0, 19.0, 6.0, 4.0, 7.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.5751953125, -1.5272979736328125, -1.479400634765625, -1.4315032958984375, -1.38360595703125, -1.3357086181640625, -1.287811279296875, -1.2399139404296875, -1.1920166015625, -1.1441192626953125, -1.096221923828125, -1.0483245849609375, -1.00042724609375, -0.9525299072265625, -0.904632568359375, -0.8567352294921875, -0.808837890625, -0.7609405517578125, -0.713043212890625, -0.6651458740234375, -0.61724853515625, -0.5693511962890625, -0.521453857421875, -0.4735565185546875, -0.4256591796875, -0.3777618408203125, -0.329864501953125, -0.2819671630859375, -0.23406982421875, -0.1861724853515625, -0.138275146484375, -0.0903778076171875, -0.04248046875, 0.0054168701171875, 0.053314208984375, 0.1012115478515625, 0.14910888671875, 0.1970062255859375, 0.244903564453125, 0.2928009033203125, 0.3406982421875, 0.3885955810546875, 0.436492919921875, 0.4843902587890625, 0.53228759765625, 0.5801849365234375, 0.628082275390625, 0.6759796142578125, 0.723876953125, 0.7717742919921875, 0.819671630859375, 0.8675689697265625, 0.91546630859375, 0.9633636474609375, 1.011260986328125, 1.0591583251953125, 1.1070556640625, 1.1549530029296875, 1.202850341796875, 1.2507476806640625, 1.29864501953125, 1.3465423583984375, 1.394439697265625, 1.4423370361328125, 1.490234375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 6.0, 2.0, 6.0, 3.0, 7.0, 11.0, 14.0, 11.0, 18.0, 22.0, 36.0, 50.0, 47.0, 82.0, 95.0, 105.0, 105.0, 84.0, 58.0, 53.0, 41.0, 32.0, 31.0, 21.0, 12.0, 8.0, 7.0, 7.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.0380859375, -0.03703045845031738, -0.035974979400634766, -0.03491950035095215, -0.03386402130126953, -0.032808542251586914, -0.0317530632019043, -0.03069758415222168, -0.029642105102539062, -0.028586626052856445, -0.027531147003173828, -0.02647566795349121, -0.025420188903808594, -0.024364709854125977, -0.02330923080444336, -0.022253751754760742, -0.021198272705078125, -0.020142793655395508, -0.01908731460571289, -0.018031835556030273, -0.016976356506347656, -0.01592087745666504, -0.014865398406982422, -0.013809919357299805, -0.012754440307617188, -0.01169896125793457, -0.010643482208251953, -0.009588003158569336, -0.008532524108886719, -0.0074770450592041016, -0.006421566009521484, -0.005366086959838867, -0.00431060791015625, -0.003255128860473633, -0.0021996498107910156, -0.0011441707611083984, -8.869171142578125e-05, 0.0009667873382568359, 0.002022266387939453, 0.0030777454376220703, 0.0041332244873046875, 0.005188703536987305, 0.006244182586669922, 0.007299661636352539, 0.008355140686035156, 0.009410619735717773, 0.01046609878540039, 0.011521577835083008, 0.012577056884765625, 0.013632535934448242, 0.01468801498413086, 0.015743494033813477, 0.016798973083496094, 0.01785445213317871, 0.018909931182861328, 0.019965410232543945, 0.021020889282226562, 0.02207636833190918, 0.023131847381591797, 0.024187326431274414, 0.02524280548095703, 0.02629828453063965, 0.027353763580322266, 0.028409242630004883, 0.0294647216796875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 1.0, 3.0, 8.0, 3.0, 3.0, 15.0, 9.0, 13.0, 22.0, 23.0, 34.0, 52.0, 64.0, 111.0, 143.0, 299.0, 988.0, 683170.0, 361801.0, 913.0, 318.0, 174.0, 108.0, 73.0, 48.0, 40.0, 24.0, 21.0, 18.0, 14.0, 3.0, 8.0, 3.0, 10.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.61865234375, -0.5965423583984375, -0.574432373046875, -0.5523223876953125, -0.53021240234375, -0.5081024169921875, -0.485992431640625, -0.4638824462890625, -0.4417724609375, -0.4196624755859375, -0.397552490234375, -0.3754425048828125, -0.35333251953125, -0.3312225341796875, -0.309112548828125, -0.2870025634765625, -0.264892578125, -0.2427825927734375, -0.220672607421875, -0.1985626220703125, -0.17645263671875, -0.1543426513671875, -0.132232666015625, -0.1101226806640625, -0.0880126953125, -0.0659027099609375, -0.043792724609375, -0.0216827392578125, 0.00042724609375, 0.0225372314453125, 0.044647216796875, 0.0667572021484375, 0.0888671875, 0.1109771728515625, 0.133087158203125, 0.1551971435546875, 0.17730712890625, 0.1994171142578125, 0.221527099609375, 0.2436370849609375, 0.2657470703125, 0.2878570556640625, 0.309967041015625, 0.3320770263671875, 0.35418701171875, 0.3762969970703125, 0.398406982421875, 0.4205169677734375, 0.442626953125, 0.4647369384765625, 0.486846923828125, 0.5089569091796875, 0.53106689453125, 0.5531768798828125, 0.575286865234375, 0.5973968505859375, 0.6195068359375, 0.6416168212890625, 0.663726806640625, 0.6858367919921875, 0.70794677734375, 0.7300567626953125, 0.752166748046875, 0.7742767333984375, 0.79638671875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 13.0, 998.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2344381958246231, -0.21398285031318665, -0.19352751970291138, -0.17307217419147491, -0.15261682868003845, -0.13216149806976318, -0.11170615255832672, -0.09125082194805145, -0.07079547643661499, -0.050340138375759125, -0.02988479658961296, -0.009429454803466797, 0.011025883257389069, 0.031481221318244934, 0.051936566829681396, 0.07239189743995667, 0.09284724295139313, 0.11330258101224899, 0.13375791907310486, 0.15421326458454132, 0.17466861009597778, 0.19512394070625305, 0.21557928621768951, 0.23603461682796478, 0.25648996233940125, 0.2769452929496765, 0.29740065336227417, 0.31785598397254944, 0.3383113145828247, 0.35876667499542236, 0.37922200560569763, 0.3996773362159729, 0.42013269662857056, 0.4405880272388458, 0.4610433876514435, 0.48149871826171875, 0.5019540786743164, 0.5224093794822693, 0.5428647398948669, 0.5633200407028198, 0.5837754011154175, 0.6042307615280151, 0.624686062335968, 0.6451414227485657, 0.6655967831611633, 0.6860520839691162, 0.7065074443817139, 0.7269628047943115, 0.7474181652069092, 0.7678735256195068, 0.7883288264274597, 0.8087841868400574, 0.829239547252655, 0.8496948480606079, 0.8701502084732056, 0.8906055688858032, 0.9110608696937561, 0.9315162301063538, 0.9519715309143066, 0.9724268913269043, 0.992882251739502, 1.0133376121520996, 1.0337929725646973, 1.0542482137680054, 1.074703574180603]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 4.0, 4.0, 9.0, 5.0, 10.0, 9.0, 13.0, 18.0, 17.0, 41.0, 26.0, 33.0, 38.0, 43.0, 43.0, 46.0, 49.0, 48.0, 53.0, 63.0, 54.0, 49.0, 48.0, 41.0, 32.0, 41.0, 25.0, 28.0, 21.0, 17.0, 15.0, 19.0, 14.0, 8.0, 9.0, 9.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.05061835050582886, -0.049346547573804855, -0.04807474464178085, -0.04680294543504715, -0.04553114250302315, -0.044259339570999146, -0.04298754036426544, -0.04171573743224144, -0.04044393450021744, -0.039172131568193436, -0.037900328636169434, -0.03662852942943573, -0.03535672649741173, -0.034084923565387726, -0.03281312435865402, -0.03154132142663002, -0.030269518494606018, -0.028997715562582016, -0.027725914493203163, -0.02645411342382431, -0.025182310491800308, -0.023910507559776306, -0.022638706490397453, -0.0213669054210186, -0.0200951024889946, -0.018823299556970596, -0.017551498487591743, -0.01627969741821289, -0.015007894486188889, -0.013736092485487461, -0.012464290484786034, -0.011192488484084606, -0.009920686483383179, -0.008648884482681751, -0.007377082481980324, -0.006105280481278896, -0.004833478480577469, -0.0035616764798760414, -0.002289874479174614, -0.0010180724784731865, 0.00025372952222824097, 0.0015255315229296684, 0.002797333523631096, 0.004069135524332523, 0.005340937525033951, 0.006612739525735378, 0.007884541526436806, 0.009156343527138233, 0.01042814552783966, 0.011699947528541088, 0.012971749529242516, 0.014243551529943943, 0.01551535353064537, 0.016787156462669373, 0.018058957532048225, 0.019330758601427078, 0.02060256153345108, 0.021874364465475082, 0.023146165534853935, 0.024417966604232788, 0.02568976953625679, 0.026961572468280792, 0.028233373537659645, 0.029505174607038498, 0.0307769775390625]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 6.0, 7.0, 6.0, 8.0, 14.0, 7.0, 14.0, 17.0, 19.0, 20.0, 28.0, 31.0, 33.0, 37.0, 46.0, 31.0, 33.0, 38.0, 43.0, 57.0, 49.0, 39.0, 41.0, 41.0, 44.0, 48.0, 27.0, 32.0, 26.0, 26.0, 24.0, 19.0, 21.0, 12.0, 15.0, 12.0, 11.0, 6.0, 7.0, 10.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.71875, -16.1484375, -15.578125, -15.0078125, -14.4375, -13.8671875, -13.296875, -12.7265625, -12.15625, -11.5859375, -11.015625, -10.4453125, -9.875, -9.3046875, -8.734375, -8.1640625, -7.59375, -7.0234375, -6.453125, -5.8828125, -5.3125, -4.7421875, -4.171875, -3.6015625, -3.03125, -2.4609375, -1.890625, -1.3203125, -0.75, -0.1796875, 0.390625, 0.9609375, 1.53125, 2.1015625, 2.671875, 3.2421875, 3.8125, 4.3828125, 4.953125, 5.5234375, 6.09375, 6.6640625, 7.234375, 7.8046875, 8.375, 8.9453125, 9.515625, 10.0859375, 10.65625, 11.2265625, 11.796875, 12.3671875, 12.9375, 13.5078125, 14.078125, 14.6484375, 15.21875, 15.7890625, 16.359375, 16.9296875, 17.5, 18.0703125, 18.640625, 19.2109375, 19.78125]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 7.0, 2.0, 9.0, 17.0, 12.0, 24.0, 32.0, 28.0, 35.0, 62.0, 83.0, 107.0, 176.0, 233.0, 351.0, 534.0, 903.0, 1591.0, 3207.0, 7541.0, 20627.0, 116183.0, 825612.0, 46312.0, 13477.0, 5560.0, 2500.0, 1220.0, 697.0, 420.0, 267.0, 189.0, 138.0, 105.0, 78.0, 55.0, 44.0, 37.0, 23.0, 16.0, 19.0, 15.0, 6.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-38.875, -37.54833984375, -36.2216796875, -34.89501953125, -33.568359375, -32.24169921875, -30.9150390625, -29.58837890625, -28.26171875, -26.93505859375, -25.6083984375, -24.28173828125, -22.955078125, -21.62841796875, -20.3017578125, -18.97509765625, -17.6484375, -16.32177734375, -14.9951171875, -13.66845703125, -12.341796875, -11.01513671875, -9.6884765625, -8.36181640625, -7.03515625, -5.70849609375, -4.3818359375, -3.05517578125, -1.728515625, -0.40185546875, 0.9248046875, 2.25146484375, 3.578125, 4.90478515625, 6.2314453125, 7.55810546875, 8.884765625, 10.21142578125, 11.5380859375, 12.86474609375, 14.19140625, 15.51806640625, 16.8447265625, 18.17138671875, 19.498046875, 20.82470703125, 22.1513671875, 23.47802734375, 24.8046875, 26.13134765625, 27.4580078125, 28.78466796875, 30.111328125, 31.43798828125, 32.7646484375, 34.09130859375, 35.41796875, 36.74462890625, 38.0712890625, 39.39794921875, 40.724609375, 42.05126953125, 43.3779296875, 44.70458984375, 46.03125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 7.0, 6.0, 7.0, 12.0, 11.0, 23.0, 18.0, 16.0, 18.0, 17.0, 22.0, 35.0, 43.0, 49.0, 45.0, 41.0, 60.0, 75.0, 130.0, 1702.0, 192.0, 88.0, 60.0, 37.0, 50.0, 42.0, 36.0, 22.0, 33.0, 26.0, 21.0, 14.0, 17.0, 17.0, 15.0, 7.0, 7.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.9375, -44.4375, -42.9375, -41.4375, -39.9375, -38.4375, -36.9375, -35.4375, -33.9375, -32.4375, -30.9375, -29.4375, -27.9375, -26.4375, -24.9375, -23.4375, -21.9375, -20.4375, -18.9375, -17.4375, -15.9375, -14.4375, -12.9375, -11.4375, -9.9375, -8.4375, -6.9375, -5.4375, -3.9375, -2.4375, -0.9375, 0.5625, 2.0625, 3.5625, 5.0625, 6.5625, 8.0625, 9.5625, 11.0625, 12.5625, 14.0625, 15.5625, 17.0625, 18.5625, 20.0625, 21.5625, 23.0625, 24.5625, 26.0625, 27.5625, 29.0625, 30.5625, 32.0625, 33.5625, 35.0625, 36.5625, 38.0625, 39.5625, 41.0625, 42.5625, 44.0625, 45.5625, 47.0625, 48.5625, 50.0625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 7.0, 7.0, 9.0, 13.0, 19.0, 18.0, 19.0, 32.0, 29.0, 43.0, 31.0, 52.0, 70.0, 136.0, 206.0, 468.0, 2515.0, 38791.0, 3073519.0, 26538.0, 2064.0, 440.0, 170.0, 109.0, 79.0, 67.0, 42.0, 27.0, 22.0, 20.0, 23.0, 23.0, 23.0, 13.0, 15.0, 5.0, 8.0, 5.0, 4.0, 2.0, 9.0, 2.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-126.375, -122.5966796875, -118.818359375, -115.0400390625, -111.26171875, -107.4833984375, -103.705078125, -99.9267578125, -96.1484375, -92.3701171875, -88.591796875, -84.8134765625, -81.03515625, -77.2568359375, -73.478515625, -69.7001953125, -65.921875, -62.1435546875, -58.365234375, -54.5869140625, -50.80859375, -47.0302734375, -43.251953125, -39.4736328125, -35.6953125, -31.9169921875, -28.138671875, -24.3603515625, -20.58203125, -16.8037109375, -13.025390625, -9.2470703125, -5.46875, -1.6904296875, 2.087890625, 5.8662109375, 9.64453125, 13.4228515625, 17.201171875, 20.9794921875, 24.7578125, 28.5361328125, 32.314453125, 36.0927734375, 39.87109375, 43.6494140625, 47.427734375, 51.2060546875, 54.984375, 58.7626953125, 62.541015625, 66.3193359375, 70.09765625, 73.8759765625, 77.654296875, 81.4326171875, 85.2109375, 88.9892578125, 92.767578125, 96.5458984375, 100.32421875, 104.1025390625, 107.880859375, 111.6591796875, 115.4375]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 11.0, 38.0, 91.0, 259.0, 325.0, 190.0, 63.0, 26.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-186.94204711914062, -183.37054443359375, -179.79905700683594, -176.22755432128906, -172.65606689453125, -169.08456420898438, -165.5130615234375, -161.9415740966797, -158.3700714111328, -154.79856872558594, -151.22708129882812, -147.65557861328125, -144.08407592773438, -140.51258850097656, -136.9410858154297, -133.36959838867188, -129.798095703125, -126.22660064697266, -122.65510559082031, -119.08360290527344, -115.5121078491211, -111.94061279296875, -108.36911010742188, -104.79761505126953, -101.22611999511719, -97.65462493896484, -94.0831298828125, -90.51162719726562, -86.94013214111328, -83.36863708496094, -79.79713439941406, -76.22563934326172, -72.65414428710938, -69.08264923095703, -65.51115417480469, -61.93965148925781, -58.36815643310547, -54.796661376953125, -51.225162506103516, -47.653663635253906, -44.08216857910156, -40.51067352294922, -36.93917465209961, -33.36767578125, -29.796180725097656, -26.22468376159668, -22.653186798095703, -19.081689834594727, -15.51019287109375, -11.938695907592773, -8.367198944091797, -4.79570198059082, -1.2242050170898438, 2.347291946411133, 5.918788909912109, 9.490285873413086, 13.061782836914062, 16.63327980041504, 20.204776763916016, 23.776273727416992, 27.34777069091797, 30.919267654418945, 34.49076461791992, 38.06226348876953, 41.633758544921875]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 6.0, 11.0, 7.0, 7.0, 17.0, 19.0, 18.0, 21.0, 24.0, 38.0, 30.0, 26.0, 31.0, 40.0, 35.0, 41.0, 37.0, 51.0, 48.0, 43.0, 43.0, 42.0, 43.0, 47.0, 32.0, 33.0, 43.0, 25.0, 25.0, 18.0, 22.0, 12.0, 21.0, 12.0, 14.0, 6.0, 5.0, 5.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-121.14675903320312, -117.2154312133789, -113.28410339355469, -109.35276794433594, -105.42144012451172, -101.4901123046875, -97.55877685546875, -93.62744903564453, -89.69612121582031, -85.7647933959961, -81.83346557617188, -77.90213012695312, -73.9708023071289, -70.03947448730469, -66.10813903808594, -62.17681121826172, -58.2454833984375, -54.31415557861328, -50.3828239440918, -46.45149230957031, -42.520164489746094, -38.588836669921875, -34.65750503540039, -30.72617530822754, -26.794845581054688, -22.863515853881836, -18.932186126708984, -15.000856399536133, -11.069526672363281, -7.13819694519043, -3.206867218017578, 0.7244625091552734, 4.655792236328125, 8.587121963500977, 12.518451690673828, 16.44978141784668, 20.38111114501953, 24.312440872192383, 28.243770599365234, 32.17510223388672, 36.10643005371094, 40.037757873535156, 43.96908950805664, 47.900421142578125, 51.831748962402344, 55.76307678222656, 59.69440841674805, 63.62574005126953, 67.55706787109375, 71.48839569091797, 75.41972351074219, 79.35105895996094, 83.28238677978516, 87.21371459960938, 91.14505004882812, 95.07637786865234, 99.00770568847656, 102.93903350830078, 106.870361328125, 110.80169677734375, 114.73302459716797, 118.66435241699219, 122.59568786621094, 126.52701568603516, 130.45834350585938]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 5.0, 6.0, 3.0, 8.0, 8.0, 8.0, 9.0, 21.0, 14.0, 25.0, 28.0, 26.0, 24.0, 49.0, 36.0, 23.0, 36.0, 51.0, 33.0, 38.0, 51.0, 45.0, 39.0, 34.0, 56.0, 45.0, 28.0, 38.0, 28.0, 24.0, 20.0, 25.0, 26.0, 18.0, 18.0, 13.0, 15.0, 7.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.515625, -15.947021484375, -15.37841796875, -14.809814453125, -14.2412109375, -13.672607421875, -13.10400390625, -12.535400390625, -11.966796875, -11.398193359375, -10.82958984375, -10.260986328125, -9.6923828125, -9.123779296875, -8.55517578125, -7.986572265625, -7.41796875, -6.849365234375, -6.28076171875, -5.712158203125, -5.1435546875, -4.574951171875, -4.00634765625, -3.437744140625, -2.869140625, -2.300537109375, -1.73193359375, -1.163330078125, -0.5947265625, -0.026123046875, 0.54248046875, 1.111083984375, 1.6796875, 2.248291015625, 2.81689453125, 3.385498046875, 3.9541015625, 4.522705078125, 5.09130859375, 5.659912109375, 6.228515625, 6.797119140625, 7.36572265625, 7.934326171875, 8.5029296875, 9.071533203125, 9.64013671875, 10.208740234375, 10.77734375, 11.345947265625, 11.91455078125, 12.483154296875, 13.0517578125, 13.620361328125, 14.18896484375, 14.757568359375, 15.326171875, 15.894775390625, 16.46337890625, 17.031982421875, 17.6005859375, 18.169189453125, 18.73779296875, 19.306396484375, 19.875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 6.0, 5.0, 9.0, 17.0, 10.0, 11.0, 31.0, 35.0, 42.0, 79.0, 106.0, 162.0, 234.0, 284.0, 481.0, 720.0, 1070.0, 1714.0, 2772.0, 4913.0, 9476.0, 19690.0, 51195.0, 219985.0, 1248779.0, 2039224.0, 453061.0, 84242.0, 27476.0, 12640.0, 6294.0, 3630.0, 2088.0, 1219.0, 781.0, 545.0, 347.0, 269.0, 187.0, 119.0, 107.0, 58.0, 41.0, 35.0, 26.0, 18.0, 21.0, 10.0, 6.0, 2.0, 5.0, 6.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-26.28125, -25.43896484375, -24.5966796875, -23.75439453125, -22.912109375, -22.06982421875, -21.2275390625, -20.38525390625, -19.54296875, -18.70068359375, -17.8583984375, -17.01611328125, -16.173828125, -15.33154296875, -14.4892578125, -13.64697265625, -12.8046875, -11.96240234375, -11.1201171875, -10.27783203125, -9.435546875, -8.59326171875, -7.7509765625, -6.90869140625, -6.06640625, -5.22412109375, -4.3818359375, -3.53955078125, -2.697265625, -1.85498046875, -1.0126953125, -0.17041015625, 0.671875, 1.51416015625, 2.3564453125, 3.19873046875, 4.041015625, 4.88330078125, 5.7255859375, 6.56787109375, 7.41015625, 8.25244140625, 9.0947265625, 9.93701171875, 10.779296875, 11.62158203125, 12.4638671875, 13.30615234375, 14.1484375, 14.99072265625, 15.8330078125, 16.67529296875, 17.517578125, 18.35986328125, 19.2021484375, 20.04443359375, 20.88671875, 21.72900390625, 22.5712890625, 23.41357421875, 24.255859375, 25.09814453125, 25.9404296875, 26.78271484375, 27.625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 6.0, 15.0, 13.0, 19.0, 27.0, 43.0, 74.0, 109.0, 214.0, 370.0, 688.0, 916.0, 625.0, 353.0, 212.0, 116.0, 72.0, 53.0, 32.0, 27.0, 19.0, 19.0, 7.0, 12.0, 8.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.59375, -41.28271484375, -39.9716796875, -38.66064453125, -37.349609375, -36.03857421875, -34.7275390625, -33.41650390625, -32.10546875, -30.79443359375, -29.4833984375, -28.17236328125, -26.861328125, -25.55029296875, -24.2392578125, -22.92822265625, -21.6171875, -20.30615234375, -18.9951171875, -17.68408203125, -16.373046875, -15.06201171875, -13.7509765625, -12.43994140625, -11.12890625, -9.81787109375, -8.5068359375, -7.19580078125, -5.884765625, -4.57373046875, -3.2626953125, -1.95166015625, -0.640625, 0.67041015625, 1.9814453125, 3.29248046875, 4.603515625, 5.91455078125, 7.2255859375, 8.53662109375, 9.84765625, 11.15869140625, 12.4697265625, 13.78076171875, 15.091796875, 16.40283203125, 17.7138671875, 19.02490234375, 20.3359375, 21.64697265625, 22.9580078125, 24.26904296875, 25.580078125, 26.89111328125, 28.2021484375, 29.51318359375, 30.82421875, 32.13525390625, 33.4462890625, 34.75732421875, 36.068359375, 37.37939453125, 38.6904296875, 40.00146484375, 41.3125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 7.0, 2.0, 8.0, 7.0, 13.0, 10.0, 18.0, 39.0, 41.0, 76.0, 122.0, 258.0, 539.0, 1556.0, 5682.0, 37895.0, 2050940.0, 2050177.0, 38406.0, 5870.0, 1538.0, 538.0, 248.0, 116.0, 66.0, 44.0, 23.0, 18.0, 10.0, 5.0, 3.0, 1.0, 4.0, 5.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-105.625, -102.32421875, -99.0234375, -95.72265625, -92.421875, -89.12109375, -85.8203125, -82.51953125, -79.21875, -75.91796875, -72.6171875, -69.31640625, -66.015625, -62.71484375, -59.4140625, -56.11328125, -52.8125, -49.51171875, -46.2109375, -42.91015625, -39.609375, -36.30859375, -33.0078125, -29.70703125, -26.40625, -23.10546875, -19.8046875, -16.50390625, -13.203125, -9.90234375, -6.6015625, -3.30078125, 0.0, 3.30078125, 6.6015625, 9.90234375, 13.203125, 16.50390625, 19.8046875, 23.10546875, 26.40625, 29.70703125, 33.0078125, 36.30859375, 39.609375, 42.91015625, 46.2109375, 49.51171875, 52.8125, 56.11328125, 59.4140625, 62.71484375, 66.015625, 69.31640625, 72.6171875, 75.91796875, 79.21875, 82.51953125, 85.8203125, 89.12109375, 92.421875, 95.72265625, 99.0234375, 102.32421875, 105.625]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 9.0, 15.0, 40.0, 88.0, 175.0, 251.0, 206.0, 110.0, 58.0, 29.0, 16.0, 9.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-219.80262756347656, -212.37191772460938, -204.9412078857422, -197.510498046875, -190.0797882080078, -182.64907836914062, -175.21836853027344, -167.78765869140625, -160.35694885253906, -152.92623901367188, -145.4955291748047, -138.0648193359375, -130.6341094970703, -123.20339965820312, -115.77268981933594, -108.34197998046875, -100.91127014160156, -93.48056030273438, -86.04985046386719, -78.619140625, -71.18843078613281, -63.757720947265625, -56.32701110839844, -48.89630126953125, -41.46559143066406, -34.034881591796875, -26.604171752929688, -19.1734619140625, -11.742752075195312, -4.312042236328125, 3.1186676025390625, 10.54937744140625, 17.980087280273438, 25.410797119140625, 32.84150695800781, 40.272216796875, 47.70292663574219, 55.133636474609375, 62.56434631347656, 69.99505615234375, 77.42576599121094, 84.85647583007812, 92.28718566894531, 99.7178955078125, 107.14860534667969, 114.57931518554688, 122.01002502441406, 129.44073486328125, 136.87144470214844, 144.30215454101562, 151.7328643798828, 159.16357421875, 166.5942840576172, 174.02499389648438, 181.45570373535156, 188.88641357421875, 196.31712341308594, 203.74783325195312, 211.1785430908203, 218.6092529296875, 226.0399627685547, 233.47067260742188, 240.90138244628906, 248.33209228515625, 255.76280212402344]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 5.0, 3.0, 9.0, 8.0, 4.0, 7.0, 13.0, 11.0, 15.0, 16.0, 24.0, 19.0, 31.0, 31.0, 27.0, 40.0, 32.0, 40.0, 36.0, 33.0, 44.0, 36.0, 41.0, 40.0, 45.0, 49.0, 38.0, 39.0, 33.0, 31.0, 20.0, 25.0, 25.0, 24.0, 19.0, 15.0, 14.0, 10.0, 6.0, 13.0, 12.0, 6.0, 6.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-112.84909057617188, -109.6712875366211, -106.49348449707031, -103.31568908691406, -100.13788604736328, -96.9600830078125, -93.78228759765625, -90.60448455810547, -87.42668151855469, -84.2488784790039, -81.07107543945312, -77.89328002929688, -74.7154769897461, -71.53767395019531, -68.35987854003906, -65.18207550048828, -62.0042724609375, -58.82646942138672, -55.6486701965332, -52.47087097167969, -49.293067932128906, -46.115264892578125, -42.93746566772461, -39.759666442871094, -36.58186340332031, -33.40406036376953, -30.226261138916016, -27.048460006713867, -23.87065887451172, -20.69285774230957, -17.515056610107422, -14.337255477905273, -11.159446716308594, -7.981645584106445, -4.803844451904297, -1.6260433197021484, 1.5517578125, 4.729558944702148, 7.907360076904297, 11.085161209106445, 14.262962341308594, 17.440763473510742, 20.61856460571289, 23.79636573791504, 26.974166870117188, 30.151968002319336, 33.329769134521484, 36.507568359375, 39.68537139892578, 42.86317443847656, 46.04097366333008, 49.218772888183594, 52.396575927734375, 55.574378967285156, 58.75217819213867, 61.92997741699219, 65.10778045654297, 68.28558349609375, 71.46337890625, 74.64118194580078, 77.81898498535156, 80.99678802490234, 84.17459106445312, 87.35238647460938, 90.53018951416016]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 12.0, 10.0, 19.0, 17.0, 21.0, 20.0, 21.0, 24.0, 29.0, 40.0, 34.0, 53.0, 49.0, 54.0, 42.0, 41.0, 52.0, 32.0, 45.0, 44.0, 40.0, 33.0, 35.0, 44.0, 26.0, 28.0, 16.0, 14.0, 16.0, 12.0, 16.0, 12.0, 9.0, 8.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.5146484375, -16.888671875, -16.2626953125, -15.63671875, -15.0107421875, -14.384765625, -13.7587890625, -13.1328125, -12.5068359375, -11.880859375, -11.2548828125, -10.62890625, -10.0029296875, -9.376953125, -8.7509765625, -8.125, -7.4990234375, -6.873046875, -6.2470703125, -5.62109375, -4.9951171875, -4.369140625, -3.7431640625, -3.1171875, -2.4912109375, -1.865234375, -1.2392578125, -0.61328125, 0.0126953125, 0.638671875, 1.2646484375, 1.890625, 2.5166015625, 3.142578125, 3.7685546875, 4.39453125, 5.0205078125, 5.646484375, 6.2724609375, 6.8984375, 7.5244140625, 8.150390625, 8.7763671875, 9.40234375, 10.0283203125, 10.654296875, 11.2802734375, 11.90625, 12.5322265625, 13.158203125, 13.7841796875, 14.41015625, 15.0361328125, 15.662109375, 16.2880859375, 16.9140625, 17.5400390625, 18.166015625, 18.7919921875, 19.41796875, 20.0439453125, 20.669921875, 21.2958984375, 21.921875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 4.0, 13.0, 23.0, 33.0, 37.0, 61.0, 86.0, 134.0, 209.0, 282.0, 451.0, 667.0, 1016.0, 1445.0, 2141.0, 3124.0, 4751.0, 7268.0, 10926.0, 16641.0, 25959.0, 41367.0, 66914.0, 107649.0, 164079.0, 192996.0, 147133.0, 92905.0, 57577.0, 35951.0, 22978.0, 14579.0, 9526.0, 6507.0, 4233.0, 2873.0, 1950.0, 1353.0, 824.0, 596.0, 432.0, 266.0, 206.0, 122.0, 85.0, 64.0, 38.0, 32.0, 23.0, 11.0, 6.0, 6.0, 1.0, 0.0, 1.0, 2.0], "bins": [-2.21484375, -2.1484375, -2.08203125, -2.015625, -1.94921875, -1.8828125, -1.81640625, -1.75, -1.68359375, -1.6171875, -1.55078125, -1.484375, -1.41796875, -1.3515625, -1.28515625, -1.21875, -1.15234375, -1.0859375, -1.01953125, -0.953125, -0.88671875, -0.8203125, -0.75390625, -0.6875, -0.62109375, -0.5546875, -0.48828125, -0.421875, -0.35546875, -0.2890625, -0.22265625, -0.15625, -0.08984375, -0.0234375, 0.04296875, 0.109375, 0.17578125, 0.2421875, 0.30859375, 0.375, 0.44140625, 0.5078125, 0.57421875, 0.640625, 0.70703125, 0.7734375, 0.83984375, 0.90625, 0.97265625, 1.0390625, 1.10546875, 1.171875, 1.23828125, 1.3046875, 1.37109375, 1.4375, 1.50390625, 1.5703125, 1.63671875, 1.703125, 1.76953125, 1.8359375, 1.90234375, 1.96875, 2.03515625]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 7.0, 3.0, 15.0, 12.0, 13.0, 12.0, 28.0, 20.0, 22.0, 30.0, 27.0, 28.0, 33.0, 42.0, 35.0, 48.0, 37.0, 40.0, 1076.0, 43.0, 43.0, 42.0, 45.0, 38.0, 34.0, 38.0, 32.0, 30.0, 26.0, 18.0, 21.0, 25.0, 11.0, 12.0, 10.0, 9.0, 4.0, 2.0, 5.0, 6.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.37158203125, -11.9697265625, -11.56787109375, -11.166015625, -10.76416015625, -10.3623046875, -9.96044921875, -9.55859375, -9.15673828125, -8.7548828125, -8.35302734375, -7.951171875, -7.54931640625, -7.1474609375, -6.74560546875, -6.34375, -5.94189453125, -5.5400390625, -5.13818359375, -4.736328125, -4.33447265625, -3.9326171875, -3.53076171875, -3.12890625, -2.72705078125, -2.3251953125, -1.92333984375, -1.521484375, -1.11962890625, -0.7177734375, -0.31591796875, 0.0859375, 0.48779296875, 0.8896484375, 1.29150390625, 1.693359375, 2.09521484375, 2.4970703125, 2.89892578125, 3.30078125, 3.70263671875, 4.1044921875, 4.50634765625, 4.908203125, 5.31005859375, 5.7119140625, 6.11376953125, 6.515625, 6.91748046875, 7.3193359375, 7.72119140625, 8.123046875, 8.52490234375, 8.9267578125, 9.32861328125, 9.73046875, 10.13232421875, 10.5341796875, 10.93603515625, 11.337890625, 11.73974609375, 12.1416015625, 12.54345703125, 12.9453125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 17.0, 11.0, 20.0, 27.0, 49.0, 67.0, 97.0, 150.0, 223.0, 327.0, 529.0, 724.0, 1158.0, 1787.0, 2723.0, 4545.0, 6907.0, 11304.0, 18385.0, 30085.0, 50352.0, 84460.0, 137591.0, 1224226.0, 206976.0, 123975.0, 74994.0, 44669.0, 26678.0, 16498.0, 10034.0, 6381.0, 3922.0, 2506.0, 1662.0, 986.0, 702.0, 433.0, 311.0, 197.0, 114.0, 101.0, 71.0, 53.0, 34.0, 18.0, 16.0, 9.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-1.58203125, -1.5308074951171875, -1.479583740234375, -1.4283599853515625, -1.37713623046875, -1.3259124755859375, -1.274688720703125, -1.2234649658203125, -1.1722412109375, -1.1210174560546875, -1.069793701171875, -1.0185699462890625, -0.96734619140625, -0.9161224365234375, -0.864898681640625, -0.8136749267578125, -0.762451171875, -0.7112274169921875, -0.660003662109375, -0.6087799072265625, -0.55755615234375, -0.5063323974609375, -0.455108642578125, -0.4038848876953125, -0.3526611328125, -0.3014373779296875, -0.250213623046875, -0.1989898681640625, -0.14776611328125, -0.0965423583984375, -0.045318603515625, 0.0059051513671875, 0.05712890625, 0.1083526611328125, 0.159576416015625, 0.2108001708984375, 0.26202392578125, 0.3132476806640625, 0.364471435546875, 0.4156951904296875, 0.4669189453125, 0.5181427001953125, 0.569366455078125, 0.6205902099609375, 0.67181396484375, 0.7230377197265625, 0.774261474609375, 0.8254852294921875, 0.876708984375, 0.9279327392578125, 0.979156494140625, 1.0303802490234375, 1.08160400390625, 1.1328277587890625, 1.184051513671875, 1.2352752685546875, 1.2864990234375, 1.3377227783203125, 1.388946533203125, 1.4401702880859375, 1.49139404296875, 1.5426177978515625, 1.593841552734375, 1.6450653076171875, 1.6962890625]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 8.0, 6.0, 3.0, 3.0, 4.0, 8.0, 7.0, 7.0, 11.0, 16.0, 18.0, 22.0, 23.0, 11.0, 33.0, 22.0, 36.0, 37.0, 39.0, 71.0, 48.0, 39.0, 48.0, 47.0, 57.0, 37.0, 39.0, 41.0, 37.0, 35.0, 30.0, 29.0, 27.0, 20.0, 9.0, 19.0, 5.0, 10.0, 12.0, 7.0, 9.0, 5.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0], "bins": [-0.0205841064453125, -0.01998114585876465, -0.019378185272216797, -0.018775224685668945, -0.018172264099121094, -0.017569303512573242, -0.01696634292602539, -0.01636338233947754, -0.015760421752929688, -0.015157461166381836, -0.014554500579833984, -0.013951539993286133, -0.013348579406738281, -0.01274561882019043, -0.012142658233642578, -0.011539697647094727, -0.010936737060546875, -0.010333776473999023, -0.009730815887451172, -0.00912785530090332, -0.008524894714355469, -0.007921934127807617, -0.007318973541259766, -0.006716012954711914, -0.0061130523681640625, -0.005510091781616211, -0.004907131195068359, -0.004304170608520508, -0.0037012100219726562, -0.0030982494354248047, -0.002495288848876953, -0.0018923282623291016, -0.00128936767578125, -0.0006864070892333984, -8.344650268554688e-05, 0.0005195140838623047, 0.0011224746704101562, 0.0017254352569580078, 0.0023283958435058594, 0.002931356430053711, 0.0035343170166015625, 0.004137277603149414, 0.004740238189697266, 0.005343198776245117, 0.005946159362792969, 0.00654911994934082, 0.007152080535888672, 0.0077550411224365234, 0.008358001708984375, 0.008960962295532227, 0.009563922882080078, 0.01016688346862793, 0.010769844055175781, 0.011372804641723633, 0.011975765228271484, 0.012578725814819336, 0.013181686401367188, 0.013784646987915039, 0.01438760757446289, 0.014990568161010742, 0.015593528747558594, 0.016196489334106445, 0.016799449920654297, 0.01740241050720215, 0.01800537109375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 3.0, 4.0, 11.0, 9.0, 10.0, 13.0, 11.0, 17.0, 20.0, 22.0, 34.0, 30.0, 45.0, 62.0, 73.0, 95.0, 127.0, 144.0, 248.0, 362.0, 724.0, 6963.0, 1015027.0, 22288.0, 897.0, 407.0, 229.0, 160.0, 101.0, 70.0, 68.0, 59.0, 39.0, 33.0, 27.0, 25.0, 13.0, 10.0, 16.0, 11.0, 10.0, 7.0, 4.0, 4.0, 5.0, 8.0, 3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.36572265625, -0.3537712097167969, -0.34181976318359375, -0.3298683166503906, -0.3179168701171875, -0.3059654235839844, -0.29401397705078125, -0.2820625305175781, -0.270111083984375, -0.2581596374511719, -0.24620819091796875, -0.23425674438476562, -0.2223052978515625, -0.21035385131835938, -0.19840240478515625, -0.18645095825195312, -0.17449951171875, -0.16254806518554688, -0.15059661865234375, -0.13864517211914062, -0.1266937255859375, -0.11474227905273438, -0.10279083251953125, -0.09083938598632812, -0.078887939453125, -0.06693649291992188, -0.05498504638671875, -0.043033599853515625, -0.0310821533203125, -0.019130706787109375, -0.00717926025390625, 0.004772186279296875, 0.0167236328125, 0.028675079345703125, 0.04062652587890625, 0.052577972412109375, 0.0645294189453125, 0.07648086547851562, 0.08843231201171875, 0.10038375854492188, 0.112335205078125, 0.12428665161132812, 0.13623809814453125, 0.14818954467773438, 0.1601409912109375, 0.17209243774414062, 0.18404388427734375, 0.19599533081054688, 0.20794677734375, 0.21989822387695312, 0.23184967041015625, 0.24380111694335938, 0.2557525634765625, 0.2677040100097656, 0.27965545654296875, 0.2916069030761719, 0.303558349609375, 0.3155097961425781, 0.32746124267578125, 0.3394126892089844, 0.3513641357421875, 0.3633155822753906, 0.37526702880859375, 0.3872184753417969, 0.399169921875]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 989.0, 23.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3351563811302185, -0.3203372359275818, -0.30551812052726746, -0.29069897532463074, -0.275879830121994, -0.2610607147216797, -0.24624156951904297, -0.23142242431640625, -0.21660329401493073, -0.2017841637134552, -0.18696501851081848, -0.17214588820934296, -0.15732675790786743, -0.1425076127052307, -0.1276884824037552, -0.11286934465169907, -0.09805020689964294, -0.08323106914758682, -0.0684119313955307, -0.053592801094055176, -0.038773663341999054, -0.023954525589942932, -0.009135395288467407, 0.005683742463588715, 0.020502880215644836, 0.03532201796770096, 0.05014115199446678, 0.0649602860212326, 0.07977942377328873, 0.09459856152534485, 0.10941769182682037, 0.1242368295788765, 0.13905596733093262, 0.15387509763240814, 0.16869424283504486, 0.18351337313652039, 0.1983325183391571, 0.21315164864063263, 0.22797077894210815, 0.24278992414474487, 0.2576090693473816, 0.2724282145500183, 0.28724732995033264, 0.30206647515296936, 0.3168856203556061, 0.3317047357559204, 0.34652388095855713, 0.36134302616119385, 0.3761621415615082, 0.3909812867641449, 0.40580040216445923, 0.42061954736709595, 0.43543869256973267, 0.4502578377723694, 0.4650769531726837, 0.47989609837532043, 0.49471521377563477, 0.5095343589782715, 0.5243535041809082, 0.5391726493835449, 0.5539917349815369, 0.5688108801841736, 0.5836300253868103, 0.598449170589447, 0.6132683157920837]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 1.0, 8.0, 6.0, 9.0, 10.0, 16.0, 10.0, 14.0, 15.0, 18.0, 20.0, 24.0, 36.0, 40.0, 33.0, 44.0, 38.0, 31.0, 44.0, 46.0, 28.0, 37.0, 48.0, 27.0, 54.0, 37.0, 33.0, 36.0, 37.0, 34.0, 26.0, 24.0, 22.0, 19.0, 13.0, 14.0, 15.0, 9.0, 10.0, 6.0, 5.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.029133617877960205, -0.028279069811105728, -0.0274245236068964, -0.026569977402687073, -0.025715429335832596, -0.02486088126897812, -0.02400633506476879, -0.023151788860559464, -0.022297240793704987, -0.02144269272685051, -0.020588146522641182, -0.019733600318431854, -0.018879052251577377, -0.0180245041847229, -0.017169957980513573, -0.016315411776304245, -0.015460863709449768, -0.014606316573917866, -0.013751769438385963, -0.012897222302854061, -0.012042675167322159, -0.011188128031790257, -0.010333580896258354, -0.009479033760726452, -0.00862448662519455, -0.007769939489662647, -0.006915392354130745, -0.006060845218598843, -0.00520629808306694, -0.004351750947535038, -0.0034972038120031357, -0.0026426566764712334, -0.001788109540939331, -0.0009335624054074287, -7.901526987552643e-05, 0.0007755318656563759, 0.0016300790011882782, 0.0024846261367201805, 0.003339173272252083, 0.004193720407783985, 0.0050482675433158875, 0.00590281467884779, 0.006757361814379692, 0.007611908949911594, 0.008466456085443497, 0.009321003220975399, 0.010175550356507301, 0.011030097492039204, 0.011884644627571106, 0.012739191763103008, 0.01359373889863491, 0.014448286034166813, 0.015302833169698715, 0.016157381236553192, 0.01701192744076252, 0.017866473644971848, 0.018721021711826324, 0.0195755697786808, 0.02043011598289013, 0.021284662187099457, 0.022139210253953934, 0.02299375832080841, 0.02384830452501774, 0.024702850729227066, 0.025557398796081543]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 11.0, 11.0, 19.0, 17.0, 21.0, 19.0, 22.0, 24.0, 29.0, 40.0, 34.0, 53.0, 49.0, 54.0, 42.0, 41.0, 52.0, 32.0, 46.0, 44.0, 39.0, 33.0, 35.0, 44.0, 26.0, 28.0, 16.0, 14.0, 16.0, 12.0, 16.0, 12.0, 9.0, 8.0, 8.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.140625, -17.5146484375, -16.888671875, -16.2626953125, -15.63671875, -15.0107421875, -14.384765625, -13.7587890625, -13.1328125, -12.5068359375, -11.880859375, -11.2548828125, -10.62890625, -10.0029296875, -9.376953125, -8.7509765625, -8.125, -7.4990234375, -6.873046875, -6.2470703125, -5.62109375, -4.9951171875, -4.369140625, -3.7431640625, -3.1171875, -2.4912109375, -1.865234375, -1.2392578125, -0.61328125, 0.0126953125, 0.638671875, 1.2646484375, 1.890625, 2.5166015625, 3.142578125, 3.7685546875, 4.39453125, 5.0205078125, 5.646484375, 6.2724609375, 6.8984375, 7.5244140625, 8.150390625, 8.7763671875, 9.40234375, 10.0283203125, 10.654296875, 11.2802734375, 11.90625, 12.5322265625, 13.158203125, 13.7841796875, 14.41015625, 15.0361328125, 15.662109375, 16.2880859375, 16.9140625, 17.5400390625, 18.166015625, 18.7919921875, 19.41796875, 20.0439453125, 20.669921875, 21.2958984375, 21.921875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 0.0, 2.0, 2.0, 7.0, 10.0, 8.0, 10.0, 18.0, 29.0, 37.0, 62.0, 74.0, 96.0, 142.0, 212.0, 310.0, 462.0, 704.0, 1092.0, 1891.0, 3137.0, 5899.0, 11618.0, 25956.0, 75306.0, 351236.0, 427334.0, 86200.0, 29051.0, 12481.0, 6336.0, 3372.0, 2041.0, 1186.0, 651.0, 501.0, 338.0, 211.0, 157.0, 130.0, 69.0, 55.0, 42.0, 26.0, 20.0, 10.0, 7.0, 9.0, 5.0, 5.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.0, -26.15771484375, -25.3154296875, -24.47314453125, -23.630859375, -22.78857421875, -21.9462890625, -21.10400390625, -20.26171875, -19.41943359375, -18.5771484375, -17.73486328125, -16.892578125, -16.05029296875, -15.2080078125, -14.36572265625, -13.5234375, -12.68115234375, -11.8388671875, -10.99658203125, -10.154296875, -9.31201171875, -8.4697265625, -7.62744140625, -6.78515625, -5.94287109375, -5.1005859375, -4.25830078125, -3.416015625, -2.57373046875, -1.7314453125, -0.88916015625, -0.046875, 0.79541015625, 1.6376953125, 2.47998046875, 3.322265625, 4.16455078125, 5.0068359375, 5.84912109375, 6.69140625, 7.53369140625, 8.3759765625, 9.21826171875, 10.060546875, 10.90283203125, 11.7451171875, 12.58740234375, 13.4296875, 14.27197265625, 15.1142578125, 15.95654296875, 16.798828125, 17.64111328125, 18.4833984375, 19.32568359375, 20.16796875, 21.01025390625, 21.8525390625, 22.69482421875, 23.537109375, 24.37939453125, 25.2216796875, 26.06396484375, 26.90625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 3.0, 10.0, 9.0, 10.0, 16.0, 13.0, 16.0, 9.0, 22.0, 29.0, 26.0, 30.0, 47.0, 35.0, 46.0, 65.0, 63.0, 93.0, 278.0, 1560.0, 143.0, 92.0, 68.0, 44.0, 45.0, 39.0, 27.0, 34.0, 27.0, 27.0, 24.0, 12.0, 14.0, 17.0, 9.0, 10.0, 4.0, 5.0, 2.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-48.03125, -46.4931640625, -44.955078125, -43.4169921875, -41.87890625, -40.3408203125, -38.802734375, -37.2646484375, -35.7265625, -34.1884765625, -32.650390625, -31.1123046875, -29.57421875, -28.0361328125, -26.498046875, -24.9599609375, -23.421875, -21.8837890625, -20.345703125, -18.8076171875, -17.26953125, -15.7314453125, -14.193359375, -12.6552734375, -11.1171875, -9.5791015625, -8.041015625, -6.5029296875, -4.96484375, -3.4267578125, -1.888671875, -0.3505859375, 1.1875, 2.7255859375, 4.263671875, 5.8017578125, 7.33984375, 8.8779296875, 10.416015625, 11.9541015625, 13.4921875, 15.0302734375, 16.568359375, 18.1064453125, 19.64453125, 21.1826171875, 22.720703125, 24.2587890625, 25.796875, 27.3349609375, 28.873046875, 30.4111328125, 31.94921875, 33.4873046875, 35.025390625, 36.5634765625, 38.1015625, 39.6396484375, 41.177734375, 42.7158203125, 44.25390625, 45.7919921875, 47.330078125, 48.8681640625, 50.40625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 5.0, 6.0, 13.0, 20.0, 14.0, 26.0, 42.0, 63.0, 85.0, 141.0, 272.0, 799.0, 4174.0, 49132.0, 2977227.0, 105410.0, 6443.0, 1021.0, 327.0, 162.0, 108.0, 76.0, 40.0, 27.0, 24.0, 19.0, 14.0, 4.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-107.3125, -104.119140625, -100.92578125, -97.732421875, -94.5390625, -91.345703125, -88.15234375, -84.958984375, -81.765625, -78.572265625, -75.37890625, -72.185546875, -68.9921875, -65.798828125, -62.60546875, -59.412109375, -56.21875, -53.025390625, -49.83203125, -46.638671875, -43.4453125, -40.251953125, -37.05859375, -33.865234375, -30.671875, -27.478515625, -24.28515625, -21.091796875, -17.8984375, -14.705078125, -11.51171875, -8.318359375, -5.125, -1.931640625, 1.26171875, 4.455078125, 7.6484375, 10.841796875, 14.03515625, 17.228515625, 20.421875, 23.615234375, 26.80859375, 30.001953125, 33.1953125, 36.388671875, 39.58203125, 42.775390625, 45.96875, 49.162109375, 52.35546875, 55.548828125, 58.7421875, 61.935546875, 65.12890625, 68.322265625, 71.515625, 74.708984375, 77.90234375, 81.095703125, 84.2890625, 87.482421875, 90.67578125, 93.869140625, 97.0625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 115.0, 725.0, 161.0, 11.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-331.76318359375, -318.2472229003906, -304.7312927246094, -291.21533203125, -277.69940185546875, -264.1834411621094, -250.66748046875, -237.1515350341797, -223.63558959960938, -210.11964416503906, -196.60369873046875, -183.08773803710938, -169.57179260253906, -156.05584716796875, -142.53988647460938, -129.02394104003906, -115.50799560546875, -101.99205017089844, -88.4760971069336, -74.96014404296875, -61.44419860839844, -47.928253173828125, -34.41230010986328, -20.896347045898438, -7.380401611328125, 6.135547637939453, 19.65149688720703, 33.16744613647461, 46.68339538574219, 60.1993408203125, 73.71529388427734, 87.23124694824219, 100.7471923828125, 114.26313781738281, 127.77909088134766, 141.2950439453125, 154.8109893798828, 168.32693481445312, 181.8428955078125, 195.3588409423828, 208.87478637695312, 222.39073181152344, 235.90667724609375, 249.42263793945312, 262.9385986328125, 276.45452880859375, 289.9704895019531, 303.4864501953125, 317.00238037109375, 330.5183410644531, 344.0342712402344, 357.55023193359375, 371.066162109375, 384.5821228027344, 398.09808349609375, 411.614013671875, 425.1299743652344, 438.64593505859375, 452.161865234375, 465.6778259277344, 479.19378662109375, 492.709716796875, 506.2256774902344, 519.7416381835938, 533.257568359375]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 7.0, 5.0, 7.0, 9.0, 11.0, 13.0, 18.0, 27.0, 24.0, 27.0, 34.0, 28.0, 42.0, 36.0, 43.0, 49.0, 42.0, 55.0, 41.0, 52.0, 51.0, 39.0, 48.0, 39.0, 31.0, 31.0, 24.0, 27.0, 15.0, 22.0, 19.0, 20.0, 18.0, 12.0, 11.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-123.12319946289062, -119.35442352294922, -115.58563995361328, -111.81686401367188, -108.04808807373047, -104.27931213378906, -100.51052856445312, -96.74175262451172, -92.97297668457031, -89.2042007446289, -85.43541717529297, -81.66664123535156, -77.89786529541016, -74.12908935546875, -70.36030578613281, -66.5915298461914, -62.82274627685547, -59.0539665222168, -55.28519058227539, -51.51641082763672, -47.74763488769531, -43.97885513305664, -40.21007537841797, -36.44129943847656, -32.67251968383789, -28.90374183654785, -25.134963989257812, -21.36618423461914, -17.5974063873291, -13.828628540039062, -10.05984878540039, -6.291070938110352, -2.5222930908203125, 1.2464852333068848, 5.015263557434082, 8.784042358398438, 12.552820205688477, 16.321598052978516, 20.090377807617188, 23.859155654907227, 27.627933502197266, 31.396711349487305, 35.165489196777344, 38.934268951416016, 42.70304870605469, 46.471824645996094, 50.240604400634766, 54.00938415527344, 57.778160095214844, 61.546939849853516, 65.31571960449219, 69.0844955444336, 72.853271484375, 76.62205505371094, 80.39083099365234, 84.15960693359375, 87.92839050292969, 91.6971664428711, 95.46595001220703, 99.23472595214844, 103.00350189208984, 106.77227783203125, 110.54106140136719, 114.3098373413086, 118.07861328125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 4.0, 11.0, 6.0, 8.0, 14.0, 10.0, 17.0, 27.0, 26.0, 25.0, 29.0, 45.0, 36.0, 36.0, 62.0, 53.0, 53.0, 56.0, 43.0, 55.0, 32.0, 39.0, 44.0, 46.0, 34.0, 37.0, 30.0, 17.0, 22.0, 16.0, 21.0, 14.0, 15.0, 7.0, 6.0, 5.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -21.153564453125, -20.44775390625, -19.741943359375, -19.0361328125, -18.330322265625, -17.62451171875, -16.918701171875, -16.212890625, -15.507080078125, -14.80126953125, -14.095458984375, -13.3896484375, -12.683837890625, -11.97802734375, -11.272216796875, -10.56640625, -9.860595703125, -9.15478515625, -8.448974609375, -7.7431640625, -7.037353515625, -6.33154296875, -5.625732421875, -4.919921875, -4.214111328125, -3.50830078125, -2.802490234375, -2.0966796875, -1.390869140625, -0.68505859375, 0.020751953125, 0.7265625, 1.432373046875, 2.13818359375, 2.843994140625, 3.5498046875, 4.255615234375, 4.96142578125, 5.667236328125, 6.373046875, 7.078857421875, 7.78466796875, 8.490478515625, 9.1962890625, 9.902099609375, 10.60791015625, 11.313720703125, 12.01953125, 12.725341796875, 13.43115234375, 14.136962890625, 14.8427734375, 15.548583984375, 16.25439453125, 16.960205078125, 17.666015625, 18.371826171875, 19.07763671875, 19.783447265625, 20.4892578125, 21.195068359375, 21.90087890625, 22.606689453125, 23.3125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 6.0, 5.0, 6.0, 7.0, 17.0, 16.0, 25.0, 26.0, 46.0, 66.0, 105.0, 150.0, 203.0, 272.0, 345.0, 534.0, 787.0, 1279.0, 2093.0, 3497.0, 6446.0, 13314.0, 31647.0, 107435.0, 603633.0, 2287241.0, 905489.0, 153450.0, 40799.0, 16120.0, 7860.0, 4225.0, 2511.0, 1553.0, 896.0, 632.0, 418.0, 310.0, 219.0, 170.0, 115.0, 86.0, 77.0, 47.0, 32.0, 19.0, 17.0, 15.0, 10.0, 8.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0], "bins": [-27.6875, -26.783203125, -25.87890625, -24.974609375, -24.0703125, -23.166015625, -22.26171875, -21.357421875, -20.453125, -19.548828125, -18.64453125, -17.740234375, -16.8359375, -15.931640625, -15.02734375, -14.123046875, -13.21875, -12.314453125, -11.41015625, -10.505859375, -9.6015625, -8.697265625, -7.79296875, -6.888671875, -5.984375, -5.080078125, -4.17578125, -3.271484375, -2.3671875, -1.462890625, -0.55859375, 0.345703125, 1.25, 2.154296875, 3.05859375, 3.962890625, 4.8671875, 5.771484375, 6.67578125, 7.580078125, 8.484375, 9.388671875, 10.29296875, 11.197265625, 12.1015625, 13.005859375, 13.91015625, 14.814453125, 15.71875, 16.623046875, 17.52734375, 18.431640625, 19.3359375, 20.240234375, 21.14453125, 22.048828125, 22.953125, 23.857421875, 24.76171875, 25.666015625, 26.5703125, 27.474609375, 28.37890625, 29.283203125, 30.1875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 20.0, 17.0, 44.0, 52.0, 82.0, 121.0, 208.0, 468.0, 996.0, 986.0, 518.0, 207.0, 122.0, 63.0, 45.0, 28.0, 22.0, 13.0, 18.0, 10.0, 3.0, 5.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.21875, -43.603515625, -41.98828125, -40.373046875, -38.7578125, -37.142578125, -35.52734375, -33.912109375, -32.296875, -30.681640625, -29.06640625, -27.451171875, -25.8359375, -24.220703125, -22.60546875, -20.990234375, -19.375, -17.759765625, -16.14453125, -14.529296875, -12.9140625, -11.298828125, -9.68359375, -8.068359375, -6.453125, -4.837890625, -3.22265625, -1.607421875, 0.0078125, 1.623046875, 3.23828125, 4.853515625, 6.46875, 8.083984375, 9.69921875, 11.314453125, 12.9296875, 14.544921875, 16.16015625, 17.775390625, 19.390625, 21.005859375, 22.62109375, 24.236328125, 25.8515625, 27.466796875, 29.08203125, 30.697265625, 32.3125, 33.927734375, 35.54296875, 37.158203125, 38.7734375, 40.388671875, 42.00390625, 43.619140625, 45.234375, 46.849609375, 48.46484375, 50.080078125, 51.6953125, 53.310546875, 54.92578125, 56.541015625, 58.15625]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 5.0, 3.0, 3.0, 1.0, 5.0, 3.0, 10.0, 14.0, 22.0, 41.0, 68.0, 93.0, 146.0, 241.0, 466.0, 767.0, 1497.0, 3620.0, 10690.0, 43793.0, 358778.0, 3494957.0, 229714.0, 34190.0, 8818.0, 3142.0, 1410.0, 743.0, 399.0, 255.0, 148.0, 79.0, 59.0, 34.0, 20.0, 12.0, 13.0, 8.0, 5.0, 5.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-76.4375, -74.216796875, -71.99609375, -69.775390625, -67.5546875, -65.333984375, -63.11328125, -60.892578125, -58.671875, -56.451171875, -54.23046875, -52.009765625, -49.7890625, -47.568359375, -45.34765625, -43.126953125, -40.90625, -38.685546875, -36.46484375, -34.244140625, -32.0234375, -29.802734375, -27.58203125, -25.361328125, -23.140625, -20.919921875, -18.69921875, -16.478515625, -14.2578125, -12.037109375, -9.81640625, -7.595703125, -5.375, -3.154296875, -0.93359375, 1.287109375, 3.5078125, 5.728515625, 7.94921875, 10.169921875, 12.390625, 14.611328125, 16.83203125, 19.052734375, 21.2734375, 23.494140625, 25.71484375, 27.935546875, 30.15625, 32.376953125, 34.59765625, 36.818359375, 39.0390625, 41.259765625, 43.48046875, 45.701171875, 47.921875, 50.142578125, 52.36328125, 54.583984375, 56.8046875, 59.025390625, 61.24609375, 63.466796875, 65.6875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 6.0, 24.0, 21.0, 75.0, 131.0, 199.0, 206.0, 147.0, 89.0, 57.0, 26.0, 14.0, 6.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-214.29751586914062, -207.6337127685547, -200.9698944091797, -194.30609130859375, -187.64227294921875, -180.9784698486328, -174.31466674804688, -167.65084838867188, -160.98704528808594, -154.3232421875, -147.659423828125, -140.99562072753906, -134.33181762695312, -127.66799926757812, -121.00419616699219, -114.34038543701172, -107.67657470703125, -101.01276397705078, -94.34895324707031, -87.68515014648438, -81.0213394165039, -74.35752868652344, -67.6937255859375, -61.02991485595703, -54.36610412597656, -47.702293395996094, -41.03848648071289, -34.37467956542969, -27.71086883544922, -21.04705810546875, -14.383251190185547, -7.719444274902344, -1.0556182861328125, 5.608190536499023, 12.27199935913086, 18.935808181762695, 25.59961700439453, 32.263427734375, 38.9272346496582, 45.591041564941406, 52.254852294921875, 58.918663024902344, 65.58247375488281, 72.24627685546875, 78.91008758544922, 85.57389831542969, 92.23770141601562, 98.9015121459961, 105.56532287597656, 112.22913360595703, 118.8929443359375, 125.55674743652344, 132.22055053710938, 138.88436889648438, 145.5481719970703, 152.21197509765625, 158.87579345703125, 165.5395965576172, 172.2034149169922, 178.86721801757812, 185.53103637695312, 192.19483947753906, 198.858642578125, 205.5224609375, 212.18626403808594]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 2.0, 2.0, 5.0, 5.0, 3.0, 9.0, 7.0, 10.0, 10.0, 18.0, 10.0, 15.0, 24.0, 24.0, 22.0, 27.0, 39.0, 28.0, 39.0, 26.0, 29.0, 36.0, 37.0, 49.0, 51.0, 38.0, 38.0, 43.0, 50.0, 32.0, 35.0, 40.0, 28.0, 34.0, 34.0, 21.0, 21.0, 16.0, 8.0, 7.0, 8.0, 8.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-104.46060180664062, -101.18244171142578, -97.90428161621094, -94.6261215209961, -91.34796142578125, -88.0698013305664, -84.79164123535156, -81.51348114013672, -78.23532104492188, -74.95716094970703, -71.67900085449219, -68.40084075927734, -65.1226806640625, -61.844520568847656, -58.56636047363281, -55.28820037841797, -52.01003646850586, -48.731876373291016, -45.45371627807617, -42.17555618286133, -38.897396087646484, -35.619232177734375, -32.34107208251953, -29.06291389465332, -25.784753799438477, -22.506593704223633, -19.22843360900879, -15.950272560119629, -12.672112464904785, -9.393951416015625, -6.115791320800781, -2.8376312255859375, 0.44052886962890625, 3.718689203262329, 6.996849536895752, 10.275010108947754, 13.553170204162598, 16.831331253051758, 20.1094913482666, 23.387651443481445, 26.66581153869629, 29.943971633911133, 33.22213363647461, 36.50029373168945, 39.7784538269043, 43.05661392211914, 46.334774017333984, 49.61293411254883, 52.89109420776367, 56.169254302978516, 59.44741439819336, 62.7255744934082, 66.00373840332031, 69.28189849853516, 72.56005859375, 75.83821868896484, 79.11637878417969, 82.39453887939453, 85.67269897460938, 88.95085906982422, 92.22901916503906, 95.5071792602539, 98.78533935546875, 102.0634994506836, 105.34165954589844]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 7.0, 6.0, 4.0, 4.0, 13.0, 10.0, 15.0, 16.0, 19.0, 18.0, 22.0, 24.0, 30.0, 32.0, 32.0, 25.0, 53.0, 25.0, 45.0, 54.0, 40.0, 38.0, 50.0, 38.0, 52.0, 40.0, 41.0, 42.0, 21.0, 26.0, 22.0, 31.0, 20.0, 19.0, 14.0, 10.0, 8.0, 7.0, 3.0, 3.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-20.9375, -20.236572265625, -19.53564453125, -18.834716796875, -18.1337890625, -17.432861328125, -16.73193359375, -16.031005859375, -15.330078125, -14.629150390625, -13.92822265625, -13.227294921875, -12.5263671875, -11.825439453125, -11.12451171875, -10.423583984375, -9.72265625, -9.021728515625, -8.32080078125, -7.619873046875, -6.9189453125, -6.218017578125, -5.51708984375, -4.816162109375, -4.115234375, -3.414306640625, -2.71337890625, -2.012451171875, -1.3115234375, -0.610595703125, 0.09033203125, 0.791259765625, 1.4921875, 2.193115234375, 2.89404296875, 3.594970703125, 4.2958984375, 4.996826171875, 5.69775390625, 6.398681640625, 7.099609375, 7.800537109375, 8.50146484375, 9.202392578125, 9.9033203125, 10.604248046875, 11.30517578125, 12.006103515625, 12.70703125, 13.407958984375, 14.10888671875, 14.809814453125, 15.5107421875, 16.211669921875, 16.91259765625, 17.613525390625, 18.314453125, 19.015380859375, 19.71630859375, 20.417236328125, 21.1181640625, 21.819091796875, 22.52001953125, 23.220947265625, 23.921875]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 6.0, 7.0, 5.0, 10.0, 13.0, 25.0, 41.0, 49.0, 61.0, 97.0, 190.0, 274.0, 340.0, 506.0, 836.0, 1252.0, 1825.0, 2913.0, 4340.0, 6270.0, 10008.0, 15681.0, 25039.0, 40556.0, 67727.0, 112451.0, 174691.0, 200655.0, 146583.0, 90524.0, 54958.0, 32948.0, 20469.0, 12800.0, 8411.0, 5434.0, 3520.0, 2280.0, 1631.0, 1025.0, 712.0, 464.0, 322.0, 206.0, 125.0, 89.0, 63.0, 56.0, 29.0, 17.0, 13.0, 7.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.48828125, -2.40875244140625, -2.3292236328125, -2.24969482421875, -2.170166015625, -2.09063720703125, -2.0111083984375, -1.93157958984375, -1.85205078125, -1.77252197265625, -1.6929931640625, -1.61346435546875, -1.533935546875, -1.45440673828125, -1.3748779296875, -1.29534912109375, -1.2158203125, -1.13629150390625, -1.0567626953125, -0.97723388671875, -0.897705078125, -0.81817626953125, -0.7386474609375, -0.65911865234375, -0.57958984375, -0.50006103515625, -0.4205322265625, -0.34100341796875, -0.261474609375, -0.18194580078125, -0.1024169921875, -0.02288818359375, 0.056640625, 0.13616943359375, 0.2156982421875, 0.29522705078125, 0.374755859375, 0.45428466796875, 0.5338134765625, 0.61334228515625, 0.69287109375, 0.77239990234375, 0.8519287109375, 0.93145751953125, 1.010986328125, 1.09051513671875, 1.1700439453125, 1.24957275390625, 1.3291015625, 1.40863037109375, 1.4881591796875, 1.56768798828125, 1.647216796875, 1.72674560546875, 1.8062744140625, 1.88580322265625, 1.96533203125, 2.04486083984375, 2.1243896484375, 2.20391845703125, 2.283447265625, 2.36297607421875, 2.4425048828125, 2.52203369140625, 2.6015625]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 7.0, 9.0, 5.0, 11.0, 16.0, 17.0, 19.0, 26.0, 20.0, 21.0, 28.0, 33.0, 35.0, 35.0, 42.0, 39.0, 37.0, 44.0, 1069.0, 39.0, 40.0, 39.0, 34.0, 54.0, 38.0, 32.0, 33.0, 23.0, 24.0, 25.0, 23.0, 26.0, 15.0, 16.0, 7.0, 10.0, 8.0, 6.0, 1.0, 1.0, 4.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0], "bins": [-15.6796875, -15.243408203125, -14.80712890625, -14.370849609375, -13.9345703125, -13.498291015625, -13.06201171875, -12.625732421875, -12.189453125, -11.753173828125, -11.31689453125, -10.880615234375, -10.4443359375, -10.008056640625, -9.57177734375, -9.135498046875, -8.69921875, -8.262939453125, -7.82666015625, -7.390380859375, -6.9541015625, -6.517822265625, -6.08154296875, -5.645263671875, -5.208984375, -4.772705078125, -4.33642578125, -3.900146484375, -3.4638671875, -3.027587890625, -2.59130859375, -2.155029296875, -1.71875, -1.282470703125, -0.84619140625, -0.409912109375, 0.0263671875, 0.462646484375, 0.89892578125, 1.335205078125, 1.771484375, 2.207763671875, 2.64404296875, 3.080322265625, 3.5166015625, 3.952880859375, 4.38916015625, 4.825439453125, 5.26171875, 5.697998046875, 6.13427734375, 6.570556640625, 7.0068359375, 7.443115234375, 7.87939453125, 8.315673828125, 8.751953125, 9.188232421875, 9.62451171875, 10.060791015625, 10.4970703125, 10.933349609375, 11.36962890625, 11.805908203125, 12.2421875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 4.0, 4.0, 6.0, 6.0, 15.0, 10.0, 25.0, 53.0, 66.0, 85.0, 145.0, 222.0, 303.0, 428.0, 681.0, 1170.0, 1748.0, 2721.0, 4139.0, 6607.0, 10521.0, 17066.0, 27920.0, 46225.0, 78657.0, 129320.0, 521333.0, 916471.0, 131318.0, 78736.0, 46602.0, 28170.0, 17147.0, 10744.0, 6566.0, 4303.0, 2633.0, 1643.0, 1144.0, 779.0, 477.0, 327.0, 206.0, 108.0, 104.0, 50.0, 36.0, 42.0, 21.0, 14.0, 6.0, 9.0, 6.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.8212890625, -1.7625579833984375, -1.703826904296875, -1.6450958251953125, -1.58636474609375, -1.5276336669921875, -1.468902587890625, -1.4101715087890625, -1.3514404296875, -1.2927093505859375, -1.233978271484375, -1.1752471923828125, -1.11651611328125, -1.0577850341796875, -0.999053955078125, -0.9403228759765625, -0.881591796875, -0.8228607177734375, -0.764129638671875, -0.7053985595703125, -0.64666748046875, -0.5879364013671875, -0.529205322265625, -0.4704742431640625, -0.4117431640625, -0.3530120849609375, -0.294281005859375, -0.2355499267578125, -0.17681884765625, -0.1180877685546875, -0.059356689453125, -0.0006256103515625, 0.05810546875, 0.1168365478515625, 0.175567626953125, 0.2342987060546875, 0.29302978515625, 0.3517608642578125, 0.410491943359375, 0.4692230224609375, 0.5279541015625, 0.5866851806640625, 0.645416259765625, 0.7041473388671875, 0.76287841796875, 0.8216094970703125, 0.880340576171875, 0.9390716552734375, 0.997802734375, 1.0565338134765625, 1.115264892578125, 1.1739959716796875, 1.23272705078125, 1.2914581298828125, 1.350189208984375, 1.4089202880859375, 1.4676513671875, 1.5263824462890625, 1.585113525390625, 1.6438446044921875, 1.70257568359375, 1.7613067626953125, 1.820037841796875, 1.8787689208984375, 1.9375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 5.0, 10.0, 3.0, 11.0, 15.0, 11.0, 27.0, 27.0, 39.0, 49.0, 63.0, 93.0, 120.0, 128.0, 110.0, 66.0, 49.0, 39.0, 33.0, 17.0, 14.0, 7.0, 15.0, 10.0, 9.0, 8.0, 4.0, 3.0, 1.0, 4.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.049713134765625, -0.04811239242553711, -0.04651165008544922, -0.04491090774536133, -0.04331016540527344, -0.04170942306518555, -0.040108680725097656, -0.038507938385009766, -0.036907196044921875, -0.035306453704833984, -0.033705711364746094, -0.0321049690246582, -0.030504226684570312, -0.028903484344482422, -0.02730274200439453, -0.02570199966430664, -0.02410125732421875, -0.02250051498413086, -0.02089977264404297, -0.019299030303955078, -0.017698287963867188, -0.016097545623779297, -0.014496803283691406, -0.012896060943603516, -0.011295318603515625, -0.009694576263427734, -0.008093833923339844, -0.006493091583251953, -0.0048923492431640625, -0.003291606903076172, -0.0016908645629882812, -9.012222290039062e-05, 0.0015106201171875, 0.0031113624572753906, 0.004712104797363281, 0.006312847137451172, 0.007913589477539062, 0.009514331817626953, 0.011115074157714844, 0.012715816497802734, 0.014316558837890625, 0.015917301177978516, 0.017518043518066406, 0.019118785858154297, 0.020719528198242188, 0.022320270538330078, 0.02392101287841797, 0.02552175521850586, 0.02712249755859375, 0.02872323989868164, 0.03032398223876953, 0.03192472457885742, 0.03352546691894531, 0.0351262092590332, 0.036726951599121094, 0.038327693939208984, 0.039928436279296875, 0.041529178619384766, 0.043129920959472656, 0.04473066329956055, 0.04633140563964844, 0.04793214797973633, 0.04953289031982422, 0.05113363265991211, 0.052734375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 1.0, 4.0, 7.0, 5.0, 4.0, 10.0, 12.0, 10.0, 20.0, 26.0, 29.0, 31.0, 49.0, 79.0, 115.0, 203.0, 343.0, 1079.0, 972386.0, 72522.0, 795.0, 289.0, 177.0, 100.0, 75.0, 46.0, 33.0, 21.0, 24.0, 12.0, 11.0, 7.0, 3.0, 4.0, 5.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0283203125, -0.9970626831054688, -0.9658050537109375, -0.9345474243164062, -0.903289794921875, -0.8720321655273438, -0.8407745361328125, -0.8095169067382812, -0.77825927734375, -0.7470016479492188, -0.7157440185546875, -0.6844863891601562, -0.653228759765625, -0.6219711303710938, -0.5907135009765625, -0.5594558715820312, -0.5281982421875, -0.49694061279296875, -0.4656829833984375, -0.43442535400390625, -0.403167724609375, -0.37191009521484375, -0.3406524658203125, -0.30939483642578125, -0.27813720703125, -0.24687957763671875, -0.2156219482421875, -0.18436431884765625, -0.153106689453125, -0.12184906005859375, -0.0905914306640625, -0.05933380126953125, -0.028076171875, 0.00318145751953125, 0.0344390869140625, 0.06569671630859375, 0.096954345703125, 0.12821197509765625, 0.1594696044921875, 0.19072723388671875, 0.22198486328125, 0.25324249267578125, 0.2845001220703125, 0.31575775146484375, 0.347015380859375, 0.37827301025390625, 0.4095306396484375, 0.44078826904296875, 0.4720458984375, 0.5033035278320312, 0.5345611572265625, 0.5658187866210938, 0.597076416015625, 0.6283340454101562, 0.6595916748046875, 0.6908493041992188, 0.72210693359375, 0.7533645629882812, 0.7846221923828125, 0.8158798217773438, 0.847137451171875, 0.8783950805664062, 0.9096527099609375, 0.9409103393554688, 0.97216796875]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1004.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.24563029408454895, -0.2198905050754547, -0.19415071606636047, -0.16841092705726624, -0.142671138048172, -0.11693136394023895, -0.09119157493114471, -0.06545178592205048, -0.03971199691295624, -0.013972209766507149, 0.01176757737994194, 0.03750736266374588, 0.06324715167284012, 0.08898693323135376, 0.114726722240448, 0.14046651124954224, 0.16620630025863647, 0.1919460892677307, 0.21768587827682495, 0.2434256672859192, 0.2691654562950134, 0.29490524530410767, 0.3206450343132019, 0.34638482332229614, 0.3721246123313904, 0.3978644013404846, 0.42360419034957886, 0.4493439793586731, 0.47508376836776733, 0.5008235573768616, 0.5265633463859558, 0.55230313539505, 0.5780429244041443, 0.6037827134132385, 0.6295225024223328, 0.655262291431427, 0.6810020804405212, 0.7067418694496155, 0.7324816584587097, 0.758221447467804, 0.7839612364768982, 0.8097010254859924, 0.8354408144950867, 0.8611806035041809, 0.8869203925132751, 0.9126601815223694, 0.9383999705314636, 0.9641397595405579, 0.9898794889450073, 1.0156192779541016, 1.0413590669631958, 1.06709885597229, 1.0928386449813843, 1.1185784339904785, 1.1443182229995728, 1.170058012008667, 1.1957978010177612, 1.2215375900268555, 1.2472773790359497, 1.273017168045044, 1.2987569570541382, 1.3244967460632324, 1.3502365350723267, 1.375976324081421, 1.4017161130905151]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 6.0, 6.0, 20.0, 19.0, 23.0, 18.0, 20.0, 28.0, 46.0, 43.0, 39.0, 56.0, 56.0, 50.0, 44.0, 38.0, 44.0, 51.0, 54.0, 45.0, 53.0, 38.0, 32.0, 37.0, 35.0, 24.0, 18.0, 15.0, 17.0, 6.0, 9.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06911146640777588, -0.06712162494659424, -0.0651317909359932, -0.06314194947481155, -0.06115211173892021, -0.05916227400302887, -0.05717243254184723, -0.05518259480595589, -0.053192757070064545, -0.0512029193341732, -0.04921308159828186, -0.04722324013710022, -0.04523340240120888, -0.043243564665317535, -0.041253723204135895, -0.03926388546824455, -0.03727404773235321, -0.03528420999646187, -0.033294372260570526, -0.031304530799388885, -0.029314693063497543, -0.0273248553276062, -0.02533501572906971, -0.02334517613053322, -0.021355338394641876, -0.019365500658750534, -0.017375661060214043, -0.015385822393000126, -0.013395983725786209, -0.011406145058572292, -0.009416306391358376, -0.007426467724144459, -0.005436629056930542, -0.003446790389716625, -0.0014569517225027084, 0.0005328869447112083, 0.002522725611925125, 0.004512564279139042, 0.006502402946352959, 0.008492241613566875, 0.010482080280780792, 0.012471918947994709, 0.014461757615208626, 0.016451597213745117, 0.01844143494963646, 0.0204312726855278, 0.022421112284064293, 0.024410951882600784, 0.026400789618492126, 0.02839062735438347, 0.03038046695291996, 0.03237030655145645, 0.034360144287347794, 0.036349982023239136, 0.038339823484420776, 0.04032966122031212, 0.04231949895620346, 0.0443093366920948, 0.046299174427986145, 0.048289015889167786, 0.05027885362505913, 0.05226869136095047, 0.05425853282213211, 0.05624837055802345, 0.058238208293914795]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 5.0, 8.0, 5.0, 4.0, 4.0, 13.0, 10.0, 15.0, 16.0, 19.0, 18.0, 22.0, 24.0, 30.0, 33.0, 31.0, 25.0, 53.0, 25.0, 45.0, 54.0, 40.0, 38.0, 50.0, 38.0, 52.0, 40.0, 41.0, 42.0, 21.0, 26.0, 22.0, 31.0, 20.0, 19.0, 15.0, 9.0, 8.0, 7.0, 3.0, 3.0, 8.0, 4.0, 3.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-20.9375, -20.236572265625, -19.53564453125, -18.834716796875, -18.1337890625, -17.432861328125, -16.73193359375, -16.031005859375, -15.330078125, -14.629150390625, -13.92822265625, -13.227294921875, -12.5263671875, -11.825439453125, -11.12451171875, -10.423583984375, -9.72265625, -9.021728515625, -8.32080078125, -7.619873046875, -6.9189453125, -6.218017578125, -5.51708984375, -4.816162109375, -4.115234375, -3.414306640625, -2.71337890625, -2.012451171875, -1.3115234375, -0.610595703125, 0.09033203125, 0.791259765625, 1.4921875, 2.193115234375, 2.89404296875, 3.594970703125, 4.2958984375, 4.996826171875, 5.69775390625, 6.398681640625, 7.099609375, 7.800537109375, 8.50146484375, 9.202392578125, 9.9033203125, 10.604248046875, 11.30517578125, 12.006103515625, 12.70703125, 13.407958984375, 14.10888671875, 14.809814453125, 15.5107421875, 16.211669921875, 16.91259765625, 17.613525390625, 18.314453125, 19.015380859375, 19.71630859375, 20.417236328125, 21.1181640625, 21.819091796875, 22.52001953125, 23.220947265625, 23.921875]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 13.0, 15.0, 26.0, 30.0, 55.0, 98.0, 122.0, 188.0, 314.0, 549.0, 930.0, 1758.0, 3366.0, 7133.0, 15800.0, 41939.0, 146871.0, 570768.0, 177394.0, 47736.0, 17530.0, 7736.0, 3657.0, 1891.0, 1055.0, 590.0, 339.0, 204.0, 136.0, 95.0, 56.0, 35.0, 27.0, 17.0, 8.0, 14.0, 10.0, 2.0, 5.0, 5.0, 4.0, 2.0, 4.0, 0.0, 4.0, 0.0, 1.0], "bins": [-39.875, -38.72119140625, -37.5673828125, -36.41357421875, -35.259765625, -34.10595703125, -32.9521484375, -31.79833984375, -30.64453125, -29.49072265625, -28.3369140625, -27.18310546875, -26.029296875, -24.87548828125, -23.7216796875, -22.56787109375, -21.4140625, -20.26025390625, -19.1064453125, -17.95263671875, -16.798828125, -15.64501953125, -14.4912109375, -13.33740234375, -12.18359375, -11.02978515625, -9.8759765625, -8.72216796875, -7.568359375, -6.41455078125, -5.2607421875, -4.10693359375, -2.953125, -1.79931640625, -0.6455078125, 0.50830078125, 1.662109375, 2.81591796875, 3.9697265625, 5.12353515625, 6.27734375, 7.43115234375, 8.5849609375, 9.73876953125, 10.892578125, 12.04638671875, 13.2001953125, 14.35400390625, 15.5078125, 16.66162109375, 17.8154296875, 18.96923828125, 20.123046875, 21.27685546875, 22.4306640625, 23.58447265625, 24.73828125, 25.89208984375, 27.0458984375, 28.19970703125, 29.353515625, 30.50732421875, 31.6611328125, 32.81494140625, 33.96875]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 7.0, 4.0, 5.0, 7.0, 12.0, 10.0, 18.0, 24.0, 26.0, 33.0, 39.0, 38.0, 42.0, 61.0, 75.0, 118.0, 249.0, 1599.0, 193.0, 102.0, 89.0, 51.0, 48.0, 34.0, 36.0, 25.0, 25.0, 23.0, 15.0, 15.0, 6.0, 10.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.0, -71.6357421875, -69.271484375, -66.9072265625, -64.54296875, -62.1787109375, -59.814453125, -57.4501953125, -55.0859375, -52.7216796875, -50.357421875, -47.9931640625, -45.62890625, -43.2646484375, -40.900390625, -38.5361328125, -36.171875, -33.8076171875, -31.443359375, -29.0791015625, -26.71484375, -24.3505859375, -21.986328125, -19.6220703125, -17.2578125, -14.8935546875, -12.529296875, -10.1650390625, -7.80078125, -5.4365234375, -3.072265625, -0.7080078125, 1.65625, 4.0205078125, 6.384765625, 8.7490234375, 11.11328125, 13.4775390625, 15.841796875, 18.2060546875, 20.5703125, 22.9345703125, 25.298828125, 27.6630859375, 30.02734375, 32.3916015625, 34.755859375, 37.1201171875, 39.484375, 41.8486328125, 44.212890625, 46.5771484375, 48.94140625, 51.3056640625, 53.669921875, 56.0341796875, 58.3984375, 60.7626953125, 63.126953125, 65.4912109375, 67.85546875, 70.2197265625, 72.583984375, 74.9482421875, 77.3125]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 3.0, 3.0, 6.0, 5.0, 12.0, 16.0, 10.0, 22.0, 19.0, 29.0, 48.0, 65.0, 103.0, 151.0, 259.0, 606.0, 2298.0, 22131.0, 2664812.0, 440912.0, 11646.0, 1455.0, 460.0, 235.0, 115.0, 80.0, 53.0, 40.0, 31.0, 20.0, 10.0, 13.0, 14.0, 6.0, 6.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.4375, -95.5947265625, -91.751953125, -87.9091796875, -84.06640625, -80.2236328125, -76.380859375, -72.5380859375, -68.6953125, -64.8525390625, -61.009765625, -57.1669921875, -53.32421875, -49.4814453125, -45.638671875, -41.7958984375, -37.953125, -34.1103515625, -30.267578125, -26.4248046875, -22.58203125, -18.7392578125, -14.896484375, -11.0537109375, -7.2109375, -3.3681640625, 0.474609375, 4.3173828125, 8.16015625, 12.0029296875, 15.845703125, 19.6884765625, 23.53125, 27.3740234375, 31.216796875, 35.0595703125, 38.90234375, 42.7451171875, 46.587890625, 50.4306640625, 54.2734375, 58.1162109375, 61.958984375, 65.8017578125, 69.64453125, 73.4873046875, 77.330078125, 81.1728515625, 85.015625, 88.8583984375, 92.701171875, 96.5439453125, 100.38671875, 104.2294921875, 108.072265625, 111.9150390625, 115.7578125, 119.6005859375, 123.443359375, 127.2861328125, 131.12890625, 134.9716796875, 138.814453125, 142.6572265625, 146.5]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 18.0, 104.0, 368.0, 348.0, 135.0, 32.0, 4.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.8460693359375, -102.3260726928711, -93.80607604980469, -85.28608703613281, -76.7660903930664, -68.24609375, -59.72610092163086, -51.20610809326172, -42.68611145019531, -34.166114807128906, -25.646121978759766, -17.126127243041992, -8.606132507324219, -0.0861358642578125, 8.433856964111328, 16.95384979248047, 25.473846435546875, 33.99384307861328, 42.51383590698242, 51.03382873535156, 59.55382537841797, 68.07382202148438, 76.59381103515625, 85.11380767822266, 93.63380432128906, 102.15380096435547, 110.67379760742188, 119.19378662109375, 127.71378326416016, 136.23377990722656, 144.75376892089844, 153.27377319335938, 161.79376220703125, 170.31375122070312, 178.83375549316406, 187.35374450683594, 195.87374877929688, 204.39373779296875, 212.91372680664062, 221.4337158203125, 229.95372009277344, 238.4737091064453, 246.99371337890625, 255.51370239257812, 264.03369140625, 272.5537109375, 281.0736999511719, 289.59368896484375, 298.1136779785156, 306.6336669921875, 315.1536560058594, 323.6736755371094, 332.19366455078125, 340.7136535644531, 349.233642578125, 357.7536315917969, 366.27362060546875, 374.7936096191406, 383.3135986328125, 391.8336181640625, 400.3536071777344, 408.87359619140625, 417.3935852050781, 425.91357421875, 434.43359375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 4.0, 1.0, 9.0, 4.0, 7.0, 9.0, 7.0, 10.0, 12.0, 13.0, 22.0, 26.0, 15.0, 21.0, 30.0, 26.0, 34.0, 33.0, 35.0, 44.0, 27.0, 43.0, 41.0, 33.0, 38.0, 33.0, 43.0, 37.0, 38.0, 42.0, 29.0, 20.0, 34.0, 24.0, 29.0, 20.0, 17.0, 13.0, 10.0, 19.0, 13.0, 4.0, 11.0, 6.0, 10.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-115.88993835449219, -112.15206909179688, -108.41419219970703, -104.67632293701172, -100.93844604492188, -97.20057678222656, -93.46270751953125, -89.7248306274414, -85.98695373535156, -82.24908447265625, -78.5112075805664, -74.7733383178711, -71.03546142578125, -67.29759216308594, -63.55971908569336, -59.82184600830078, -56.08397674560547, -52.34610366821289, -48.60823059082031, -44.870361328125, -41.132484436035156, -37.394615173339844, -33.656742095947266, -29.918869018554688, -26.18099594116211, -22.44312286376953, -18.705249786376953, -14.967378616333008, -11.22950553894043, -7.491632461547852, -3.7537612915039062, -0.015888214111328125, 3.7219924926757812, 7.459865093231201, 11.197737693786621, 14.935609817504883, 18.67348289489746, 22.41135597229004, 26.149227142333984, 29.887100219726562, 33.62497329711914, 37.36284637451172, 41.1007194519043, 44.838592529296875, 48.57646179199219, 52.31433868408203, 56.052207946777344, 59.79008102416992, 63.5279541015625, 67.26582336425781, 71.00370025634766, 74.74156951904297, 78.47944641113281, 82.21731567382812, 85.95518493652344, 89.69306182861328, 93.43093872070312, 97.16880798339844, 100.90668487548828, 104.6445541381836, 108.38243103027344, 112.12030029296875, 115.85816955566406, 119.5960464477539, 123.33391571044922]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 1.0, 1.0, 3.0, 12.0, 8.0, 7.0, 11.0, 14.0, 13.0, 10.0, 12.0, 16.0, 15.0, 21.0, 21.0, 28.0, 28.0, 31.0, 34.0, 40.0, 38.0, 37.0, 47.0, 29.0, 36.0, 34.0, 39.0, 53.0, 44.0, 40.0, 42.0, 34.0, 19.0, 40.0, 23.0, 23.0, 19.0, 13.0, 17.0, 8.0, 10.0, 4.0, 6.0, 5.0, 5.0, 4.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-21.265625, -20.583251953125, -19.90087890625, -19.218505859375, -18.5361328125, -17.853759765625, -17.17138671875, -16.489013671875, -15.806640625, -15.124267578125, -14.44189453125, -13.759521484375, -13.0771484375, -12.394775390625, -11.71240234375, -11.030029296875, -10.34765625, -9.665283203125, -8.98291015625, -8.300537109375, -7.6181640625, -6.935791015625, -6.25341796875, -5.571044921875, -4.888671875, -4.206298828125, -3.52392578125, -2.841552734375, -2.1591796875, -1.476806640625, -0.79443359375, -0.112060546875, 0.5703125, 1.252685546875, 1.93505859375, 2.617431640625, 3.2998046875, 3.982177734375, 4.66455078125, 5.346923828125, 6.029296875, 6.711669921875, 7.39404296875, 8.076416015625, 8.7587890625, 9.441162109375, 10.12353515625, 10.805908203125, 11.48828125, 12.170654296875, 12.85302734375, 13.535400390625, 14.2177734375, 14.900146484375, 15.58251953125, 16.264892578125, 16.947265625, 17.629638671875, 18.31201171875, 18.994384765625, 19.6767578125, 20.359130859375, 21.04150390625, 21.723876953125, 22.40625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 6.0, 8.0, 12.0, 11.0, 18.0, 24.0, 29.0, 21.0, 46.0, 60.0, 65.0, 92.0, 104.0, 179.0, 228.0, 476.0, 1445.0, 7704.0, 901076.0, 3267048.0, 12320.0, 1781.0, 537.0, 247.0, 201.0, 115.0, 92.0, 64.0, 71.0, 32.0, 31.0, 23.0, 18.0, 16.0, 21.0, 16.0, 5.0, 7.0, 6.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-175.875, -170.716796875, -165.55859375, -160.400390625, -155.2421875, -150.083984375, -144.92578125, -139.767578125, -134.609375, -129.451171875, -124.29296875, -119.134765625, -113.9765625, -108.818359375, -103.66015625, -98.501953125, -93.34375, -88.185546875, -83.02734375, -77.869140625, -72.7109375, -67.552734375, -62.39453125, -57.236328125, -52.078125, -46.919921875, -41.76171875, -36.603515625, -31.4453125, -26.287109375, -21.12890625, -15.970703125, -10.8125, -5.654296875, -0.49609375, 4.662109375, 9.8203125, 14.978515625, 20.13671875, 25.294921875, 30.453125, 35.611328125, 40.76953125, 45.927734375, 51.0859375, 56.244140625, 61.40234375, 66.560546875, 71.71875, 76.876953125, 82.03515625, 87.193359375, 92.3515625, 97.509765625, 102.66796875, 107.826171875, 112.984375, 118.142578125, 123.30078125, 128.458984375, 133.6171875, 138.775390625, 143.93359375, 149.091796875, 154.25]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 2.0, 2.0, 12.0, 8.0, 12.0, 14.0, 22.0, 31.0, 51.0, 66.0, 66.0, 136.0, 228.0, 445.0, 1056.0, 974.0, 457.0, 209.0, 100.0, 63.0, 31.0, 18.0, 24.0, 12.0, 15.0, 3.0, 0.0, 3.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.78125, -44.07861328125, -42.3759765625, -40.67333984375, -38.970703125, -37.26806640625, -35.5654296875, -33.86279296875, -32.16015625, -30.45751953125, -28.7548828125, -27.05224609375, -25.349609375, -23.64697265625, -21.9443359375, -20.24169921875, -18.5390625, -16.83642578125, -15.1337890625, -13.43115234375, -11.728515625, -10.02587890625, -8.3232421875, -6.62060546875, -4.91796875, -3.21533203125, -1.5126953125, 0.18994140625, 1.892578125, 3.59521484375, 5.2978515625, 7.00048828125, 8.703125, 10.40576171875, 12.1083984375, 13.81103515625, 15.513671875, 17.21630859375, 18.9189453125, 20.62158203125, 22.32421875, 24.02685546875, 25.7294921875, 27.43212890625, 29.134765625, 30.83740234375, 32.5400390625, 34.24267578125, 35.9453125, 37.64794921875, 39.3505859375, 41.05322265625, 42.755859375, 44.45849609375, 46.1611328125, 47.86376953125, 49.56640625, 51.26904296875, 52.9716796875, 54.67431640625, 56.376953125, 58.07958984375, 59.7822265625, 61.48486328125, 63.1875]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 1.0, 3.0, 4.0, 3.0, 7.0, 15.0, 10.0, 24.0, 27.0, 34.0, 42.0, 90.0, 125.0, 250.0, 467.0, 999.0, 2883.0, 10719.0, 67212.0, 3232503.0, 831108.0, 36656.0, 7045.0, 2133.0, 851.0, 437.0, 219.0, 133.0, 86.0, 61.0, 35.0, 29.0, 19.0, 17.0, 11.0, 8.0, 9.0, 4.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-83.9375, -80.8134765625, -77.689453125, -74.5654296875, -71.44140625, -68.3173828125, -65.193359375, -62.0693359375, -58.9453125, -55.8212890625, -52.697265625, -49.5732421875, -46.44921875, -43.3251953125, -40.201171875, -37.0771484375, -33.953125, -30.8291015625, -27.705078125, -24.5810546875, -21.45703125, -18.3330078125, -15.208984375, -12.0849609375, -8.9609375, -5.8369140625, -2.712890625, 0.4111328125, 3.53515625, 6.6591796875, 9.783203125, 12.9072265625, 16.03125, 19.1552734375, 22.279296875, 25.4033203125, 28.52734375, 31.6513671875, 34.775390625, 37.8994140625, 41.0234375, 44.1474609375, 47.271484375, 50.3955078125, 53.51953125, 56.6435546875, 59.767578125, 62.8916015625, 66.015625, 69.1396484375, 72.263671875, 75.3876953125, 78.51171875, 81.6357421875, 84.759765625, 87.8837890625, 91.0078125, 94.1318359375, 97.255859375, 100.3798828125, 103.50390625, 106.6279296875, 109.751953125, 112.8759765625, 116.0]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 11.0, 41.0, 217.0, 495.0, 192.0, 45.0, 10.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-288.56854248046875, -271.14715576171875, -253.72573852539062, -236.30433654785156, -218.8829345703125, -201.46153259277344, -184.04013061523438, -166.6187286376953, -149.19732666015625, -131.7759246826172, -114.35452270507812, -96.93312072753906, -79.51171875, -62.09031677246094, -44.668914794921875, -27.247512817382812, -9.82611083984375, 7.5952911376953125, 25.016693115234375, 42.43809509277344, 59.8594970703125, 77.28089904785156, 94.70230102539062, 112.12370300292969, 129.54510498046875, 146.9665069580078, 164.38790893554688, 181.80931091308594, 199.230712890625, 216.65211486816406, 234.07351684570312, 251.4949188232422, 268.9163818359375, 286.3377685546875, 303.7591857910156, 321.18060302734375, 338.60198974609375, 356.02337646484375, 373.4447937011719, 390.8662109375, 408.28759765625, 425.708984375, 443.1304016113281, 460.55181884765625, 477.97320556640625, 495.39459228515625, 512.8160400390625, 530.2374267578125, 547.6588134765625, 565.0802001953125, 582.5015869140625, 599.9230346679688, 617.3444213867188, 634.7658081054688, 652.187255859375, 669.608642578125, 687.030029296875, 704.451416015625, 721.872802734375, 739.2942504882812, 756.7156372070312, 774.1370239257812, 791.5584716796875, 808.9798583984375, 826.4012451171875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 4.0, 0.0, 0.0, 2.0, 1.0, 10.0, 3.0, 10.0, 11.0, 16.0, 12.0, 15.0, 15.0, 13.0, 23.0, 22.0, 34.0, 35.0, 29.0, 35.0, 39.0, 44.0, 33.0, 35.0, 36.0, 40.0, 35.0, 37.0, 64.0, 44.0, 34.0, 32.0, 28.0, 42.0, 28.0, 18.0, 21.0, 21.0, 12.0, 10.0, 9.0, 16.0, 7.0, 13.0, 6.0, 2.0, 5.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-118.70956420898438, -114.91063690185547, -111.11170959472656, -107.31278228759766, -103.51385498046875, -99.71492767333984, -95.91600036621094, -92.11707305908203, -88.31814575195312, -84.51921844482422, -80.72029113769531, -76.9213638305664, -73.1224365234375, -69.3235092163086, -65.52458190917969, -61.72565460205078, -57.926727294921875, -54.12779998779297, -50.32887268066406, -46.529945373535156, -42.73101806640625, -38.932090759277344, -35.13316345214844, -31.33423614501953, -27.535308837890625, -23.73638153076172, -19.937454223632812, -16.138526916503906, -12.339599609375, -8.540672302246094, -4.7417449951171875, -0.9428176879882812, 2.856109619140625, 6.655036926269531, 10.453964233398438, 14.252891540527344, 18.05181884765625, 21.850746154785156, 25.649673461914062, 29.44860076904297, 33.247528076171875, 37.04645538330078, 40.84538269042969, 44.644309997558594, 48.4432373046875, 52.242164611816406, 56.04109191894531, 59.84001922607422, 63.638946533203125, 67.43787384033203, 71.23680114746094, 75.03572845458984, 78.83465576171875, 82.63358306884766, 86.43251037597656, 90.23143768310547, 94.03036499023438, 97.82929229736328, 101.62821960449219, 105.4271469116211, 109.22607421875, 113.0250015258789, 116.82392883300781, 120.62285614013672, 124.42178344726562]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 6.0, 6.0, 13.0, 12.0, 12.0, 10.0, 15.0, 13.0, 23.0, 18.0, 25.0, 21.0, 26.0, 26.0, 27.0, 34.0, 32.0, 32.0, 40.0, 33.0, 38.0, 37.0, 46.0, 37.0, 36.0, 36.0, 48.0, 30.0, 39.0, 23.0, 22.0, 28.0, 32.0, 21.0, 21.0, 20.0, 14.0, 13.0, 10.0, 11.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.265625, -21.560791015625, -20.85595703125, -20.151123046875, -19.4462890625, -18.741455078125, -18.03662109375, -17.331787109375, -16.626953125, -15.922119140625, -15.21728515625, -14.512451171875, -13.8076171875, -13.102783203125, -12.39794921875, -11.693115234375, -10.98828125, -10.283447265625, -9.57861328125, -8.873779296875, -8.1689453125, -7.464111328125, -6.75927734375, -6.054443359375, -5.349609375, -4.644775390625, -3.93994140625, -3.235107421875, -2.5302734375, -1.825439453125, -1.12060546875, -0.415771484375, 0.2890625, 0.993896484375, 1.69873046875, 2.403564453125, 3.1083984375, 3.813232421875, 4.51806640625, 5.222900390625, 5.927734375, 6.632568359375, 7.33740234375, 8.042236328125, 8.7470703125, 9.451904296875, 10.15673828125, 10.861572265625, 11.56640625, 12.271240234375, 12.97607421875, 13.680908203125, 14.3857421875, 15.090576171875, 15.79541015625, 16.500244140625, 17.205078125, 17.909912109375, 18.61474609375, 19.319580078125, 20.0244140625, 20.729248046875, 21.43408203125, 22.138916015625, 22.84375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 11.0, 17.0, 16.0, 41.0, 56.0, 95.0, 110.0, 166.0, 278.0, 407.0, 578.0, 824.0, 1185.0, 1679.0, 2396.0, 3631.0, 5273.0, 8049.0, 11903.0, 18730.0, 29201.0, 46435.0, 74572.0, 118374.0, 179513.0, 189826.0, 130229.0, 81713.0, 50739.0, 31750.0, 20693.0, 13172.0, 8622.0, 5779.0, 3951.0, 2743.0, 1820.0, 1226.0, 875.0, 572.0, 443.0, 282.0, 199.0, 155.0, 81.0, 43.0, 41.0, 25.0, 16.0, 10.0, 6.0, 6.0, 4.0, 3.0, 1.0, 1.0], "bins": [-2.701171875, -2.61956787109375, -2.5379638671875, -2.45635986328125, -2.374755859375, -2.29315185546875, -2.2115478515625, -2.12994384765625, -2.04833984375, -1.96673583984375, -1.8851318359375, -1.80352783203125, -1.721923828125, -1.64031982421875, -1.5587158203125, -1.47711181640625, -1.3955078125, -1.31390380859375, -1.2322998046875, -1.15069580078125, -1.069091796875, -0.98748779296875, -0.9058837890625, -0.82427978515625, -0.74267578125, -0.66107177734375, -0.5794677734375, -0.49786376953125, -0.416259765625, -0.33465576171875, -0.2530517578125, -0.17144775390625, -0.08984375, -0.00823974609375, 0.0733642578125, 0.15496826171875, 0.236572265625, 0.31817626953125, 0.3997802734375, 0.48138427734375, 0.56298828125, 0.64459228515625, 0.7261962890625, 0.80780029296875, 0.889404296875, 0.97100830078125, 1.0526123046875, 1.13421630859375, 1.2158203125, 1.29742431640625, 1.3790283203125, 1.46063232421875, 1.542236328125, 1.62384033203125, 1.7054443359375, 1.78704833984375, 1.86865234375, 1.95025634765625, 2.0318603515625, 2.11346435546875, 2.195068359375, 2.27667236328125, 2.3582763671875, 2.43988037109375, 2.521484375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 7.0, 2.0, 3.0, 7.0, 9.0, 10.0, 12.0, 18.0, 15.0, 18.0, 21.0, 22.0, 34.0, 17.0, 26.0, 36.0, 35.0, 36.0, 35.0, 30.0, 43.0, 56.0, 1059.0, 43.0, 45.0, 49.0, 21.0, 33.0, 34.0, 27.0, 33.0, 22.0, 24.0, 22.0, 21.0, 18.0, 15.0, 11.0, 8.0, 19.0, 11.0, 5.0, 4.0, 5.0, 6.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0], "bins": [-15.328125, -14.875244140625, -14.42236328125, -13.969482421875, -13.5166015625, -13.063720703125, -12.61083984375, -12.157958984375, -11.705078125, -11.252197265625, -10.79931640625, -10.346435546875, -9.8935546875, -9.440673828125, -8.98779296875, -8.534912109375, -8.08203125, -7.629150390625, -7.17626953125, -6.723388671875, -6.2705078125, -5.817626953125, -5.36474609375, -4.911865234375, -4.458984375, -4.006103515625, -3.55322265625, -3.100341796875, -2.6474609375, -2.194580078125, -1.74169921875, -1.288818359375, -0.8359375, -0.383056640625, 0.06982421875, 0.522705078125, 0.9755859375, 1.428466796875, 1.88134765625, 2.334228515625, 2.787109375, 3.239990234375, 3.69287109375, 4.145751953125, 4.5986328125, 5.051513671875, 5.50439453125, 5.957275390625, 6.41015625, 6.863037109375, 7.31591796875, 7.768798828125, 8.2216796875, 8.674560546875, 9.12744140625, 9.580322265625, 10.033203125, 10.486083984375, 10.93896484375, 11.391845703125, 11.8447265625, 12.297607421875, 12.75048828125, 13.203369140625, 13.65625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 3.0, 6.0, 16.0, 10.0, 22.0, 34.0, 53.0, 77.0, 135.0, 188.0, 277.0, 407.0, 598.0, 988.0, 1469.0, 2124.0, 3474.0, 5430.0, 8150.0, 13151.0, 21253.0, 35339.0, 59454.0, 102178.0, 173012.0, 1268764.0, 161428.0, 95120.0, 56042.0, 33496.0, 19994.0, 12447.0, 7715.0, 4991.0, 3232.0, 2102.0, 1311.0, 898.0, 571.0, 406.0, 252.0, 170.0, 100.0, 89.0, 50.0, 35.0, 25.0, 17.0, 12.0, 7.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.189453125, -2.1219482421875, -2.054443359375, -1.9869384765625, -1.91943359375, -1.8519287109375, -1.784423828125, -1.7169189453125, -1.6494140625, -1.5819091796875, -1.514404296875, -1.4468994140625, -1.37939453125, -1.3118896484375, -1.244384765625, -1.1768798828125, -1.109375, -1.0418701171875, -0.974365234375, -0.9068603515625, -0.83935546875, -0.7718505859375, -0.704345703125, -0.6368408203125, -0.5693359375, -0.5018310546875, -0.434326171875, -0.3668212890625, -0.29931640625, -0.2318115234375, -0.164306640625, -0.0968017578125, -0.029296875, 0.0382080078125, 0.105712890625, 0.1732177734375, 0.24072265625, 0.3082275390625, 0.375732421875, 0.4432373046875, 0.5107421875, 0.5782470703125, 0.645751953125, 0.7132568359375, 0.78076171875, 0.8482666015625, 0.915771484375, 0.9832763671875, 1.05078125, 1.1182861328125, 1.185791015625, 1.2532958984375, 1.32080078125, 1.3883056640625, 1.455810546875, 1.5233154296875, 1.5908203125, 1.6583251953125, 1.725830078125, 1.7933349609375, 1.86083984375, 1.9283447265625, 1.995849609375, 2.0633544921875, 2.130859375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 6.0, 6.0, 4.0, 6.0, 7.0, 16.0, 9.0, 20.0, 29.0, 29.0, 51.0, 52.0, 75.0, 80.0, 98.0, 82.0, 77.0, 70.0, 66.0, 58.0, 32.0, 33.0, 24.0, 15.0, 9.0, 12.0, 5.0, 11.0, 7.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.035552978515625, -0.03436851501464844, -0.033184051513671875, -0.03199958801269531, -0.03081512451171875, -0.029630661010742188, -0.028446197509765625, -0.027261734008789062, -0.0260772705078125, -0.024892807006835938, -0.023708343505859375, -0.022523880004882812, -0.02133941650390625, -0.020154953002929688, -0.018970489501953125, -0.017786026000976562, -0.0166015625, -0.015417098999023438, -0.014232635498046875, -0.013048171997070312, -0.01186370849609375, -0.010679244995117188, -0.009494781494140625, -0.008310317993164062, -0.0071258544921875, -0.0059413909912109375, -0.004756927490234375, -0.0035724639892578125, -0.00238800048828125, -0.0012035369873046875, -1.9073486328125e-05, 0.0011653900146484375, 0.002349853515625, 0.0035343170166015625, 0.004718780517578125, 0.0059032440185546875, 0.00708770751953125, 0.008272171020507812, 0.009456634521484375, 0.010641098022460938, 0.0118255615234375, 0.013010025024414062, 0.014194488525390625, 0.015378952026367188, 0.01656341552734375, 0.017747879028320312, 0.018932342529296875, 0.020116806030273438, 0.02130126953125, 0.022485733032226562, 0.023670196533203125, 0.024854660034179688, 0.02603912353515625, 0.027223587036132812, 0.028408050537109375, 0.029592514038085938, 0.0307769775390625, 0.03196144104003906, 0.033145904541015625, 0.03433036804199219, 0.03551483154296875, 0.03669929504394531, 0.037883758544921875, 0.03906822204589844, 0.040252685546875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 4.0, 3.0, 8.0, 10.0, 15.0, 16.0, 24.0, 28.0, 50.0, 58.0, 94.0, 124.0, 234.0, 371.0, 1316.0, 786954.0, 257188.0, 1096.0, 355.0, 208.0, 124.0, 53.0, 57.0, 32.0, 27.0, 23.0, 14.0, 16.0, 13.0, 9.0, 5.0, 9.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.796875, -0.773406982421875, -0.74993896484375, -0.726470947265625, -0.7030029296875, -0.679534912109375, -0.65606689453125, -0.632598876953125, -0.609130859375, -0.585662841796875, -0.56219482421875, -0.538726806640625, -0.5152587890625, -0.491790771484375, -0.46832275390625, -0.444854736328125, -0.42138671875, -0.397918701171875, -0.37445068359375, -0.350982666015625, -0.3275146484375, -0.304046630859375, -0.28057861328125, -0.257110595703125, -0.233642578125, -0.210174560546875, -0.18670654296875, -0.163238525390625, -0.1397705078125, -0.116302490234375, -0.09283447265625, -0.069366455078125, -0.0458984375, -0.022430419921875, 0.00103759765625, 0.024505615234375, 0.0479736328125, 0.071441650390625, 0.09490966796875, 0.118377685546875, 0.141845703125, 0.165313720703125, 0.18878173828125, 0.212249755859375, 0.2357177734375, 0.259185791015625, 0.28265380859375, 0.306121826171875, 0.32958984375, 0.353057861328125, 0.37652587890625, 0.399993896484375, 0.4234619140625, 0.446929931640625, 0.47039794921875, 0.493865966796875, 0.517333984375, 0.540802001953125, 0.56427001953125, 0.587738037109375, 0.6112060546875, 0.634674072265625, 0.65814208984375, 0.681610107421875, 0.705078125]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 20.0, 988.0, 7.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1338716298341751, -0.11262015253305435, -0.0913686752319336, -0.07011719793081284, -0.04886572062969208, -0.02761424332857132, -0.0063627660274505615, 0.014888718724250793, 0.036140188574790955, 0.05739166587591171, 0.07864314317703247, 0.09989462047815323, 0.12114609777927399, 0.14239758253097534, 0.1636490523815155, 0.18490053713321686, 0.20615200698375702, 0.22740349173545837, 0.24865496158599854, 0.2699064314365387, 0.29115790128707886, 0.3124094009399414, 0.33366087079048157, 0.35491234064102173, 0.3761638402938843, 0.39741531014442444, 0.4186667799949646, 0.43991827964782715, 0.4611697494983673, 0.48242121934890747, 0.50367271900177, 0.5249241590499878, 0.5461755990982056, 0.5674270987510681, 0.5886785387992859, 0.6099300384521484, 0.6311814785003662, 0.6524329781532288, 0.6736844778060913, 0.6949359178543091, 0.7161874175071716, 0.7374389171600342, 0.758690357208252, 0.7799418568611145, 0.801193356513977, 0.8224447965621948, 0.8436962962150574, 0.8649477958679199, 0.8861992359161377, 0.9074507355690002, 0.928702175617218, 0.9499536752700806, 0.9712051153182983, 0.9924566149711609, 1.0137081146240234, 1.0349595546722412, 1.056210994720459, 1.0774624347686768, 1.098713994026184, 1.1199654340744019, 1.1412168741226196, 1.162468433380127, 1.1837198734283447, 1.2049713134765625, 1.2262228727340698]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 9.0, 6.0, 8.0, 9.0, 16.0, 13.0, 17.0, 33.0, 33.0, 33.0, 38.0, 50.0, 44.0, 50.0, 59.0, 52.0, 69.0, 55.0, 67.0, 56.0, 41.0, 48.0, 54.0, 32.0, 25.0, 26.0, 8.0, 14.0, 17.0, 6.0, 6.0, 2.0, 1.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05988478660583496, -0.058346085250377655, -0.05680738389492035, -0.055268678814172745, -0.05372997745871544, -0.05219127610325813, -0.05065257102251053, -0.04911386966705322, -0.04757516831159592, -0.04603646695613861, -0.044497765600681305, -0.0429590605199337, -0.041420359164476395, -0.03988165780901909, -0.038342952728271484, -0.03680425137281418, -0.03526555001735687, -0.03372684866189957, -0.03218814730644226, -0.030649442225694656, -0.02911074087023735, -0.027572039514780045, -0.02603333629667759, -0.024494633078575134, -0.02295593172311783, -0.021417230367660522, -0.019878527149558067, -0.018339823931455612, -0.016801122575998306, -0.015262420289218426, -0.013723718002438545, -0.012185015715658665, -0.010646313428878784, -0.009107611142098904, -0.007568908855319023, -0.006030206568539143, -0.004491504281759262, -0.0029528019949793816, -0.001414099708199501, 0.00012460257858037949, 0.00166330486536026, 0.0032020071521401405, 0.004740709438920021, 0.006279411725699902, 0.007818114012479782, 0.009356816299259663, 0.010895518586039543, 0.012434220872819424, 0.013972923159599304, 0.015511625446379185, 0.017050327733159065, 0.01858903095126152, 0.020127732306718826, 0.021666433662176132, 0.023205136880278587, 0.024743840098381042, 0.02628254145383835, 0.027821242809295654, 0.02935994602739811, 0.030898649245500565, 0.03243735060095787, 0.033976051956415176, 0.03551475703716278, 0.03705345839262009, 0.03859215974807739]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 6.0, 6.0, 13.0, 12.0, 12.0, 8.0, 17.0, 13.0, 22.0, 19.0, 25.0, 21.0, 25.0, 27.0, 26.0, 35.0, 31.0, 32.0, 40.0, 34.0, 38.0, 37.0, 46.0, 37.0, 35.0, 37.0, 48.0, 30.0, 39.0, 22.0, 23.0, 28.0, 31.0, 22.0, 21.0, 20.0, 14.0, 13.0, 10.0, 11.0, 7.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-22.28125, -21.576171875, -20.87109375, -20.166015625, -19.4609375, -18.755859375, -18.05078125, -17.345703125, -16.640625, -15.935546875, -15.23046875, -14.525390625, -13.8203125, -13.115234375, -12.41015625, -11.705078125, -11.0, -10.294921875, -9.58984375, -8.884765625, -8.1796875, -7.474609375, -6.76953125, -6.064453125, -5.359375, -4.654296875, -3.94921875, -3.244140625, -2.5390625, -1.833984375, -1.12890625, -0.423828125, 0.28125, 0.986328125, 1.69140625, 2.396484375, 3.1015625, 3.806640625, 4.51171875, 5.216796875, 5.921875, 6.626953125, 7.33203125, 8.037109375, 8.7421875, 9.447265625, 10.15234375, 10.857421875, 11.5625, 12.267578125, 12.97265625, 13.677734375, 14.3828125, 15.087890625, 15.79296875, 16.498046875, 17.203125, 17.908203125, 18.61328125, 19.318359375, 20.0234375, 20.728515625, 21.43359375, 22.138671875, 22.84375]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 6.0, 8.0, 13.0, 18.0, 32.0, 34.0, 63.0, 71.0, 95.0, 138.0, 178.0, 238.0, 378.0, 473.0, 649.0, 950.0, 1332.0, 2228.0, 3814.0, 7418.0, 16654.0, 45688.0, 166016.0, 524844.0, 189389.0, 50948.0, 17912.0, 7821.0, 3921.0, 2322.0, 1434.0, 951.0, 694.0, 553.0, 343.0, 258.0, 191.0, 130.0, 94.0, 69.0, 47.0, 44.0, 21.0, 24.0, 15.0, 13.0, 7.0, 4.0, 4.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0], "bins": [-34.625, -33.56103515625, -32.4970703125, -31.43310546875, -30.369140625, -29.30517578125, -28.2412109375, -27.17724609375, -26.11328125, -25.04931640625, -23.9853515625, -22.92138671875, -21.857421875, -20.79345703125, -19.7294921875, -18.66552734375, -17.6015625, -16.53759765625, -15.4736328125, -14.40966796875, -13.345703125, -12.28173828125, -11.2177734375, -10.15380859375, -9.08984375, -8.02587890625, -6.9619140625, -5.89794921875, -4.833984375, -3.77001953125, -2.7060546875, -1.64208984375, -0.578125, 0.48583984375, 1.5498046875, 2.61376953125, 3.677734375, 4.74169921875, 5.8056640625, 6.86962890625, 7.93359375, 8.99755859375, 10.0615234375, 11.12548828125, 12.189453125, 13.25341796875, 14.3173828125, 15.38134765625, 16.4453125, 17.50927734375, 18.5732421875, 19.63720703125, 20.701171875, 21.76513671875, 22.8291015625, 23.89306640625, 24.95703125, 26.02099609375, 27.0849609375, 28.14892578125, 29.212890625, 30.27685546875, 31.3408203125, 32.40478515625, 33.46875]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 5.0, 11.0, 16.0, 13.0, 24.0, 34.0, 44.0, 34.0, 38.0, 48.0, 60.0, 94.0, 155.0, 1440.0, 439.0, 135.0, 67.0, 43.0, 51.0, 54.0, 44.0, 37.0, 23.0, 21.0, 22.0, 18.0, 12.0, 8.0, 11.0, 4.0, 6.0, 6.0, 6.0, 1.0, 1.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-80.1875, -77.95556640625, -75.7236328125, -73.49169921875, -71.259765625, -69.02783203125, -66.7958984375, -64.56396484375, -62.33203125, -60.10009765625, -57.8681640625, -55.63623046875, -53.404296875, -51.17236328125, -48.9404296875, -46.70849609375, -44.4765625, -42.24462890625, -40.0126953125, -37.78076171875, -35.548828125, -33.31689453125, -31.0849609375, -28.85302734375, -26.62109375, -24.38916015625, -22.1572265625, -19.92529296875, -17.693359375, -15.46142578125, -13.2294921875, -10.99755859375, -8.765625, -6.53369140625, -4.3017578125, -2.06982421875, 0.162109375, 2.39404296875, 4.6259765625, 6.85791015625, 9.08984375, 11.32177734375, 13.5537109375, 15.78564453125, 18.017578125, 20.24951171875, 22.4814453125, 24.71337890625, 26.9453125, 29.17724609375, 31.4091796875, 33.64111328125, 35.873046875, 38.10498046875, 40.3369140625, 42.56884765625, 44.80078125, 47.03271484375, 49.2646484375, 51.49658203125, 53.728515625, 55.96044921875, 58.1923828125, 60.42431640625, 62.65625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 9.0, 3.0, 5.0, 12.0, 15.0, 10.0, 12.0, 25.0, 18.0, 24.0, 39.0, 42.0, 51.0, 101.0, 165.0, 348.0, 753.0, 2456.0, 2819244.0, 319246.0, 1688.0, 652.0, 310.0, 150.0, 99.0, 57.0, 25.0, 23.0, 23.0, 21.0, 17.0, 13.0, 14.0, 8.0, 3.0, 3.0, 6.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-226.75, -219.646484375, -212.54296875, -205.439453125, -198.3359375, -191.232421875, -184.12890625, -177.025390625, -169.921875, -162.818359375, -155.71484375, -148.611328125, -141.5078125, -134.404296875, -127.30078125, -120.197265625, -113.09375, -105.990234375, -98.88671875, -91.783203125, -84.6796875, -77.576171875, -70.47265625, -63.369140625, -56.265625, -49.162109375, -42.05859375, -34.955078125, -27.8515625, -20.748046875, -13.64453125, -6.541015625, 0.5625, 7.666015625, 14.76953125, 21.873046875, 28.9765625, 36.080078125, 43.18359375, 50.287109375, 57.390625, 64.494140625, 71.59765625, 78.701171875, 85.8046875, 92.908203125, 100.01171875, 107.115234375, 114.21875, 121.322265625, 128.42578125, 135.529296875, 142.6328125, 149.736328125, 156.83984375, 163.943359375, 171.046875, 178.150390625, 185.25390625, 192.357421875, 199.4609375, 206.564453125, 213.66796875, 220.771484375, 227.875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 6.0, 301.0, 658.0, 46.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-402.95916748046875, -380.8097839355469, -358.660400390625, -336.5110168457031, -314.36163330078125, -292.2122497558594, -270.0628662109375, -247.91348266601562, -225.76409912109375, -203.61471557617188, -181.46533203125, -159.31594848632812, -137.16656494140625, -115.01718139648438, -92.8677978515625, -70.71841430664062, -48.56903076171875, -26.419647216796875, -4.270263671875, 17.879119873046875, 40.02850341796875, 62.177886962890625, 84.3272705078125, 106.47665405273438, 128.62603759765625, 150.77542114257812, 172.9248046875, 195.07418823242188, 217.22357177734375, 239.37295532226562, 261.5223388671875, 283.6717224121094, 305.821044921875, 327.9704284667969, 350.11981201171875, 372.2691955566406, 394.4185791015625, 416.5679626464844, 438.71734619140625, 460.8667297363281, 483.01611328125, 505.1654968261719, 527.3148803710938, 549.4642333984375, 571.6136474609375, 593.7630615234375, 615.9124145507812, 638.061767578125, 660.211181640625, 682.360595703125, 704.5099487304688, 726.6593017578125, 748.8087158203125, 770.9581298828125, 793.1074829101562, 815.2568359375, 837.40625, 859.5556640625, 881.7050170898438, 903.8543701171875, 926.0037841796875, 948.1531982421875, 970.3025512695312, 992.451904296875, 1014.601318359375]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 6.0, 6.0, 7.0, 3.0, 7.0, 8.0, 12.0, 8.0, 19.0, 14.0, 23.0, 15.0, 30.0, 19.0, 19.0, 33.0, 30.0, 33.0, 31.0, 26.0, 52.0, 52.0, 44.0, 50.0, 35.0, 41.0, 41.0, 33.0, 25.0, 30.0, 31.0, 42.0, 24.0, 23.0, 22.0, 13.0, 11.0, 15.0, 17.0, 9.0, 8.0, 8.0, 6.0, 10.0, 4.0, 2.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0], "bins": [-162.3834991455078, -157.62156677246094, -152.85963439941406, -148.09771728515625, -143.33578491210938, -138.5738525390625, -133.81192016601562, -129.04998779296875, -124.2880630493164, -119.52613067626953, -114.76420593261719, -110.00227355957031, -105.24034118652344, -100.4784164428711, -95.71648406982422, -90.95455932617188, -86.192626953125, -81.43069458007812, -76.66876983642578, -71.9068374633789, -67.14491271972656, -62.38298034667969, -57.62104797363281, -52.8591194152832, -48.097190856933594, -43.335262298583984, -38.573333740234375, -33.8114013671875, -29.04947280883789, -24.28754425048828, -19.52561378479004, -14.763683319091797, -10.001739501953125, -5.239809989929199, -0.47788047790527344, 4.284049034118652, 9.045978546142578, 13.807907104492188, 18.56983757019043, 23.331768035888672, 28.09369659423828, 32.85562515258789, 37.6175537109375, 42.379486083984375, 47.141414642333984, 51.903343200683594, 56.66527557373047, 61.42720413208008, 66.18913269042969, 70.95106506347656, 75.7129898071289, 80.47492218017578, 85.23684692382812, 89.998779296875, 94.76071166992188, 99.52264404296875, 104.2845687866211, 109.04650115966797, 113.80842590332031, 118.57035827636719, 123.33229064941406, 128.09420776367188, 132.85614013671875, 137.61807250976562, 142.3800048828125]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 6.0, 9.0, 2.0, 10.0, 4.0, 10.0, 26.0, 15.0, 11.0, 23.0, 24.0, 26.0, 28.0, 23.0, 22.0, 30.0, 31.0, 44.0, 43.0, 41.0, 32.0, 39.0, 49.0, 56.0, 32.0, 34.0, 45.0, 39.0, 34.0, 28.0, 21.0, 21.0, 29.0, 26.0, 16.0, 13.0, 14.0, 18.0, 8.0, 10.0, 5.0, 3.0, 4.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.40625, -22.642578125, -21.87890625, -21.115234375, -20.3515625, -19.587890625, -18.82421875, -18.060546875, -17.296875, -16.533203125, -15.76953125, -15.005859375, -14.2421875, -13.478515625, -12.71484375, -11.951171875, -11.1875, -10.423828125, -9.66015625, -8.896484375, -8.1328125, -7.369140625, -6.60546875, -5.841796875, -5.078125, -4.314453125, -3.55078125, -2.787109375, -2.0234375, -1.259765625, -0.49609375, 0.267578125, 1.03125, 1.794921875, 2.55859375, 3.322265625, 4.0859375, 4.849609375, 5.61328125, 6.376953125, 7.140625, 7.904296875, 8.66796875, 9.431640625, 10.1953125, 10.958984375, 11.72265625, 12.486328125, 13.25, 14.013671875, 14.77734375, 15.541015625, 16.3046875, 17.068359375, 17.83203125, 18.595703125, 19.359375, 20.123046875, 20.88671875, 21.650390625, 22.4140625, 23.177734375, 23.94140625, 24.705078125, 25.46875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 13.0, 15.0, 18.0, 15.0, 22.0, 29.0, 39.0, 56.0, 79.0, 115.0, 168.0, 326.0, 643.0, 1287.0, 3469.0, 12100.0, 128479.0, 2906846.0, 1091452.0, 38132.0, 6688.0, 2154.0, 915.0, 456.0, 260.0, 141.0, 87.0, 74.0, 48.0, 23.0, 30.0, 14.0, 19.0, 7.0, 5.0, 9.0, 11.0, 5.0, 8.0, 4.0, 1.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.3125, -68.1015625, -65.890625, -63.6796875, -61.46875, -59.2578125, -57.046875, -54.8359375, -52.625, -50.4140625, -48.203125, -45.9921875, -43.78125, -41.5703125, -39.359375, -37.1484375, -34.9375, -32.7265625, -30.515625, -28.3046875, -26.09375, -23.8828125, -21.671875, -19.4609375, -17.25, -15.0390625, -12.828125, -10.6171875, -8.40625, -6.1953125, -3.984375, -1.7734375, 0.4375, 2.6484375, 4.859375, 7.0703125, 9.28125, 11.4921875, 13.703125, 15.9140625, 18.125, 20.3359375, 22.546875, 24.7578125, 26.96875, 29.1796875, 31.390625, 33.6015625, 35.8125, 38.0234375, 40.234375, 42.4453125, 44.65625, 46.8671875, 49.078125, 51.2890625, 53.5, 55.7109375, 57.921875, 60.1328125, 62.34375, 64.5546875, 66.765625, 68.9765625, 71.1875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 11.0, 8.0, 15.0, 4.0, 16.0, 13.0, 32.0, 31.0, 52.0, 89.0, 109.0, 136.0, 234.0, 371.0, 596.0, 843.0, 577.0, 302.0, 203.0, 132.0, 76.0, 65.0, 51.0, 36.0, 14.0, 16.0, 14.0, 9.0, 6.0, 6.0, 3.0, 4.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.4375, -46.84130859375, -45.2451171875, -43.64892578125, -42.052734375, -40.45654296875, -38.8603515625, -37.26416015625, -35.66796875, -34.07177734375, -32.4755859375, -30.87939453125, -29.283203125, -27.68701171875, -26.0908203125, -24.49462890625, -22.8984375, -21.30224609375, -19.7060546875, -18.10986328125, -16.513671875, -14.91748046875, -13.3212890625, -11.72509765625, -10.12890625, -8.53271484375, -6.9365234375, -5.34033203125, -3.744140625, -2.14794921875, -0.5517578125, 1.04443359375, 2.640625, 4.23681640625, 5.8330078125, 7.42919921875, 9.025390625, 10.62158203125, 12.2177734375, 13.81396484375, 15.41015625, 17.00634765625, 18.6025390625, 20.19873046875, 21.794921875, 23.39111328125, 24.9873046875, 26.58349609375, 28.1796875, 29.77587890625, 31.3720703125, 32.96826171875, 34.564453125, 36.16064453125, 37.7568359375, 39.35302734375, 40.94921875, 42.54541015625, 44.1416015625, 45.73779296875, 47.333984375, 48.93017578125, 50.5263671875, 52.12255859375, 53.71875]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 2.0, 2.0, 7.0, 8.0, 8.0, 28.0, 41.0, 50.0, 96.0, 165.0, 283.0, 577.0, 1238.0, 3744.0, 14077.0, 78855.0, 1727784.0, 2257335.0, 88468.0, 14866.0, 3870.0, 1405.0, 613.0, 305.0, 181.0, 97.0, 50.0, 40.0, 24.0, 16.0, 14.0, 13.0, 14.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-82.875, -80.439453125, -78.00390625, -75.568359375, -73.1328125, -70.697265625, -68.26171875, -65.826171875, -63.390625, -60.955078125, -58.51953125, -56.083984375, -53.6484375, -51.212890625, -48.77734375, -46.341796875, -43.90625, -41.470703125, -39.03515625, -36.599609375, -34.1640625, -31.728515625, -29.29296875, -26.857421875, -24.421875, -21.986328125, -19.55078125, -17.115234375, -14.6796875, -12.244140625, -9.80859375, -7.373046875, -4.9375, -2.501953125, -0.06640625, 2.369140625, 4.8046875, 7.240234375, 9.67578125, 12.111328125, 14.546875, 16.982421875, 19.41796875, 21.853515625, 24.2890625, 26.724609375, 29.16015625, 31.595703125, 34.03125, 36.466796875, 38.90234375, 41.337890625, 43.7734375, 46.208984375, 48.64453125, 51.080078125, 53.515625, 55.951171875, 58.38671875, 60.822265625, 63.2578125, 65.693359375, 68.12890625, 70.564453125, 73.0]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 115.0, 720.0, 172.0, 9.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-832.3998413085938, -793.9087524414062, -755.4176025390625, -716.926513671875, -678.4354248046875, -639.9442749023438, -601.4531860351562, -562.9620361328125, -524.470947265625, -485.9798278808594, -447.48870849609375, -408.99761962890625, -370.5065002441406, -332.015380859375, -293.5242919921875, -255.03317260742188, -216.54205322265625, -178.05093383789062, -139.55982971191406, -101.06871795654297, -62.577606201171875, -24.08648681640625, 14.404617309570312, 52.895721435546875, 91.3868408203125, 129.87796020507812, 168.3690643310547, 206.86016845703125, 245.35128784179688, 283.8424072265625, 322.33349609375, 360.8246154785156, 399.3157958984375, 437.8069152832031, 476.29803466796875, 514.7891235351562, 553.2802734375, 591.7713623046875, 630.262451171875, 668.7535400390625, 707.2446899414062, 745.7357788085938, 784.2269287109375, 822.718017578125, 861.2091064453125, 899.7002563476562, 938.1913452148438, 976.6824951171875, 1015.173583984375, 1053.6646728515625, 1092.15576171875, 1130.64697265625, 1169.1380615234375, 1207.629150390625, 1246.1202392578125, 1284.611328125, 1323.1025390625, 1361.5936279296875, 1400.084716796875, 1438.575927734375, 1477.0670166015625, 1515.55810546875, 1554.0491943359375, 1592.540283203125, 1631.0313720703125]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 6.0, 9.0, 7.0, 12.0, 10.0, 14.0, 16.0, 11.0, 25.0, 20.0, 17.0, 27.0, 22.0, 35.0, 31.0, 35.0, 33.0, 41.0, 34.0, 31.0, 44.0, 28.0, 36.0, 32.0, 33.0, 40.0, 34.0, 34.0, 36.0, 21.0, 22.0, 25.0, 26.0, 15.0, 20.0, 18.0, 12.0, 9.0, 10.0, 17.0, 6.0, 11.0, 12.0, 3.0, 2.0, 3.0, 4.0, 4.0, 1.0, 6.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-126.62420654296875, -122.42036437988281, -118.2165298461914, -114.0126953125, -109.80885314941406, -105.60501098632812, -101.40117645263672, -97.19734191894531, -92.99349975585938, -88.78965759277344, -84.58582305908203, -80.38198852539062, -76.17814636230469, -71.97430419921875, -67.77046966552734, -63.56663131713867, -59.36279296875, -55.15895462036133, -50.955116271972656, -46.751277923583984, -42.54743957519531, -38.34360122680664, -34.13976287841797, -29.935924530029297, -25.732086181640625, -21.528247833251953, -17.32440948486328, -13.12057113647461, -8.916732788085938, -4.712894439697266, -0.5090560913085938, 3.694782257080078, 7.8986358642578125, 12.102474212646484, 16.306312561035156, 20.510150909423828, 24.7139892578125, 28.917827606201172, 33.121665954589844, 37.325504302978516, 41.52934265136719, 45.73318099975586, 49.93701934814453, 54.1408576965332, 58.344696044921875, 62.54853439331055, 66.75237274169922, 70.95620727539062, 75.16004943847656, 79.3638916015625, 83.5677261352539, 87.77156066894531, 91.97540283203125, 96.17924499511719, 100.3830795288086, 104.5869140625, 108.79075622558594, 112.99459838867188, 117.19843292236328, 121.40226745605469, 125.60610961914062, 129.80995178222656, 134.0137939453125, 138.21762084960938, 142.4214630126953]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 6.0, 7.0, 9.0, 16.0, 13.0, 15.0, 15.0, 22.0, 19.0, 25.0, 19.0, 21.0, 34.0, 32.0, 33.0, 30.0, 39.0, 41.0, 54.0, 35.0, 39.0, 44.0, 44.0, 37.0, 35.0, 33.0, 29.0, 32.0, 35.0, 32.0, 33.0, 25.0, 20.0, 16.0, 11.0, 11.0, 7.0, 9.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.0, -19.35693359375, -18.7138671875, -18.07080078125, -17.427734375, -16.78466796875, -16.1416015625, -15.49853515625, -14.85546875, -14.21240234375, -13.5693359375, -12.92626953125, -12.283203125, -11.64013671875, -10.9970703125, -10.35400390625, -9.7109375, -9.06787109375, -8.4248046875, -7.78173828125, -7.138671875, -6.49560546875, -5.8525390625, -5.20947265625, -4.56640625, -3.92333984375, -3.2802734375, -2.63720703125, -1.994140625, -1.35107421875, -0.7080078125, -0.06494140625, 0.578125, 1.22119140625, 1.8642578125, 2.50732421875, 3.150390625, 3.79345703125, 4.4365234375, 5.07958984375, 5.72265625, 6.36572265625, 7.0087890625, 7.65185546875, 8.294921875, 8.93798828125, 9.5810546875, 10.22412109375, 10.8671875, 11.51025390625, 12.1533203125, 12.79638671875, 13.439453125, 14.08251953125, 14.7255859375, 15.36865234375, 16.01171875, 16.65478515625, 17.2978515625, 17.94091796875, 18.583984375, 19.22705078125, 19.8701171875, 20.51318359375, 21.15625]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 8.0, 22.0, 22.0, 32.0, 50.0, 70.0, 109.0, 144.0, 242.0, 335.0, 438.0, 685.0, 1037.0, 1438.0, 2212.0, 3209.0, 4899.0, 7257.0, 11003.0, 16737.0, 25778.0, 39571.0, 62919.0, 103372.0, 168697.0, 208070.0, 146137.0, 88896.0, 54096.0, 34811.0, 22528.0, 14566.0, 9684.0, 6433.0, 4187.0, 2879.0, 1942.0, 1267.0, 893.0, 594.0, 434.0, 271.0, 177.0, 135.0, 86.0, 57.0, 47.0, 31.0, 23.0, 13.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.099609375, -2.032623291015625, -1.96563720703125, -1.898651123046875, -1.8316650390625, -1.764678955078125, -1.69769287109375, -1.630706787109375, -1.563720703125, -1.496734619140625, -1.42974853515625, -1.362762451171875, -1.2957763671875, -1.228790283203125, -1.16180419921875, -1.094818115234375, -1.02783203125, -0.960845947265625, -0.89385986328125, -0.826873779296875, -0.7598876953125, -0.692901611328125, -0.62591552734375, -0.558929443359375, -0.491943359375, -0.424957275390625, -0.35797119140625, -0.290985107421875, -0.2239990234375, -0.157012939453125, -0.09002685546875, -0.023040771484375, 0.0439453125, 0.110931396484375, 0.17791748046875, 0.244903564453125, 0.3118896484375, 0.378875732421875, 0.44586181640625, 0.512847900390625, 0.579833984375, 0.646820068359375, 0.71380615234375, 0.780792236328125, 0.8477783203125, 0.914764404296875, 0.98175048828125, 1.048736572265625, 1.11572265625, 1.182708740234375, 1.24969482421875, 1.316680908203125, 1.3836669921875, 1.450653076171875, 1.51763916015625, 1.584625244140625, 1.651611328125, 1.718597412109375, 1.78558349609375, 1.852569580078125, 1.9195556640625, 1.986541748046875, 2.05352783203125, 2.120513916015625, 2.1875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 9.0, 8.0, 8.0, 4.0, 12.0, 16.0, 18.0, 16.0, 15.0, 17.0, 26.0, 19.0, 22.0, 29.0, 29.0, 32.0, 37.0, 43.0, 32.0, 54.0, 28.0, 40.0, 1057.0, 31.0, 31.0, 30.0, 40.0, 37.0, 22.0, 28.0, 36.0, 31.0, 28.0, 21.0, 23.0, 12.0, 13.0, 12.0, 14.0, 8.0, 12.0, 7.0, 5.0, 3.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-12.8203125, -12.4345703125, -12.048828125, -11.6630859375, -11.27734375, -10.8916015625, -10.505859375, -10.1201171875, -9.734375, -9.3486328125, -8.962890625, -8.5771484375, -8.19140625, -7.8056640625, -7.419921875, -7.0341796875, -6.6484375, -6.2626953125, -5.876953125, -5.4912109375, -5.10546875, -4.7197265625, -4.333984375, -3.9482421875, -3.5625, -3.1767578125, -2.791015625, -2.4052734375, -2.01953125, -1.6337890625, -1.248046875, -0.8623046875, -0.4765625, -0.0908203125, 0.294921875, 0.6806640625, 1.06640625, 1.4521484375, 1.837890625, 2.2236328125, 2.609375, 2.9951171875, 3.380859375, 3.7666015625, 4.15234375, 4.5380859375, 4.923828125, 5.3095703125, 5.6953125, 6.0810546875, 6.466796875, 6.8525390625, 7.23828125, 7.6240234375, 8.009765625, 8.3955078125, 8.78125, 9.1669921875, 9.552734375, 9.9384765625, 10.32421875, 10.7099609375, 11.095703125, 11.4814453125, 11.8671875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 7.0, 6.0, 8.0, 10.0, 25.0, 19.0, 29.0, 39.0, 61.0, 87.0, 136.0, 181.0, 261.0, 399.0, 541.0, 806.0, 1190.0, 1760.0, 2568.0, 3943.0, 5682.0, 8706.0, 13217.0, 19997.0, 31518.0, 49226.0, 79602.0, 129428.0, 1179691.0, 238239.0, 121475.0, 74839.0, 46486.0, 29399.0, 19227.0, 12714.0, 8394.0, 5483.0, 3719.0, 2565.0, 1754.0, 1139.0, 796.0, 533.0, 396.0, 223.0, 189.0, 131.0, 98.0, 61.0, 53.0, 30.0, 23.0, 10.0, 10.0, 4.0, 4.0, 5.0, 1.0, 2.0, 3.0, 1.0], "bins": [-1.55859375, -1.508209228515625, -1.45782470703125, -1.407440185546875, -1.3570556640625, -1.306671142578125, -1.25628662109375, -1.205902099609375, -1.155517578125, -1.105133056640625, -1.05474853515625, -1.004364013671875, -0.9539794921875, -0.903594970703125, -0.85321044921875, -0.802825927734375, -0.75244140625, -0.702056884765625, -0.65167236328125, -0.601287841796875, -0.5509033203125, -0.500518798828125, -0.45013427734375, -0.399749755859375, -0.349365234375, -0.298980712890625, -0.24859619140625, -0.198211669921875, -0.1478271484375, -0.097442626953125, -0.04705810546875, 0.003326416015625, 0.0537109375, 0.104095458984375, 0.15447998046875, 0.204864501953125, 0.2552490234375, 0.305633544921875, 0.35601806640625, 0.406402587890625, 0.456787109375, 0.507171630859375, 0.55755615234375, 0.607940673828125, 0.6583251953125, 0.708709716796875, 0.75909423828125, 0.809478759765625, 0.85986328125, 0.910247802734375, 0.96063232421875, 1.011016845703125, 1.0614013671875, 1.111785888671875, 1.16217041015625, 1.212554931640625, 1.262939453125, 1.313323974609375, 1.36370849609375, 1.414093017578125, 1.4644775390625, 1.514862060546875, 1.56524658203125, 1.615631103515625, 1.666015625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 4.0, 9.0, 10.0, 9.0, 12.0, 7.0, 15.0, 20.0, 31.0, 21.0, 34.0, 47.0, 57.0, 52.0, 77.0, 66.0, 88.0, 64.0, 66.0, 51.0, 50.0, 38.0, 30.0, 32.0, 22.0, 14.0, 13.0, 10.0, 10.0, 7.0, 9.0, 8.0, 2.0, 0.0, 6.0, 0.0, 3.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.022857666015625, -0.022141218185424805, -0.02142477035522461, -0.020708322525024414, -0.01999187469482422, -0.019275426864624023, -0.018558979034423828, -0.017842531204223633, -0.017126083374023438, -0.016409635543823242, -0.015693187713623047, -0.014976739883422852, -0.014260292053222656, -0.013543844223022461, -0.012827396392822266, -0.01211094856262207, -0.011394500732421875, -0.01067805290222168, -0.009961605072021484, -0.009245157241821289, -0.008528709411621094, -0.0078122615814208984, -0.007095813751220703, -0.006379365921020508, -0.0056629180908203125, -0.004946470260620117, -0.004230022430419922, -0.0035135746002197266, -0.0027971267700195312, -0.002080678939819336, -0.0013642311096191406, -0.0006477832794189453, 6.866455078125e-05, 0.0007851123809814453, 0.0015015602111816406, 0.002218008041381836, 0.0029344558715820312, 0.0036509037017822266, 0.004367351531982422, 0.005083799362182617, 0.0058002471923828125, 0.006516695022583008, 0.007233142852783203, 0.007949590682983398, 0.008666038513183594, 0.009382486343383789, 0.010098934173583984, 0.01081538200378418, 0.011531829833984375, 0.01224827766418457, 0.012964725494384766, 0.013681173324584961, 0.014397621154785156, 0.015114068984985352, 0.015830516815185547, 0.016546964645385742, 0.017263412475585938, 0.017979860305786133, 0.018696308135986328, 0.019412755966186523, 0.02012920379638672, 0.020845651626586914, 0.02156209945678711, 0.022278547286987305, 0.0229949951171875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 4.0, 2.0, 4.0, 3.0, 9.0, 3.0, 7.0, 8.0, 15.0, 18.0, 18.0, 17.0, 23.0, 28.0, 52.0, 62.0, 70.0, 98.0, 161.0, 231.0, 392.0, 809.0, 33253.0, 1009454.0, 2412.0, 477.0, 280.0, 183.0, 124.0, 67.0, 65.0, 45.0, 29.0, 27.0, 16.0, 23.0, 15.0, 15.0, 10.0, 12.0, 8.0, 4.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.4501953125, -0.4362449645996094, -0.42229461669921875, -0.4083442687988281, -0.3943939208984375, -0.3804435729980469, -0.36649322509765625, -0.3525428771972656, -0.338592529296875, -0.3246421813964844, -0.31069183349609375, -0.2967414855957031, -0.2827911376953125, -0.2688407897949219, -0.25489044189453125, -0.24094009399414062, -0.22698974609375, -0.21303939819335938, -0.19908905029296875, -0.18513870239257812, -0.1711883544921875, -0.15723800659179688, -0.14328765869140625, -0.12933731079101562, -0.115386962890625, -0.10143661499023438, -0.08748626708984375, -0.07353591918945312, -0.0595855712890625, -0.045635223388671875, -0.03168487548828125, -0.017734527587890625, -0.0037841796875, 0.010166168212890625, 0.02411651611328125, 0.038066864013671875, 0.0520172119140625, 0.06596755981445312, 0.07991790771484375, 0.09386825561523438, 0.107818603515625, 0.12176895141601562, 0.13571929931640625, 0.14966964721679688, 0.1636199951171875, 0.17757034301757812, 0.19152069091796875, 0.20547103881835938, 0.21942138671875, 0.23337173461914062, 0.24732208251953125, 0.2612724304199219, 0.2752227783203125, 0.2891731262207031, 0.30312347412109375, 0.3170738220214844, 0.331024169921875, 0.3449745178222656, 0.35892486572265625, 0.3728752136230469, 0.3868255615234375, 0.4007759094238281, 0.41472625732421875, 0.4286766052246094, 0.442626953125]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 10.0, 999.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12311657518148422, -0.10840263962745667, -0.0936887115240097, -0.07897477596998215, -0.06426084041595459, -0.04954690486192703, -0.03483297675848007, -0.020119041204452515, -0.005405105650424957, 0.00930882804095745, 0.02402276173233986, 0.03873669356107712, 0.053450629115104675, 0.06816456466913223, 0.0828784927725792, 0.09759242832660675, 0.11230636388063431, 0.12702029943466187, 0.14173422753810883, 0.1564481556415558, 0.17116209864616394, 0.1858760416507721, 0.20058995485305786, 0.21530389785766602, 0.23001784086227417, 0.24473176896572113, 0.2594456970691681, 0.27415964007377625, 0.2888735830783844, 0.30358749628067017, 0.3183014392852783, 0.3330153822898865, 0.34772932529449463, 0.3624432682991028, 0.37715718150138855, 0.3918711245059967, 0.40658506751060486, 0.4212989807128906, 0.4360129237174988, 0.45072686672210693, 0.4654408097267151, 0.48015475273132324, 0.494868665933609, 0.5095826387405396, 0.5242965221405029, 0.5390104651451111, 0.5537244081497192, 0.5684383511543274, 0.5831522941589355, 0.5978662371635437, 0.6125801801681519, 0.6272940635681152, 0.6420080065727234, 0.6567219495773315, 0.6714358925819397, 0.6861498355865479, 0.7008637189865112, 0.7155776619911194, 0.7302916049957275, 0.7450054883956909, 0.7597194314002991, 0.7744333744049072, 0.7891473174095154, 0.8038612604141235, 0.8185752034187317]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 9.0, 5.0, 7.0, 12.0, 20.0, 22.0, 29.0, 37.0, 37.0, 60.0, 36.0, 62.0, 65.0, 55.0, 60.0, 60.0, 55.0, 65.0, 48.0, 51.0, 56.0, 32.0, 32.0, 18.0, 29.0, 18.0, 10.0, 8.0, 8.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03972238302230835, -0.0385768823325634, -0.03743138164281845, -0.0362858846783638, -0.03514038398861885, -0.0339948832988739, -0.03284938633441925, -0.0317038856446743, -0.030558384954929352, -0.029412884265184402, -0.028267385438084602, -0.027121886610984802, -0.025976385921239853, -0.024830885231494904, -0.023685386404395103, -0.022539887577295303, -0.021394386887550354, -0.020248886197805405, -0.019103387370705605, -0.017957888543605804, -0.016812387853860855, -0.015666887164115906, -0.014521388337016106, -0.013375888578593731, -0.012230388820171356, -0.011084889061748981, -0.009939389303326607, -0.008793889544904232, -0.007648389786481857, -0.006502890028059483, -0.005357390269637108, -0.004211890511214733, -0.0030663907527923584, -0.0019208909943699837, -0.000775391235947609, 0.0003701085224747658, 0.0015156082808971405, 0.0026611080393195152, 0.00380660779774189, 0.004952107556164265, 0.006097607314586639, 0.007243107073009014, 0.008388606831431389, 0.009534106589853764, 0.010679606348276138, 0.011825106106698513, 0.012970605865120888, 0.014116105623543262, 0.015261605381965637, 0.016407106071710587, 0.017552604898810387, 0.018698103725910187, 0.019843604415655136, 0.020989105105400085, 0.022134603932499886, 0.023280102759599686, 0.024425603449344635, 0.025571104139089584, 0.026716602966189384, 0.027862101793289185, 0.029007602483034134, 0.030153103172779083, 0.031298600137233734, 0.032444100826978683, 0.03358960151672363]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 5.0, 6.0, 7.0, 9.0, 16.0, 13.0, 15.0, 15.0, 22.0, 19.0, 25.0, 20.0, 20.0, 34.0, 32.0, 33.0, 30.0, 40.0, 40.0, 54.0, 36.0, 38.0, 44.0, 44.0, 37.0, 35.0, 32.0, 30.0, 33.0, 33.0, 33.0, 33.0, 24.0, 21.0, 16.0, 11.0, 11.0, 8.0, 8.0, 7.0, 3.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-20.0, -19.35693359375, -18.7138671875, -18.07080078125, -17.427734375, -16.78466796875, -16.1416015625, -15.49853515625, -14.85546875, -14.21240234375, -13.5693359375, -12.92626953125, -12.283203125, -11.64013671875, -10.9970703125, -10.35400390625, -9.7109375, -9.06787109375, -8.4248046875, -7.78173828125, -7.138671875, -6.49560546875, -5.8525390625, -5.20947265625, -4.56640625, -3.92333984375, -3.2802734375, -2.63720703125, -1.994140625, -1.35107421875, -0.7080078125, -0.06494140625, 0.578125, 1.22119140625, 1.8642578125, 2.50732421875, 3.150390625, 3.79345703125, 4.4365234375, 5.07958984375, 5.72265625, 6.36572265625, 7.0087890625, 7.65185546875, 8.294921875, 8.93798828125, 9.5810546875, 10.22412109375, 10.8671875, 11.51025390625, 12.1533203125, 12.79638671875, 13.439453125, 14.08251953125, 14.7255859375, 15.36865234375, 16.01171875, 16.65478515625, 17.2978515625, 17.94091796875, 18.583984375, 19.22705078125, 19.8701171875, 20.51318359375, 21.15625]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 7.0, 4.0, 10.0, 8.0, 19.0, 20.0, 27.0, 32.0, 48.0, 74.0, 78.0, 126.0, 189.0, 251.0, 397.0, 563.0, 796.0, 1210.0, 1885.0, 2995.0, 6043.0, 16595.0, 73695.0, 609952.0, 272764.0, 38205.0, 10791.0, 4525.0, 2448.0, 1494.0, 963.0, 687.0, 480.0, 351.0, 238.0, 177.0, 109.0, 92.0, 61.0, 46.0, 26.0, 25.0, 18.0, 17.0, 3.0, 7.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-49.625, -48.19921875, -46.7734375, -45.34765625, -43.921875, -42.49609375, -41.0703125, -39.64453125, -38.21875, -36.79296875, -35.3671875, -33.94140625, -32.515625, -31.08984375, -29.6640625, -28.23828125, -26.8125, -25.38671875, -23.9609375, -22.53515625, -21.109375, -19.68359375, -18.2578125, -16.83203125, -15.40625, -13.98046875, -12.5546875, -11.12890625, -9.703125, -8.27734375, -6.8515625, -5.42578125, -4.0, -2.57421875, -1.1484375, 0.27734375, 1.703125, 3.12890625, 4.5546875, 5.98046875, 7.40625, 8.83203125, 10.2578125, 11.68359375, 13.109375, 14.53515625, 15.9609375, 17.38671875, 18.8125, 20.23828125, 21.6640625, 23.08984375, 24.515625, 25.94140625, 27.3671875, 28.79296875, 30.21875, 31.64453125, 33.0703125, 34.49609375, 35.921875, 37.34765625, 38.7734375, 40.19921875, 41.625]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 9.0, 9.0, 4.0, 15.0, 25.0, 28.0, 20.0, 36.0, 29.0, 43.0, 50.0, 66.0, 58.0, 101.0, 209.0, 1598.0, 229.0, 96.0, 89.0, 49.0, 50.0, 23.0, 34.0, 32.0, 24.0, 20.0, 13.0, 10.0, 13.0, 11.0, 12.0, 3.0, 2.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0], "bins": [-66.75, -64.7607421875, -62.771484375, -60.7822265625, -58.79296875, -56.8037109375, -54.814453125, -52.8251953125, -50.8359375, -48.8466796875, -46.857421875, -44.8681640625, -42.87890625, -40.8896484375, -38.900390625, -36.9111328125, -34.921875, -32.9326171875, -30.943359375, -28.9541015625, -26.96484375, -24.9755859375, -22.986328125, -20.9970703125, -19.0078125, -17.0185546875, -15.029296875, -13.0400390625, -11.05078125, -9.0615234375, -7.072265625, -5.0830078125, -3.09375, -1.1044921875, 0.884765625, 2.8740234375, 4.86328125, 6.8525390625, 8.841796875, 10.8310546875, 12.8203125, 14.8095703125, 16.798828125, 18.7880859375, 20.77734375, 22.7666015625, 24.755859375, 26.7451171875, 28.734375, 30.7236328125, 32.712890625, 34.7021484375, 36.69140625, 38.6806640625, 40.669921875, 42.6591796875, 44.6484375, 46.6376953125, 48.626953125, 50.6162109375, 52.60546875, 54.5947265625, 56.583984375, 58.5732421875, 60.5625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 5.0, 6.0, 0.0, 2.0, 2.0, 7.0, 8.0, 6.0, 9.0, 10.0, 16.0, 11.0, 25.0, 31.0, 45.0, 47.0, 77.0, 73.0, 127.0, 187.0, 329.0, 659.0, 1552.0, 48351.0, 3085663.0, 5958.0, 1074.0, 493.0, 285.0, 168.0, 115.0, 93.0, 68.0, 59.0, 41.0, 24.0, 17.0, 19.0, 16.0, 7.0, 10.0, 4.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-168.25, -163.041015625, -157.83203125, -152.623046875, -147.4140625, -142.205078125, -136.99609375, -131.787109375, -126.578125, -121.369140625, -116.16015625, -110.951171875, -105.7421875, -100.533203125, -95.32421875, -90.115234375, -84.90625, -79.697265625, -74.48828125, -69.279296875, -64.0703125, -58.861328125, -53.65234375, -48.443359375, -43.234375, -38.025390625, -32.81640625, -27.607421875, -22.3984375, -17.189453125, -11.98046875, -6.771484375, -1.5625, 3.646484375, 8.85546875, 14.064453125, 19.2734375, 24.482421875, 29.69140625, 34.900390625, 40.109375, 45.318359375, 50.52734375, 55.736328125, 60.9453125, 66.154296875, 71.36328125, 76.572265625, 81.78125, 86.990234375, 92.19921875, 97.408203125, 102.6171875, 107.826171875, 113.03515625, 118.244140625, 123.453125, 128.662109375, 133.87109375, 139.080078125, 144.2890625, 149.498046875, 154.70703125, 159.916015625, 165.125]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 12.0, 42.0, 80.0, 199.0, 303.0, 218.0, 101.0, 34.0, 14.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-271.7008972167969, -263.5650329589844, -255.42913818359375, -247.2932586669922, -239.15737915039062, -231.02151489257812, -222.88563537597656, -214.749755859375, -206.61387634277344, -198.47799682617188, -190.3421173095703, -182.20623779296875, -174.07037353515625, -165.93447875976562, -157.79861450195312, -149.66273498535156, -141.52685546875, -133.39097595214844, -125.25509643554688, -117.11922454833984, -108.98334503173828, -100.84746551513672, -92.71159362792969, -84.57571411132812, -76.43983459472656, -68.303955078125, -60.1680793762207, -52.032203674316406, -43.896324157714844, -35.76044464111328, -27.624568939208984, -19.488693237304688, -11.352828979492188, -3.216951370239258, 4.918926239013672, 13.054803848266602, 21.19068145751953, 29.326560974121094, 37.46243667602539, 45.59831237792969, 53.73419189453125, 61.87007141113281, 70.00595092773438, 78.1418228149414, 86.27770233154297, 94.41358184814453, 102.54945373535156, 110.68533325195312, 118.82121276855469, 126.95709228515625, 135.0929718017578, 143.22885131835938, 151.36471557617188, 159.5006103515625, 167.636474609375, 175.77235412597656, 183.90823364257812, 192.0441131591797, 200.17999267578125, 208.3158721923828, 216.45175170898438, 224.58761596679688, 232.72349548339844, 240.859375, 248.99525451660156]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 2.0, 2.0, 3.0, 8.0, 11.0, 10.0, 10.0, 14.0, 21.0, 15.0, 26.0, 26.0, 39.0, 30.0, 37.0, 41.0, 29.0, 43.0, 49.0, 53.0, 60.0, 51.0, 48.0, 34.0, 40.0, 44.0, 28.0, 38.0, 33.0, 22.0, 26.0, 17.0, 16.0, 16.0, 17.0, 8.0, 8.0, 3.0, 10.0, 3.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-179.334228515625, -173.6168670654297, -167.89950561523438, -162.18214416503906, -156.46478271484375, -150.74742126464844, -145.03005981445312, -139.31268310546875, -133.5953369140625, -127.87797546386719, -122.16061401367188, -116.44325256347656, -110.72589111328125, -105.00852966308594, -99.2911605834961, -93.57379913330078, -87.85643005371094, -82.13906860351562, -76.42170715332031, -70.704345703125, -64.98698425292969, -59.26961898803711, -53.55225372314453, -47.83489227294922, -42.117530822753906, -36.400169372558594, -30.68280601501465, -24.965442657470703, -19.24808120727539, -13.530719757080078, -7.8133544921875, -2.0959930419921875, 3.621368408203125, 9.338730812072754, 15.056093215942383, 20.773456573486328, 26.49081802368164, 32.20817947387695, 37.92554473876953, 43.642906188964844, 49.360267639160156, 55.07762908935547, 60.79499053955078, 66.51235961914062, 72.22972106933594, 77.94708251953125, 83.66444396972656, 89.38180541992188, 95.09916687011719, 100.8165283203125, 106.53388977050781, 112.25125122070312, 117.96861267089844, 123.68597412109375, 129.40335083007812, 135.12069702148438, 140.83807373046875, 146.55543518066406, 152.27279663085938, 157.9901580810547, 163.70751953125, 169.4248809814453, 175.14224243164062, 180.859619140625, 186.57696533203125]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 9.0, 10.0, 23.0, 12.0, 15.0, 21.0, 23.0, 25.0, 37.0, 24.0, 29.0, 25.0, 26.0, 39.0, 36.0, 32.0, 37.0, 49.0, 33.0, 43.0, 33.0, 40.0, 36.0, 42.0, 27.0, 34.0, 31.0, 30.0, 18.0, 21.0, 16.0, 22.0, 11.0, 14.0, 10.0, 10.0, 8.0, 9.0, 4.0, 4.0, 5.0, 4.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-20.8125, -20.165283203125, -19.51806640625, -18.870849609375, -18.2236328125, -17.576416015625, -16.92919921875, -16.281982421875, -15.634765625, -14.987548828125, -14.34033203125, -13.693115234375, -13.0458984375, -12.398681640625, -11.75146484375, -11.104248046875, -10.45703125, -9.809814453125, -9.16259765625, -8.515380859375, -7.8681640625, -7.220947265625, -6.57373046875, -5.926513671875, -5.279296875, -4.632080078125, -3.98486328125, -3.337646484375, -2.6904296875, -2.043212890625, -1.39599609375, -0.748779296875, -0.1015625, 0.545654296875, 1.19287109375, 1.840087890625, 2.4873046875, 3.134521484375, 3.78173828125, 4.428955078125, 5.076171875, 5.723388671875, 6.37060546875, 7.017822265625, 7.6650390625, 8.312255859375, 8.95947265625, 9.606689453125, 10.25390625, 10.901123046875, 11.54833984375, 12.195556640625, 12.8427734375, 13.489990234375, 14.13720703125, 14.784423828125, 15.431640625, 16.078857421875, 16.72607421875, 17.373291015625, 18.0205078125, 18.667724609375, 19.31494140625, 19.962158203125, 20.609375]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 4.0, 5.0, 7.0, 12.0, 15.0, 14.0, 30.0, 19.0, 32.0, 50.0, 57.0, 71.0, 96.0, 107.0, 160.0, 214.0, 308.0, 429.0, 650.0, 981.0, 1741.0, 3518.0, 9691.0, 53385.0, 656224.0, 2800580.0, 603667.0, 44764.0, 8889.0, 3544.0, 1760.0, 1015.0, 652.0, 421.0, 313.0, 205.0, 169.0, 109.0, 96.0, 56.0, 57.0, 32.0, 29.0, 30.0, 17.0, 13.0, 11.0, 11.0, 11.0, 2.0, 4.0, 6.0, 2.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 3.0], "bins": [-40.9375, -39.548828125, -38.16015625, -36.771484375, -35.3828125, -33.994140625, -32.60546875, -31.216796875, -29.828125, -28.439453125, -27.05078125, -25.662109375, -24.2734375, -22.884765625, -21.49609375, -20.107421875, -18.71875, -17.330078125, -15.94140625, -14.552734375, -13.1640625, -11.775390625, -10.38671875, -8.998046875, -7.609375, -6.220703125, -4.83203125, -3.443359375, -2.0546875, -0.666015625, 0.72265625, 2.111328125, 3.5, 4.888671875, 6.27734375, 7.666015625, 9.0546875, 10.443359375, 11.83203125, 13.220703125, 14.609375, 15.998046875, 17.38671875, 18.775390625, 20.1640625, 21.552734375, 22.94140625, 24.330078125, 25.71875, 27.107421875, 28.49609375, 29.884765625, 31.2734375, 32.662109375, 34.05078125, 35.439453125, 36.828125, 38.216796875, 39.60546875, 40.994140625, 42.3828125, 43.771484375, 45.16015625, 46.548828125, 47.9375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 11.0, 21.0, 24.0, 56.0, 147.0, 267.0, 720.0, 1365.0, 861.0, 320.0, 147.0, 73.0, 33.0, 17.0, 12.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.8125, -71.0439453125, -68.275390625, -65.5068359375, -62.73828125, -59.9697265625, -57.201171875, -54.4326171875, -51.6640625, -48.8955078125, -46.126953125, -43.3583984375, -40.58984375, -37.8212890625, -35.052734375, -32.2841796875, -29.515625, -26.7470703125, -23.978515625, -21.2099609375, -18.44140625, -15.6728515625, -12.904296875, -10.1357421875, -7.3671875, -4.5986328125, -1.830078125, 0.9384765625, 3.70703125, 6.4755859375, 9.244140625, 12.0126953125, 14.78125, 17.5498046875, 20.318359375, 23.0869140625, 25.85546875, 28.6240234375, 31.392578125, 34.1611328125, 36.9296875, 39.6982421875, 42.466796875, 45.2353515625, 48.00390625, 50.7724609375, 53.541015625, 56.3095703125, 59.078125, 61.8466796875, 64.615234375, 67.3837890625, 70.15234375, 72.9208984375, 75.689453125, 78.4580078125, 81.2265625, 83.9951171875, 86.763671875, 89.5322265625, 92.30078125, 95.0693359375, 97.837890625, 100.6064453125, 103.375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 10.0, 27.0, 54.0, 161.0, 458.0, 1837.0, 121808.0, 4061301.0, 7277.0, 851.0, 322.0, 103.0, 36.0, 18.0, 12.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-241.0, -234.529296875, -228.05859375, -221.587890625, -215.1171875, -208.646484375, -202.17578125, -195.705078125, -189.234375, -182.763671875, -176.29296875, -169.822265625, -163.3515625, -156.880859375, -150.41015625, -143.939453125, -137.46875, -130.998046875, -124.52734375, -118.056640625, -111.5859375, -105.115234375, -98.64453125, -92.173828125, -85.703125, -79.232421875, -72.76171875, -66.291015625, -59.8203125, -53.349609375, -46.87890625, -40.408203125, -33.9375, -27.466796875, -20.99609375, -14.525390625, -8.0546875, -1.583984375, 4.88671875, 11.357421875, 17.828125, 24.298828125, 30.76953125, 37.240234375, 43.7109375, 50.181640625, 56.65234375, 63.123046875, 69.59375, 76.064453125, 82.53515625, 89.005859375, 95.4765625, 101.947265625, 108.41796875, 114.888671875, 121.359375, 127.830078125, 134.30078125, 140.771484375, 147.2421875, 153.712890625, 160.18359375, 166.654296875, 173.125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 38.0, 152.0, 431.0, 288.0, 79.0, 17.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-599.0835571289062, -583.9814453125, -568.87939453125, -553.77734375, -538.6752319335938, -523.5731201171875, -508.4710693359375, -493.3689880371094, -478.26690673828125, -463.1648254394531, -448.062744140625, -432.9606628417969, -417.85858154296875, -402.7565002441406, -387.6544189453125, -372.5523376464844, -357.45025634765625, -342.3481750488281, -327.24609375, -312.1440124511719, -297.04193115234375, -281.9398498535156, -266.8377685546875, -251.73568725585938, -236.63360595703125, -221.53152465820312, -206.429443359375, -191.32736206054688, -176.22528076171875, -161.12319946289062, -146.0211181640625, -130.91903686523438, -115.81695556640625, -100.71487426757812, -85.61279296875, -70.51071166992188, -55.40863037109375, -40.306549072265625, -25.2044677734375, -10.102386474609375, 4.99969482421875, 20.101776123046875, 35.203857421875, 50.305938720703125, 65.40802001953125, 80.51010131835938, 95.6121826171875, 110.71426391601562, 125.81634521484375, 140.91842651367188, 156.0205078125, 171.12258911132812, 186.22467041015625, 201.32675170898438, 216.4288330078125, 231.53091430664062, 246.63299560546875, 261.7350769042969, 276.837158203125, 291.9392395019531, 307.04132080078125, 322.1434020996094, 337.2454833984375, 352.3475646972656, 367.44964599609375]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 6.0, 4.0, 2.0, 12.0, 5.0, 8.0, 12.0, 16.0, 16.0, 18.0, 20.0, 25.0, 35.0, 23.0, 31.0, 33.0, 35.0, 41.0, 37.0, 34.0, 41.0, 46.0, 53.0, 41.0, 40.0, 28.0, 28.0, 45.0, 29.0, 33.0, 33.0, 27.0, 15.0, 20.0, 18.0, 17.0, 13.0, 12.0, 14.0, 8.0, 5.0, 6.0, 2.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.4825439453125, -111.51422119140625, -107.5458984375, -103.57757568359375, -99.6092529296875, -95.64093017578125, -91.67259979248047, -87.70427703857422, -83.73595428466797, -79.76763153076172, -75.79930877685547, -71.83098602294922, -67.86265563964844, -63.89433670043945, -59.92601013183594, -55.95768737792969, -51.98936462402344, -48.02104187011719, -44.05271911621094, -40.08439254760742, -36.11606979370117, -32.14774703979492, -28.17942237854004, -24.211097717285156, -20.242774963378906, -16.274452209472656, -12.306127548217773, -8.337803840637207, -4.369480133056641, -0.4011573791503906, 3.567167282104492, 7.535491943359375, 11.503814697265625, 15.472138404846191, 19.440462112426758, 23.40878677368164, 27.37710952758789, 31.34543228149414, 35.313758850097656, 39.282081604003906, 43.250404357910156, 47.218727111816406, 51.187049865722656, 55.15537643432617, 59.12369918823242, 63.09202194213867, 67.06034851074219, 71.02867126464844, 74.99699401855469, 78.96531677246094, 82.93363952636719, 86.90196228027344, 90.87028503417969, 94.83860778808594, 98.80693817138672, 102.77526092529297, 106.74358367919922, 110.71190643310547, 114.68022918701172, 118.64855194091797, 122.61688232421875, 126.585205078125, 130.55352783203125, 134.5218505859375, 138.49017333984375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 4.0, 6.0, 6.0, 4.0, 5.0, 14.0, 14.0, 9.0, 12.0, 23.0, 20.0, 14.0, 33.0, 18.0, 32.0, 30.0, 22.0, 26.0, 27.0, 30.0, 32.0, 30.0, 32.0, 39.0, 25.0, 30.0, 46.0, 41.0, 36.0, 40.0, 27.0, 31.0, 24.0, 26.0, 21.0, 26.0, 21.0, 16.0, 14.0, 17.0, 10.0, 14.0, 10.0, 9.0, 9.0, 3.0, 3.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-15.171875, -14.683837890625, -14.19580078125, -13.707763671875, -13.2197265625, -12.731689453125, -12.24365234375, -11.755615234375, -11.267578125, -10.779541015625, -10.29150390625, -9.803466796875, -9.3154296875, -8.827392578125, -8.33935546875, -7.851318359375, -7.36328125, -6.875244140625, -6.38720703125, -5.899169921875, -5.4111328125, -4.923095703125, -4.43505859375, -3.947021484375, -3.458984375, -2.970947265625, -2.48291015625, -1.994873046875, -1.5068359375, -1.018798828125, -0.53076171875, -0.042724609375, 0.4453125, 0.933349609375, 1.42138671875, 1.909423828125, 2.3974609375, 2.885498046875, 3.37353515625, 3.861572265625, 4.349609375, 4.837646484375, 5.32568359375, 5.813720703125, 6.3017578125, 6.789794921875, 7.27783203125, 7.765869140625, 8.25390625, 8.741943359375, 9.22998046875, 9.718017578125, 10.2060546875, 10.694091796875, 11.18212890625, 11.670166015625, 12.158203125, 12.646240234375, 13.13427734375, 13.622314453125, 14.1103515625, 14.598388671875, 15.08642578125, 15.574462890625, 16.0625]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 7.0, 8.0, 8.0, 20.0, 28.0, 33.0, 57.0, 77.0, 127.0, 182.0, 306.0, 529.0, 836.0, 1422.0, 2339.0, 3734.0, 6452.0, 10798.0, 18436.0, 32465.0, 56990.0, 105996.0, 204383.0, 262825.0, 154733.0, 80533.0, 44066.0, 25198.0, 14468.0, 8581.0, 5065.0, 3094.0, 1854.0, 1099.0, 674.0, 431.0, 258.0, 145.0, 116.0, 66.0, 45.0, 21.0, 22.0, 12.0, 11.0, 4.0, 5.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.287109375, -2.211578369140625, -2.13604736328125, -2.060516357421875, -1.9849853515625, -1.909454345703125, -1.83392333984375, -1.758392333984375, -1.682861328125, -1.607330322265625, -1.53179931640625, -1.456268310546875, -1.3807373046875, -1.305206298828125, -1.22967529296875, -1.154144287109375, -1.07861328125, -1.003082275390625, -0.92755126953125, -0.852020263671875, -0.7764892578125, -0.700958251953125, -0.62542724609375, -0.549896240234375, -0.474365234375, -0.398834228515625, -0.32330322265625, -0.247772216796875, -0.1722412109375, -0.096710205078125, -0.02117919921875, 0.054351806640625, 0.1298828125, 0.205413818359375, 0.28094482421875, 0.356475830078125, 0.4320068359375, 0.507537841796875, 0.58306884765625, 0.658599853515625, 0.734130859375, 0.809661865234375, 0.88519287109375, 0.960723876953125, 1.0362548828125, 1.111785888671875, 1.18731689453125, 1.262847900390625, 1.33837890625, 1.413909912109375, 1.48944091796875, 1.564971923828125, 1.6405029296875, 1.716033935546875, 1.79156494140625, 1.867095947265625, 1.942626953125, 2.018157958984375, 2.09368896484375, 2.169219970703125, 2.2447509765625, 2.320281982421875, 2.39581298828125, 2.471343994140625, 2.546875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [4.0, 0.0, 5.0, 3.0, 2.0, 1.0, 4.0, 3.0, 7.0, 9.0, 14.0, 11.0, 9.0, 10.0, 15.0, 17.0, 12.0, 21.0, 28.0, 34.0, 32.0, 30.0, 41.0, 26.0, 34.0, 42.0, 26.0, 37.0, 37.0, 1064.0, 43.0, 46.0, 30.0, 26.0, 28.0, 40.0, 33.0, 26.0, 25.0, 16.0, 22.0, 16.0, 18.0, 10.0, 12.0, 13.0, 10.0, 13.0, 10.0, 5.0, 6.0, 9.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.171875, -9.8216552734375, -9.471435546875, -9.1212158203125, -8.77099609375, -8.4207763671875, -8.070556640625, -7.7203369140625, -7.3701171875, -7.0198974609375, -6.669677734375, -6.3194580078125, -5.96923828125, -5.6190185546875, -5.268798828125, -4.9185791015625, -4.568359375, -4.2181396484375, -3.867919921875, -3.5177001953125, -3.16748046875, -2.8172607421875, -2.467041015625, -2.1168212890625, -1.7666015625, -1.4163818359375, -1.066162109375, -0.7159423828125, -0.36572265625, -0.0155029296875, 0.334716796875, 0.6849365234375, 1.03515625, 1.3853759765625, 1.735595703125, 2.0858154296875, 2.43603515625, 2.7862548828125, 3.136474609375, 3.4866943359375, 3.8369140625, 4.1871337890625, 4.537353515625, 4.8875732421875, 5.23779296875, 5.5880126953125, 5.938232421875, 6.2884521484375, 6.638671875, 6.9888916015625, 7.339111328125, 7.6893310546875, 8.03955078125, 8.3897705078125, 8.739990234375, 9.0902099609375, 9.4404296875, 9.7906494140625, 10.140869140625, 10.4910888671875, 10.84130859375, 11.1915283203125, 11.541748046875, 11.8919677734375, 12.2421875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 0.0, 4.0, 2.0, 3.0, 6.0, 20.0, 20.0, 27.0, 51.0, 65.0, 58.0, 98.0, 174.0, 250.0, 370.0, 487.0, 693.0, 1020.0, 1465.0, 2236.0, 3074.0, 4553.0, 6771.0, 9794.0, 14651.0, 21759.0, 34059.0, 54041.0, 86727.0, 139773.0, 1246072.0, 170646.0, 108085.0, 66791.0, 41885.0, 26905.0, 17598.0, 11627.0, 7823.0, 5448.0, 3825.0, 2547.0, 1682.0, 1235.0, 806.0, 574.0, 415.0, 285.0, 193.0, 154.0, 98.0, 61.0, 44.0, 29.0, 15.0, 13.0, 11.0, 9.0, 8.0, 4.0, 5.0, 2.0], "bins": [-1.45703125, -1.412506103515625, -1.36798095703125, -1.323455810546875, -1.2789306640625, -1.234405517578125, -1.18988037109375, -1.145355224609375, -1.100830078125, -1.056304931640625, -1.01177978515625, -0.967254638671875, -0.9227294921875, -0.878204345703125, -0.83367919921875, -0.789154052734375, -0.74462890625, -0.700103759765625, -0.65557861328125, -0.611053466796875, -0.5665283203125, -0.522003173828125, -0.47747802734375, -0.432952880859375, -0.388427734375, -0.343902587890625, -0.29937744140625, -0.254852294921875, -0.2103271484375, -0.165802001953125, -0.12127685546875, -0.076751708984375, -0.0322265625, 0.012298583984375, 0.05682373046875, 0.101348876953125, 0.1458740234375, 0.190399169921875, 0.23492431640625, 0.279449462890625, 0.323974609375, 0.368499755859375, 0.41302490234375, 0.457550048828125, 0.5020751953125, 0.546600341796875, 0.59112548828125, 0.635650634765625, 0.68017578125, 0.724700927734375, 0.76922607421875, 0.813751220703125, 0.8582763671875, 0.902801513671875, 0.94732666015625, 0.991851806640625, 1.036376953125, 1.080902099609375, 1.12542724609375, 1.169952392578125, 1.2144775390625, 1.259002685546875, 1.30352783203125, 1.348052978515625, 1.392578125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 1.0, 4.0, 7.0, 7.0, 21.0, 19.0, 19.0, 34.0, 32.0, 23.0, 28.0, 43.0, 45.0, 61.0, 91.0, 94.0, 92.0, 57.0, 63.0, 41.0, 46.0, 35.0, 28.0, 21.0, 11.0, 13.0, 15.0, 17.0, 10.0, 8.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.02557373046875, -0.024890661239624023, -0.024207592010498047, -0.02352452278137207, -0.022841453552246094, -0.022158384323120117, -0.02147531509399414, -0.020792245864868164, -0.020109176635742188, -0.01942610740661621, -0.018743038177490234, -0.018059968948364258, -0.01737689971923828, -0.016693830490112305, -0.016010761260986328, -0.015327692031860352, -0.014644622802734375, -0.013961553573608398, -0.013278484344482422, -0.012595415115356445, -0.011912345886230469, -0.011229276657104492, -0.010546207427978516, -0.009863138198852539, -0.009180068969726562, -0.008496999740600586, -0.00781393051147461, -0.007130861282348633, -0.006447792053222656, -0.00576472282409668, -0.005081653594970703, -0.0043985843658447266, -0.00371551513671875, -0.0030324459075927734, -0.002349376678466797, -0.0016663074493408203, -0.0009832382202148438, -0.0003001689910888672, 0.0003829002380371094, 0.001065969467163086, 0.0017490386962890625, 0.002432107925415039, 0.0031151771545410156, 0.003798246383666992, 0.004481315612792969, 0.005164384841918945, 0.005847454071044922, 0.0065305233001708984, 0.007213592529296875, 0.007896661758422852, 0.008579730987548828, 0.009262800216674805, 0.009945869445800781, 0.010628938674926758, 0.011312007904052734, 0.011995077133178711, 0.012678146362304688, 0.013361215591430664, 0.01404428482055664, 0.014727354049682617, 0.015410423278808594, 0.01609349250793457, 0.016776561737060547, 0.017459630966186523, 0.0181427001953125]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 3.0, 1.0, 7.0, 12.0, 19.0, 16.0, 29.0, 37.0, 41.0, 62.0, 79.0, 143.0, 207.0, 333.0, 601.0, 3497.0, 1038680.0, 3221.0, 589.0, 318.0, 195.0, 125.0, 99.0, 67.0, 53.0, 40.0, 27.0, 11.0, 12.0, 8.0, 8.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3740234375, -0.3599090576171875, -0.345794677734375, -0.3316802978515625, -0.31756591796875, -0.3034515380859375, -0.289337158203125, -0.2752227783203125, -0.2611083984375, -0.2469940185546875, -0.232879638671875, -0.2187652587890625, -0.20465087890625, -0.1905364990234375, -0.176422119140625, -0.1623077392578125, -0.148193359375, -0.1340789794921875, -0.119964599609375, -0.1058502197265625, -0.09173583984375, -0.0776214599609375, -0.063507080078125, -0.0493927001953125, -0.0352783203125, -0.0211639404296875, -0.007049560546875, 0.0070648193359375, 0.02117919921875, 0.0352935791015625, 0.049407958984375, 0.0635223388671875, 0.07763671875, 0.0917510986328125, 0.105865478515625, 0.1199798583984375, 0.13409423828125, 0.1482086181640625, 0.162322998046875, 0.1764373779296875, 0.1905517578125, 0.2046661376953125, 0.218780517578125, 0.2328948974609375, 0.24700927734375, 0.2611236572265625, 0.275238037109375, 0.2893524169921875, 0.303466796875, 0.3175811767578125, 0.331695556640625, 0.3458099365234375, 0.35992431640625, 0.3740386962890625, 0.388153076171875, 0.4022674560546875, 0.4163818359375, 0.4304962158203125, 0.444610595703125, 0.4587249755859375, 0.47283935546875, 0.4869537353515625, 0.501068115234375, 0.5151824951171875, 0.529296875]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 947.0, 62.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07114312052726746, -0.06445673853158951, -0.05777035653591156, -0.05108397454023361, -0.044397592544555664, -0.037711214274168015, -0.031024832278490067, -0.02433845028281212, -0.01765206828713417, -0.010965686291456223, -0.004279305227100849, 0.0024070758372545242, 0.009093457832932472, 0.01577983796596527, 0.02246621996164322, 0.029152601957321167, 0.035838983952999115, 0.04252536594867706, 0.04921174794435501, 0.05589812994003296, 0.06258451193571091, 0.06927089393138885, 0.0759572684764862, 0.08264365792274475, 0.0893300324678421, 0.09601641446352005, 0.102702796459198, 0.10938917845487595, 0.1160755604505539, 0.12276193499565125, 0.1294483244419098, 0.13613469898700714, 0.14282108843326569, 0.14950746297836304, 0.15619385242462158, 0.16288022696971893, 0.16956661641597748, 0.17625299096107483, 0.18293938040733337, 0.18962575495243073, 0.19631214439868927, 0.20299851894378662, 0.20968490839004517, 0.21637128293514252, 0.22305767238140106, 0.2297440469264984, 0.23643043637275696, 0.2431168109178543, 0.24980318546295166, 0.2564895749092102, 0.26317593455314636, 0.2698623239994049, 0.27654871344566345, 0.283235102891922, 0.28992146253585815, 0.2966078519821167, 0.30329424142837524, 0.3099806308746338, 0.31666699051856995, 0.3233533799648285, 0.33003976941108704, 0.3367261588573456, 0.34341251850128174, 0.3500989079475403, 0.35678529739379883]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 7.0, 10.0, 8.0, 17.0, 25.0, 26.0, 36.0, 36.0, 46.0, 41.0, 38.0, 46.0, 44.0, 57.0, 53.0, 53.0, 51.0, 48.0, 45.0, 59.0, 37.0, 33.0, 40.0, 35.0, 27.0, 20.0, 19.0, 12.0, 9.0, 1.0, 6.0, 3.0, 7.0, 3.0, 0.0, 5.0, 1.0, 1.0, 2.0], "bins": [-0.026851892471313477, -0.026176083832979202, -0.025500277057290077, -0.024824470281600952, -0.024148661643266678, -0.023472853004932404, -0.02279704622924328, -0.022121239453554153, -0.02144543081521988, -0.020769622176885605, -0.02009381540119648, -0.019418008625507355, -0.01874219998717308, -0.018066391348838806, -0.01739058457314968, -0.016714777797460556, -0.016038969159126282, -0.015363161452114582, -0.014687353745102882, -0.014011546038091183, -0.013335738331079483, -0.012659930624067783, -0.011984122917056084, -0.011308315210044384, -0.010632507503032684, -0.009956699796020985, -0.009280892089009285, -0.008605084381997585, -0.007929276674985886, -0.007253468967974186, -0.006577661260962486, -0.005901853553950787, -0.005226045846939087, -0.004550238139927387, -0.0038744304329156876, -0.003198622725903988, -0.002522815018892288, -0.0018470073118805885, -0.0011711996048688889, -0.0004953918978571892, 0.0001804158091545105, 0.0008562235161662102, 0.0015320312231779099, 0.0022078389301896095, 0.002883646637201309, 0.003559454344213009, 0.0042352620512247086, 0.004911069758236408, 0.005586877465248108, 0.006262685172259808, 0.006938492879271507, 0.007614300586283207, 0.008290108293294907, 0.008965916000306606, 0.009641723707318306, 0.010317531414330006, 0.010993339121341705, 0.011669146828353405, 0.012344954535365105, 0.013020762242376804, 0.013696569949388504, 0.014372377656400204, 0.015048185363411903, 0.01572399213910103, 0.016399800777435303]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 4.0, 6.0, 6.0, 4.0, 5.0, 14.0, 14.0, 9.0, 12.0, 21.0, 22.0, 14.0, 33.0, 16.0, 32.0, 32.0, 22.0, 26.0, 27.0, 30.0, 32.0, 30.0, 31.0, 40.0, 24.0, 31.0, 46.0, 40.0, 37.0, 40.0, 27.0, 31.0, 24.0, 26.0, 21.0, 26.0, 21.0, 15.0, 15.0, 17.0, 10.0, 14.0, 10.0, 9.0, 9.0, 3.0, 3.0, 5.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-15.1796875, -14.6915283203125, -14.203369140625, -13.7152099609375, -13.22705078125, -12.7388916015625, -12.250732421875, -11.7625732421875, -11.2744140625, -10.7862548828125, -10.298095703125, -9.8099365234375, -9.32177734375, -8.8336181640625, -8.345458984375, -7.8572998046875, -7.369140625, -6.8809814453125, -6.392822265625, -5.9046630859375, -5.41650390625, -4.9283447265625, -4.440185546875, -3.9520263671875, -3.4638671875, -2.9757080078125, -2.487548828125, -1.9993896484375, -1.51123046875, -1.0230712890625, -0.534912109375, -0.0467529296875, 0.44140625, 0.9295654296875, 1.417724609375, 1.9058837890625, 2.39404296875, 2.8822021484375, 3.370361328125, 3.8585205078125, 4.3466796875, 4.8348388671875, 5.322998046875, 5.8111572265625, 6.29931640625, 6.7874755859375, 7.275634765625, 7.7637939453125, 8.251953125, 8.7401123046875, 9.228271484375, 9.7164306640625, 10.20458984375, 10.6927490234375, 11.180908203125, 11.6690673828125, 12.1572265625, 12.6453857421875, 13.133544921875, 13.6217041015625, 14.10986328125, 14.5980224609375, 15.086181640625, 15.5743408203125, 16.0625]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 3.0, 1.0, 2.0, 11.0, 5.0, 12.0, 10.0, 17.0, 22.0, 16.0, 30.0, 32.0, 55.0, 58.0, 80.0, 129.0, 155.0, 205.0, 329.0, 463.0, 711.0, 1090.0, 1818.0, 3378.0, 7372.0, 20405.0, 78747.0, 447851.0, 384090.0, 68254.0, 18288.0, 6700.0, 3213.0, 1722.0, 1061.0, 672.0, 442.0, 313.0, 200.0, 162.0, 98.0, 81.0, 52.0, 56.0, 29.0, 25.0, 21.0, 23.0, 17.0, 8.0, 6.0, 9.0, 8.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0], "bins": [-26.796875, -25.958251953125, -25.11962890625, -24.281005859375, -23.4423828125, -22.603759765625, -21.76513671875, -20.926513671875, -20.087890625, -19.249267578125, -18.41064453125, -17.572021484375, -16.7333984375, -15.894775390625, -15.05615234375, -14.217529296875, -13.37890625, -12.540283203125, -11.70166015625, -10.863037109375, -10.0244140625, -9.185791015625, -8.34716796875, -7.508544921875, -6.669921875, -5.831298828125, -4.99267578125, -4.154052734375, -3.3154296875, -2.476806640625, -1.63818359375, -0.799560546875, 0.0390625, 0.877685546875, 1.71630859375, 2.554931640625, 3.3935546875, 4.232177734375, 5.07080078125, 5.909423828125, 6.748046875, 7.586669921875, 8.42529296875, 9.263916015625, 10.1025390625, 10.941162109375, 11.77978515625, 12.618408203125, 13.45703125, 14.295654296875, 15.13427734375, 15.972900390625, 16.8115234375, 17.650146484375, 18.48876953125, 19.327392578125, 20.166015625, 21.004638671875, 21.84326171875, 22.681884765625, 23.5205078125, 24.359130859375, 25.19775390625, 26.036376953125, 26.875]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 4.0, 7.0, 3.0, 7.0, 10.0, 17.0, 23.0, 26.0, 26.0, 15.0, 34.0, 55.0, 60.0, 76.0, 131.0, 354.0, 1574.0, 159.0, 97.0, 84.0, 56.0, 53.0, 41.0, 31.0, 23.0, 17.0, 8.0, 17.0, 7.0, 10.0, 6.0, 4.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.40625, -57.36865234375, -55.3310546875, -53.29345703125, -51.255859375, -49.21826171875, -47.1806640625, -45.14306640625, -43.10546875, -41.06787109375, -39.0302734375, -36.99267578125, -34.955078125, -32.91748046875, -30.8798828125, -28.84228515625, -26.8046875, -24.76708984375, -22.7294921875, -20.69189453125, -18.654296875, -16.61669921875, -14.5791015625, -12.54150390625, -10.50390625, -8.46630859375, -6.4287109375, -4.39111328125, -2.353515625, -0.31591796875, 1.7216796875, 3.75927734375, 5.796875, 7.83447265625, 9.8720703125, 11.90966796875, 13.947265625, 15.98486328125, 18.0224609375, 20.06005859375, 22.09765625, 24.13525390625, 26.1728515625, 28.21044921875, 30.248046875, 32.28564453125, 34.3232421875, 36.36083984375, 38.3984375, 40.43603515625, 42.4736328125, 44.51123046875, 46.548828125, 48.58642578125, 50.6240234375, 52.66162109375, 54.69921875, 56.73681640625, 58.7744140625, 60.81201171875, 62.849609375, 64.88720703125, 66.9248046875, 68.96240234375, 71.0]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 3.0, 9.0, 10.0, 9.0, 15.0, 16.0, 38.0, 43.0, 79.0, 113.0, 246.0, 453.0, 1272.0, 98589.0, 3041483.0, 2119.0, 529.0, 268.0, 135.0, 88.0, 53.0, 29.0, 39.0, 17.0, 12.0, 6.0, 4.0, 14.0, 1.0, 0.0, 2.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-193.25, -187.751953125, -182.25390625, -176.755859375, -171.2578125, -165.759765625, -160.26171875, -154.763671875, -149.265625, -143.767578125, -138.26953125, -132.771484375, -127.2734375, -121.775390625, -116.27734375, -110.779296875, -105.28125, -99.783203125, -94.28515625, -88.787109375, -83.2890625, -77.791015625, -72.29296875, -66.794921875, -61.296875, -55.798828125, -50.30078125, -44.802734375, -39.3046875, -33.806640625, -28.30859375, -22.810546875, -17.3125, -11.814453125, -6.31640625, -0.818359375, 4.6796875, 10.177734375, 15.67578125, 21.173828125, 26.671875, 32.169921875, 37.66796875, 43.166015625, 48.6640625, 54.162109375, 59.66015625, 65.158203125, 70.65625, 76.154296875, 81.65234375, 87.150390625, 92.6484375, 98.146484375, 103.64453125, 109.142578125, 114.640625, 120.138671875, 125.63671875, 131.134765625, 136.6328125, 142.130859375, 147.62890625, 153.126953125, 158.625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [3.0, 457.0, 546.0, 11.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.125770568847656, -26.121835708618164, -0.11790084838867188, 25.886032104492188, 51.88996887207031, 77.8938980102539, 103.89783477783203, 129.90176391601562, 155.90570068359375, 181.90963745117188, 207.91357421875, 233.91751098632812, 259.92144775390625, 285.92535400390625, 311.9293212890625, 337.9332275390625, 363.93719482421875, 389.9411315917969, 415.945068359375, 441.9490051269531, 467.95294189453125, 493.95684814453125, 519.9608154296875, 545.9647216796875, 571.9686889648438, 597.9725952148438, 623.9765625, 649.98046875, 675.9844360351562, 701.9883422851562, 727.9923095703125, 753.9962158203125, 780.0001831054688, 806.0040893554688, 832.008056640625, 858.011962890625, 884.0159301757812, 910.0198364257812, 936.0238037109375, 962.0277099609375, 988.0316772460938, 1014.0355834960938, 1040.03955078125, 1066.04345703125, 1092.04736328125, 1118.0513916015625, 1144.0552978515625, 1170.0592041015625, 1196.0631103515625, 1222.0670166015625, 1248.0709228515625, 1274.074951171875, 1300.078857421875, 1326.082763671875, 1352.086669921875, 1378.0906982421875, 1404.0946044921875, 1430.0985107421875, 1456.1024169921875, 1482.1064453125, 1508.1103515625, 1534.1142578125, 1560.1181640625, 1586.1221923828125, 1612.1260986328125]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 8.0, 8.0, 9.0, 7.0, 6.0, 10.0, 19.0, 18.0, 20.0, 24.0, 23.0, 21.0, 36.0, 46.0, 31.0, 37.0, 37.0, 50.0, 50.0, 42.0, 41.0, 40.0, 53.0, 41.0, 38.0, 39.0, 31.0, 39.0, 24.0, 33.0, 19.0, 11.0, 18.0, 16.0, 14.0, 9.0, 7.0, 4.0, 8.0, 6.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0], "bins": [-126.49910736083984, -122.5952377319336, -118.69137573242188, -114.78750610351562, -110.88363647460938, -106.97976684570312, -103.07589721679688, -99.17203521728516, -95.2681655883789, -91.36429595947266, -87.46043395996094, -83.55656433105469, -79.65269470214844, -75.74882507324219, -71.84495544433594, -67.94109344482422, -64.03722381591797, -60.13335418701172, -56.229488372802734, -52.32562255859375, -48.4217529296875, -44.51788330078125, -40.614017486572266, -36.71015167236328, -32.80628204345703, -28.902414321899414, -24.998546600341797, -21.09467887878418, -17.190811157226562, -13.286943435668945, -9.383075714111328, -5.479207992553711, -1.5753326416015625, 2.3285350799560547, 6.232402801513672, 10.136270523071289, 14.040138244628906, 17.944005966186523, 21.84787368774414, 25.751741409301758, 29.655609130859375, 33.559478759765625, 37.46334457397461, 41.367210388183594, 45.271080017089844, 49.174949645996094, 53.07881546020508, 56.98268127441406, 60.88655090332031, 64.79042053222656, 68.69429016113281, 72.59815216064453, 76.50202178955078, 80.40589141845703, 84.30975341796875, 88.213623046875, 92.11749267578125, 96.0213623046875, 99.92523193359375, 103.82909393310547, 107.73296356201172, 111.63683319091797, 115.54069519042969, 119.44456481933594, 123.34843444824219]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 1.0, 3.0, 6.0, 5.0, 4.0, 12.0, 8.0, 9.0, 16.0, 14.0, 10.0, 13.0, 30.0, 18.0, 23.0, 24.0, 24.0, 43.0, 37.0, 34.0, 36.0, 32.0, 35.0, 48.0, 42.0, 41.0, 35.0, 35.0, 44.0, 44.0, 31.0, 27.0, 33.0, 21.0, 28.0, 29.0, 14.0, 13.0, 15.0, 17.0, 17.0, 12.0, 7.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-21.0625, -20.43017578125, -19.7978515625, -19.16552734375, -18.533203125, -17.90087890625, -17.2685546875, -16.63623046875, -16.00390625, -15.37158203125, -14.7392578125, -14.10693359375, -13.474609375, -12.84228515625, -12.2099609375, -11.57763671875, -10.9453125, -10.31298828125, -9.6806640625, -9.04833984375, -8.416015625, -7.78369140625, -7.1513671875, -6.51904296875, -5.88671875, -5.25439453125, -4.6220703125, -3.98974609375, -3.357421875, -2.72509765625, -2.0927734375, -1.46044921875, -0.828125, -0.19580078125, 0.4365234375, 1.06884765625, 1.701171875, 2.33349609375, 2.9658203125, 3.59814453125, 4.23046875, 4.86279296875, 5.4951171875, 6.12744140625, 6.759765625, 7.39208984375, 8.0244140625, 8.65673828125, 9.2890625, 9.92138671875, 10.5537109375, 11.18603515625, 11.818359375, 12.45068359375, 13.0830078125, 13.71533203125, 14.34765625, 14.97998046875, 15.6123046875, 16.24462890625, 16.876953125, 17.50927734375, 18.1416015625, 18.77392578125, 19.40625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 5.0, 12.0, 10.0, 12.0, 16.0, 24.0, 17.0, 40.0, 35.0, 55.0, 64.0, 97.0, 103.0, 141.0, 161.0, 250.0, 334.0, 495.0, 823.0, 1724.0, 3693.0, 11193.0, 114964.0, 3577199.0, 456246.0, 16448.0, 4950.0, 2054.0, 1079.0, 569.0, 378.0, 269.0, 181.0, 138.0, 106.0, 100.0, 57.0, 48.0, 39.0, 36.0, 22.0, 19.0, 24.0, 16.0, 9.0, 8.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0], "bins": [-97.1875, -94.2978515625, -91.408203125, -88.5185546875, -85.62890625, -82.7392578125, -79.849609375, -76.9599609375, -74.0703125, -71.1806640625, -68.291015625, -65.4013671875, -62.51171875, -59.6220703125, -56.732421875, -53.8427734375, -50.953125, -48.0634765625, -45.173828125, -42.2841796875, -39.39453125, -36.5048828125, -33.615234375, -30.7255859375, -27.8359375, -24.9462890625, -22.056640625, -19.1669921875, -16.27734375, -13.3876953125, -10.498046875, -7.6083984375, -4.71875, -1.8291015625, 1.060546875, 3.9501953125, 6.83984375, 9.7294921875, 12.619140625, 15.5087890625, 18.3984375, 21.2880859375, 24.177734375, 27.0673828125, 29.95703125, 32.8466796875, 35.736328125, 38.6259765625, 41.515625, 44.4052734375, 47.294921875, 50.1845703125, 53.07421875, 55.9638671875, 58.853515625, 61.7431640625, 64.6328125, 67.5224609375, 70.412109375, 73.3017578125, 76.19140625, 79.0810546875, 81.970703125, 84.8603515625, 87.75]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 5.0, 4.0, 6.0, 7.0, 11.0, 15.0, 25.0, 32.0, 78.0, 125.0, 262.0, 575.0, 1123.0, 935.0, 415.0, 205.0, 103.0, 61.0, 26.0, 19.0, 13.0, 6.0, 8.0, 5.0, 2.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.90625, -52.86279296875, -50.8193359375, -48.77587890625, -46.732421875, -44.68896484375, -42.6455078125, -40.60205078125, -38.55859375, -36.51513671875, -34.4716796875, -32.42822265625, -30.384765625, -28.34130859375, -26.2978515625, -24.25439453125, -22.2109375, -20.16748046875, -18.1240234375, -16.08056640625, -14.037109375, -11.99365234375, -9.9501953125, -7.90673828125, -5.86328125, -3.81982421875, -1.7763671875, 0.26708984375, 2.310546875, 4.35400390625, 6.3974609375, 8.44091796875, 10.484375, 12.52783203125, 14.5712890625, 16.61474609375, 18.658203125, 20.70166015625, 22.7451171875, 24.78857421875, 26.83203125, 28.87548828125, 30.9189453125, 32.96240234375, 35.005859375, 37.04931640625, 39.0927734375, 41.13623046875, 43.1796875, 45.22314453125, 47.2666015625, 49.31005859375, 51.353515625, 53.39697265625, 55.4404296875, 57.48388671875, 59.52734375, 61.57080078125, 63.6142578125, 65.65771484375, 67.701171875, 69.74462890625, 71.7880859375, 73.83154296875, 75.875]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 12.0, 4.0, 5.0, 9.0, 15.0, 25.0, 19.0, 30.0, 33.0, 45.0, 71.0, 104.0, 165.0, 243.0, 440.0, 739.0, 1478.0, 3031.0, 6945.0, 21230.0, 97904.0, 1654900.0, 2252119.0, 116316.0, 23815.0, 7683.0, 3298.0, 1563.0, 797.0, 437.0, 242.0, 162.0, 116.0, 76.0, 55.0, 36.0, 25.0, 19.0, 26.0, 9.0, 17.0, 8.0, 4.0, 11.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-45.40625, -43.89501953125, -42.3837890625, -40.87255859375, -39.361328125, -37.85009765625, -36.3388671875, -34.82763671875, -33.31640625, -31.80517578125, -30.2939453125, -28.78271484375, -27.271484375, -25.76025390625, -24.2490234375, -22.73779296875, -21.2265625, -19.71533203125, -18.2041015625, -16.69287109375, -15.181640625, -13.67041015625, -12.1591796875, -10.64794921875, -9.13671875, -7.62548828125, -6.1142578125, -4.60302734375, -3.091796875, -1.58056640625, -0.0693359375, 1.44189453125, 2.953125, 4.46435546875, 5.9755859375, 7.48681640625, 8.998046875, 10.50927734375, 12.0205078125, 13.53173828125, 15.04296875, 16.55419921875, 18.0654296875, 19.57666015625, 21.087890625, 22.59912109375, 24.1103515625, 25.62158203125, 27.1328125, 28.64404296875, 30.1552734375, 31.66650390625, 33.177734375, 34.68896484375, 36.2001953125, 37.71142578125, 39.22265625, 40.73388671875, 42.2451171875, 43.75634765625, 45.267578125, 46.77880859375, 48.2900390625, 49.80126953125, 51.3125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 4.0, 11.0, 12.0, 25.0, 18.0, 35.0, 48.0, 43.0, 64.0, 85.0, 107.0, 106.0, 104.0, 73.0, 60.0, 49.0, 31.0, 23.0, 16.0, 17.0, 11.0, 17.0, 14.0, 7.0, 5.0, 4.0, 6.0, 0.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-268.54449462890625, -261.75665283203125, -254.9688262939453, -248.1809844970703, -241.3931427001953, -234.60531616210938, -227.81747436523438, -221.02963256835938, -214.24180603027344, -207.45396423339844, -200.6661376953125, -193.8782958984375, -187.0904541015625, -180.30262756347656, -173.51478576660156, -166.72695922851562, -159.93911743164062, -153.15127563476562, -146.3634490966797, -139.5756072998047, -132.7877655029297, -125.99993896484375, -119.21209716796875, -112.42426300048828, -105.63641357421875, -98.84857940673828, -92.06073760986328, -85.27290344238281, -78.48506927490234, -71.69723510742188, -64.90939331054688, -58.121559143066406, -51.33372497558594, -44.5458869934082, -37.758052825927734, -30.97021484375, -24.1823787689209, -17.394542694091797, -10.606704711914062, -3.8188705444335938, 2.9689674377441406, 9.756803512573242, 16.544639587402344, 23.332477569580078, 30.12031364440918, 36.90814971923828, 43.695987701416016, 50.483821868896484, 57.27165985107422, 64.05949401855469, 70.84733581542969, 77.63516998291016, 84.42300415039062, 91.21084594726562, 97.9986801147461, 104.78651428222656, 111.57435607910156, 118.36219024658203, 125.15003204345703, 131.9378662109375, 138.7257080078125, 145.51353454589844, 152.30137634277344, 159.08920288085938, 165.87704467773438]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 3.0, 6.0, 9.0, 15.0, 15.0, 13.0, 19.0, 26.0, 27.0, 25.0, 19.0, 38.0, 38.0, 34.0, 30.0, 41.0, 54.0, 43.0, 42.0, 40.0, 45.0, 39.0, 46.0, 28.0, 30.0, 30.0, 36.0, 20.0, 22.0, 22.0, 30.0, 19.0, 19.0, 8.0, 16.0, 11.0, 7.0, 6.0, 3.0, 8.0, 3.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-141.1405029296875, -136.6005859375, -132.06068420410156, -127.52076721191406, -122.9808578491211, -118.44094848632812, -113.90103149414062, -109.36112213134766, -104.82121276855469, -100.28130340576172, -95.74139404296875, -91.20147705078125, -86.66156768798828, -82.12165832519531, -77.58174133300781, -73.04183197021484, -68.50192260742188, -63.962013244628906, -59.42210006713867, -54.88218688964844, -50.34227752685547, -45.8023681640625, -41.262454986572266, -36.72254180908203, -32.18263244628906, -27.64272117614746, -23.10280990600586, -18.562898635864258, -14.022987365722656, -9.483076095581055, -4.943164825439453, -0.40325355529785156, 4.1366424560546875, 8.676553726196289, 13.21646499633789, 17.756376266479492, 22.296287536621094, 26.836198806762695, 31.376110076904297, 35.91602325439453, 40.4559326171875, 44.99584197998047, 49.5357551574707, 54.07566833496094, 58.615577697753906, 63.155487060546875, 67.69540405273438, 72.23531341552734, 76.77522277832031, 81.31513214111328, 85.85504150390625, 90.39495849609375, 94.93486785888672, 99.47477722167969, 104.01469421386719, 108.55460357666016, 113.09451293945312, 117.6344223022461, 122.17433166503906, 126.71424865722656, 131.254150390625, 135.7940673828125, 140.333984375, 144.87388610839844, 149.41380310058594]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 7.0, 5.0, 13.0, 10.0, 13.0, 12.0, 20.0, 23.0, 24.0, 32.0, 37.0, 37.0, 33.0, 42.0, 30.0, 54.0, 52.0, 54.0, 42.0, 41.0, 40.0, 38.0, 40.0, 40.0, 36.0, 23.0, 33.0, 18.0, 18.0, 34.0, 17.0, 16.0, 15.0, 12.0, 8.0, 5.0, 3.0, 1.0, 5.0, 4.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-247.625, -239.181640625, -230.73828125, -222.294921875, -213.8515625, -205.408203125, -196.96484375, -188.521484375, -180.078125, -171.634765625, -163.19140625, -154.748046875, -146.3046875, -137.861328125, -129.41796875, -120.974609375, -112.53125, -104.087890625, -95.64453125, -87.201171875, -78.7578125, -70.314453125, -61.87109375, -53.427734375, -44.984375, -36.541015625, -28.09765625, -19.654296875, -11.2109375, -2.767578125, 5.67578125, 14.119140625, 22.5625, 31.005859375, 39.44921875, 47.892578125, 56.3359375, 64.779296875, 73.22265625, 81.666015625, 90.109375, 98.552734375, 106.99609375, 115.439453125, 123.8828125, 132.326171875, 140.76953125, 149.212890625, 157.65625, 166.099609375, 174.54296875, 182.986328125, 191.4296875, 199.873046875, 208.31640625, 216.759765625, 225.203125, 233.646484375, 242.08984375, 250.533203125, 258.9765625, 267.419921875, 275.86328125, 284.306640625, 292.75]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 7.0, 15.0, 23.0, 51.0, 59.0, 84.0, 124.0, 183.0, 281.0, 445.0, 686.0, 1087.0, 1733.0, 2853.0, 4784.0, 7930.0, 13975.0, 25065.0, 45502.0, 87766.0, 178086.0, 288194.0, 187297.0, 92280.0, 47557.0, 26163.0, 14778.0, 8576.0, 4895.0, 2984.0, 1813.0, 1174.0, 730.0, 469.0, 301.0, 213.0, 134.0, 74.0, 58.0, 43.0, 27.0, 19.0, 9.0, 8.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.59375, -27.657470703125, -26.72119140625, -25.784912109375, -24.8486328125, -23.912353515625, -22.97607421875, -22.039794921875, -21.103515625, -20.167236328125, -19.23095703125, -18.294677734375, -17.3583984375, -16.422119140625, -15.48583984375, -14.549560546875, -13.61328125, -12.677001953125, -11.74072265625, -10.804443359375, -9.8681640625, -8.931884765625, -7.99560546875, -7.059326171875, -6.123046875, -5.186767578125, -4.25048828125, -3.314208984375, -2.3779296875, -1.441650390625, -0.50537109375, 0.430908203125, 1.3671875, 2.303466796875, 3.23974609375, 4.176025390625, 5.1123046875, 6.048583984375, 6.98486328125, 7.921142578125, 8.857421875, 9.793701171875, 10.72998046875, 11.666259765625, 12.6025390625, 13.538818359375, 14.47509765625, 15.411376953125, 16.34765625, 17.283935546875, 18.22021484375, 19.156494140625, 20.0927734375, 21.029052734375, 21.96533203125, 22.901611328125, 23.837890625, 24.774169921875, 25.71044921875, 26.646728515625, 27.5830078125, 28.519287109375, 29.45556640625, 30.391845703125, 31.328125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 1.0, 5.0, 5.0, 5.0, 6.0, 9.0, 13.0, 18.0, 10.0, 21.0, 23.0, 9.0, 22.0, 29.0, 30.0, 32.0, 37.0, 32.0, 31.0, 36.0, 47.0, 32.0, 42.0, 1059.0, 49.0, 31.0, 29.0, 32.0, 36.0, 33.0, 25.0, 28.0, 22.0, 20.0, 22.0, 22.0, 16.0, 22.0, 8.0, 12.0, 12.0, 15.0, 5.0, 8.0, 6.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 3.0, 1.0], "bins": [-154.0, -149.513671875, -145.02734375, -140.541015625, -136.0546875, -131.568359375, -127.08203125, -122.595703125, -118.109375, -113.623046875, -109.13671875, -104.650390625, -100.1640625, -95.677734375, -91.19140625, -86.705078125, -82.21875, -77.732421875, -73.24609375, -68.759765625, -64.2734375, -59.787109375, -55.30078125, -50.814453125, -46.328125, -41.841796875, -37.35546875, -32.869140625, -28.3828125, -23.896484375, -19.41015625, -14.923828125, -10.4375, -5.951171875, -1.46484375, 3.021484375, 7.5078125, 11.994140625, 16.48046875, 20.966796875, 25.453125, 29.939453125, 34.42578125, 38.912109375, 43.3984375, 47.884765625, 52.37109375, 56.857421875, 61.34375, 65.830078125, 70.31640625, 74.802734375, 79.2890625, 83.775390625, 88.26171875, 92.748046875, 97.234375, 101.720703125, 106.20703125, 110.693359375, 115.1796875, 119.666015625, 124.15234375, 128.638671875, 133.125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 5.0, 5.0, 9.0, 17.0, 11.0, 28.0, 39.0, 47.0, 80.0, 109.0, 161.0, 234.0, 366.0, 535.0, 747.0, 1070.0, 1586.0, 2304.0, 3445.0, 5058.0, 7413.0, 10904.0, 16257.0, 24630.0, 38876.0, 63965.0, 107145.0, 175660.0, 1254578.0, 145243.0, 87211.0, 52538.0, 32505.0, 20920.0, 13973.0, 9324.0, 6291.0, 4463.0, 2944.0, 2027.0, 1401.0, 913.0, 667.0, 443.0, 306.0, 223.0, 150.0, 108.0, 73.0, 35.0, 32.0, 24.0, 18.0, 10.0, 8.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-17.875, -17.303955078125, -16.73291015625, -16.161865234375, -15.5908203125, -15.019775390625, -14.44873046875, -13.877685546875, -13.306640625, -12.735595703125, -12.16455078125, -11.593505859375, -11.0224609375, -10.451416015625, -9.88037109375, -9.309326171875, -8.73828125, -8.167236328125, -7.59619140625, -7.025146484375, -6.4541015625, -5.883056640625, -5.31201171875, -4.740966796875, -4.169921875, -3.598876953125, -3.02783203125, -2.456787109375, -1.8857421875, -1.314697265625, -0.74365234375, -0.172607421875, 0.3984375, 0.969482421875, 1.54052734375, 2.111572265625, 2.6826171875, 3.253662109375, 3.82470703125, 4.395751953125, 4.966796875, 5.537841796875, 6.10888671875, 6.679931640625, 7.2509765625, 7.822021484375, 8.39306640625, 8.964111328125, 9.53515625, 10.106201171875, 10.67724609375, 11.248291015625, 11.8193359375, 12.390380859375, 12.96142578125, 13.532470703125, 14.103515625, 14.674560546875, 15.24560546875, 15.816650390625, 16.3876953125, 16.958740234375, 17.52978515625, 18.100830078125, 18.671875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 7.0, 8.0, 7.0, 20.0, 28.0, 32.0, 37.0, 57.0, 74.0, 123.0, 111.0, 105.0, 100.0, 75.0, 76.0, 37.0, 29.0, 21.0, 14.0, 9.0, 5.0, 10.0, 6.0, 2.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.238037109375, -0.22842025756835938, -0.21880340576171875, -0.20918655395507812, -0.1995697021484375, -0.18995285034179688, -0.18033599853515625, -0.17071914672851562, -0.161102294921875, -0.15148544311523438, -0.14186859130859375, -0.13225173950195312, -0.1226348876953125, -0.11301803588867188, -0.10340118408203125, -0.09378433227539062, -0.08416748046875, -0.07455062866210938, -0.06493377685546875, -0.055316925048828125, -0.0457000732421875, -0.036083221435546875, -0.02646636962890625, -0.016849517822265625, -0.007232666015625, 0.002384185791015625, 0.01200103759765625, 0.021617889404296875, 0.0312347412109375, 0.040851593017578125, 0.05046844482421875, 0.060085296630859375, 0.0697021484375, 0.07931900024414062, 0.08893585205078125, 0.09855270385742188, 0.1081695556640625, 0.11778640747070312, 0.12740325927734375, 0.13702011108398438, 0.146636962890625, 0.15625381469726562, 0.16587066650390625, 0.17548751831054688, 0.1851043701171875, 0.19472122192382812, 0.20433807373046875, 0.21395492553710938, 0.22357177734375, 0.23318862915039062, 0.24280548095703125, 0.2524223327636719, 0.2620391845703125, 0.2716560363769531, 0.28127288818359375, 0.2908897399902344, 0.300506591796875, 0.3101234436035156, 0.31974029541015625, 0.3293571472167969, 0.3389739990234375, 0.3485908508300781, 0.35820770263671875, 0.3678245544433594, 0.37744140625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 8.0, 6.0, 9.0, 18.0, 24.0, 32.0, 48.0, 78.0, 123.0, 198.0, 404.0, 821.0, 1916.0, 5397.0, 21064.0, 172065.0, 762978.0, 65463.0, 11732.0, 3427.0, 1352.0, 650.0, 298.0, 163.0, 105.0, 48.0, 38.0, 26.0, 18.0, 12.0, 14.0, 5.0, 5.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.9775390625, -1.923065185546875, -1.86859130859375, -1.814117431640625, -1.7596435546875, -1.705169677734375, -1.65069580078125, -1.596221923828125, -1.541748046875, -1.487274169921875, -1.43280029296875, -1.378326416015625, -1.3238525390625, -1.269378662109375, -1.21490478515625, -1.160430908203125, -1.10595703125, -1.051483154296875, -0.99700927734375, -0.942535400390625, -0.8880615234375, -0.833587646484375, -0.77911376953125, -0.724639892578125, -0.670166015625, -0.615692138671875, -0.56121826171875, -0.506744384765625, -0.4522705078125, -0.397796630859375, -0.34332275390625, -0.288848876953125, -0.234375, -0.179901123046875, -0.12542724609375, -0.070953369140625, -0.0164794921875, 0.037994384765625, 0.09246826171875, 0.146942138671875, 0.201416015625, 0.255889892578125, 0.31036376953125, 0.364837646484375, 0.4193115234375, 0.473785400390625, 0.52825927734375, 0.582733154296875, 0.63720703125, 0.691680908203125, 0.74615478515625, 0.800628662109375, 0.8551025390625, 0.909576416015625, 0.96405029296875, 1.018524169921875, 1.072998046875, 1.127471923828125, 1.18194580078125, 1.236419677734375, 1.2908935546875, 1.345367431640625, 1.39984130859375, 1.454315185546875, 1.5087890625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 3.0, 6.0, 12.0, 20.0, 14.0, 19.0, 29.0, 47.0, 58.0, 111.0, 193.0, 239.0, 122.0, 64.0, 24.0, 14.0, 9.0, 5.0, 4.0, 5.0, 1.0, 0.0, 1.0], "bins": [-0.7018107771873474, -0.6883791089057922, -0.6749473810195923, -0.6615157127380371, -0.6480840444564819, -0.634652316570282, -0.6212206482887268, -0.6077889800071716, -0.5943572521209717, -0.5809255838394165, -0.5674938559532166, -0.5540621876716614, -0.5406305193901062, -0.5271987915039062, -0.5137671232223511, -0.5003354549407959, -0.48690375685691833, -0.47347205877304077, -0.4600403904914856, -0.44660869240760803, -0.43317699432373047, -0.4197453260421753, -0.40631362795829773, -0.39288192987442017, -0.379450261592865, -0.3660185635089874, -0.35258689522743225, -0.3391551971435547, -0.3257234990596771, -0.31229180097579956, -0.2988601326942444, -0.2854284346103668, -0.27199673652648926, -0.2585650384426117, -0.24513335525989532, -0.23170167207717896, -0.2182699739933014, -0.20483829081058502, -0.19140660762786865, -0.1779749095439911, -0.16454321146011353, -0.15111152827739716, -0.1376798301935196, -0.12424814701080322, -0.11081645637750626, -0.09738476574420929, -0.08395308256149292, -0.07052139192819595, -0.05708970129489899, -0.04365801066160202, -0.030226323753595352, -0.016794636845588684, -0.0033629462122917175, 0.010068744421005249, 0.02350042760372162, 0.036932118237018585, 0.05036380887031555, 0.06379549950361252, 0.07722719013690948, 0.09065887331962585, 0.10409056395292282, 0.11752225458621979, 0.13095393776893616, 0.14438563585281372, 0.1578173190355301]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 5.0, 3.0, 13.0, 5.0, 14.0, 20.0, 18.0, 19.0, 29.0, 23.0, 22.0, 26.0, 26.0, 35.0, 38.0, 37.0, 39.0, 41.0, 32.0, 36.0, 45.0, 41.0, 44.0, 44.0, 29.0, 37.0, 28.0, 22.0, 21.0, 31.0, 25.0, 27.0, 23.0, 13.0, 21.0, 16.0, 13.0, 12.0, 9.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.22242134809494019, -0.2160506397485733, -0.20967991650104523, -0.20330920815467834, -0.19693848490715027, -0.1905677765607834, -0.1841970682144165, -0.17782634496688843, -0.17145563662052155, -0.16508492827415466, -0.1587142050266266, -0.1523434966802597, -0.14597278833389282, -0.13960206508636475, -0.13323135673999786, -0.12686064839363098, -0.1204899251461029, -0.11411920934915543, -0.10774849355220795, -0.10137778520584106, -0.09500706940889359, -0.0886363536119461, -0.08226564526557922, -0.07589492946863174, -0.06952421367168427, -0.06315349787473679, -0.056782785803079605, -0.050412073731422424, -0.044041357934474945, -0.037670642137527466, -0.031299930065870285, -0.024929217994213104, -0.018558502197265625, -0.012187788262963295, -0.005817074328660965, 0.000553639605641365, 0.006924353539943695, 0.013295069336891174, 0.019665781408548355, 0.026036493480205536, 0.032407209277153015, 0.038777925074100494, 0.045148637145757675, 0.051519349217414856, 0.057890065014362335, 0.06426078081130981, 0.0706314891576767, 0.07700220495462418, 0.08337292075157166, 0.08974363654851913, 0.09611435234546661, 0.1024850606918335, 0.10885577648878098, 0.11522649228572845, 0.12159720063209534, 0.1279679238796234, 0.1343386322259903, 0.14070934057235718, 0.14708006381988525, 0.15345077216625214, 0.15982148051261902, 0.1661922037601471, 0.17256291210651398, 0.17893362045288086, 0.18530434370040894]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 5.0, 12.0, 11.0, 12.0, 10.0, 23.0, 22.0, 25.0, 35.0, 35.0, 37.0, 31.0, 45.0, 28.0, 53.0, 54.0, 54.0, 45.0, 38.0, 39.0, 38.0, 42.0, 41.0, 32.0, 26.0, 32.0, 17.0, 19.0, 33.0, 17.0, 16.0, 15.0, 11.0, 7.0, 6.0, 3.0, 1.0, 5.0, 5.0, 6.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-247.5, -239.046875, -230.59375, -222.140625, -213.6875, -205.234375, -196.78125, -188.328125, -179.875, -171.421875, -162.96875, -154.515625, -146.0625, -137.609375, -129.15625, -120.703125, -112.25, -103.796875, -95.34375, -86.890625, -78.4375, -69.984375, -61.53125, -53.078125, -44.625, -36.171875, -27.71875, -19.265625, -10.8125, -2.359375, 6.09375, 14.546875, 23.0, 31.453125, 39.90625, 48.359375, 56.8125, 65.265625, 73.71875, 82.171875, 90.625, 99.078125, 107.53125, 115.984375, 124.4375, 132.890625, 141.34375, 149.796875, 158.25, 166.703125, 175.15625, 183.609375, 192.0625, 200.515625, 208.96875, 217.421875, 225.875, 234.328125, 242.78125, 251.234375, 259.6875, 268.140625, 276.59375, 285.046875, 293.5]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 7.0, 3.0, 12.0, 7.0, 8.0, 13.0, 25.0, 30.0, 43.0, 62.0, 90.0, 142.0, 196.0, 279.0, 429.0, 716.0, 1257.0, 2302.0, 4826.0, 11291.0, 32554.0, 121171.0, 501639.0, 274612.0, 62863.0, 19030.0, 7367.0, 3347.0, 1607.0, 941.0, 563.0, 355.0, 221.0, 161.0, 114.0, 64.0, 51.0, 48.0, 34.0, 24.0, 19.0, 12.0, 7.0, 9.0, 7.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.46875, -37.17626953125, -35.8837890625, -34.59130859375, -33.298828125, -32.00634765625, -30.7138671875, -29.42138671875, -28.12890625, -26.83642578125, -25.5439453125, -24.25146484375, -22.958984375, -21.66650390625, -20.3740234375, -19.08154296875, -17.7890625, -16.49658203125, -15.2041015625, -13.91162109375, -12.619140625, -11.32666015625, -10.0341796875, -8.74169921875, -7.44921875, -6.15673828125, -4.8642578125, -3.57177734375, -2.279296875, -0.98681640625, 0.3056640625, 1.59814453125, 2.890625, 4.18310546875, 5.4755859375, 6.76806640625, 8.060546875, 9.35302734375, 10.6455078125, 11.93798828125, 13.23046875, 14.52294921875, 15.8154296875, 17.10791015625, 18.400390625, 19.69287109375, 20.9853515625, 22.27783203125, 23.5703125, 24.86279296875, 26.1552734375, 27.44775390625, 28.740234375, 30.03271484375, 31.3251953125, 32.61767578125, 33.91015625, 35.20263671875, 36.4951171875, 37.78759765625, 39.080078125, 40.37255859375, 41.6650390625, 42.95751953125, 44.25]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 9.0, 15.0, 8.0, 20.0, 18.0, 18.0, 27.0, 34.0, 45.0, 65.0, 61.0, 70.0, 63.0, 2109.0, 78.0, 48.0, 61.0, 58.0, 50.0, 28.0, 33.0, 31.0, 20.0, 18.0, 6.0, 13.0, 1.0, 3.0, 8.0, 5.0, 1.0, 2.0, 5.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-625.0, -607.48828125, -589.9765625, -572.46484375, -554.953125, -537.44140625, -519.9296875, -502.41796875, -484.90625, -467.39453125, -449.8828125, -432.37109375, -414.859375, -397.34765625, -379.8359375, -362.32421875, -344.8125, -327.30078125, -309.7890625, -292.27734375, -274.765625, -257.25390625, -239.7421875, -222.23046875, -204.71875, -187.20703125, -169.6953125, -152.18359375, -134.671875, -117.16015625, -99.6484375, -82.13671875, -64.625, -47.11328125, -29.6015625, -12.08984375, 5.421875, 22.93359375, 40.4453125, 57.95703125, 75.46875, 92.98046875, 110.4921875, 128.00390625, 145.515625, 163.02734375, 180.5390625, 198.05078125, 215.5625, 233.07421875, 250.5859375, 268.09765625, 285.609375, 303.12109375, 320.6328125, 338.14453125, 355.65625, 373.16796875, 390.6796875, 408.19140625, 425.703125, 443.21484375, 460.7265625, 478.23828125, 495.75]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 2.0, 14.0, 15.0, 17.0, 16.0, 34.0, 45.0, 53.0, 87.0, 108.0, 194.0, 314.0, 628.0, 1671.0, 6335.0, 50942.0, 2942457.0, 127857.0, 10656.0, 2346.0, 805.0, 383.0, 220.0, 157.0, 85.0, 62.0, 45.0, 29.0, 37.0, 15.0, 17.0, 7.0, 13.0, 8.0, 4.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-110.75, -107.13671875, -103.5234375, -99.91015625, -96.296875, -92.68359375, -89.0703125, -85.45703125, -81.84375, -78.23046875, -74.6171875, -71.00390625, -67.390625, -63.77734375, -60.1640625, -56.55078125, -52.9375, -49.32421875, -45.7109375, -42.09765625, -38.484375, -34.87109375, -31.2578125, -27.64453125, -24.03125, -20.41796875, -16.8046875, -13.19140625, -9.578125, -5.96484375, -2.3515625, 1.26171875, 4.875, 8.48828125, 12.1015625, 15.71484375, 19.328125, 22.94140625, 26.5546875, 30.16796875, 33.78125, 37.39453125, 41.0078125, 44.62109375, 48.234375, 51.84765625, 55.4609375, 59.07421875, 62.6875, 66.30078125, 69.9140625, 73.52734375, 77.140625, 80.75390625, 84.3671875, 87.98046875, 91.59375, 95.20703125, 98.8203125, 102.43359375, 106.046875, 109.66015625, 113.2734375, 116.88671875, 120.5]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 2.0, 7.0, 8.0, 19.0, 32.0, 44.0, 60.0, 135.0, 173.0, 174.0, 136.0, 68.0, 53.0, 25.0, 16.0, 10.0, 14.0, 11.0, 1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-949.3392944335938, -928.2639770507812, -907.1886596679688, -886.1133422851562, -865.0380249023438, -843.9627075195312, -822.8873901367188, -801.8120727539062, -780.7367553710938, -759.6614379882812, -738.5861206054688, -717.5108032226562, -696.4354858398438, -675.3601684570312, -654.2848510742188, -633.2095336914062, -612.13427734375, -591.0589599609375, -569.983642578125, -548.9083251953125, -527.8330078125, -506.7576904296875, -485.682373046875, -464.6070556640625, -443.53173828125, -422.4564208984375, -401.381103515625, -380.3057861328125, -359.23046875, -338.1551513671875, -317.079833984375, -296.0045166015625, -274.92919921875, -253.8538818359375, -232.778564453125, -211.7032470703125, -190.6279296875, -169.5526123046875, -148.47731018066406, -127.40199279785156, -106.32667541503906, -85.25135803222656, -64.17604064941406, -43.100730895996094, -22.025413513183594, -0.9500961303710938, 20.125213623046875, 41.200531005859375, 62.275848388671875, 83.35116577148438, 104.42648315429688, 125.50179290771484, 146.57711791992188, 167.65243530273438, 188.7277374267578, 209.8030548095703, 230.8783721923828, 251.9536895751953, 273.02899169921875, 294.10430908203125, 315.17962646484375, 336.25494384765625, 357.33026123046875, 378.40557861328125, 399.48089599609375]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 10.0, 10.0, 15.0, 11.0, 18.0, 22.0, 26.0, 21.0, 30.0, 31.0, 29.0, 39.0, 35.0, 40.0, 54.0, 48.0, 54.0, 63.0, 52.0, 50.0, 37.0, 39.0, 34.0, 41.0, 27.0, 22.0, 16.0, 18.0, 15.0, 14.0, 13.0, 9.0, 5.0, 5.0, 7.0, 2.0, 7.0, 7.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-594.61328125, -575.13037109375, -555.6474609375, -536.1644897460938, -516.6815795898438, -497.19866943359375, -477.71575927734375, -458.23284912109375, -438.7499084472656, -419.2669982910156, -399.7840576171875, -380.3011474609375, -360.8182373046875, -341.3352966308594, -321.8523864746094, -302.36944580078125, -282.88653564453125, -263.40362548828125, -243.92068481445312, -224.43777465820312, -204.95484924316406, -185.471923828125, -165.989013671875, -146.50608825683594, -127.02316284179688, -107.54023742675781, -88.05731964111328, -68.57440185546875, -49.09147644042969, -29.608551025390625, -10.125633239746094, 9.357284545898438, 28.8402099609375, 48.3231315612793, 67.8060531616211, 87.28897094726562, 106.77189636230469, 126.25482177734375, 145.73773193359375, 165.2206573486328, 184.70358276367188, 204.18650817871094, 223.66943359375, 243.15234375, 262.63525390625, 282.1181945800781, 301.6011047363281, 321.08404541015625, 340.56695556640625, 360.04986572265625, 379.5328063964844, 399.0157165527344, 418.4986572265625, 437.9815673828125, 457.4644775390625, 476.9473876953125, 496.4303283691406, 515.9132690429688, 535.3961791992188, 554.8790893554688, 574.3619995117188, 593.844970703125, 613.327880859375, 632.810791015625, 652.293701171875]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 5.0, 5.0, 8.0, 12.0, 10.0, 17.0, 24.0, 27.0, 39.0, 31.0, 54.0, 58.0, 95.0, 90.0, 124.0, 162.0, 221.0, 323.0, 448.0, 823.0, 1597.0, 1041593.0, 886.0, 559.0, 323.0, 238.0, 167.0, 116.0, 99.0, 82.0, 58.0, 53.0, 42.0, 26.0, 27.0, 18.0, 20.0, 18.0, 14.0, 11.0, 8.0, 7.0, 5.0, 3.0, 4.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-153.81883239746094, -148.34539794921875, -142.87196350097656, -137.39852905273438, -131.92507934570312, -126.45165252685547, -120.97821044921875, -115.50477600097656, -110.03134155273438, -104.55790710449219, -99.08447265625, -93.61103057861328, -88.1375961303711, -82.6641616821289, -77.19071960449219, -71.71728515625, -66.24385070800781, -60.770416259765625, -55.29697799682617, -49.82353973388672, -44.35010528564453, -38.876670837402344, -33.40323257446289, -27.929794311523438, -22.45635986328125, -16.98292350769043, -11.50948715209961, -6.036050796508789, -0.5626144409179688, 4.910821914672852, 10.384258270263672, 15.857696533203125, 21.331146240234375, 26.804582595825195, 32.278018951416016, 37.75145721435547, 43.224891662597656, 48.698326110839844, 54.1717643737793, 59.64520263671875, 65.11863708496094, 70.59207153320312, 76.06550598144531, 81.53894805908203, 87.01238250732422, 92.4858169555664, 97.95925903320312, 103.43269348144531, 108.9061279296875, 114.37956237792969, 119.85299682617188, 125.3264389038086, 130.79986572265625, 136.2733154296875, 141.7467498779297, 147.22018432617188, 152.69361877441406, 158.16705322265625, 163.64048767089844, 169.11392211914062, 174.58737182617188, 180.06080627441406, 185.53424072265625, 191.00767517089844, 196.48110961914062]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 5.0, 3.0, 9.0, 11.0, 9.0, 12.0, 4.0, 9.0, 18.0, 24.0, 76.0, 594.0, 51461156.0, 1060.0, 73.0, 36.0, 17.0, 11.0, 1.0, 3.0, 1.0, 6.0, 4.0, 3.0, 6.0, 0.0, 1.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3195.414794921875, -3100.2216796875, -3005.0283203125, -2909.835205078125, -2814.64208984375, -2719.44873046875, -2624.255615234375, -2529.0625, -2433.869140625, -2338.676025390625, -2243.482666015625, -2148.28955078125, -2053.09619140625, -1957.903076171875, -1862.7099609375, -1767.5167236328125, -1672.323486328125, -1577.1302490234375, -1481.93701171875, -1386.743896484375, -1291.5506591796875, -1196.357421875, -1101.164306640625, -1005.9710693359375, -910.77783203125, -815.5845947265625, -720.3914184570312, -625.1982421875, -530.0050048828125, -434.8117980957031, -339.61859130859375, -244.4254150390625, -149.232177734375, -54.038970947265625, 41.15423583984375, 136.34744262695312, 231.5406494140625, 326.7338562011719, 421.92706298828125, 517.1202392578125, 612.3134765625, 707.5067138671875, 802.6998901367188, 897.89306640625, 993.0863037109375, 1088.279541015625, 1183.47265625, 1278.6658935546875, 1373.859130859375, 1469.0523681640625, 1564.24560546875, 1659.438720703125, 1754.6319580078125, 1849.8251953125, 1945.018310546875, 2040.2115478515625, 2135.40478515625, 2230.597900390625, 2325.791259765625, 2420.984375, 2516.177734375, 2611.370849609375, 2706.56396484375, 2801.75732421875, 2896.950439453125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 10.0, 14.0, 14.0, 22.0, 40.0, 67.0, 92.0, 125.0, 211.0, 290.0, 449.0, 676.0, 988.0, 1488.0, 2251.0, 3391.0, 5151.0, 7745.0, 11692.0, 17469.0, 27471.0, 42158.0, 67282.0, 110593.0, 187931.0, 326438.0, 676907.0, 3685608.0, 465228.0, 257162.0, 149263.0, 88932.0, 54796.0, 34442.0, 22238.0, 14718.0, 9613.0, 6165.0, 4151.0, 2761.0, 1768.0, 1209.0, 846.0, 580.0, 366.0, 234.0, 167.0, 88.0, 47.0, 40.0, 22.0, 13.0, 6.0, 7.0, 1.0, 2.0], "bins": [-7.796875, -7.57598876953125, -7.3551025390625, -7.13421630859375, -6.913330078125, -6.69244384765625, -6.4715576171875, -6.25067138671875, -6.02978515625, -5.80889892578125, -5.5880126953125, -5.36712646484375, -5.146240234375, -4.92535400390625, -4.7044677734375, -4.48358154296875, -4.2626953125, -4.04180908203125, -3.8209228515625, -3.60003662109375, -3.379150390625, -3.15826416015625, -2.9373779296875, -2.71649169921875, -2.49560546875, -2.27471923828125, -2.0538330078125, -1.83294677734375, -1.612060546875, -1.39117431640625, -1.1702880859375, -0.94940185546875, -0.728515625, -0.50762939453125, -0.2867431640625, -0.06585693359375, 0.155029296875, 0.37591552734375, 0.5968017578125, 0.81768798828125, 1.03857421875, 1.25946044921875, 1.4803466796875, 1.70123291015625, 1.922119140625, 2.14300537109375, 2.3638916015625, 2.58477783203125, 2.8056640625, 3.02655029296875, 3.2474365234375, 3.46832275390625, 3.689208984375, 3.91009521484375, 4.1309814453125, 4.35186767578125, 4.57275390625, 4.79364013671875, 5.0145263671875, 5.23541259765625, 5.456298828125, 5.67718505859375, 5.8980712890625, 6.11895751953125, 6.33984375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 4.0, 5.0, 6.0, 11.0, 7.0, 14.0, 7.0, 16.0, 12.0, 18.0, 18.0, 30.0, 34.0, 25.0, 26.0, 35.0, 35.0, 31.0, 30.0, 43.0, 68.0, 840.0, 220.0, 37.0, 37.0, 46.0, 42.0, 27.0, 40.0, 36.0, 39.0, 29.0, 23.0, 24.0, 18.0, 11.0, 15.0, 17.0, 7.0, 7.0, 9.0, 6.0, 5.0, 5.0, 9.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.9375, -62.6728515625, -60.408203125, -58.1435546875, -55.87890625, -53.6142578125, -51.349609375, -49.0849609375, -46.8203125, -44.5556640625, -42.291015625, -40.0263671875, -37.76171875, -35.4970703125, -33.232421875, -30.9677734375, -28.703125, -26.4384765625, -24.173828125, -21.9091796875, -19.64453125, -17.3798828125, -15.115234375, -12.8505859375, -10.5859375, -8.3212890625, -6.056640625, -3.7919921875, -1.52734375, 0.7373046875, 3.001953125, 5.2666015625, 7.53125, 9.7958984375, 12.060546875, 14.3251953125, 16.58984375, 18.8544921875, 21.119140625, 23.3837890625, 25.6484375, 27.9130859375, 30.177734375, 32.4423828125, 34.70703125, 36.9716796875, 39.236328125, 41.5009765625, 43.765625, 46.0302734375, 48.294921875, 50.5595703125, 52.82421875, 55.0888671875, 57.353515625, 59.6181640625, 61.8828125, 64.1474609375, 66.412109375, 68.6767578125, 70.94140625, 73.2060546875, 75.470703125, 77.7353515625, 80.0]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 5.0, 6.0, 4.0, 8.0, 7.0, 14.0, 15.0, 44.0, 49.0, 81.0, 115.0, 193.0, 263.0, 364.0, 604.0, 892.0, 1285.0, 1898.0, 2983.0, 4359.0, 6566.0, 10338.0, 15779.0, 25125.0, 39954.0, 65118.0, 107534.0, 185634.0, 340541.0, 775673.0, 3671455.0, 446311.0, 236934.0, 136069.0, 80606.0, 49004.0, 30258.0, 19381.0, 12369.0, 7990.0, 5183.0, 3377.0, 2288.0, 1606.0, 1035.0, 676.0, 477.0, 336.0, 223.0, 138.0, 100.0, 60.0, 47.0, 23.0, 24.0, 9.0, 3.0, 4.0, 5.0, 6.0, 3.0, 2.0], "bins": [-7.48046875, -7.24822998046875, -7.0159912109375, -6.78375244140625, -6.551513671875, -6.31927490234375, -6.0870361328125, -5.85479736328125, -5.62255859375, -5.39031982421875, -5.1580810546875, -4.92584228515625, -4.693603515625, -4.46136474609375, -4.2291259765625, -3.99688720703125, -3.7646484375, -3.53240966796875, -3.3001708984375, -3.06793212890625, -2.835693359375, -2.60345458984375, -2.3712158203125, -2.13897705078125, -1.90673828125, -1.67449951171875, -1.4422607421875, -1.21002197265625, -0.977783203125, -0.74554443359375, -0.5133056640625, -0.28106689453125, -0.048828125, 0.18341064453125, 0.4156494140625, 0.64788818359375, 0.880126953125, 1.11236572265625, 1.3446044921875, 1.57684326171875, 1.80908203125, 2.04132080078125, 2.2735595703125, 2.50579833984375, 2.738037109375, 2.97027587890625, 3.2025146484375, 3.43475341796875, 3.6669921875, 3.89923095703125, 4.1314697265625, 4.36370849609375, 4.595947265625, 4.82818603515625, 5.0604248046875, 5.29266357421875, 5.52490234375, 5.75714111328125, 5.9893798828125, 6.22161865234375, 6.453857421875, 6.68609619140625, 6.9183349609375, 7.15057373046875, 7.3828125]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 2.0, 6.0, 9.0, 11.0, 10.0, 21.0, 19.0, 24.0, 19.0, 33.0, 41.0, 37.0, 29.0, 35.0, 41.0, 35.0, 34.0, 58.0, 161.0, 926.0, 66.0, 47.0, 35.0, 38.0, 35.0, 25.0, 29.0, 19.0, 27.0, 24.0, 18.0, 19.0, 13.0, 14.0, 7.0, 10.0, 8.0, 6.0, 6.0, 7.0, 1.0, 8.0, 4.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-83.3125, -80.8046875, -78.296875, -75.7890625, -73.28125, -70.7734375, -68.265625, -65.7578125, -63.25, -60.7421875, -58.234375, -55.7265625, -53.21875, -50.7109375, -48.203125, -45.6953125, -43.1875, -40.6796875, -38.171875, -35.6640625, -33.15625, -30.6484375, -28.140625, -25.6328125, -23.125, -20.6171875, -18.109375, -15.6015625, -13.09375, -10.5859375, -8.078125, -5.5703125, -3.0625, -0.5546875, 1.953125, 4.4609375, 6.96875, 9.4765625, 11.984375, 14.4921875, 17.0, 19.5078125, 22.015625, 24.5234375, 27.03125, 29.5390625, 32.046875, 34.5546875, 37.0625, 39.5703125, 42.078125, 44.5859375, 47.09375, 49.6015625, 52.109375, 54.6171875, 57.125, 59.6328125, 62.140625, 64.6484375, 67.15625, 69.6640625, 72.171875, 74.6796875, 77.1875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 12.0, 11.0, 22.0, 22.0, 45.0, 59.0, 145.0, 204.0, 307.0, 504.0, 788.0, 1290.0, 1975.0, 3042.0, 4678.0, 7837.0, 12967.0, 21977.0, 40892.0, 86401.0, 5284123.0, 645993.0, 83728.0, 39787.0, 21402.0, 12551.0, 7712.0, 4761.0, 3032.0, 1921.0, 1279.0, 748.0, 467.0, 298.0, 157.0, 106.0, 84.0, 40.0, 24.0, 18.0, 12.0, 9.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-22.90625, -22.087646484375, -21.26904296875, -20.450439453125, -19.6318359375, -18.813232421875, -17.99462890625, -17.176025390625, -16.357421875, -15.538818359375, -14.72021484375, -13.901611328125, -13.0830078125, -12.264404296875, -11.44580078125, -10.627197265625, -9.80859375, -8.989990234375, -8.17138671875, -7.352783203125, -6.5341796875, -5.715576171875, -4.89697265625, -4.078369140625, -3.259765625, -2.441162109375, -1.62255859375, -0.803955078125, 0.0146484375, 0.833251953125, 1.65185546875, 2.470458984375, 3.2890625, 4.107666015625, 4.92626953125, 5.744873046875, 6.5634765625, 7.382080078125, 8.20068359375, 9.019287109375, 9.837890625, 10.656494140625, 11.47509765625, 12.293701171875, 13.1123046875, 13.930908203125, 14.74951171875, 15.568115234375, 16.38671875, 17.205322265625, 18.02392578125, 18.842529296875, 19.6611328125, 20.479736328125, 21.29833984375, 22.116943359375, 22.935546875, 23.754150390625, 24.57275390625, 25.391357421875, 26.2099609375, 27.028564453125, 27.84716796875, 28.665771484375, 29.484375]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 6.0, 5.0, 4.0, 8.0, 8.0, 10.0, 5.0, 18.0, 11.0, 18.0, 16.0, 13.0, 25.0, 37.0, 23.0, 30.0, 36.0, 30.0, 34.0, 44.0, 46.0, 36.0, 141.0, 922.0, 81.0, 45.0, 44.0, 39.0, 32.0, 23.0, 31.0, 28.0, 22.0, 25.0, 19.0, 26.0, 16.0, 13.0, 16.0, 11.0, 13.0, 4.0, 4.0, 5.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 0.0, 0.0, 1.0], "bins": [-93.8125, -91.072265625, -88.33203125, -85.591796875, -82.8515625, -80.111328125, -77.37109375, -74.630859375, -71.890625, -69.150390625, -66.41015625, -63.669921875, -60.9296875, -58.189453125, -55.44921875, -52.708984375, -49.96875, -47.228515625, -44.48828125, -41.748046875, -39.0078125, -36.267578125, -33.52734375, -30.787109375, -28.046875, -25.306640625, -22.56640625, -19.826171875, -17.0859375, -14.345703125, -11.60546875, -8.865234375, -6.125, -3.384765625, -0.64453125, 2.095703125, 4.8359375, 7.576171875, 10.31640625, 13.056640625, 15.796875, 18.537109375, 21.27734375, 24.017578125, 26.7578125, 29.498046875, 32.23828125, 34.978515625, 37.71875, 40.458984375, 43.19921875, 45.939453125, 48.6796875, 51.419921875, 54.16015625, 56.900390625, 59.640625, 62.380859375, 65.12109375, 67.861328125, 70.6015625, 73.341796875, 76.08203125, 78.822265625, 81.5625]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 20.0, 25.0, 72.0, 228.0, 410.0, 132.0, 49.0, 27.0, 15.0, 5.0, 3.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-279.72393798828125, -269.84014892578125, -259.95635986328125, -250.0725555419922, -240.18875122070312, -230.30496215820312, -220.42117309570312, -210.53738403320312, -200.65357971191406, -190.76979064941406, -180.885986328125, -171.002197265625, -161.118408203125, -151.23460388183594, -141.35081481933594, -131.46701049804688, -121.58322143554688, -111.69942474365234, -101.81562805175781, -91.93183898925781, -82.04804229736328, -72.16424560546875, -62.280452728271484, -52.39665985107422, -42.51286315917969, -32.629066467285156, -22.74527359008789, -12.861478805541992, -2.9776840209960938, 6.9061126708984375, 16.789905548095703, 26.67369842529297, 36.5574951171875, 46.44129180908203, 56.3250846862793, 66.20887756347656, 76.0926742553711, 85.97647094726562, 95.86026000976562, 105.74405670166016, 115.62785339355469, 125.51165008544922, 135.39544677734375, 145.27923583984375, 155.16302490234375, 165.0468292236328, 174.9306182861328, 184.81442260742188, 194.69821166992188, 204.58200073242188, 214.46580505371094, 224.34959411621094, 234.2333984375, 244.1171875, 254.0009765625, 263.884765625, 273.7685546875, 283.65234375, 293.5361328125, 303.4199523925781, 313.3037414550781, 323.1875305175781, 333.0713195800781, 342.9551086425781, 352.83892822265625]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 6.0, 6.0, 4.0, 10.0, 5.0, 21.0, 23.0, 31.0, 39.0, 66.0, 83.0, 111.0, 112.0, 106.0, 105.0, 78.0, 56.0, 46.0, 30.0, 20.0, 17.0, 13.0, 8.0, 2.0, 2.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-523.0494384765625, -510.5206604003906, -497.99188232421875, -485.4631042480469, -472.934326171875, -460.405517578125, -447.8767395019531, -435.34796142578125, -422.8191833496094, -410.2904052734375, -397.7616271972656, -385.23284912109375, -372.70404052734375, -360.1752624511719, -347.646484375, -335.1177062988281, -322.58892822265625, -310.0601501464844, -297.5313720703125, -285.0025939941406, -272.47381591796875, -259.94500732421875, -247.41622924804688, -234.887451171875, -222.35867309570312, -209.82989501953125, -197.30111694335938, -184.77232360839844, -172.24354553222656, -159.7147674560547, -147.18597412109375, -134.65719604492188, -122.12841796875, -109.59963989257812, -97.07085418701172, -84.54206848144531, -72.01329040527344, -59.4845085144043, -46.955726623535156, -34.42694091796875, -21.898162841796875, -9.369380950927734, 3.1594009399414062, 15.688182830810547, 28.216964721679688, 40.74574661254883, 53.27452850341797, 65.80331420898438, 78.33209228515625, 90.86087036132812, 103.38965606689453, 115.91844177246094, 128.4472198486328, 140.9759979248047, 153.50479125976562, 166.0335693359375, 178.56234741210938, 191.09112548828125, 203.61990356445312, 216.14869689941406, 228.67747497558594, 241.2062530517578, 253.73504638671875, 266.2638244628906, 278.7926025390625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 6.0, 5.0, 5.0, 7.0, 12.0, 8.0, 12.0, 18.0, 31.0, 39.0, 51.0, 80.0, 112.0, 137.0, 194.0, 303.0, 434.0, 776.0, 1214.0, 2176.0, 4258.0, 9604.0, 30719.0, 4017755.0, 99846.0, 15112.0, 5448.0, 2613.0, 1328.0, 753.0, 446.0, 276.0, 178.0, 110.0, 59.0, 62.0, 26.0, 26.0, 18.0, 7.0, 9.0, 5.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-4.59375, -4.475189208984375, -4.35662841796875, -4.238067626953125, -4.1195068359375, -4.000946044921875, -3.88238525390625, -3.763824462890625, -3.645263671875, -3.526702880859375, -3.40814208984375, -3.289581298828125, -3.1710205078125, -3.052459716796875, -2.93389892578125, -2.815338134765625, -2.69677734375, -2.578216552734375, -2.45965576171875, -2.341094970703125, -2.2225341796875, -2.103973388671875, -1.98541259765625, -1.866851806640625, -1.748291015625, -1.629730224609375, -1.51116943359375, -1.392608642578125, -1.2740478515625, -1.155487060546875, -1.03692626953125, -0.918365478515625, -0.7998046875, -0.681243896484375, -0.56268310546875, -0.444122314453125, -0.3255615234375, -0.207000732421875, -0.08843994140625, 0.030120849609375, 0.148681640625, 0.267242431640625, 0.38580322265625, 0.504364013671875, 0.6229248046875, 0.741485595703125, 0.86004638671875, 0.978607177734375, 1.09716796875, 1.215728759765625, 1.33428955078125, 1.452850341796875, 1.5714111328125, 1.689971923828125, 1.80853271484375, 1.927093505859375, 2.045654296875, 2.164215087890625, 2.28277587890625, 2.401336669921875, 2.5198974609375, 2.638458251953125, 2.75701904296875, 2.875579833984375, 2.994140625]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 4.0, 4.0, 4.0, 6.0, 6.0, 6.0, 7.0, 10.0, 8.0, 12.0, 18.0, 17.0, 759.0, 33.0, 14.0, 19.0, 11.0, 11.0, 8.0, 10.0, 7.0, 4.0, 3.0, 3.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.578125, -1.537322998046875, -1.49652099609375, -1.455718994140625, -1.4149169921875, -1.374114990234375, -1.33331298828125, -1.292510986328125, -1.251708984375, -1.210906982421875, -1.17010498046875, -1.129302978515625, -1.0885009765625, -1.047698974609375, -1.00689697265625, -0.966094970703125, -0.92529296875, -0.884490966796875, -0.84368896484375, -0.802886962890625, -0.7620849609375, -0.721282958984375, -0.68048095703125, -0.639678955078125, -0.598876953125, -0.558074951171875, -0.51727294921875, -0.476470947265625, -0.4356689453125, -0.394866943359375, -0.35406494140625, -0.313262939453125, -0.2724609375, -0.231658935546875, -0.19085693359375, -0.150054931640625, -0.1092529296875, -0.068450927734375, -0.02764892578125, 0.013153076171875, 0.053955078125, 0.094757080078125, 0.13555908203125, 0.176361083984375, 0.2171630859375, 0.257965087890625, 0.29876708984375, 0.339569091796875, 0.38037109375, 0.421173095703125, 0.46197509765625, 0.502777099609375, 0.5435791015625, 0.584381103515625, 0.62518310546875, 0.665985107421875, 0.706787109375, 0.747589111328125, 0.78839111328125, 0.829193115234375, 0.8699951171875, 0.910797119140625, 0.95159912109375, 0.992401123046875, 1.033203125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 10.0, 8.0, 18.0, 20.0, 26.0, 40.0, 88.0, 168.0, 409.0, 1278.0, 5509.0, 32517.0, 1662916.0, 2442885.0, 38660.0, 6953.0, 1703.0, 515.0, 215.0, 139.0, 69.0, 30.0, 24.0, 22.0, 13.0, 14.0, 10.0, 4.0, 6.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.927734375, -3.787506103515625, -3.64727783203125, -3.507049560546875, -3.3668212890625, -3.226593017578125, -3.08636474609375, -2.946136474609375, -2.805908203125, -2.665679931640625, -2.52545166015625, -2.385223388671875, -2.2449951171875, -2.104766845703125, -1.96453857421875, -1.824310302734375, -1.68408203125, -1.543853759765625, -1.40362548828125, -1.263397216796875, -1.1231689453125, -0.982940673828125, -0.84271240234375, -0.702484130859375, -0.562255859375, -0.422027587890625, -0.28179931640625, -0.141571044921875, -0.0013427734375, 0.138885498046875, 0.27911376953125, 0.419342041015625, 0.5595703125, 0.699798583984375, 0.84002685546875, 0.980255126953125, 1.1204833984375, 1.260711669921875, 1.40093994140625, 1.541168212890625, 1.681396484375, 1.821624755859375, 1.96185302734375, 2.102081298828125, 2.2423095703125, 2.382537841796875, 2.52276611328125, 2.662994384765625, 2.80322265625, 2.943450927734375, 3.08367919921875, 3.223907470703125, 3.3641357421875, 3.504364013671875, 3.64459228515625, 3.784820556640625, 3.925048828125, 4.065277099609375, 4.20550537109375, 4.345733642578125, 4.4859619140625, 4.626190185546875, 4.76641845703125, 4.906646728515625, 5.046875]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 10.0, 14.0, 17.0, 11.0, 17.0, 28.0, 39.0, 41.0, 58.0, 99.0, 144.0, 534.0, 1966.0, 446.0, 192.0, 122.0, 80.0, 47.0, 54.0, 29.0, 23.0, 23.0, 16.0, 13.0, 8.0, 14.0, 7.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.16796875, -1.128265380859375, -1.08856201171875, -1.048858642578125, -1.0091552734375, -0.969451904296875, -0.92974853515625, -0.890045166015625, -0.850341796875, -0.810638427734375, -0.77093505859375, -0.731231689453125, -0.6915283203125, -0.651824951171875, -0.61212158203125, -0.572418212890625, -0.53271484375, -0.493011474609375, -0.45330810546875, -0.413604736328125, -0.3739013671875, -0.334197998046875, -0.29449462890625, -0.254791259765625, -0.215087890625, -0.175384521484375, -0.13568115234375, -0.095977783203125, -0.0562744140625, -0.016571044921875, 0.02313232421875, 0.062835693359375, 0.1025390625, 0.142242431640625, 0.18194580078125, 0.221649169921875, 0.2613525390625, 0.301055908203125, 0.34075927734375, 0.380462646484375, 0.420166015625, 0.459869384765625, 0.49957275390625, 0.539276123046875, 0.5789794921875, 0.618682861328125, 0.65838623046875, 0.698089599609375, 0.73779296875, 0.777496337890625, 0.81719970703125, 0.856903076171875, 0.8966064453125, 0.936309814453125, 0.97601318359375, 1.015716552734375, 1.055419921875, 1.095123291015625, 1.13482666015625, 1.174530029296875, 1.2142333984375, 1.253936767578125, 1.29364013671875, 1.333343505859375, 1.373046875]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [4.0, 1.0, 0.0, 1.0, 4.0, 21.0, 110.0, 608.0, 186.0, 51.0, 11.0, 7.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8753252029418945, -4.22678279876709, -3.578240394592285, -2.9296982288360596, -2.281155824661255, -1.6326134204864502, -0.9840712547302246, -0.3355288505554199, 0.31301355361938477, 0.9615558981895447, 1.6100982427597046, 2.2586405277252197, 2.9071829319000244, 3.555725336074829, 4.204267501831055, 4.852809906005859, 5.501352310180664, 6.149894714355469, 6.798437118530273, 7.446979522705078, 8.095521926879883, 8.744064331054688, 9.392606735229492, 10.041149139404297, 10.689691543579102, 11.338233947753906, 11.986776351928711, 12.635318756103516, 13.28386116027832, 13.932403564453125, 14.58094596862793, 15.229488372802734, 15.878030776977539, 16.526573181152344, 17.17511558532715, 17.823657989501953, 18.472200393676758, 19.120742797851562, 19.769285202026367, 20.417827606201172, 21.066370010375977, 21.71491241455078, 22.363454818725586, 23.01199722290039, 23.660539627075195, 24.30908203125, 24.957624435424805, 25.60616683959961, 26.25470733642578, 26.903249740600586, 27.55179214477539, 28.200334548950195, 28.848876953125, 29.497419357299805, 30.14596176147461, 30.794504165649414, 31.44304656982422, 32.09158706665039, 32.74013137817383, 33.388671875, 34.03721618652344, 34.68575668334961, 35.33430099487305, 35.98284149169922, 36.631385803222656]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 3.0, 8.0, 17.0, 24.0, 39.0, 41.0, 37.0, 35.0, 54.0, 54.0, 56.0, 67.0, 66.0, 78.0, 62.0, 66.0, 53.0, 49.0, 47.0, 24.0, 29.0, 23.0, 14.0, 13.0, 7.0, 8.0, 8.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1167707443237305, -5.892937183380127, -5.669103622436523, -5.44527006149292, -5.221436500549316, -4.997602939605713, -4.773769378662109, -4.549935340881348, -4.326102256774902, -4.102268695831299, -3.8784351348876953, -3.654601573944092, -3.4307680130004883, -3.2069344520568848, -2.983100652694702, -2.7592670917510986, -2.535433292388916, -2.3115997314453125, -2.087766170501709, -1.863932490348816, -1.6400989294052124, -1.4162653684616089, -1.1924316883087158, -0.9685981273651123, -0.7447645664215088, -0.5209310054779053, -0.297097384929657, -0.07326376438140869, 0.15056979656219482, 0.37440335750579834, 0.5982370376586914, 0.8220705986022949, 1.0459041595458984, 1.269737720489502, 1.4935712814331055, 1.7174049615859985, 1.941238522529602, 2.165071964263916, 2.3889057636260986, 2.612739324569702, 2.8365728855133057, 3.060406446456909, 3.2842400074005127, 3.5080738067626953, 3.731907367706299, 3.9557409286499023, 4.179574489593506, 4.403408050537109, 4.627241611480713, 4.851075172424316, 5.07490873336792, 5.298742294311523, 5.522575855255127, 5.7464094161987305, 5.970243453979492, 6.1940765380859375, 6.417910575866699, 6.641744136810303, 6.865577697753906, 7.08941125869751, 7.313244819641113, 7.537078380584717, 7.76091194152832, 7.984745979309082, 8.208579063415527]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 7.0, 12.0, 19.0, 17.0, 32.0, 45.0, 56.0, 93.0, 128.0, 193.0, 300.0, 462.0, 718.0, 1205.0, 1942.0, 3326.0, 5897.0, 11600.0, 26365.0, 780442.0, 170064.0, 22340.0, 10075.0, 5343.0, 3053.0, 1786.0, 1066.0, 695.0, 400.0, 264.0, 164.0, 139.0, 91.0, 62.0, 37.0, 32.0, 21.0, 19.0, 10.0, 5.0, 10.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.45703125, -4.2850341796875, -4.113037109375, -3.9410400390625, -3.76904296875, -3.5970458984375, -3.425048828125, -3.2530517578125, -3.0810546875, -2.9090576171875, -2.737060546875, -2.5650634765625, -2.39306640625, -2.2210693359375, -2.049072265625, -1.8770751953125, -1.705078125, -1.5330810546875, -1.361083984375, -1.1890869140625, -1.01708984375, -0.8450927734375, -0.673095703125, -0.5010986328125, -0.3291015625, -0.1571044921875, 0.014892578125, 0.1868896484375, 0.35888671875, 0.5308837890625, 0.702880859375, 0.8748779296875, 1.046875, 1.2188720703125, 1.390869140625, 1.5628662109375, 1.73486328125, 1.9068603515625, 2.078857421875, 2.2508544921875, 2.4228515625, 2.5948486328125, 2.766845703125, 2.9388427734375, 3.11083984375, 3.2828369140625, 3.454833984375, 3.6268310546875, 3.798828125, 3.9708251953125, 4.142822265625, 4.3148193359375, 4.48681640625, 4.6588134765625, 4.830810546875, 5.0028076171875, 5.1748046875, 5.3468017578125, 5.518798828125, 5.6907958984375, 5.86279296875, 6.0347900390625, 6.206787109375, 6.3787841796875, 6.55078125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 5.0, 6.0, 2.0, 2.0, 9.0, 8.0, 9.0, 7.0, 8.0, 15.0, 15.0, 41.0, 548.0, 213.0, 24.0, 15.0, 16.0, 8.0, 7.0, 8.0, 4.0, 9.0, 3.0, 1.0, 5.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5625, -1.5210418701171875, -1.479583740234375, -1.4381256103515625, -1.39666748046875, -1.3552093505859375, -1.313751220703125, -1.2722930908203125, -1.2308349609375, -1.1893768310546875, -1.147918701171875, -1.1064605712890625, -1.06500244140625, -1.0235443115234375, -0.982086181640625, -0.9406280517578125, -0.899169921875, -0.8577117919921875, -0.816253662109375, -0.7747955322265625, -0.73333740234375, -0.6918792724609375, -0.650421142578125, -0.6089630126953125, -0.5675048828125, -0.5260467529296875, -0.484588623046875, -0.4431304931640625, -0.40167236328125, -0.3602142333984375, -0.318756103515625, -0.2772979736328125, -0.23583984375, -0.1943817138671875, -0.152923583984375, -0.1114654541015625, -0.07000732421875, -0.0285491943359375, 0.012908935546875, 0.0543670654296875, 0.0958251953125, 0.1372833251953125, 0.178741455078125, 0.2201995849609375, 0.26165771484375, 0.3031158447265625, 0.344573974609375, 0.3860321044921875, 0.427490234375, 0.4689483642578125, 0.510406494140625, 0.5518646240234375, 0.59332275390625, 0.6347808837890625, 0.676239013671875, 0.7176971435546875, 0.7591552734375, 0.8006134033203125, 0.842071533203125, 0.8835296630859375, 0.92498779296875, 0.9664459228515625, 1.007904052734375, 1.0493621826171875, 1.0908203125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 7.0, 7.0, 13.0, 19.0, 28.0, 28.0, 56.0, 64.0, 93.0, 132.0, 172.0, 223.0, 342.0, 504.0, 996.0, 1837.0, 3951.0, 8655.0, 21315.0, 56859.0, 201747.0, 533423.0, 142441.0, 44160.0, 17028.0, 7166.0, 3335.0, 1578.0, 882.0, 427.0, 302.0, 210.0, 141.0, 110.0, 77.0, 70.0, 42.0, 39.0, 20.0, 10.0, 20.0, 4.0, 6.0, 5.0, 3.0, 3.0, 1.0, 6.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.8828125, -2.79644775390625, -2.7100830078125, -2.62371826171875, -2.537353515625, -2.45098876953125, -2.3646240234375, -2.27825927734375, -2.19189453125, -2.10552978515625, -2.0191650390625, -1.93280029296875, -1.846435546875, -1.76007080078125, -1.6737060546875, -1.58734130859375, -1.5009765625, -1.41461181640625, -1.3282470703125, -1.24188232421875, -1.155517578125, -1.06915283203125, -0.9827880859375, -0.89642333984375, -0.81005859375, -0.72369384765625, -0.6373291015625, -0.55096435546875, -0.464599609375, -0.37823486328125, -0.2918701171875, -0.20550537109375, -0.119140625, -0.03277587890625, 0.0535888671875, 0.13995361328125, 0.226318359375, 0.31268310546875, 0.3990478515625, 0.48541259765625, 0.57177734375, 0.65814208984375, 0.7445068359375, 0.83087158203125, 0.917236328125, 1.00360107421875, 1.0899658203125, 1.17633056640625, 1.2626953125, 1.34906005859375, 1.4354248046875, 1.52178955078125, 1.608154296875, 1.69451904296875, 1.7808837890625, 1.86724853515625, 1.95361328125, 2.03997802734375, 2.1263427734375, 2.21270751953125, 2.299072265625, 2.38543701171875, 2.4718017578125, 2.55816650390625, 2.64453125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 7.0, 11.0, 9.0, 15.0, 17.0, 17.0, 15.0, 17.0, 24.0, 19.0, 20.0, 31.0, 43.0, 39.0, 40.0, 45.0, 39.0, 40.0, 45.0, 48.0, 45.0, 42.0, 46.0, 34.0, 50.0, 28.0, 34.0, 23.0, 25.0, 21.0, 16.0, 16.0, 14.0, 19.0, 12.0, 5.0, 5.0, 6.0, 6.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-3.720703125, -3.60357666015625, -3.4864501953125, -3.36932373046875, -3.252197265625, -3.13507080078125, -3.0179443359375, -2.90081787109375, -2.78369140625, -2.66656494140625, -2.5494384765625, -2.43231201171875, -2.315185546875, -2.19805908203125, -2.0809326171875, -1.96380615234375, -1.8466796875, -1.72955322265625, -1.6124267578125, -1.49530029296875, -1.378173828125, -1.26104736328125, -1.1439208984375, -1.02679443359375, -0.90966796875, -0.79254150390625, -0.6754150390625, -0.55828857421875, -0.441162109375, -0.32403564453125, -0.2069091796875, -0.08978271484375, 0.02734375, 0.14447021484375, 0.2615966796875, 0.37872314453125, 0.495849609375, 0.61297607421875, 0.7301025390625, 0.84722900390625, 0.96435546875, 1.08148193359375, 1.1986083984375, 1.31573486328125, 1.432861328125, 1.54998779296875, 1.6671142578125, 1.78424072265625, 1.9013671875, 2.01849365234375, 2.1356201171875, 2.25274658203125, 2.369873046875, 2.48699951171875, 2.6041259765625, 2.72125244140625, 2.83837890625, 2.95550537109375, 3.0726318359375, 3.18975830078125, 3.306884765625, 3.42401123046875, 3.5411376953125, 3.65826416015625, 3.775390625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 12.0, 24.0, 25.0, 46.0, 100.0, 204.0, 643.0, 3193.0, 178243.0, 860567.0, 4204.0, 761.0, 269.0, 119.0, 47.0, 32.0, 16.0, 11.0, 9.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3359375, -12.0118408203125, -11.687744140625, -11.3636474609375, -11.03955078125, -10.7154541015625, -10.391357421875, -10.0672607421875, -9.7431640625, -9.4190673828125, -9.094970703125, -8.7708740234375, -8.44677734375, -8.1226806640625, -7.798583984375, -7.4744873046875, -7.150390625, -6.8262939453125, -6.502197265625, -6.1781005859375, -5.85400390625, -5.5299072265625, -5.205810546875, -4.8817138671875, -4.5576171875, -4.2335205078125, -3.909423828125, -3.5853271484375, -3.26123046875, -2.9371337890625, -2.613037109375, -2.2889404296875, -1.96484375, -1.6407470703125, -1.316650390625, -0.9925537109375, -0.66845703125, -0.3443603515625, -0.020263671875, 0.3038330078125, 0.6279296875, 0.9520263671875, 1.276123046875, 1.6002197265625, 1.92431640625, 2.2484130859375, 2.572509765625, 2.8966064453125, 3.220703125, 3.5447998046875, 3.868896484375, 4.1929931640625, 4.51708984375, 4.8411865234375, 5.165283203125, 5.4893798828125, 5.8134765625, 6.1375732421875, 6.461669921875, 6.7857666015625, 7.10986328125, 7.4339599609375, 7.758056640625, 8.0821533203125, 8.40625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 3.0, 8.0, 13.0, 20.0, 49.0, 100.0, 287.0, 289.0, 112.0, 57.0, 19.0, 16.0, 5.0, 7.0, 7.0, 4.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00047397613525390625, -0.0004614889621734619, -0.0004490017890930176, -0.00043651461601257324, -0.0004240274429321289, -0.00041154026985168457, -0.00039905309677124023, -0.0003865659236907959, -0.00037407875061035156, -0.0003615915775299072, -0.0003491044044494629, -0.00033661723136901855, -0.0003241300582885742, -0.0003116428852081299, -0.00029915571212768555, -0.0002866685390472412, -0.0002741813659667969, -0.00026169419288635254, -0.0002492070198059082, -0.00023671984672546387, -0.00022423267364501953, -0.0002117455005645752, -0.00019925832748413086, -0.00018677115440368652, -0.0001742839813232422, -0.00016179680824279785, -0.00014930963516235352, -0.00013682246208190918, -0.00012433528900146484, -0.00011184811592102051, -9.936094284057617e-05, -8.687376976013184e-05, -7.43865966796875e-05, -6.189942359924316e-05, -4.941225051879883e-05, -3.692507743835449e-05, -2.4437904357910156e-05, -1.195073127746582e-05, 5.364418029785156e-07, 1.3023614883422852e-05, 2.5510787963867188e-05, 3.7997961044311523e-05, 5.048513412475586e-05, 6.29723072052002e-05, 7.545948028564453e-05, 8.794665336608887e-05, 0.0001004338264465332, 0.00011292099952697754, 0.00012540817260742188, 0.0001378953456878662, 0.00015038251876831055, 0.00016286969184875488, 0.00017535686492919922, 0.00018784403800964355, 0.0002003312110900879, 0.00021281838417053223, 0.00022530555725097656, 0.0002377927303314209, 0.00025027990341186523, 0.00026276707649230957, 0.0002752542495727539, 0.00028774142265319824, 0.0003002285957336426, 0.0003127157688140869, 0.00032520294189453125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 0.0, 1.0, 6.0, 3.0, 8.0, 7.0, 6.0, 14.0, 31.0, 42.0, 83.0, 136.0, 257.0, 490.0, 1119.0, 3209.0, 11238.0, 77290.0, 847691.0, 88706.0, 12506.0, 3344.0, 1222.0, 539.0, 254.0, 144.0, 75.0, 50.0, 34.0, 14.0, 8.0, 7.0, 9.0, 5.0, 6.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1953125, -3.100006103515625, -3.00469970703125, -2.909393310546875, -2.8140869140625, -2.718780517578125, -2.62347412109375, -2.528167724609375, -2.432861328125, -2.337554931640625, -2.24224853515625, -2.146942138671875, -2.0516357421875, -1.956329345703125, -1.86102294921875, -1.765716552734375, -1.67041015625, -1.575103759765625, -1.47979736328125, -1.384490966796875, -1.2891845703125, -1.193878173828125, -1.09857177734375, -1.003265380859375, -0.907958984375, -0.812652587890625, -0.71734619140625, -0.622039794921875, -0.5267333984375, -0.431427001953125, -0.33612060546875, -0.240814208984375, -0.1455078125, -0.050201416015625, 0.04510498046875, 0.140411376953125, 0.2357177734375, 0.331024169921875, 0.42633056640625, 0.521636962890625, 0.616943359375, 0.712249755859375, 0.80755615234375, 0.902862548828125, 0.9981689453125, 1.093475341796875, 1.18878173828125, 1.284088134765625, 1.37939453125, 1.474700927734375, 1.57000732421875, 1.665313720703125, 1.7606201171875, 1.855926513671875, 1.95123291015625, 2.046539306640625, 2.141845703125, 2.237152099609375, 2.33245849609375, 2.427764892578125, 2.5230712890625, 2.618377685546875, 2.71368408203125, 2.808990478515625, 2.904296875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 2.0, 5.0, 7.0, 17.0, 12.0, 14.0, 24.0, 30.0, 34.0, 39.0, 71.0, 89.0, 121.0, 100.0, 100.0, 92.0, 66.0, 52.0, 38.0, 29.0, 15.0, 8.0, 8.0, 7.0, 5.0, 2.0, 6.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.12109375, -3.03253173828125, -2.9439697265625, -2.85540771484375, -2.766845703125, -2.67828369140625, -2.5897216796875, -2.50115966796875, -2.41259765625, -2.32403564453125, -2.2354736328125, -2.14691162109375, -2.058349609375, -1.96978759765625, -1.8812255859375, -1.79266357421875, -1.7041015625, -1.61553955078125, -1.5269775390625, -1.43841552734375, -1.349853515625, -1.26129150390625, -1.1727294921875, -1.08416748046875, -0.99560546875, -0.90704345703125, -0.8184814453125, -0.72991943359375, -0.641357421875, -0.55279541015625, -0.4642333984375, -0.37567138671875, -0.287109375, -0.19854736328125, -0.1099853515625, -0.02142333984375, 0.067138671875, 0.15570068359375, 0.2442626953125, 0.33282470703125, 0.42138671875, 0.50994873046875, 0.5985107421875, 0.68707275390625, 0.775634765625, 0.86419677734375, 0.9527587890625, 1.04132080078125, 1.1298828125, 1.21844482421875, 1.3070068359375, 1.39556884765625, 1.484130859375, 1.57269287109375, 1.6612548828125, 1.74981689453125, 1.83837890625, 1.92694091796875, 2.0155029296875, 2.10406494140625, 2.192626953125, 2.28118896484375, 2.3697509765625, 2.45831298828125, 2.546875]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 5.0, 2.0, 1.0, 8.0, 4.0, 7.0, 7.0, 18.0, 48.0, 138.0, 338.0, 269.0, 91.0, 35.0, 19.0, 7.0, 4.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-77.83209228515625, -76.24474334716797, -74.65739440917969, -73.0700454711914, -71.48269653320312, -69.89533996582031, -68.30799102783203, -66.72064208984375, -65.13329315185547, -63.54594421386719, -61.958595275878906, -60.37124252319336, -58.78389358520508, -57.1965446472168, -55.60919189453125, -54.02184295654297, -52.43449401855469, -50.847145080566406, -49.259796142578125, -47.67244338989258, -46.0850944519043, -44.497745513916016, -42.91039276123047, -41.32304382324219, -39.735694885253906, -38.148345947265625, -36.560997009277344, -34.9736442565918, -33.386295318603516, -31.798946380615234, -30.21159553527832, -28.624244689941406, -27.03689193725586, -25.449542999267578, -23.862192153930664, -22.27484130859375, -20.68749237060547, -19.100143432617188, -17.512792587280273, -15.925442695617676, -14.338092803955078, -12.75074291229248, -11.163393020629883, -9.576043128967285, -7.9886932373046875, -6.40134334564209, -4.813993453979492, -3.2266435623168945, -1.6392936706542969, -0.05194377899169922, 1.5354061126708984, 3.122756004333496, 4.710105895996094, 6.297455787658691, 7.884805679321289, 9.472155570983887, 11.059505462646484, 12.646855354309082, 14.23420524597168, 15.821555137634277, 17.408905029296875, 18.996253967285156, 20.58360481262207, 22.170955657958984, 23.758304595947266]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 2.0, 4.0, 8.0, 8.0, 11.0, 11.0, 3.0, 12.0, 22.0, 36.0, 55.0, 82.0, 103.0, 119.0, 136.0, 96.0, 80.0, 53.0, 47.0, 25.0, 20.0, 16.0, 6.0, 9.0, 7.0, 3.0, 4.0, 1.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.01615905761719, -61.96639633178711, -59.91663360595703, -57.86686706542969, -55.81710433959961, -53.76734161376953, -51.71757888793945, -49.667816162109375, -47.61804962158203, -45.56828689575195, -43.518524169921875, -41.46875762939453, -39.41899490356445, -37.369232177734375, -35.3194694519043, -33.26970672607422, -31.21994400024414, -29.170181274414062, -27.12041664123535, -25.070653915405273, -23.020889282226562, -20.971126556396484, -18.921363830566406, -16.871601104736328, -14.821836471557617, -12.772072792053223, -10.722309112548828, -8.67254638671875, -6.6227827072143555, -4.573019027709961, -2.523256301879883, -0.4734926223754883, 1.5762710571289062, 3.6260344982147217, 5.675797939300537, 7.725561141967773, 9.775324821472168, 11.825088500976562, 13.87485122680664, 15.924614906311035, 17.97437858581543, 20.024141311645508, 22.07390594482422, 24.123668670654297, 26.173431396484375, 28.223196029663086, 30.272958755493164, 32.322723388671875, 34.37248611450195, 36.42224884033203, 38.47201156616211, 40.52177429199219, 42.57154083251953, 44.62130355834961, 46.67106628417969, 48.720829010009766, 50.770591735839844, 52.82035446166992, 54.8701171875, 56.919883728027344, 58.96964645385742, 61.0194091796875, 63.06917190551758, 65.11893463134766, 67.168701171875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 3.0, 7.0, 5.0, 9.0, 26.0, 27.0, 31.0, 59.0, 101.0, 186.0, 363.0, 827.0, 2101.0, 7581.0, 61495.0, 4088553.0, 27178.0, 3956.0, 1086.0, 374.0, 162.0, 72.0, 34.0, 17.0, 11.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-21.53125, -20.984375, -20.4375, -19.890625, -19.34375, -18.796875, -18.25, -17.703125, -17.15625, -16.609375, -16.0625, -15.515625, -14.96875, -14.421875, -13.875, -13.328125, -12.78125, -12.234375, -11.6875, -11.140625, -10.59375, -10.046875, -9.5, -8.953125, -8.40625, -7.859375, -7.3125, -6.765625, -6.21875, -5.671875, -5.125, -4.578125, -4.03125, -3.484375, -2.9375, -2.390625, -1.84375, -1.296875, -0.75, -0.203125, 0.34375, 0.890625, 1.4375, 1.984375, 2.53125, 3.078125, 3.625, 4.171875, 4.71875, 5.265625, 5.8125, 6.359375, 6.90625, 7.453125, 8.0, 8.546875, 9.09375, 9.640625, 10.1875, 10.734375, 11.28125, 11.828125, 12.375, 12.921875, 13.46875]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 6.0, 7.0, 3.0, 4.0, 5.0, 9.0, 8.0, 7.0, 9.0, 24.0, 73.0, 232.0, 345.0, 149.0, 39.0, 16.0, 14.0, 15.0, 8.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.48046875, -1.44268798828125, -1.4049072265625, -1.36712646484375, -1.329345703125, -1.29156494140625, -1.2537841796875, -1.21600341796875, -1.17822265625, -1.14044189453125, -1.1026611328125, -1.06488037109375, -1.027099609375, -0.98931884765625, -0.9515380859375, -0.91375732421875, -0.8759765625, -0.83819580078125, -0.8004150390625, -0.76263427734375, -0.724853515625, -0.68707275390625, -0.6492919921875, -0.61151123046875, -0.57373046875, -0.53594970703125, -0.4981689453125, -0.46038818359375, -0.422607421875, -0.38482666015625, -0.3470458984375, -0.30926513671875, -0.271484375, -0.23370361328125, -0.1959228515625, -0.15814208984375, -0.120361328125, -0.08258056640625, -0.0447998046875, -0.00701904296875, 0.03076171875, 0.06854248046875, 0.1063232421875, 0.14410400390625, 0.181884765625, 0.21966552734375, 0.2574462890625, 0.29522705078125, 0.3330078125, 0.37078857421875, 0.4085693359375, 0.44635009765625, 0.484130859375, 0.52191162109375, 0.5596923828125, 0.59747314453125, 0.63525390625, 0.67303466796875, 0.7108154296875, 0.74859619140625, 0.786376953125, 0.82415771484375, 0.8619384765625, 0.89971923828125, 0.9375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 7.0, 8.0, 17.0, 29.0, 30.0, 90.0, 143.0, 324.0, 759.0, 2175.0, 8958.0, 69429.0, 3933878.0, 158356.0, 14671.0, 3394.0, 1064.0, 488.0, 197.0, 95.0, 53.0, 39.0, 20.0, 18.0, 10.0, 10.0, 3.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.3203125, -8.0572509765625, -7.794189453125, -7.5311279296875, -7.26806640625, -7.0050048828125, -6.741943359375, -6.4788818359375, -6.2158203125, -5.9527587890625, -5.689697265625, -5.4266357421875, -5.16357421875, -4.9005126953125, -4.637451171875, -4.3743896484375, -4.111328125, -3.8482666015625, -3.585205078125, -3.3221435546875, -3.05908203125, -2.7960205078125, -2.532958984375, -2.2698974609375, -2.0068359375, -1.7437744140625, -1.480712890625, -1.2176513671875, -0.95458984375, -0.6915283203125, -0.428466796875, -0.1654052734375, 0.09765625, 0.3607177734375, 0.623779296875, 0.8868408203125, 1.14990234375, 1.4129638671875, 1.676025390625, 1.9390869140625, 2.2021484375, 2.4652099609375, 2.728271484375, 2.9913330078125, 3.25439453125, 3.5174560546875, 3.780517578125, 4.0435791015625, 4.306640625, 4.5697021484375, 4.832763671875, 5.0958251953125, 5.35888671875, 5.6219482421875, 5.885009765625, 6.1480712890625, 6.4111328125, 6.6741943359375, 6.937255859375, 7.2003173828125, 7.46337890625, 7.7264404296875, 7.989501953125, 8.2525634765625, 8.515625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 5.0, 0.0, 4.0, 3.0, 15.0, 14.0, 19.0, 25.0, 47.0, 52.0, 75.0, 130.0, 245.0, 725.0, 1808.0, 375.0, 158.0, 113.0, 82.0, 40.0, 30.0, 24.0, 14.0, 20.0, 9.0, 9.0, 6.0, 8.0, 3.0, 5.0, 6.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.15625, -1.120361328125, -1.08447265625, -1.048583984375, -1.0126953125, -0.976806640625, -0.94091796875, -0.905029296875, -0.869140625, -0.833251953125, -0.79736328125, -0.761474609375, -0.7255859375, -0.689697265625, -0.65380859375, -0.617919921875, -0.58203125, -0.546142578125, -0.51025390625, -0.474365234375, -0.4384765625, -0.402587890625, -0.36669921875, -0.330810546875, -0.294921875, -0.259033203125, -0.22314453125, -0.187255859375, -0.1513671875, -0.115478515625, -0.07958984375, -0.043701171875, -0.0078125, 0.028076171875, 0.06396484375, 0.099853515625, 0.1357421875, 0.171630859375, 0.20751953125, 0.243408203125, 0.279296875, 0.315185546875, 0.35107421875, 0.386962890625, 0.4228515625, 0.458740234375, 0.49462890625, 0.530517578125, 0.56640625, 0.602294921875, 0.63818359375, 0.674072265625, 0.7099609375, 0.745849609375, 0.78173828125, 0.817626953125, 0.853515625, 0.889404296875, 0.92529296875, 0.961181640625, 0.9970703125, 1.032958984375, 1.06884765625, 1.104736328125, 1.140625]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 29.0, 836.0, 119.0, 10.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.163687705993652, -4.046584129333496, -2.9294800758361816, -1.8123762607574463, -0.6952724456787109, 0.4218311309814453, 1.5389351844787598, 2.656039237976074, 3.7731428146362305, 4.890246391296387, 6.007350444793701, 7.124454498291016, 8.241558074951172, 9.358661651611328, 10.475765228271484, 11.592869758605957, 12.709973335266113, 13.82707691192627, 14.944181442260742, 16.0612850189209, 17.178388595581055, 18.29549217224121, 19.412595748901367, 20.529701232910156, 21.646804809570312, 22.76390838623047, 23.881011962890625, 24.99811553955078, 26.115219116210938, 27.232322692871094, 28.349428176879883, 29.46653175354004, 30.583633422851562, 31.70073699951172, 32.817840576171875, 33.93494415283203, 35.05204772949219, 36.169151306152344, 37.2862548828125, 38.403358459472656, 39.52046203613281, 40.63756561279297, 41.754669189453125, 42.87177276611328, 43.98887634277344, 45.105979919433594, 46.22308349609375, 47.340187072753906, 48.45729446411133, 49.574398040771484, 50.69150161743164, 51.8086051940918, 52.92570877075195, 54.04281234741211, 55.159915924072266, 56.27702331542969, 57.394126892089844, 58.51123046875, 59.628334045410156, 60.74543762207031, 61.86254119873047, 62.979644775390625, 64.09674835205078, 65.21385192871094, 66.3309555053711]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 5.0, 6.0, 12.0, 12.0, 19.0, 22.0, 15.0, 27.0, 35.0, 42.0, 41.0, 43.0, 57.0, 75.0, 74.0, 55.0, 66.0, 58.0, 63.0, 58.0, 37.0, 43.0, 32.0, 18.0, 17.0, 12.0, 9.0, 12.0, 4.0, 9.0, 3.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.042205810546875, -4.890949726104736, -4.739693641662598, -4.588437557220459, -4.43718147277832, -4.285925388336182, -4.134669303894043, -3.9834132194519043, -3.8321571350097656, -3.680901050567627, -3.5296449661254883, -3.3783888816833496, -3.227132797241211, -3.0758767127990723, -2.9246206283569336, -2.773364543914795, -2.622108221054077, -2.4708521366119385, -2.3195960521698, -2.168339967727661, -2.0170838832855225, -1.8658277988433838, -1.7145715951919556, -1.563315510749817, -1.4120594263076782, -1.2608033418655396, -1.1095472574234009, -0.9582911133766174, -0.8070350289344788, -0.6557789444923401, -0.5045228004455566, -0.35326671600341797, -0.2020106315612793, -0.05075453221797943, 0.10050156712532043, 0.2517576813697815, 0.40301376581192017, 0.5542698502540588, 0.7055259943008423, 0.856782078742981, 1.0080381631851196, 1.1592942476272583, 1.310550332069397, 1.4618065357208252, 1.6130626201629639, 1.7643187046051025, 1.9155747890472412, 2.06683087348938, 2.2180869579315186, 2.3693430423736572, 2.520599126815796, 2.6718552112579346, 2.8231112957000732, 2.974367380142212, 3.1256237030029297, 3.2768797874450684, 3.428135871887207, 3.5793919563293457, 3.7306480407714844, 3.881904125213623, 4.033160209655762, 4.1844162940979, 4.335672378540039, 4.486928462982178, 4.638184547424316]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 7.0, 6.0, 12.0, 11.0, 24.0, 26.0, 40.0, 54.0, 65.0, 101.0, 161.0, 220.0, 390.0, 695.0, 1318.0, 2546.0, 5185.0, 12221.0, 48434.0, 871957.0, 77848.0, 14716.0, 5909.0, 2919.0, 1553.0, 836.0, 455.0, 260.0, 163.0, 116.0, 69.0, 52.0, 38.0, 37.0, 21.0, 21.0, 15.0, 11.0, 17.0, 7.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-8.21875, -7.9586181640625, -7.698486328125, -7.4383544921875, -7.17822265625, -6.9180908203125, -6.657958984375, -6.3978271484375, -6.1376953125, -5.8775634765625, -5.617431640625, -5.3572998046875, -5.09716796875, -4.8370361328125, -4.576904296875, -4.3167724609375, -4.056640625, -3.7965087890625, -3.536376953125, -3.2762451171875, -3.01611328125, -2.7559814453125, -2.495849609375, -2.2357177734375, -1.9755859375, -1.7154541015625, -1.455322265625, -1.1951904296875, -0.93505859375, -0.6749267578125, -0.414794921875, -0.1546630859375, 0.10546875, 0.3656005859375, 0.625732421875, 0.8858642578125, 1.14599609375, 1.4061279296875, 1.666259765625, 1.9263916015625, 2.1865234375, 2.4466552734375, 2.706787109375, 2.9669189453125, 3.22705078125, 3.4871826171875, 3.747314453125, 4.0074462890625, 4.267578125, 4.5277099609375, 4.787841796875, 5.0479736328125, 5.30810546875, 5.5682373046875, 5.828369140625, 6.0885009765625, 6.3486328125, 6.6087646484375, 6.868896484375, 7.1290283203125, 7.38916015625, 7.6492919921875, 7.909423828125, 8.1695556640625, 8.4296875]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 6.0, 5.0, 3.0, 4.0, 1.0, 4.0, 5.0, 4.0, 12.0, 12.0, 23.0, 52.0, 173.0, 318.0, 212.0, 77.0, 30.0, 13.0, 12.0, 6.0, 12.0, 5.0, 4.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-1.5654296875, -1.5286026000976562, -1.4917755126953125, -1.4549484252929688, -1.418121337890625, -1.3812942504882812, -1.3444671630859375, -1.3076400756835938, -1.27081298828125, -1.2339859008789062, -1.1971588134765625, -1.1603317260742188, -1.123504638671875, -1.0866775512695312, -1.0498504638671875, -1.0130233764648438, -0.9761962890625, -0.9393692016601562, -0.9025421142578125, -0.8657150268554688, -0.828887939453125, -0.7920608520507812, -0.7552337646484375, -0.7184066772460938, -0.68157958984375, -0.6447525024414062, -0.6079254150390625, -0.5710983276367188, -0.534271240234375, -0.49744415283203125, -0.4606170654296875, -0.42378997802734375, -0.386962890625, -0.35013580322265625, -0.3133087158203125, -0.27648162841796875, -0.239654541015625, -0.20282745361328125, -0.1660003662109375, -0.12917327880859375, -0.09234619140625, -0.05551910400390625, -0.0186920166015625, 0.01813507080078125, 0.054962158203125, 0.09178924560546875, 0.1286163330078125, 0.16544342041015625, 0.2022705078125, 0.23909759521484375, 0.2759246826171875, 0.31275177001953125, 0.349578857421875, 0.38640594482421875, 0.4232330322265625, 0.46006011962890625, 0.49688720703125, 0.5337142944335938, 0.5705413818359375, 0.6073684692382812, 0.644195556640625, 0.6810226440429688, 0.7178497314453125, 0.7546768188476562, 0.79150390625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 4.0, 4.0, 8.0, 11.0, 8.0, 18.0, 13.0, 24.0, 28.0, 38.0, 56.0, 65.0, 132.0, 194.0, 378.0, 723.0, 1588.0, 4278.0, 14141.0, 55328.0, 308039.0, 547742.0, 86044.0, 19983.0, 5811.0, 1964.0, 881.0, 397.0, 232.0, 123.0, 79.0, 57.0, 38.0, 23.0, 23.0, 14.0, 15.0, 15.0, 12.0, 7.0, 1.0, 3.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0859375, -3.9588623046875, -3.831787109375, -3.7047119140625, -3.57763671875, -3.4505615234375, -3.323486328125, -3.1964111328125, -3.0693359375, -2.9422607421875, -2.815185546875, -2.6881103515625, -2.56103515625, -2.4339599609375, -2.306884765625, -2.1798095703125, -2.052734375, -1.9256591796875, -1.798583984375, -1.6715087890625, -1.54443359375, -1.4173583984375, -1.290283203125, -1.1632080078125, -1.0361328125, -0.9090576171875, -0.781982421875, -0.6549072265625, -0.52783203125, -0.4007568359375, -0.273681640625, -0.1466064453125, -0.01953125, 0.1075439453125, 0.234619140625, 0.3616943359375, 0.48876953125, 0.6158447265625, 0.742919921875, 0.8699951171875, 0.9970703125, 1.1241455078125, 1.251220703125, 1.3782958984375, 1.50537109375, 1.6324462890625, 1.759521484375, 1.8865966796875, 2.013671875, 2.1407470703125, 2.267822265625, 2.3948974609375, 2.52197265625, 2.6490478515625, 2.776123046875, 2.9031982421875, 3.0302734375, 3.1573486328125, 3.284423828125, 3.4114990234375, 3.53857421875, 3.6656494140625, 3.792724609375, 3.9197998046875, 4.046875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 6.0, 3.0, 5.0, 4.0, 5.0, 10.0, 11.0, 14.0, 11.0, 21.0, 16.0, 21.0, 27.0, 30.0, 29.0, 26.0, 23.0, 33.0, 44.0, 35.0, 35.0, 42.0, 39.0, 41.0, 41.0, 43.0, 33.0, 38.0, 38.0, 36.0, 37.0, 22.0, 32.0, 28.0, 19.0, 16.0, 14.0, 15.0, 13.0, 15.0, 10.0, 9.0, 3.0, 4.0, 1.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.5234375, -2.445953369140625, -2.36846923828125, -2.290985107421875, -2.2135009765625, -2.136016845703125, -2.05853271484375, -1.981048583984375, -1.903564453125, -1.826080322265625, -1.74859619140625, -1.671112060546875, -1.5936279296875, -1.516143798828125, -1.43865966796875, -1.361175537109375, -1.28369140625, -1.206207275390625, -1.12872314453125, -1.051239013671875, -0.9737548828125, -0.896270751953125, -0.81878662109375, -0.741302490234375, -0.663818359375, -0.586334228515625, -0.50885009765625, -0.431365966796875, -0.3538818359375, -0.276397705078125, -0.19891357421875, -0.121429443359375, -0.0439453125, 0.033538818359375, 0.11102294921875, 0.188507080078125, 0.2659912109375, 0.343475341796875, 0.42095947265625, 0.498443603515625, 0.575927734375, 0.653411865234375, 0.73089599609375, 0.808380126953125, 0.8858642578125, 0.963348388671875, 1.04083251953125, 1.118316650390625, 1.19580078125, 1.273284912109375, 1.35076904296875, 1.428253173828125, 1.5057373046875, 1.583221435546875, 1.66070556640625, 1.738189697265625, 1.815673828125, 1.893157958984375, 1.97064208984375, 2.048126220703125, 2.1256103515625, 2.203094482421875, 2.28057861328125, 2.358062744140625, 2.435546875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 2.0, 4.0, 7.0, 4.0, 11.0, 14.0, 17.0, 26.0, 48.0, 73.0, 130.0, 288.0, 721.0, 2048.0, 12330.0, 971291.0, 56229.0, 3400.0, 1054.0, 374.0, 223.0, 110.0, 48.0, 30.0, 19.0, 17.0, 9.0, 8.0, 7.0, 4.0, 6.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0], "bins": [-7.94921875, -7.73260498046875, -7.5159912109375, -7.29937744140625, -7.082763671875, -6.86614990234375, -6.6495361328125, -6.43292236328125, -6.21630859375, -5.99969482421875, -5.7830810546875, -5.56646728515625, -5.349853515625, -5.13323974609375, -4.9166259765625, -4.70001220703125, -4.4833984375, -4.26678466796875, -4.0501708984375, -3.83355712890625, -3.616943359375, -3.40032958984375, -3.1837158203125, -2.96710205078125, -2.75048828125, -2.53387451171875, -2.3172607421875, -2.10064697265625, -1.884033203125, -1.66741943359375, -1.4508056640625, -1.23419189453125, -1.017578125, -0.80096435546875, -0.5843505859375, -0.36773681640625, -0.151123046875, 0.06549072265625, 0.2821044921875, 0.49871826171875, 0.71533203125, 0.93194580078125, 1.1485595703125, 1.36517333984375, 1.581787109375, 1.79840087890625, 2.0150146484375, 2.23162841796875, 2.4482421875, 2.66485595703125, 2.8814697265625, 3.09808349609375, 3.314697265625, 3.53131103515625, 3.7479248046875, 3.96453857421875, 4.18115234375, 4.39776611328125, 4.6143798828125, 4.83099365234375, 5.047607421875, 5.26422119140625, 5.4808349609375, 5.69744873046875, 5.9140625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 6.0, 6.0, 10.0, 20.0, 36.0, 64.0, 208.0, 354.0, 161.0, 78.0, 31.0, 16.0, 8.0, 6.0, 6.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042366981506347656, -0.00041138753294944763, -0.0003991052508354187, -0.00038682296872138977, -0.00037454068660736084, -0.0003622584044933319, -0.000349976122379303, -0.00033769384026527405, -0.0003254115581512451, -0.0003131292760372162, -0.00030084699392318726, -0.0002885647118091583, -0.0002762824296951294, -0.00026400014758110046, -0.00025171786546707153, -0.0002394355833530426, -0.00022715330123901367, -0.00021487101912498474, -0.0002025887370109558, -0.00019030645489692688, -0.00017802417278289795, -0.00016574189066886902, -0.0001534596085548401, -0.00014117732644081116, -0.00012889504432678223, -0.0001166127622127533, -0.00010433048009872437, -9.204819798469543e-05, -7.97659158706665e-05, -6.748363375663757e-05, -5.520135164260864e-05, -4.291906952857971e-05, -3.063678741455078e-05, -1.835450530052185e-05, -6.07222318649292e-06, 6.210058927536011e-06, 1.849234104156494e-05, 3.077462315559387e-05, 4.30569052696228e-05, 5.5339187383651733e-05, 6.762146949768066e-05, 7.99037516117096e-05, 9.218603372573853e-05, 0.00010446831583976746, 0.00011675059795379639, 0.00012903288006782532, 0.00014131516218185425, 0.00015359744429588318, 0.0001658797264099121, 0.00017816200852394104, 0.00019044429063796997, 0.0002027265727519989, 0.00021500885486602783, 0.00022729113698005676, 0.0002395734190940857, 0.0002518557012081146, 0.00026413798332214355, 0.0002764202654361725, 0.0002887025475502014, 0.00030098482966423035, 0.0003132671117782593, 0.0003255493938922882, 0.00033783167600631714, 0.00035011395812034607, 0.000362396240234375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 1.0, 5.0, 8.0, 7.0, 13.0, 23.0, 41.0, 102.0, 159.0, 307.0, 759.0, 2196.0, 11191.0, 227269.0, 777313.0, 23912.0, 3438.0, 1013.0, 426.0, 182.0, 75.0, 38.0, 26.0, 18.0, 12.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.34375, -4.21661376953125, -4.0894775390625, -3.96234130859375, -3.835205078125, -3.70806884765625, -3.5809326171875, -3.45379638671875, -3.32666015625, -3.19952392578125, -3.0723876953125, -2.94525146484375, -2.818115234375, -2.69097900390625, -2.5638427734375, -2.43670654296875, -2.3095703125, -2.18243408203125, -2.0552978515625, -1.92816162109375, -1.801025390625, -1.67388916015625, -1.5467529296875, -1.41961669921875, -1.29248046875, -1.16534423828125, -1.0382080078125, -0.91107177734375, -0.783935546875, -0.65679931640625, -0.5296630859375, -0.40252685546875, -0.275390625, -0.14825439453125, -0.0211181640625, 0.10601806640625, 0.233154296875, 0.36029052734375, 0.4874267578125, 0.61456298828125, 0.74169921875, 0.86883544921875, 0.9959716796875, 1.12310791015625, 1.250244140625, 1.37738037109375, 1.5045166015625, 1.63165283203125, 1.7587890625, 1.88592529296875, 2.0130615234375, 2.14019775390625, 2.267333984375, 2.39447021484375, 2.5216064453125, 2.64874267578125, 2.77587890625, 2.90301513671875, 3.0301513671875, 3.15728759765625, 3.284423828125, 3.41156005859375, 3.5386962890625, 3.66583251953125, 3.79296875]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 4.0, 10.0, 8.0, 24.0, 26.0, 40.0, 49.0, 72.0, 69.0, 110.0, 170.0, 117.0, 89.0, 77.0, 43.0, 31.0, 20.0, 12.0, 10.0, 7.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.728515625, -2.649261474609375, -2.57000732421875, -2.490753173828125, -2.4114990234375, -2.332244873046875, -2.25299072265625, -2.173736572265625, -2.094482421875, -2.015228271484375, -1.93597412109375, -1.856719970703125, -1.7774658203125, -1.698211669921875, -1.61895751953125, -1.539703369140625, -1.46044921875, -1.381195068359375, -1.30194091796875, -1.222686767578125, -1.1434326171875, -1.064178466796875, -0.98492431640625, -0.905670166015625, -0.826416015625, -0.747161865234375, -0.66790771484375, -0.588653564453125, -0.5093994140625, -0.430145263671875, -0.35089111328125, -0.271636962890625, -0.1923828125, -0.113128662109375, -0.03387451171875, 0.045379638671875, 0.1246337890625, 0.203887939453125, 0.28314208984375, 0.362396240234375, 0.441650390625, 0.520904541015625, 0.60015869140625, 0.679412841796875, 0.7586669921875, 0.837921142578125, 0.91717529296875, 0.996429443359375, 1.07568359375, 1.154937744140625, 1.23419189453125, 1.313446044921875, 1.3927001953125, 1.471954345703125, 1.55120849609375, 1.630462646484375, 1.709716796875, 1.788970947265625, 1.86822509765625, 1.947479248046875, 2.0267333984375, 2.105987548828125, 2.18524169921875, 2.264495849609375, 2.34375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 5.0, 19.0, 44.0, 132.0, 487.0, 232.0, 52.0, 18.0, 5.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-66.1846923828125, -64.59866333007812, -63.012638092041016, -61.426612854003906, -59.84058380126953, -58.25455856323242, -56.66852951049805, -55.08250427246094, -53.49647521972656, -51.91044998168945, -50.32442092895508, -48.73839569091797, -47.152366638183594, -45.566341400146484, -43.98031234741211, -42.394287109375, -40.808258056640625, -39.222232818603516, -37.63620376586914, -36.05017852783203, -34.464149475097656, -32.87812423706055, -31.292095184326172, -29.706069946289062, -28.120044708251953, -26.53401756286621, -24.94799041748047, -23.361963272094727, -21.775936126708984, -20.189908981323242, -18.6038818359375, -17.01785659790039, -15.431827545166016, -13.845800399780273, -12.259773254394531, -10.673746109008789, -9.087718963623047, -7.501692295074463, -5.915665626525879, -4.329638481140137, -2.7436113357543945, -1.157584309577942, 0.42844271659851074, 2.014469623565674, 3.600496768951416, 5.186523914337158, 6.772550582885742, 8.358577728271484, 9.944604873657227, 11.530632019042969, 13.116659164428711, 14.702686309814453, 16.288713455200195, 17.874740600585938, 19.460765838623047, 21.046794891357422, 22.63282012939453, 24.218847274780273, 25.804874420166016, 27.390901565551758, 28.9769287109375, 30.562955856323242, 32.148983001708984, 33.735008239746094, 35.32103729248047]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 3.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 8.0, 9.0, 7.0, 9.0, 27.0, 34.0, 40.0, 48.0, 54.0, 83.0, 70.0, 95.0, 91.0, 85.0, 77.0, 55.0, 46.0, 30.0, 29.0, 18.0, 21.0, 9.0, 7.0, 7.0, 7.0, 4.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-35.79064178466797, -34.79438400268555, -33.79812240600586, -32.80186462402344, -31.80560302734375, -30.809343338012695, -29.81308364868164, -28.81682586669922, -27.82056427001953, -26.824304580688477, -25.828044891357422, -24.831785202026367, -23.835525512695312, -22.839265823364258, -21.843006134033203, -20.84674835205078, -19.850488662719727, -18.854228973388672, -17.857969284057617, -16.861709594726562, -15.865449905395508, -14.869190216064453, -13.872931480407715, -12.87667179107666, -11.880412101745605, -10.88415241241455, -9.887892723083496, -8.891633987426758, -7.895373821258545, -6.89911413192749, -5.902854919433594, -4.906595230102539, -3.9103355407714844, -2.9140758514404297, -1.917816400527954, -0.9215569496154785, 0.07470273971557617, 1.0709624290466309, 2.0672216415405273, 3.063481330871582, 4.059741020202637, 5.056000709533691, 6.052260398864746, 7.048519611358643, 8.044778823852539, 9.041038513183594, 10.037298202514648, 11.033557891845703, 12.029817581176758, 13.026077270507812, 14.022336959838867, 15.018596649169922, 16.014856338500977, 17.01111602783203, 18.007373809814453, 19.00363540649414, 19.999893188476562, 20.996152877807617, 21.992412567138672, 22.988672256469727, 23.98493194580078, 24.981191635131836, 25.97745132446289, 26.973709106445312, 27.969970703125]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 4.0, 3.0, 2.0, 7.0, 5.0, 3.0, 7.0, 4.0, 8.0, 8.0, 6.0, 6.0, 11.0, 10.0, 21.0, 26.0, 27.0, 32.0, 34.0, 44.0, 60.0, 89.0, 80.0, 98.0, 152.0, 172.0, 220.0, 291.0, 448.0, 883.0, 1711.0, 3578.0, 11374.0, 139544.0, 4002693.0, 22634.0, 5071.0, 2162.0, 1084.0, 606.0, 342.0, 238.0, 153.0, 87.0, 67.0, 56.0, 44.0, 22.0, 16.0, 12.0, 12.0, 10.0, 5.0, 5.0], "bins": [-20.15625, -19.7000732421875, -19.243896484375, -18.7877197265625, -18.33154296875, -17.8753662109375, -17.419189453125, -16.9630126953125, -16.5068359375, -16.0506591796875, -15.594482421875, -15.1383056640625, -14.68212890625, -14.2259521484375, -13.769775390625, -13.3135986328125, -12.857421875, -12.4012451171875, -11.945068359375, -11.4888916015625, -11.03271484375, -10.5765380859375, -10.120361328125, -9.6641845703125, -9.2080078125, -8.7518310546875, -8.295654296875, -7.8394775390625, -7.38330078125, -6.9271240234375, -6.470947265625, -6.0147705078125, -5.55859375, -5.1024169921875, -4.646240234375, -4.1900634765625, -3.73388671875, -3.2777099609375, -2.821533203125, -2.3653564453125, -1.9091796875, -1.4530029296875, -0.996826171875, -0.5406494140625, -0.08447265625, 0.3717041015625, 0.827880859375, 1.2840576171875, 1.740234375, 2.1964111328125, 2.652587890625, 3.1087646484375, 3.56494140625, 4.0211181640625, 4.477294921875, 4.9334716796875, 5.3896484375, 5.8458251953125, 6.302001953125, 6.7581787109375, 7.21435546875, 7.6705322265625, 8.126708984375, 8.5828857421875, 9.0390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 13.0, 16.0, 14.0, 34.0, 96.0, 215.0, 266.0, 170.0, 75.0, 32.0, 17.0, 12.0, 11.0, 11.0, 2.0, 3.0, 0.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-1.736328125, -1.6971435546875, -1.657958984375, -1.6187744140625, -1.57958984375, -1.5404052734375, -1.501220703125, -1.4620361328125, -1.4228515625, -1.3836669921875, -1.344482421875, -1.3052978515625, -1.26611328125, -1.2269287109375, -1.187744140625, -1.1485595703125, -1.109375, -1.0701904296875, -1.031005859375, -0.9918212890625, -0.95263671875, -0.9134521484375, -0.874267578125, -0.8350830078125, -0.7958984375, -0.7567138671875, -0.717529296875, -0.6783447265625, -0.63916015625, -0.5999755859375, -0.560791015625, -0.5216064453125, -0.482421875, -0.4432373046875, -0.404052734375, -0.3648681640625, -0.32568359375, -0.2864990234375, -0.247314453125, -0.2081298828125, -0.1689453125, -0.1297607421875, -0.090576171875, -0.0513916015625, -0.01220703125, 0.0269775390625, 0.066162109375, 0.1053466796875, 0.14453125, 0.1837158203125, 0.222900390625, 0.2620849609375, 0.30126953125, 0.3404541015625, 0.379638671875, 0.4188232421875, 0.4580078125, 0.4971923828125, 0.536376953125, 0.5755615234375, 0.61474609375, 0.6539306640625, 0.693115234375, 0.7322998046875, 0.771484375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 5.0, 5.0, 9.0, 13.0, 10.0, 19.0, 20.0, 45.0, 69.0, 110.0, 275.0, 1014.0, 8852.0, 1870234.0, 2303047.0, 8938.0, 1082.0, 239.0, 87.0, 65.0, 47.0, 29.0, 17.0, 13.0, 8.0, 11.0, 4.0, 5.0, 5.0, 1.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.6640625, -13.1385498046875, -12.613037109375, -12.0875244140625, -11.56201171875, -11.0364990234375, -10.510986328125, -9.9854736328125, -9.4599609375, -8.9344482421875, -8.408935546875, -7.8834228515625, -7.35791015625, -6.8323974609375, -6.306884765625, -5.7813720703125, -5.255859375, -4.7303466796875, -4.204833984375, -3.6793212890625, -3.15380859375, -2.6282958984375, -2.102783203125, -1.5772705078125, -1.0517578125, -0.5262451171875, -0.000732421875, 0.5247802734375, 1.05029296875, 1.5758056640625, 2.101318359375, 2.6268310546875, 3.15234375, 3.6778564453125, 4.203369140625, 4.7288818359375, 5.25439453125, 5.7799072265625, 6.305419921875, 6.8309326171875, 7.3564453125, 7.8819580078125, 8.407470703125, 8.9329833984375, 9.45849609375, 9.9840087890625, 10.509521484375, 11.0350341796875, 11.560546875, 12.0860595703125, 12.611572265625, 13.1370849609375, 13.66259765625, 14.1881103515625, 14.713623046875, 15.2391357421875, 15.7646484375, 16.2901611328125, 16.815673828125, 17.3411865234375, 17.86669921875, 18.3922119140625, 18.917724609375, 19.4432373046875, 19.96875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 5.0, 2.0, 6.0, 4.0, 11.0, 13.0, 18.0, 20.0, 28.0, 38.0, 62.0, 129.0, 346.0, 2299.0, 652.0, 179.0, 87.0, 47.0, 35.0, 30.0, 9.0, 11.0, 9.0, 9.0, 8.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-2.068359375, -2.018768310546875, -1.96917724609375, -1.919586181640625, -1.8699951171875, -1.820404052734375, -1.77081298828125, -1.721221923828125, -1.671630859375, -1.622039794921875, -1.57244873046875, -1.522857666015625, -1.4732666015625, -1.423675537109375, -1.37408447265625, -1.324493408203125, -1.27490234375, -1.225311279296875, -1.17572021484375, -1.126129150390625, -1.0765380859375, -1.026947021484375, -0.97735595703125, -0.927764892578125, -0.878173828125, -0.828582763671875, -0.77899169921875, -0.729400634765625, -0.6798095703125, -0.630218505859375, -0.58062744140625, -0.531036376953125, -0.4814453125, -0.431854248046875, -0.38226318359375, -0.332672119140625, -0.2830810546875, -0.233489990234375, -0.18389892578125, -0.134307861328125, -0.084716796875, -0.035125732421875, 0.01446533203125, 0.064056396484375, 0.1136474609375, 0.163238525390625, 0.21282958984375, 0.262420654296875, 0.31201171875, 0.361602783203125, 0.41119384765625, 0.460784912109375, 0.5103759765625, 0.559967041015625, 0.60955810546875, 0.659149169921875, 0.708740234375, 0.758331298828125, 0.80792236328125, 0.857513427734375, 0.9071044921875, 0.956695556640625, 1.00628662109375, 1.055877685546875, 1.10546875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 10.0, 35.0, 159.0, 571.0, 183.0, 34.0, 9.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5868446826934814, -3.0413684844970703, -2.495892286300659, -1.950416088104248, -1.404939889907837, -0.8594636917114258, -0.31398749351501465, 0.23148870468139648, 0.7769649028778076, 1.3224411010742188, 1.8679172992706299, 2.413393497467041, 2.958869695663452, 3.5043458938598633, 4.049821853637695, 4.5952982902526855, 5.140774726867676, 5.686250686645508, 6.231727123260498, 6.777203559875488, 7.32267951965332, 7.868155479431152, 8.413631439208984, 8.959108352661133, 9.504584312438965, 10.050060272216797, 10.595537185668945, 11.141013145446777, 11.68648910522461, 12.231965065002441, 12.777441024780273, 13.322917938232422, 13.86839485168457, 14.413870811462402, 14.959346771240234, 15.504823684692383, 16.05030059814453, 16.595775604248047, 17.141252517700195, 17.68672752380371, 18.23220443725586, 18.777681350708008, 19.323156356811523, 19.868633270263672, 20.414108276367188, 20.959585189819336, 21.505062103271484, 22.050537109375, 22.59601402282715, 23.141490936279297, 23.686965942382812, 24.23244285583496, 24.77791976928711, 25.323394775390625, 25.868871688842773, 26.41434669494629, 26.959823608398438, 27.505300521850586, 28.0507755279541, 28.59625244140625, 29.141727447509766, 29.687204360961914, 30.232681274414062, 30.778156280517578, 31.323633193969727]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 2.0, 1.0, 4.0, 7.0, 7.0, 5.0, 4.0, 15.0, 17.0, 12.0, 22.0, 25.0, 32.0, 26.0, 40.0, 43.0, 54.0, 45.0, 62.0, 51.0, 66.0, 63.0, 51.0, 57.0, 60.0, 32.0, 38.0, 29.0, 26.0, 22.0, 17.0, 23.0, 8.0, 6.0, 8.0, 8.0, 3.0, 2.0, 7.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.2804365158081055, -5.115255355834961, -4.950074672698975, -4.78489351272583, -4.619712829589844, -4.454531669616699, -4.289350509643555, -4.124169826507568, -3.958988666534424, -3.7938077449798584, -3.628626823425293, -3.4634456634521484, -3.298264741897583, -3.1330838203430176, -2.967902898788452, -2.8027219772338867, -2.6375410556793213, -2.472360134124756, -2.3071792125701904, -2.141998291015625, -1.9768171310424805, -1.811636209487915, -1.6464552879333496, -1.4812742471694946, -1.3160933256149292, -1.1509124040603638, -0.9857313632965088, -0.8205504417419434, -0.6553694605827332, -0.49018847942352295, -0.3250075578689575, -0.15982651710510254, 0.005354404449462891, 0.1705353707075119, 0.3357163369655609, 0.5008972883224487, 0.6660782694816589, 0.8312592506408691, 0.9964401721954346, 1.1616212129592896, 1.326802134513855, 1.4919830560684204, 1.6571640968322754, 1.8223450183868408, 1.9875259399414062, 2.152707099914551, 2.317887783050537, 2.4830689430236816, 2.648249864578247, 2.8134307861328125, 2.978611707687378, 3.1437926292419434, 3.308973789215088, 3.4741547107696533, 3.6393356323242188, 3.8045167922973633, 3.9696974754333496, 4.134878635406494, 4.3000593185424805, 4.465240478515625, 4.630421161651611, 4.795602321624756, 4.960783004760742, 5.125964164733887, 5.291145324707031]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 9.0, 8.0, 8.0, 12.0, 22.0, 29.0, 34.0, 65.0, 102.0, 171.0, 339.0, 617.0, 1259.0, 3605.0, 26275.0, 948354.0, 59387.0, 5136.0, 1597.0, 666.0, 375.0, 193.0, 103.0, 59.0, 43.0, 28.0, 18.0, 18.0, 8.0, 5.0, 7.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.65625, -13.237548828125, -12.81884765625, -12.400146484375, -11.9814453125, -11.562744140625, -11.14404296875, -10.725341796875, -10.306640625, -9.887939453125, -9.46923828125, -9.050537109375, -8.6318359375, -8.213134765625, -7.79443359375, -7.375732421875, -6.95703125, -6.538330078125, -6.11962890625, -5.700927734375, -5.2822265625, -4.863525390625, -4.44482421875, -4.026123046875, -3.607421875, -3.188720703125, -2.77001953125, -2.351318359375, -1.9326171875, -1.513916015625, -1.09521484375, -0.676513671875, -0.2578125, 0.160888671875, 0.57958984375, 0.998291015625, 1.4169921875, 1.835693359375, 2.25439453125, 2.673095703125, 3.091796875, 3.510498046875, 3.92919921875, 4.347900390625, 4.7666015625, 5.185302734375, 5.60400390625, 6.022705078125, 6.44140625, 6.860107421875, 7.27880859375, 7.697509765625, 8.1162109375, 8.534912109375, 8.95361328125, 9.372314453125, 9.791015625, 10.209716796875, 10.62841796875, 11.047119140625, 11.4658203125, 11.884521484375, 12.30322265625, 12.721923828125, 13.140625]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 18.0, 39.0, 87.0, 200.0, 214.0, 192.0, 136.0, 48.0, 24.0, 4.0, 12.0, 5.0, 5.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6923828125, -1.6535186767578125, -1.614654541015625, -1.5757904052734375, -1.53692626953125, -1.4980621337890625, -1.459197998046875, -1.4203338623046875, -1.3814697265625, -1.3426055908203125, -1.303741455078125, -1.2648773193359375, -1.22601318359375, -1.1871490478515625, -1.148284912109375, -1.1094207763671875, -1.070556640625, -1.0316925048828125, -0.992828369140625, -0.9539642333984375, -0.91510009765625, -0.8762359619140625, -0.837371826171875, -0.7985076904296875, -0.7596435546875, -0.7207794189453125, -0.681915283203125, -0.6430511474609375, -0.60418701171875, -0.5653228759765625, -0.526458740234375, -0.4875946044921875, -0.44873046875, -0.4098663330078125, -0.371002197265625, -0.3321380615234375, -0.29327392578125, -0.2544097900390625, -0.215545654296875, -0.1766815185546875, -0.1378173828125, -0.0989532470703125, -0.060089111328125, -0.0212249755859375, 0.01763916015625, 0.0565032958984375, 0.095367431640625, 0.1342315673828125, 0.173095703125, 0.2119598388671875, 0.250823974609375, 0.2896881103515625, 0.32855224609375, 0.3674163818359375, 0.406280517578125, 0.4451446533203125, 0.4840087890625, 0.5228729248046875, 0.561737060546875, 0.6006011962890625, 0.63946533203125, 0.6783294677734375, 0.717193603515625, 0.7560577392578125, 0.794921875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 1.0, 0.0, 4.0, 5.0, 4.0, 7.0, 11.0, 10.0, 10.0, 13.0, 17.0, 25.0, 34.0, 39.0, 79.0, 125.0, 200.0, 414.0, 1024.0, 2709.0, 13348.0, 152380.0, 803582.0, 63178.0, 7733.0, 1910.0, 724.0, 364.0, 198.0, 131.0, 71.0, 43.0, 32.0, 19.0, 15.0, 18.0, 17.0, 13.0, 7.0, 15.0, 7.0, 4.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.66015625, -7.41571044921875, -7.1712646484375, -6.92681884765625, -6.682373046875, -6.43792724609375, -6.1934814453125, -5.94903564453125, -5.70458984375, -5.46014404296875, -5.2156982421875, -4.97125244140625, -4.726806640625, -4.48236083984375, -4.2379150390625, -3.99346923828125, -3.7490234375, -3.50457763671875, -3.2601318359375, -3.01568603515625, -2.771240234375, -2.52679443359375, -2.2823486328125, -2.03790283203125, -1.79345703125, -1.54901123046875, -1.3045654296875, -1.06011962890625, -0.815673828125, -0.57122802734375, -0.3267822265625, -0.08233642578125, 0.162109375, 0.40655517578125, 0.6510009765625, 0.89544677734375, 1.139892578125, 1.38433837890625, 1.6287841796875, 1.87322998046875, 2.11767578125, 2.36212158203125, 2.6065673828125, 2.85101318359375, 3.095458984375, 3.33990478515625, 3.5843505859375, 3.82879638671875, 4.0732421875, 4.31768798828125, 4.5621337890625, 4.80657958984375, 5.051025390625, 5.29547119140625, 5.5399169921875, 5.78436279296875, 6.02880859375, 6.27325439453125, 6.5177001953125, 6.76214599609375, 7.006591796875, 7.25103759765625, 7.4954833984375, 7.73992919921875, 7.984375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0, 6.0, 4.0, 11.0, 8.0, 7.0, 14.0, 15.0, 22.0, 19.0, 25.0, 26.0, 24.0, 26.0, 28.0, 26.0, 38.0, 38.0, 39.0, 48.0, 41.0, 51.0, 48.0, 40.0, 38.0, 30.0, 38.0, 32.0, 38.0, 25.0, 25.0, 30.0, 16.0, 14.0, 28.0, 15.0, 15.0, 12.0, 11.0, 5.0, 9.0, 7.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.470703125, -2.390838623046875, -2.31097412109375, -2.231109619140625, -2.1512451171875, -2.071380615234375, -1.99151611328125, -1.911651611328125, -1.831787109375, -1.751922607421875, -1.67205810546875, -1.592193603515625, -1.5123291015625, -1.432464599609375, -1.35260009765625, -1.272735595703125, -1.19287109375, -1.113006591796875, -1.03314208984375, -0.953277587890625, -0.8734130859375, -0.793548583984375, -0.71368408203125, -0.633819580078125, -0.553955078125, -0.474090576171875, -0.39422607421875, -0.314361572265625, -0.2344970703125, -0.154632568359375, -0.07476806640625, 0.005096435546875, 0.0849609375, 0.164825439453125, 0.24468994140625, 0.324554443359375, 0.4044189453125, 0.484283447265625, 0.56414794921875, 0.644012451171875, 0.723876953125, 0.803741455078125, 0.88360595703125, 0.963470458984375, 1.0433349609375, 1.123199462890625, 1.20306396484375, 1.282928466796875, 1.36279296875, 1.442657470703125, 1.52252197265625, 1.602386474609375, 1.6822509765625, 1.762115478515625, 1.84197998046875, 1.921844482421875, 2.001708984375, 2.081573486328125, 2.16143798828125, 2.241302490234375, 2.3211669921875, 2.401031494140625, 2.48089599609375, 2.560760498046875, 2.640625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 10.0, 16.0, 15.0, 28.0, 38.0, 73.0, 140.0, 301.0, 652.0, 1776.0, 10689.0, 426258.0, 592424.0, 12791.0, 2014.0, 672.0, 290.0, 141.0, 82.0, 49.0, 32.0, 22.0, 6.0, 8.0, 3.0, 5.0, 1.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09765625, -3.96124267578125, -3.8248291015625, -3.68841552734375, -3.552001953125, -3.41558837890625, -3.2791748046875, -3.14276123046875, -3.00634765625, -2.86993408203125, -2.7335205078125, -2.59710693359375, -2.460693359375, -2.32427978515625, -2.1878662109375, -2.05145263671875, -1.9150390625, -1.77862548828125, -1.6422119140625, -1.50579833984375, -1.369384765625, -1.23297119140625, -1.0965576171875, -0.96014404296875, -0.82373046875, -0.68731689453125, -0.5509033203125, -0.41448974609375, -0.278076171875, -0.14166259765625, -0.0052490234375, 0.13116455078125, 0.267578125, 0.40399169921875, 0.5404052734375, 0.67681884765625, 0.813232421875, 0.94964599609375, 1.0860595703125, 1.22247314453125, 1.35888671875, 1.49530029296875, 1.6317138671875, 1.76812744140625, 1.904541015625, 2.04095458984375, 2.1773681640625, 2.31378173828125, 2.4501953125, 2.58660888671875, 2.7230224609375, 2.85943603515625, 2.995849609375, 3.13226318359375, 3.2686767578125, 3.40509033203125, 3.54150390625, 3.67791748046875, 3.8143310546875, 3.95074462890625, 4.087158203125, 4.22357177734375, 4.3599853515625, 4.49639892578125, 4.6328125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 9.0, 12.0, 7.0, 19.0, 27.0, 26.0, 39.0, 48.0, 47.0, 104.0, 134.0, 121.0, 95.0, 83.0, 55.0, 43.0, 35.0, 18.0, 21.0, 15.0, 8.0, 12.0, 4.0, 4.0, 1.0, 3.0, 5.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014448165893554688, -0.00013848207890987396, -0.00013248249888420105, -0.00012648291885852814, -0.00012048333883285522, -0.00011448375880718231, -0.0001084841787815094, -0.00010248459875583649, -9.648501873016357e-05, -9.048543870449066e-05, -8.448585867881775e-05, -7.848627865314484e-05, -7.248669862747192e-05, -6.648711860179901e-05, -6.04875385761261e-05, -5.4487958550453186e-05, -4.8488378524780273e-05, -4.248879849910736e-05, -3.648921847343445e-05, -3.0489638447761536e-05, -2.4490058422088623e-05, -1.849047839641571e-05, -1.2490898370742798e-05, -6.491318345069885e-06, -4.917383193969727e-07, 5.50784170627594e-06, 1.1507421731948853e-05, 1.7507001757621765e-05, 2.3506581783294678e-05, 2.950616180896759e-05, 3.55057418346405e-05, 4.1505321860313416e-05, 4.750490188598633e-05, 5.350448191165924e-05, 5.950406193733215e-05, 6.550364196300507e-05, 7.150322198867798e-05, 7.750280201435089e-05, 8.35023820400238e-05, 8.950196206569672e-05, 9.550154209136963e-05, 0.00010150112211704254, 0.00010750070214271545, 0.00011350028216838837, 0.00011949986219406128, 0.0001254994422197342, 0.0001314990222454071, 0.00013749860227108002, 0.00014349818229675293, 0.00014949776232242584, 0.00015549734234809875, 0.00016149692237377167, 0.00016749650239944458, 0.0001734960824251175, 0.0001794956624507904, 0.00018549524247646332, 0.00019149482250213623, 0.00019749440252780914, 0.00020349398255348206, 0.00020949356257915497, 0.00021549314260482788, 0.0002214927226305008, 0.0002274923026561737, 0.00023349188268184662, 0.00023949146270751953]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 6.0, 4.0, 7.0, 11.0, 30.0, 35.0, 62.0, 82.0, 142.0, 352.0, 867.0, 3336.0, 26340.0, 852579.0, 153768.0, 8032.0, 1737.0, 566.0, 257.0, 119.0, 65.0, 43.0, 38.0, 22.0, 11.0, 10.0, 4.0, 8.0, 8.0, 1.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8828125, -4.73370361328125, -4.5845947265625, -4.43548583984375, -4.286376953125, -4.13726806640625, -3.9881591796875, -3.83905029296875, -3.68994140625, -3.54083251953125, -3.3917236328125, -3.24261474609375, -3.093505859375, -2.94439697265625, -2.7952880859375, -2.64617919921875, -2.4970703125, -2.34796142578125, -2.1988525390625, -2.04974365234375, -1.900634765625, -1.75152587890625, -1.6024169921875, -1.45330810546875, -1.30419921875, -1.15509033203125, -1.0059814453125, -0.85687255859375, -0.707763671875, -0.55865478515625, -0.4095458984375, -0.26043701171875, -0.111328125, 0.03778076171875, 0.1868896484375, 0.33599853515625, 0.485107421875, 0.63421630859375, 0.7833251953125, 0.93243408203125, 1.08154296875, 1.23065185546875, 1.3797607421875, 1.52886962890625, 1.677978515625, 1.82708740234375, 1.9761962890625, 2.12530517578125, 2.2744140625, 2.42352294921875, 2.5726318359375, 2.72174072265625, 2.870849609375, 3.01995849609375, 3.1690673828125, 3.31817626953125, 3.46728515625, 3.61639404296875, 3.7655029296875, 3.91461181640625, 4.063720703125, 4.21282958984375, 4.3619384765625, 4.51104736328125, 4.66015625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 5.0, 5.0, 9.0, 11.0, 21.0, 20.0, 37.0, 39.0, 59.0, 55.0, 84.0, 89.0, 107.0, 106.0, 76.0, 74.0, 50.0, 36.0, 39.0, 14.0, 9.0, 20.0, 8.0, 7.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 5.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5048828125, -1.4523773193359375, -1.399871826171875, -1.3473663330078125, -1.29486083984375, -1.2423553466796875, -1.189849853515625, -1.1373443603515625, -1.0848388671875, -1.0323333740234375, -0.979827880859375, -0.9273223876953125, -0.87481689453125, -0.8223114013671875, -0.769805908203125, -0.7173004150390625, -0.664794921875, -0.6122894287109375, -0.559783935546875, -0.5072784423828125, -0.45477294921875, -0.4022674560546875, -0.349761962890625, -0.2972564697265625, -0.2447509765625, -0.1922454833984375, -0.139739990234375, -0.0872344970703125, -0.03472900390625, 0.0177764892578125, 0.070281982421875, 0.1227874755859375, 0.17529296875, 0.2277984619140625, 0.280303955078125, 0.3328094482421875, 0.38531494140625, 0.4378204345703125, 0.490325927734375, 0.5428314208984375, 0.5953369140625, 0.6478424072265625, 0.700347900390625, 0.7528533935546875, 0.80535888671875, 0.8578643798828125, 0.910369873046875, 0.9628753662109375, 1.015380859375, 1.0678863525390625, 1.120391845703125, 1.1728973388671875, 1.22540283203125, 1.2779083251953125, 1.330413818359375, 1.3829193115234375, 1.4354248046875, 1.4879302978515625, 1.540435791015625, 1.5929412841796875, 1.64544677734375, 1.6979522705078125, 1.750457763671875, 1.8029632568359375, 1.85546875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 1.0, 9.0, 17.0, 119.0, 577.0, 236.0, 33.0, 11.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.367431640625, -17.71942901611328, -15.07142448425293, -12.423420906066895, -9.77541732788086, -7.127413749694824, -4.479410171508789, -1.8314056396484375, 0.8165969848632812, 3.4646005630493164, 6.112604141235352, 8.760607719421387, 11.408611297607422, 14.056614875793457, 16.704618453979492, 19.352622985839844, 22.000625610351562, 24.64862823486328, 27.296632766723633, 29.944637298583984, 32.5926399230957, 35.24064254760742, 37.888648986816406, 40.536651611328125, 43.184654235839844, 45.83265686035156, 48.48065948486328, 51.128665924072266, 53.776668548583984, 56.4246711730957, 59.07267761230469, 61.720680236816406, 64.36868286132812, 67.01668548583984, 69.66468811035156, 72.31269073486328, 74.960693359375, 77.60870361328125, 80.25670623779297, 82.90470886230469, 85.5527114868164, 88.20071411132812, 90.84871673583984, 93.49671936035156, 96.14472961425781, 98.79273223876953, 101.44073486328125, 104.08873748779297, 106.73674011230469, 109.3847427368164, 112.03274536132812, 114.68074798583984, 117.32875061035156, 119.97676086425781, 122.62476348876953, 125.27276611328125, 127.92076873779297, 130.5687713623047, 133.21678161621094, 135.86477661132812, 138.51278686523438, 141.16078186035156, 143.8087921142578, 146.456787109375, 149.10479736328125]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 4.0, 7.0, 9.0, 11.0, 5.0, 16.0, 16.0, 16.0, 30.0, 48.0, 52.0, 51.0, 68.0, 73.0, 76.0, 66.0, 61.0, 56.0, 67.0, 48.0, 46.0, 37.0, 38.0, 27.0, 17.0, 18.0, 10.0, 12.0, 5.0, 4.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.94731521606445, -34.030887603759766, -33.11445617675781, -32.198028564453125, -31.281600952148438, -30.365171432495117, -29.44874382019043, -28.53231430053711, -27.615886688232422, -26.6994571685791, -25.783029556274414, -24.866600036621094, -23.950172424316406, -23.033742904663086, -22.1173152923584, -21.200885772705078, -20.28445816040039, -19.36802864074707, -18.451601028442383, -17.535171508789062, -16.618743896484375, -15.702314376831055, -14.785886764526367, -13.869457244873047, -12.953027725219727, -12.036599159240723, -11.120170593261719, -10.203742027282715, -9.287313461303711, -8.37088394165039, -7.454455852508545, -6.538027286529541, -5.621599197387695, -4.705170631408691, -3.7887420654296875, -2.8723132610321045, -1.9558846950531006, -1.0394558906555176, -0.12302732467651367, 0.7934012413024902, 1.7098298072814941, 2.626258373260498, 3.542686939239502, 4.459115982055664, 5.375544548034668, 6.291973114013672, 7.208401679992676, 8.12483024597168, 9.041258811950684, 9.957687377929688, 10.874115943908691, 11.790544509887695, 12.7069730758667, 13.623401641845703, 14.539831161499023, 15.456258773803711, 16.37268829345703, 17.28911781311035, 18.20554542541504, 19.12197494506836, 20.038402557373047, 20.954832077026367, 21.871259689331055, 22.787689208984375, 23.704116821289062]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 7.0, 4.0, 11.0, 18.0, 41.0, 96.0, 203.0, 594.0, 3567.0, 4179329.0, 9745.0, 438.0, 140.0, 48.0, 29.0, 4.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-79.6875, -77.90283203125, -76.1181640625, -74.33349609375, -72.548828125, -70.76416015625, -68.9794921875, -67.19482421875, -65.41015625, -63.62548828125, -61.8408203125, -60.05615234375, -58.271484375, -56.48681640625, -54.7021484375, -52.91748046875, -51.1328125, -49.34814453125, -47.5634765625, -45.77880859375, -43.994140625, -42.20947265625, -40.4248046875, -38.64013671875, -36.85546875, -35.07080078125, -33.2861328125, -31.50146484375, -29.716796875, -27.93212890625, -26.1474609375, -24.36279296875, -22.578125, -20.79345703125, -19.0087890625, -17.22412109375, -15.439453125, -13.65478515625, -11.8701171875, -10.08544921875, -8.30078125, -6.51611328125, -4.7314453125, -2.94677734375, -1.162109375, 0.62255859375, 2.4072265625, 4.19189453125, 5.9765625, 7.76123046875, 9.5458984375, 11.33056640625, 13.115234375, 14.89990234375, 16.6845703125, 18.46923828125, 20.25390625, 22.03857421875, 23.8232421875, 25.60791015625, 27.392578125, 29.17724609375, 30.9619140625, 32.74658203125, 34.53125]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 11.0, 18.0, 37.0, 78.0, 158.0, 197.0, 207.0, 140.0, 79.0, 29.0, 26.0, 9.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.294921875, -2.24371337890625, -2.1925048828125, -2.14129638671875, -2.090087890625, -2.03887939453125, -1.9876708984375, -1.93646240234375, -1.88525390625, -1.83404541015625, -1.7828369140625, -1.73162841796875, -1.680419921875, -1.62921142578125, -1.5780029296875, -1.52679443359375, -1.4755859375, -1.42437744140625, -1.3731689453125, -1.32196044921875, -1.270751953125, -1.21954345703125, -1.1683349609375, -1.11712646484375, -1.06591796875, -1.01470947265625, -0.9635009765625, -0.91229248046875, -0.861083984375, -0.80987548828125, -0.7586669921875, -0.70745849609375, -0.65625, -0.60504150390625, -0.5538330078125, -0.50262451171875, -0.451416015625, -0.40020751953125, -0.3489990234375, -0.29779052734375, -0.24658203125, -0.19537353515625, -0.1441650390625, -0.09295654296875, -0.041748046875, 0.00946044921875, 0.0606689453125, 0.11187744140625, 0.1630859375, 0.21429443359375, 0.2655029296875, 0.31671142578125, 0.367919921875, 0.41912841796875, 0.4703369140625, 0.52154541015625, 0.57275390625, 0.62396240234375, 0.6751708984375, 0.72637939453125, 0.777587890625, 0.82879638671875, 0.8800048828125, 0.93121337890625, 0.982421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 4.0, 1.0, 4.0, 16.0, 12.0, 9.0, 24.0, 43.0, 50.0, 108.0, 212.0, 447.0, 1626.0, 10193.0, 1577217.0, 2592209.0, 9945.0, 1516.0, 345.0, 133.0, 65.0, 41.0, 29.0, 17.0, 7.0, 5.0, 4.0, 3.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.34375, -19.8814697265625, -19.419189453125, -18.9569091796875, -18.49462890625, -18.0323486328125, -17.570068359375, -17.1077880859375, -16.6455078125, -16.1832275390625, -15.720947265625, -15.2586669921875, -14.79638671875, -14.3341064453125, -13.871826171875, -13.4095458984375, -12.947265625, -12.4849853515625, -12.022705078125, -11.5604248046875, -11.09814453125, -10.6358642578125, -10.173583984375, -9.7113037109375, -9.2490234375, -8.7867431640625, -8.324462890625, -7.8621826171875, -7.39990234375, -6.9376220703125, -6.475341796875, -6.0130615234375, -5.55078125, -5.0885009765625, -4.626220703125, -4.1639404296875, -3.70166015625, -3.2393798828125, -2.777099609375, -2.3148193359375, -1.8525390625, -1.3902587890625, -0.927978515625, -0.4656982421875, -0.00341796875, 0.4588623046875, 0.921142578125, 1.3834228515625, 1.845703125, 2.3079833984375, 2.770263671875, 3.2325439453125, 3.69482421875, 4.1571044921875, 4.619384765625, 5.0816650390625, 5.5439453125, 6.0062255859375, 6.468505859375, 6.9307861328125, 7.39306640625, 7.8553466796875, 8.317626953125, 8.7799072265625, 9.2421875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 5.0, 1.0, 1.0, 2.0, 1.0, 7.0, 6.0, 10.0, 25.0, 36.0, 46.0, 95.0, 247.0, 2262.0, 976.0, 172.0, 89.0, 41.0, 21.0, 14.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.75390625, -3.6738433837890625, -3.593780517578125, -3.5137176513671875, -3.43365478515625, -3.3535919189453125, -3.273529052734375, -3.1934661865234375, -3.1134033203125, -3.0333404541015625, -2.953277587890625, -2.8732147216796875, -2.79315185546875, -2.7130889892578125, -2.633026123046875, -2.5529632568359375, -2.472900390625, -2.3928375244140625, -2.312774658203125, -2.2327117919921875, -2.15264892578125, -2.0725860595703125, -1.992523193359375, -1.9124603271484375, -1.8323974609375, -1.7523345947265625, -1.672271728515625, -1.5922088623046875, -1.51214599609375, -1.4320831298828125, -1.352020263671875, -1.2719573974609375, -1.19189453125, -1.1118316650390625, -1.031768798828125, -0.9517059326171875, -0.87164306640625, -0.7915802001953125, -0.711517333984375, -0.6314544677734375, -0.5513916015625, -0.4713287353515625, -0.391265869140625, -0.3112030029296875, -0.23114013671875, -0.1510772705078125, -0.071014404296875, 0.0090484619140625, 0.089111328125, 0.1691741943359375, 0.249237060546875, 0.3292999267578125, 0.40936279296875, 0.4894256591796875, 0.569488525390625, 0.6495513916015625, 0.7296142578125, 0.8096771240234375, 0.889739990234375, 0.9698028564453125, 1.04986572265625, 1.1299285888671875, 1.209991455078125, 1.2900543212890625, 1.3701171875]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 8.0, 14.0, 42.0, 92.0, 300.0, 343.0, 132.0, 40.0, 19.0, 10.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-20.79538917541504, -20.381046295166016, -19.96670150756836, -19.552358627319336, -19.138015747070312, -18.723670959472656, -18.309328079223633, -17.89498519897461, -17.480640411376953, -17.06629753112793, -16.651952743530273, -16.23760986328125, -15.82326602935791, -15.408923149108887, -14.994579315185547, -14.580236434936523, -14.1658935546875, -13.75154972076416, -13.337206840515137, -12.922863006591797, -12.508519172668457, -12.094176292419434, -11.679832458496094, -11.26548957824707, -10.851144790649414, -10.436800956726074, -10.02245807647705, -9.608114242553711, -9.193770408630371, -8.779427528381348, -8.365083694458008, -7.950740337371826, -7.536397457122803, -7.122054100036621, -6.707710266113281, -6.2933669090271, -5.879023551940918, -5.464679718017578, -5.0503363609313965, -4.635993003845215, -4.221649169921875, -3.8073055744171143, -3.3929622173309326, -2.978618621826172, -2.5642752647399902, -2.1499316692352295, -1.7355880737304688, -1.321244716644287, -0.9069013595581055, -0.4925578534603119, -0.07821434736251831, 0.33612918853759766, 0.7504726648330688, 1.16481614112854, 1.5791597366333008, 1.9935030937194824, 2.407846689224243, 2.822190284729004, 3.2365336418151855, 3.6508772373199463, 4.065220832824707, 4.479564189910889, 4.89390754699707, 5.30825138092041, 5.722594738006592]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 2.0, 1.0, 5.0, 10.0, 8.0, 8.0, 8.0, 16.0, 17.0, 20.0, 27.0, 21.0, 33.0, 39.0, 40.0, 41.0, 37.0, 36.0, 51.0, 41.0, 45.0, 48.0, 65.0, 48.0, 39.0, 34.0, 34.0, 33.0, 34.0, 23.0, 26.0, 28.0, 9.0, 13.0, 17.0, 11.0, 5.0, 7.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.436602592468262, -5.275496482849121, -5.1143903732299805, -4.95328426361084, -4.792178153991699, -4.631072521209717, -4.469966411590576, -4.3088603019714355, -4.147754192352295, -3.9866480827331543, -3.8255419731140137, -3.664436101913452, -3.5033299922943115, -3.342223882675171, -3.1811180114746094, -3.0200119018554688, -2.858905792236328, -2.6977996826171875, -2.536693572998047, -2.3755877017974854, -2.2144815921783447, -2.053375482559204, -1.892269492149353, -1.731163501739502, -1.5700573921203613, -1.4089512825012207, -1.2478452920913696, -1.0867393016815186, -0.9256331920623779, -0.7645271420478821, -0.6034210920333862, -0.44231510162353516, -0.28120899200439453, -0.12010294198989868, 0.04100310802459717, 0.20210915803909302, 0.36321520805358887, 0.5243212580680847, 0.6854273080825806, 0.8465332984924316, 1.0076394081115723, 1.168745517730713, 1.329851508140564, 1.490957498550415, 1.6520636081695557, 1.8131697177886963, 1.9742757081985474, 2.1353816986083984, 2.296487808227539, 2.4575939178466797, 2.6187000274658203, 2.779805898666382, 2.9409120082855225, 3.102018117904663, 3.2631239891052246, 3.4242300987243652, 3.585336208343506, 3.7464423179626465, 3.907548427581787, 4.068654537200928, 4.22976016998291, 4.390866279602051, 4.551972389221191, 4.713078498840332, 4.874184608459473]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 2.0, 9.0, 11.0, 16.0, 22.0, 18.0, 36.0, 61.0, 96.0, 179.0, 337.0, 666.0, 1645.0, 5504.0, 98169.0, 918031.0, 18741.0, 3037.0, 1000.0, 431.0, 205.0, 104.0, 83.0, 46.0, 18.0, 28.0, 17.0, 14.0, 7.0, 7.0, 4.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.953125, -12.56396484375, -12.1748046875, -11.78564453125, -11.396484375, -11.00732421875, -10.6181640625, -10.22900390625, -9.83984375, -9.45068359375, -9.0615234375, -8.67236328125, -8.283203125, -7.89404296875, -7.5048828125, -7.11572265625, -6.7265625, -6.33740234375, -5.9482421875, -5.55908203125, -5.169921875, -4.78076171875, -4.3916015625, -4.00244140625, -3.61328125, -3.22412109375, -2.8349609375, -2.44580078125, -2.056640625, -1.66748046875, -1.2783203125, -0.88916015625, -0.5, -0.11083984375, 0.2783203125, 0.66748046875, 1.056640625, 1.44580078125, 1.8349609375, 2.22412109375, 2.61328125, 3.00244140625, 3.3916015625, 3.78076171875, 4.169921875, 4.55908203125, 4.9482421875, 5.33740234375, 5.7265625, 6.11572265625, 6.5048828125, 6.89404296875, 7.283203125, 7.67236328125, 8.0615234375, 8.45068359375, 8.83984375, 9.22900390625, 9.6181640625, 10.00732421875, 10.396484375, 10.78564453125, 11.1748046875, 11.56396484375, 11.953125]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 11.0, 21.0, 55.0, 114.0, 164.0, 191.0, 191.0, 116.0, 69.0, 40.0, 11.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.177734375, -2.1287765502929688, -2.0798187255859375, -2.0308609008789062, -1.981903076171875, -1.9329452514648438, -1.8839874267578125, -1.8350296020507812, -1.78607177734375, -1.7371139526367188, -1.6881561279296875, -1.6391983032226562, -1.590240478515625, -1.5412826538085938, -1.4923248291015625, -1.4433670043945312, -1.3944091796875, -1.3454513549804688, -1.2964935302734375, -1.2475357055664062, -1.198577880859375, -1.1496200561523438, -1.1006622314453125, -1.0517044067382812, -1.00274658203125, -0.9537887573242188, -0.9048309326171875, -0.8558731079101562, -0.806915283203125, -0.7579574584960938, -0.7089996337890625, -0.6600418090820312, -0.611083984375, -0.5621261596679688, -0.5131683349609375, -0.46421051025390625, -0.415252685546875, -0.36629486083984375, -0.3173370361328125, -0.26837921142578125, -0.21942138671875, -0.17046356201171875, -0.1215057373046875, -0.07254791259765625, -0.023590087890625, 0.02536773681640625, 0.0743255615234375, 0.12328338623046875, 0.1722412109375, 0.22119903564453125, 0.2701568603515625, 0.31911468505859375, 0.368072509765625, 0.41703033447265625, 0.4659881591796875, 0.5149459838867188, 0.56390380859375, 0.6128616333007812, 0.6618194580078125, 0.7107772827148438, 0.759735107421875, 0.8086929321289062, 0.8576507568359375, 0.9066085815429688, 0.95556640625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 7.0, 7.0, 3.0, 4.0, 9.0, 4.0, 10.0, 4.0, 9.0, 21.0, 23.0, 23.0, 26.0, 43.0, 58.0, 80.0, 129.0, 221.0, 374.0, 767.0, 2012.0, 7279.0, 41879.0, 538411.0, 414507.0, 33242.0, 6052.0, 1700.0, 736.0, 319.0, 208.0, 107.0, 79.0, 50.0, 24.0, 28.0, 19.0, 17.0, 10.0, 9.0, 10.0, 8.0, 6.0, 7.0, 3.0, 6.0, 1.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0], "bins": [-7.33203125, -7.1025390625, -6.873046875, -6.6435546875, -6.4140625, -6.1845703125, -5.955078125, -5.7255859375, -5.49609375, -5.2666015625, -5.037109375, -4.8076171875, -4.578125, -4.3486328125, -4.119140625, -3.8896484375, -3.66015625, -3.4306640625, -3.201171875, -2.9716796875, -2.7421875, -2.5126953125, -2.283203125, -2.0537109375, -1.82421875, -1.5947265625, -1.365234375, -1.1357421875, -0.90625, -0.6767578125, -0.447265625, -0.2177734375, 0.01171875, 0.2412109375, 0.470703125, 0.7001953125, 0.9296875, 1.1591796875, 1.388671875, 1.6181640625, 1.84765625, 2.0771484375, 2.306640625, 2.5361328125, 2.765625, 2.9951171875, 3.224609375, 3.4541015625, 3.68359375, 3.9130859375, 4.142578125, 4.3720703125, 4.6015625, 4.8310546875, 5.060546875, 5.2900390625, 5.51953125, 5.7490234375, 5.978515625, 6.2080078125, 6.4375, 6.6669921875, 6.896484375, 7.1259765625, 7.35546875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 7.0, 3.0, 7.0, 7.0, 15.0, 8.0, 12.0, 16.0, 17.0, 28.0, 28.0, 29.0, 41.0, 33.0, 30.0, 49.0, 46.0, 52.0, 37.0, 53.0, 48.0, 44.0, 52.0, 46.0, 35.0, 45.0, 26.0, 40.0, 22.0, 23.0, 17.0, 22.0, 16.0, 9.0, 10.0, 6.0, 5.0, 8.0, 5.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.5390625, -3.421478271484375, -3.30389404296875, -3.186309814453125, -3.0687255859375, -2.951141357421875, -2.83355712890625, -2.715972900390625, -2.598388671875, -2.480804443359375, -2.36322021484375, -2.245635986328125, -2.1280517578125, -2.010467529296875, -1.89288330078125, -1.775299072265625, -1.65771484375, -1.540130615234375, -1.42254638671875, -1.304962158203125, -1.1873779296875, -1.069793701171875, -0.95220947265625, -0.834625244140625, -0.717041015625, -0.599456787109375, -0.48187255859375, -0.364288330078125, -0.2467041015625, -0.129119873046875, -0.01153564453125, 0.106048583984375, 0.2236328125, 0.341217041015625, 0.45880126953125, 0.576385498046875, 0.6939697265625, 0.811553955078125, 0.92913818359375, 1.046722412109375, 1.164306640625, 1.281890869140625, 1.39947509765625, 1.517059326171875, 1.6346435546875, 1.752227783203125, 1.86981201171875, 1.987396240234375, 2.10498046875, 2.222564697265625, 2.34014892578125, 2.457733154296875, 2.5753173828125, 2.692901611328125, 2.81048583984375, 2.928070068359375, 3.045654296875, 3.163238525390625, 3.28082275390625, 3.398406982421875, 3.5159912109375, 3.633575439453125, 3.75115966796875, 3.868743896484375, 3.986328125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 6.0, 2.0, 6.0, 8.0, 8.0, 26.0, 35.0, 69.0, 150.0, 354.0, 1057.0, 5428.0, 176480.0, 845112.0, 16939.0, 1881.0, 539.0, 202.0, 123.0, 59.0, 33.0, 14.0, 14.0, 5.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.48828125, -4.36083984375, -4.2333984375, -4.10595703125, -3.978515625, -3.85107421875, -3.7236328125, -3.59619140625, -3.46875, -3.34130859375, -3.2138671875, -3.08642578125, -2.958984375, -2.83154296875, -2.7041015625, -2.57666015625, -2.44921875, -2.32177734375, -2.1943359375, -2.06689453125, -1.939453125, -1.81201171875, -1.6845703125, -1.55712890625, -1.4296875, -1.30224609375, -1.1748046875, -1.04736328125, -0.919921875, -0.79248046875, -0.6650390625, -0.53759765625, -0.41015625, -0.28271484375, -0.1552734375, -0.02783203125, 0.099609375, 0.22705078125, 0.3544921875, 0.48193359375, 0.609375, 0.73681640625, 0.8642578125, 0.99169921875, 1.119140625, 1.24658203125, 1.3740234375, 1.50146484375, 1.62890625, 1.75634765625, 1.8837890625, 2.01123046875, 2.138671875, 2.26611328125, 2.3935546875, 2.52099609375, 2.6484375, 2.77587890625, 2.9033203125, 3.03076171875, 3.158203125, 3.28564453125, 3.4130859375, 3.54052734375, 3.66796875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 5.0, 8.0, 4.0, 8.0, 11.0, 16.0, 18.0, 20.0, 32.0, 40.0, 56.0, 55.0, 89.0, 107.0, 110.0, 100.0, 85.0, 53.0, 49.0, 25.0, 23.0, 20.0, 16.0, 9.0, 11.0, 7.0, 8.0, 2.0, 4.0, 3.0, 9.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0001691579818725586, -0.00016393326222896576, -0.00015870854258537292, -0.0001534838229417801, -0.00014825910329818726, -0.00014303438365459442, -0.0001378096640110016, -0.00013258494436740875, -0.00012736022472381592, -0.00012213550508022308, -0.00011691078543663025, -0.00011168606579303741, -0.00010646134614944458, -0.00010123662650585175, -9.601190686225891e-05, -9.078718721866608e-05, -8.556246757507324e-05, -8.033774793148041e-05, -7.511302828788757e-05, -6.988830864429474e-05, -6.46635890007019e-05, -5.943886935710907e-05, -5.4214149713516235e-05, -4.89894300699234e-05, -4.3764710426330566e-05, -3.853999078273773e-05, -3.33152711391449e-05, -2.8090551495552063e-05, -2.286583185195923e-05, -1.7641112208366394e-05, -1.241639256477356e-05, -7.191672921180725e-06, -1.9669532775878906e-06, 3.257766366004944e-06, 8.482486009597778e-06, 1.3707205653190613e-05, 1.8931925296783447e-05, 2.4156644940376282e-05, 2.9381364583969116e-05, 3.460608422756195e-05, 3.9830803871154785e-05, 4.505552351474762e-05, 5.0280243158340454e-05, 5.550496280193329e-05, 6.072968244552612e-05, 6.595440208911896e-05, 7.117912173271179e-05, 7.640384137630463e-05, 8.162856101989746e-05, 8.68532806634903e-05, 9.207800030708313e-05, 9.730271995067596e-05, 0.0001025274395942688, 0.00010775215923786163, 0.00011297687888145447, 0.0001182015985250473, 0.00012342631816864014, 0.00012865103781223297, 0.0001338757574558258, 0.00013910047709941864, 0.00014432519674301147, 0.0001495499163866043, 0.00015477463603019714, 0.00015999935567378998, 0.0001652240753173828]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 5.0, 3.0, 1.0, 10.0, 10.0, 15.0, 26.0, 50.0, 100.0, 276.0, 836.0, 4815.0, 296575.0, 736439.0, 7674.0, 1136.0, 315.0, 135.0, 55.0, 34.0, 23.0, 7.0, 9.0, 13.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.859375, -3.6763916015625, -3.493408203125, -3.3104248046875, -3.12744140625, -2.9444580078125, -2.761474609375, -2.5784912109375, -2.3955078125, -2.2125244140625, -2.029541015625, -1.8465576171875, -1.66357421875, -1.4805908203125, -1.297607421875, -1.1146240234375, -0.931640625, -0.7486572265625, -0.565673828125, -0.3826904296875, -0.19970703125, -0.0167236328125, 0.166259765625, 0.3492431640625, 0.5322265625, 0.7152099609375, 0.898193359375, 1.0811767578125, 1.26416015625, 1.4471435546875, 1.630126953125, 1.8131103515625, 1.99609375, 2.1790771484375, 2.362060546875, 2.5450439453125, 2.72802734375, 2.9110107421875, 3.093994140625, 3.2769775390625, 3.4599609375, 3.6429443359375, 3.825927734375, 4.0089111328125, 4.19189453125, 4.3748779296875, 4.557861328125, 4.7408447265625, 4.923828125, 5.1068115234375, 5.289794921875, 5.4727783203125, 5.65576171875, 5.8387451171875, 6.021728515625, 6.2047119140625, 6.3876953125, 6.5706787109375, 6.753662109375, 6.9366455078125, 7.11962890625, 7.3026123046875, 7.485595703125, 7.6685791015625, 7.8515625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 1.0, 4.0, 8.0, 12.0, 21.0, 28.0, 54.0, 61.0, 91.0, 151.0, 147.0, 127.0, 105.0, 72.0, 45.0, 28.0, 21.0, 15.0, 7.0, 7.0, 5.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.580078125, -1.50323486328125, -1.4263916015625, -1.34954833984375, -1.272705078125, -1.19586181640625, -1.1190185546875, -1.04217529296875, -0.96533203125, -0.88848876953125, -0.8116455078125, -0.73480224609375, -0.657958984375, -0.58111572265625, -0.5042724609375, -0.42742919921875, -0.3505859375, -0.27374267578125, -0.1968994140625, -0.12005615234375, -0.043212890625, 0.03363037109375, 0.1104736328125, 0.18731689453125, 0.26416015625, 0.34100341796875, 0.4178466796875, 0.49468994140625, 0.571533203125, 0.64837646484375, 0.7252197265625, 0.80206298828125, 0.87890625, 0.95574951171875, 1.0325927734375, 1.10943603515625, 1.186279296875, 1.26312255859375, 1.3399658203125, 1.41680908203125, 1.49365234375, 1.57049560546875, 1.6473388671875, 1.72418212890625, 1.801025390625, 1.87786865234375, 1.9547119140625, 2.03155517578125, 2.1083984375, 2.18524169921875, 2.2620849609375, 2.33892822265625, 2.415771484375, 2.49261474609375, 2.5694580078125, 2.64630126953125, 2.72314453125, 2.79998779296875, 2.8768310546875, 2.95367431640625, 3.030517578125, 3.10736083984375, 3.1842041015625, 3.26104736328125, 3.337890625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 9.0, 52.0, 472.0, 431.0, 37.0, 11.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.870460510253906, -30.08580780029297, -26.30115509033203, -22.516504287719727, -18.73185157775879, -14.947198867797852, -11.162548065185547, -7.377895355224609, -3.593242645263672, 0.19140958786010742, 3.9760618209838867, 7.760713577270508, 11.545366287231445, 15.330018997192383, 19.114669799804688, 22.899322509765625, 26.683975219726562, 30.4686279296875, 34.25328063964844, 38.037933349609375, 41.82258605957031, 45.60723876953125, 49.39188766479492, 53.17654037475586, 56.9611930847168, 60.745845794677734, 64.5304946899414, 68.31514739990234, 72.09980010986328, 75.88445281982422, 79.66910552978516, 83.4537582397461, 87.2384033203125, 91.02305603027344, 94.80770874023438, 98.59236145019531, 102.37701416015625, 106.16166687011719, 109.94631958007812, 113.73097229003906, 117.515625, 121.30027770996094, 125.08493041992188, 128.8695831298828, 132.65423583984375, 136.4388885498047, 140.22354125976562, 144.00819396972656, 147.7928466796875, 151.57749938964844, 155.36215209960938, 159.1468048095703, 162.93145751953125, 166.7161102294922, 170.50076293945312, 174.28541564941406, 178.07005310058594, 181.85470581054688, 185.6393585205078, 189.42401123046875, 193.2086639404297, 196.99331665039062, 200.77796936035156, 204.5626220703125, 208.34727478027344]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 9.0, 3.0, 6.0, 2.0, 4.0, 3.0, 2.0, 7.0, 4.0, 10.0, 13.0, 22.0, 23.0, 20.0, 30.0, 32.0, 41.0, 39.0, 27.0, 46.0, 61.0, 57.0, 65.0, 41.0, 41.0, 41.0, 46.0, 38.0, 39.0, 23.0, 39.0, 36.0, 25.0, 19.0, 23.0, 23.0, 12.0, 11.0, 11.0, 5.0, 3.0, 4.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.824403762817383, -21.04537582397461, -20.266345977783203, -19.48731803894043, -18.708288192749023, -17.92926025390625, -17.150230407714844, -16.37120246887207, -15.592172622680664, -14.813143730163574, -14.034114837646484, -13.255085945129395, -12.476057052612305, -11.697028160095215, -10.917999267578125, -10.138971328735352, -9.359942436218262, -8.580913543701172, -7.801884651184082, -7.022855758666992, -6.243826866149902, -5.4647979736328125, -4.685769557952881, -3.906740665435791, -3.127711772918701, -2.3486828804016113, -1.569654107093811, -0.7906253337860107, -0.011596441268920898, 0.767432451248169, 1.5464611053466797, 2.3254899978637695, 3.1045188903808594, 3.883547782897949, 4.662576675415039, 5.441605567932129, 6.220634460449219, 6.999663352966309, 7.77869176864624, 8.557720184326172, 9.336750030517578, 10.115778923034668, 10.894807815551758, 11.673836708068848, 12.452865600585938, 13.231894493103027, 14.010923385620117, 14.78995132446289, 15.56898021697998, 16.34800910949707, 17.127037048339844, 17.90606689453125, 18.685094833374023, 19.46412467956543, 20.243152618408203, 21.02218246459961, 21.801210403442383, 22.580238342285156, 23.359268188476562, 24.138296127319336, 24.917325973510742, 25.696353912353516, 26.475383758544922, 27.254411697387695, 28.0334415435791]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 6.0, 3.0, 4.0, 5.0, 2.0, 4.0, 9.0, 7.0, 18.0, 20.0, 21.0, 28.0, 30.0, 34.0, 59.0, 99.0, 128.0, 248.0, 341.0, 745.0, 1533.0, 3721.0, 17996.0, 3418532.0, 731802.0, 14593.0, 2715.0, 893.0, 350.0, 166.0, 65.0, 31.0, 26.0, 14.0, 11.0, 7.0, 8.0, 2.0, 6.0, 0.0, 3.0, 2.0, 2.0], "bins": [-15.0859375, -14.7503662109375, -14.414794921875, -14.0792236328125, -13.74365234375, -13.4080810546875, -13.072509765625, -12.7369384765625, -12.4013671875, -12.0657958984375, -11.730224609375, -11.3946533203125, -11.05908203125, -10.7235107421875, -10.387939453125, -10.0523681640625, -9.716796875, -9.3812255859375, -9.045654296875, -8.7100830078125, -8.37451171875, -8.0389404296875, -7.703369140625, -7.3677978515625, -7.0322265625, -6.6966552734375, -6.361083984375, -6.0255126953125, -5.68994140625, -5.3543701171875, -5.018798828125, -4.6832275390625, -4.34765625, -4.0120849609375, -3.676513671875, -3.3409423828125, -3.00537109375, -2.6697998046875, -2.334228515625, -1.9986572265625, -1.6630859375, -1.3275146484375, -0.991943359375, -0.6563720703125, -0.32080078125, 0.0147705078125, 0.350341796875, 0.6859130859375, 1.021484375, 1.3570556640625, 1.692626953125, 2.0281982421875, 2.36376953125, 2.6993408203125, 3.034912109375, 3.3704833984375, 3.7060546875, 4.0416259765625, 4.377197265625, 4.7127685546875, 5.04833984375, 5.3839111328125, 5.719482421875, 6.0550537109375, 6.390625]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 5.0, 8.0, 16.0, 29.0, 40.0, 69.0, 115.0, 132.0, 148.0, 139.0, 124.0, 82.0, 38.0, 31.0, 14.0, 7.0, 2.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.251953125, -2.2012100219726562, -2.1504669189453125, -2.0997238159179688, -2.048980712890625, -1.9982376098632812, -1.9474945068359375, -1.8967514038085938, -1.84600830078125, -1.7952651977539062, -1.7445220947265625, -1.6937789916992188, -1.643035888671875, -1.5922927856445312, -1.5415496826171875, -1.4908065795898438, -1.4400634765625, -1.3893203735351562, -1.3385772705078125, -1.2878341674804688, -1.237091064453125, -1.1863479614257812, -1.1356048583984375, -1.0848617553710938, -1.03411865234375, -0.9833755493164062, -0.9326324462890625, -0.8818893432617188, -0.831146240234375, -0.7804031372070312, -0.7296600341796875, -0.6789169311523438, -0.628173828125, -0.5774307250976562, -0.5266876220703125, -0.47594451904296875, -0.425201416015625, -0.37445831298828125, -0.3237152099609375, -0.27297210693359375, -0.22222900390625, -0.17148590087890625, -0.1207427978515625, -0.06999969482421875, -0.019256591796875, 0.03148651123046875, 0.0822296142578125, 0.13297271728515625, 0.1837158203125, 0.23445892333984375, 0.2852020263671875, 0.33594512939453125, 0.386688232421875, 0.43743133544921875, 0.4881744384765625, 0.5389175415039062, 0.58966064453125, 0.6404037475585938, 0.6911468505859375, 0.7418899536132812, 0.792633056640625, 0.8433761596679688, 0.8941192626953125, 0.9448623657226562, 0.99560546875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 4.0, 8.0, 11.0, 22.0, 28.0, 62.0, 97.0, 196.0, 432.0, 971.0, 2644.0, 11263.0, 135526.0, 3972864.0, 59594.0, 7257.0, 1894.0, 735.0, 325.0, 163.0, 80.0, 44.0, 23.0, 11.0, 9.0, 3.0, 6.0, 4.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.4609375, -8.182373046875, -7.90380859375, -7.625244140625, -7.3466796875, -7.068115234375, -6.78955078125, -6.510986328125, -6.232421875, -5.953857421875, -5.67529296875, -5.396728515625, -5.1181640625, -4.839599609375, -4.56103515625, -4.282470703125, -4.00390625, -3.725341796875, -3.44677734375, -3.168212890625, -2.8896484375, -2.611083984375, -2.33251953125, -2.053955078125, -1.775390625, -1.496826171875, -1.21826171875, -0.939697265625, -0.6611328125, -0.382568359375, -0.10400390625, 0.174560546875, 0.453125, 0.731689453125, 1.01025390625, 1.288818359375, 1.5673828125, 1.845947265625, 2.12451171875, 2.403076171875, 2.681640625, 2.960205078125, 3.23876953125, 3.517333984375, 3.7958984375, 4.074462890625, 4.35302734375, 4.631591796875, 4.91015625, 5.188720703125, 5.46728515625, 5.745849609375, 6.0244140625, 6.302978515625, 6.58154296875, 6.860107421875, 7.138671875, 7.417236328125, 7.69580078125, 7.974365234375, 8.2529296875, 8.531494140625, 8.81005859375, 9.088623046875, 9.3671875]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 9.0, 3.0, 6.0, 13.0, 18.0, 19.0, 31.0, 40.0, 74.0, 158.0, 450.0, 2375.0, 492.0, 152.0, 73.0, 57.0, 37.0, 17.0, 13.0, 13.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.990234375, -1.9271240234375, -1.864013671875, -1.8009033203125, -1.73779296875, -1.6746826171875, -1.611572265625, -1.5484619140625, -1.4853515625, -1.4222412109375, -1.359130859375, -1.2960205078125, -1.23291015625, -1.1697998046875, -1.106689453125, -1.0435791015625, -0.98046875, -0.9173583984375, -0.854248046875, -0.7911376953125, -0.72802734375, -0.6649169921875, -0.601806640625, -0.5386962890625, -0.4755859375, -0.4124755859375, -0.349365234375, -0.2862548828125, -0.22314453125, -0.1600341796875, -0.096923828125, -0.0338134765625, 0.029296875, 0.0924072265625, 0.155517578125, 0.2186279296875, 0.28173828125, 0.3448486328125, 0.407958984375, 0.4710693359375, 0.5341796875, 0.5972900390625, 0.660400390625, 0.7235107421875, 0.78662109375, 0.8497314453125, 0.912841796875, 0.9759521484375, 1.0390625, 1.1021728515625, 1.165283203125, 1.2283935546875, 1.29150390625, 1.3546142578125, 1.417724609375, 1.4808349609375, 1.5439453125, 1.6070556640625, 1.670166015625, 1.7332763671875, 1.79638671875, 1.8594970703125, 1.922607421875, 1.9857177734375, 2.048828125]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 4.0, 13.0, 20.0, 29.0, 66.0, 159.0, 216.0, 228.0, 140.0, 62.0, 25.0, 13.0, 17.0, 8.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.367212295532227, -6.088510990142822, -5.80980920791626, -5.5311079025268555, -5.252406597137451, -4.973705291748047, -4.695003509521484, -4.41630220413208, -4.137600898742676, -3.8588993549346924, -3.580198049545288, -3.3014965057373047, -3.0227952003479004, -2.744093656539917, -2.4653921127319336, -2.1866908073425293, -1.9079890251159668, -1.629287600517273, -1.350586175918579, -1.0718846321105957, -0.7931832075119019, -0.514481782913208, -0.2357802391052246, 0.04292118549346924, 0.3216226100921631, 0.6003240346908569, 0.8790255188941956, 1.1577270030975342, 1.436428427696228, 1.7151298522949219, 1.9938313961029053, 2.2725329399108887, 2.551234245300293, 2.8299357891082764, 3.1086370944976807, 3.387338638305664, 3.6660399436950684, 3.9447414875030518, 4.223443031311035, 4.5021443367004395, 4.780845642089844, 5.059546947479248, 5.3382487297058105, 5.616950035095215, 5.895651340484619, 6.174352645874023, 6.453054428100586, 6.73175573348999, 7.010457515716553, 7.289158821105957, 7.5678606033325195, 7.846561908721924, 8.125263214111328, 8.40396499633789, 8.682666778564453, 8.9613676071167, 9.240069389343262, 9.518771171569824, 9.79747200012207, 10.076173782348633, 10.354875564575195, 10.633576393127441, 10.912278175354004, 11.190979957580566, 11.469680786132812]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 0.0, 5.0, 5.0, 3.0, 10.0, 6.0, 14.0, 9.0, 17.0, 13.0, 19.0, 21.0, 30.0, 27.0, 30.0, 42.0, 39.0, 31.0, 48.0, 35.0, 27.0, 34.0, 27.0, 44.0, 39.0, 37.0, 34.0, 31.0, 33.0, 39.0, 33.0, 28.0, 30.0, 30.0, 19.0, 13.0, 16.0, 18.0, 10.0, 15.0, 8.0, 10.0, 9.0, 1.0, 3.0, 2.0, 4.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.42619514465332, -4.284749984741211, -4.143304824829102, -4.001859188079834, -3.8604140281677246, -3.7189688682556152, -3.5775234699249268, -3.4360780715942383, -3.294632911682129, -3.1531877517700195, -3.011742353439331, -2.8702969551086426, -2.728851795196533, -2.587406635284424, -2.4459612369537354, -2.304515838623047, -2.1630706787109375, -2.021625518798828, -1.8801801204681396, -1.7387348413467407, -1.5972895622253418, -1.4558442831039429, -1.314399003982544, -1.172953724861145, -1.031508445739746, -0.8900631666183472, -0.7486178874969482, -0.6071726083755493, -0.4657273292541504, -0.32428205013275146, -0.18283677101135254, -0.04139149188995361, 0.10005378723144531, 0.24149906635284424, 0.38294434547424316, 0.5243896245956421, 0.665834903717041, 0.8072801828384399, 0.9487254619598389, 1.0901707410812378, 1.2316160202026367, 1.3730612993240356, 1.5145065784454346, 1.6559518575668335, 1.7973971366882324, 1.9388424158096313, 2.0802876949310303, 2.2217330932617188, 2.363178253173828, 2.5046234130859375, 2.646068811416626, 2.7875142097473145, 2.928959369659424, 3.070404529571533, 3.2118499279022217, 3.35329532623291, 3.4947404861450195, 3.636185646057129, 3.7776310443878174, 3.919076442718506, 4.060521602630615, 4.201966762542725, 4.343412399291992, 4.484857559204102, 4.626302719116211]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 10.0, 6.0, 12.0, 13.0, 9.0, 26.0, 21.0, 37.0, 44.0, 57.0, 103.0, 146.0, 195.0, 278.0, 467.0, 793.0, 1371.0, 3182.0, 11432.0, 65076.0, 592767.0, 323502.0, 36128.0, 7426.0, 2363.0, 1106.0, 644.0, 428.0, 294.0, 193.0, 109.0, 74.0, 57.0, 40.0, 37.0, 25.0, 32.0, 8.0, 14.0, 9.0, 9.0, 5.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0], "bins": [-5.7265625, -5.557373046875, -5.38818359375, -5.218994140625, -5.0498046875, -4.880615234375, -4.71142578125, -4.542236328125, -4.373046875, -4.203857421875, -4.03466796875, -3.865478515625, -3.6962890625, -3.527099609375, -3.35791015625, -3.188720703125, -3.01953125, -2.850341796875, -2.68115234375, -2.511962890625, -2.3427734375, -2.173583984375, -2.00439453125, -1.835205078125, -1.666015625, -1.496826171875, -1.32763671875, -1.158447265625, -0.9892578125, -0.820068359375, -0.65087890625, -0.481689453125, -0.3125, -0.143310546875, 0.02587890625, 0.195068359375, 0.3642578125, 0.533447265625, 0.70263671875, 0.871826171875, 1.041015625, 1.210205078125, 1.37939453125, 1.548583984375, 1.7177734375, 1.886962890625, 2.05615234375, 2.225341796875, 2.39453125, 2.563720703125, 2.73291015625, 2.902099609375, 3.0712890625, 3.240478515625, 3.40966796875, 3.578857421875, 3.748046875, 3.917236328125, 4.08642578125, 4.255615234375, 4.4248046875, 4.593994140625, 4.76318359375, 4.932373046875, 5.1015625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 11.0, 28.0, 40.0, 64.0, 99.0, 144.0, 148.0, 145.0, 108.0, 78.0, 63.0, 30.0, 15.0, 10.0, 7.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.279296875, -2.2292938232421875, -2.179290771484375, -2.1292877197265625, -2.07928466796875, -2.0292816162109375, -1.979278564453125, -1.9292755126953125, -1.8792724609375, -1.8292694091796875, -1.779266357421875, -1.7292633056640625, -1.67926025390625, -1.6292572021484375, -1.579254150390625, -1.5292510986328125, -1.479248046875, -1.4292449951171875, -1.379241943359375, -1.3292388916015625, -1.27923583984375, -1.2292327880859375, -1.179229736328125, -1.1292266845703125, -1.0792236328125, -1.0292205810546875, -0.979217529296875, -0.9292144775390625, -0.87921142578125, -0.8292083740234375, -0.779205322265625, -0.7292022705078125, -0.67919921875, -0.6291961669921875, -0.579193115234375, -0.5291900634765625, -0.47918701171875, -0.4291839599609375, -0.379180908203125, -0.3291778564453125, -0.2791748046875, -0.2291717529296875, -0.179168701171875, -0.1291656494140625, -0.07916259765625, -0.0291595458984375, 0.020843505859375, 0.0708465576171875, 0.120849609375, 0.1708526611328125, 0.220855712890625, 0.2708587646484375, 0.32086181640625, 0.3708648681640625, 0.420867919921875, 0.4708709716796875, 0.5208740234375, 0.5708770751953125, 0.620880126953125, 0.6708831787109375, 0.72088623046875, 0.7708892822265625, 0.820892333984375, 0.8708953857421875, 0.9208984375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 2.0, 5.0, 6.0, 6.0, 12.0, 16.0, 17.0, 21.0, 32.0, 37.0, 69.0, 76.0, 110.0, 197.0, 333.0, 560.0, 1136.0, 2669.0, 7762.0, 29026.0, 178786.0, 679566.0, 115427.0, 21965.0, 6173.0, 2304.0, 972.0, 463.0, 275.0, 165.0, 108.0, 75.0, 56.0, 34.0, 24.0, 21.0, 18.0, 6.0, 7.0, 8.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.70703125, -5.5252685546875, -5.343505859375, -5.1617431640625, -4.97998046875, -4.7982177734375, -4.616455078125, -4.4346923828125, -4.2529296875, -4.0711669921875, -3.889404296875, -3.7076416015625, -3.52587890625, -3.3441162109375, -3.162353515625, -2.9805908203125, -2.798828125, -2.6170654296875, -2.435302734375, -2.2535400390625, -2.07177734375, -1.8900146484375, -1.708251953125, -1.5264892578125, -1.3447265625, -1.1629638671875, -0.981201171875, -0.7994384765625, -0.61767578125, -0.4359130859375, -0.254150390625, -0.0723876953125, 0.109375, 0.2911376953125, 0.472900390625, 0.6546630859375, 0.83642578125, 1.0181884765625, 1.199951171875, 1.3817138671875, 1.5634765625, 1.7452392578125, 1.927001953125, 2.1087646484375, 2.29052734375, 2.4722900390625, 2.654052734375, 2.8358154296875, 3.017578125, 3.1993408203125, 3.381103515625, 3.5628662109375, 3.74462890625, 3.9263916015625, 4.108154296875, 4.2899169921875, 4.4716796875, 4.6534423828125, 4.835205078125, 5.0169677734375, 5.19873046875, 5.3804931640625, 5.562255859375, 5.7440185546875, 5.92578125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 2.0, 10.0, 2.0, 5.0, 6.0, 6.0, 10.0, 16.0, 17.0, 19.0, 30.0, 27.0, 27.0, 26.0, 49.0, 42.0, 50.0, 50.0, 59.0, 46.0, 45.0, 47.0, 57.0, 39.0, 43.0, 49.0, 40.0, 36.0, 33.0, 21.0, 13.0, 11.0, 16.0, 11.0, 11.0, 9.0, 8.0, 2.0, 5.0, 4.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.8125, -4.67315673828125, -4.5338134765625, -4.39447021484375, -4.255126953125, -4.11578369140625, -3.9764404296875, -3.83709716796875, -3.69775390625, -3.55841064453125, -3.4190673828125, -3.27972412109375, -3.140380859375, -3.00103759765625, -2.8616943359375, -2.72235107421875, -2.5830078125, -2.44366455078125, -2.3043212890625, -2.16497802734375, -2.025634765625, -1.88629150390625, -1.7469482421875, -1.60760498046875, -1.46826171875, -1.32891845703125, -1.1895751953125, -1.05023193359375, -0.910888671875, -0.77154541015625, -0.6322021484375, -0.49285888671875, -0.353515625, -0.21417236328125, -0.0748291015625, 0.06451416015625, 0.203857421875, 0.34320068359375, 0.4825439453125, 0.62188720703125, 0.76123046875, 0.90057373046875, 1.0399169921875, 1.17926025390625, 1.318603515625, 1.45794677734375, 1.5972900390625, 1.73663330078125, 1.8759765625, 2.01531982421875, 2.1546630859375, 2.29400634765625, 2.433349609375, 2.57269287109375, 2.7120361328125, 2.85137939453125, 2.99072265625, 3.13006591796875, 3.2694091796875, 3.40875244140625, 3.548095703125, 3.68743896484375, 3.8267822265625, 3.96612548828125, 4.10546875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 6.0, 11.0, 12.0, 15.0, 20.0, 28.0, 41.0, 79.0, 100.0, 163.0, 331.0, 677.0, 1458.0, 3581.0, 11665.0, 72371.0, 768172.0, 163102.0, 18095.0, 5050.0, 1827.0, 800.0, 391.0, 212.0, 121.0, 73.0, 43.0, 29.0, 22.0, 20.0, 13.0, 10.0, 6.0, 2.0, 5.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.857421875, -1.802215576171875, -1.74700927734375, -1.691802978515625, -1.6365966796875, -1.581390380859375, -1.52618408203125, -1.470977783203125, -1.415771484375, -1.360565185546875, -1.30535888671875, -1.250152587890625, -1.1949462890625, -1.139739990234375, -1.08453369140625, -1.029327392578125, -0.97412109375, -0.918914794921875, -0.86370849609375, -0.808502197265625, -0.7532958984375, -0.698089599609375, -0.64288330078125, -0.587677001953125, -0.532470703125, -0.477264404296875, -0.42205810546875, -0.366851806640625, -0.3116455078125, -0.256439208984375, -0.20123291015625, -0.146026611328125, -0.0908203125, -0.035614013671875, 0.01959228515625, 0.074798583984375, 0.1300048828125, 0.185211181640625, 0.24041748046875, 0.295623779296875, 0.350830078125, 0.406036376953125, 0.46124267578125, 0.516448974609375, 0.5716552734375, 0.626861572265625, 0.68206787109375, 0.737274169921875, 0.79248046875, 0.847686767578125, 0.90289306640625, 0.958099365234375, 1.0133056640625, 1.068511962890625, 1.12371826171875, 1.178924560546875, 1.234130859375, 1.289337158203125, 1.34454345703125, 1.399749755859375, 1.4549560546875, 1.510162353515625, 1.56536865234375, 1.620574951171875, 1.67578125]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 7.0, 4.0, 2.0, 11.0, 12.0, 7.0, 10.0, 18.0, 32.0, 37.0, 60.0, 65.0, 80.0, 108.0, 104.0, 119.0, 87.0, 75.0, 44.0, 32.0, 23.0, 18.0, 17.0, 9.0, 3.0, 2.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001747608184814453, -0.00016954168677330017, -0.00016432255506515503, -0.0001591034233570099, -0.00015388429164886475, -0.0001486651599407196, -0.00014344602823257446, -0.00013822689652442932, -0.00013300776481628418, -0.00012778863310813904, -0.0001225695013999939, -0.00011735036969184875, -0.00011213123798370361, -0.00010691210627555847, -0.00010169297456741333, -9.647384285926819e-05, -9.125471115112305e-05, -8.60355794429779e-05, -8.081644773483276e-05, -7.559731602668762e-05, -7.037818431854248e-05, -6.515905261039734e-05, -5.99399209022522e-05, -5.4720789194107056e-05, -4.9501657485961914e-05, -4.428252577781677e-05, -3.906339406967163e-05, -3.384426236152649e-05, -2.8625130653381348e-05, -2.3405998945236206e-05, -1.8186867237091064e-05, -1.2967735528945923e-05, -7.748603820800781e-06, -2.5294721126556396e-06, 2.689659595489502e-06, 7.908791303634644e-06, 1.3127923011779785e-05, 1.8347054719924927e-05, 2.356618642807007e-05, 2.878531813621521e-05, 3.400444984436035e-05, 3.922358155250549e-05, 4.4442713260650635e-05, 4.9661844968795776e-05, 5.488097667694092e-05, 6.010010838508606e-05, 6.53192400932312e-05, 7.053837180137634e-05, 7.575750350952148e-05, 8.097663521766663e-05, 8.619576692581177e-05, 9.141489863395691e-05, 9.663403034210205e-05, 0.00010185316205024719, 0.00010707229375839233, 0.00011229142546653748, 0.00011751055717468262, 0.00012272968888282776, 0.0001279488205909729, 0.00013316795229911804, 0.00013838708400726318, 0.00014360621571540833, 0.00014882534742355347, 0.0001540444791316986, 0.00015926361083984375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 5.0, 3.0, 13.0, 24.0, 18.0, 22.0, 37.0, 66.0, 121.0, 191.0, 420.0, 918.0, 2602.0, 9819.0, 71547.0, 806281.0, 136755.0, 13926.0, 3500.0, 1214.0, 476.0, 225.0, 131.0, 83.0, 54.0, 37.0, 17.0, 9.0, 10.0, 8.0, 4.0, 6.0, 3.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.900390625, -1.836212158203125, -1.77203369140625, -1.707855224609375, -1.6436767578125, -1.579498291015625, -1.51531982421875, -1.451141357421875, -1.386962890625, -1.322784423828125, -1.25860595703125, -1.194427490234375, -1.1302490234375, -1.066070556640625, -1.00189208984375, -0.937713623046875, -0.87353515625, -0.809356689453125, -0.74517822265625, -0.680999755859375, -0.6168212890625, -0.552642822265625, -0.48846435546875, -0.424285888671875, -0.360107421875, -0.295928955078125, -0.23175048828125, -0.167572021484375, -0.1033935546875, -0.039215087890625, 0.02496337890625, 0.089141845703125, 0.1533203125, 0.217498779296875, 0.28167724609375, 0.345855712890625, 0.4100341796875, 0.474212646484375, 0.53839111328125, 0.602569580078125, 0.666748046875, 0.730926513671875, 0.79510498046875, 0.859283447265625, 0.9234619140625, 0.987640380859375, 1.05181884765625, 1.115997314453125, 1.18017578125, 1.244354248046875, 1.30853271484375, 1.372711181640625, 1.4368896484375, 1.501068115234375, 1.56524658203125, 1.629425048828125, 1.693603515625, 1.757781982421875, 1.82196044921875, 1.886138916015625, 1.9503173828125, 2.014495849609375, 2.07867431640625, 2.142852783203125, 2.20703125]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 9.0, 8.0, 15.0, 16.0, 28.0, 51.0, 69.0, 65.0, 121.0, 123.0, 109.0, 104.0, 69.0, 57.0, 52.0, 29.0, 18.0, 9.0, 12.0, 9.0, 7.0, 1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2822265625, -1.237762451171875, -1.19329833984375, -1.148834228515625, -1.1043701171875, -1.059906005859375, -1.01544189453125, -0.970977783203125, -0.926513671875, -0.882049560546875, -0.83758544921875, -0.793121337890625, -0.7486572265625, -0.704193115234375, -0.65972900390625, -0.615264892578125, -0.57080078125, -0.526336669921875, -0.48187255859375, -0.437408447265625, -0.3929443359375, -0.348480224609375, -0.30401611328125, -0.259552001953125, -0.215087890625, -0.170623779296875, -0.12615966796875, -0.081695556640625, -0.0372314453125, 0.007232666015625, 0.05169677734375, 0.096160888671875, 0.140625, 0.185089111328125, 0.22955322265625, 0.274017333984375, 0.3184814453125, 0.362945556640625, 0.40740966796875, 0.451873779296875, 0.496337890625, 0.540802001953125, 0.58526611328125, 0.629730224609375, 0.6741943359375, 0.718658447265625, 0.76312255859375, 0.807586669921875, 0.85205078125, 0.896514892578125, 0.94097900390625, 0.985443115234375, 1.0299072265625, 1.074371337890625, 1.11883544921875, 1.163299560546875, 1.207763671875, 1.252227783203125, 1.29669189453125, 1.341156005859375, 1.3856201171875, 1.430084228515625, 1.47454833984375, 1.519012451171875, 1.5634765625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 8.0, 10.0, 10.0, 39.0, 71.0, 123.0, 256.0, 214.0, 128.0, 65.0, 33.0, 24.0, 16.0, 8.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-56.603397369384766, -55.40073013305664, -54.19806671142578, -52.995399475097656, -51.79273223876953, -50.590065002441406, -49.38739776611328, -48.18473434448242, -46.9820671081543, -45.77939987182617, -44.57673645019531, -43.37406921386719, -42.17140197753906, -40.96873474121094, -39.76606750488281, -38.56340408325195, -37.36073684692383, -36.1580696105957, -34.955406188964844, -33.75273895263672, -32.550071716308594, -31.34740447998047, -30.144739151000977, -28.942073822021484, -27.73940658569336, -26.536739349365234, -25.334074020385742, -24.13140869140625, -22.928741455078125, -21.72607421875, -20.523408889770508, -19.320743560791016, -18.118072509765625, -16.9154052734375, -15.712739944458008, -14.5100736618042, -13.30740737915039, -12.104741096496582, -10.902074813842773, -9.699408531188965, -8.496742248535156, -7.294075965881348, -6.091409683227539, -4.8887434005737305, -3.686077117919922, -2.4834108352661133, -1.2807445526123047, -0.0780782699584961, 1.1245880126953125, 2.327254295349121, 3.5299205780029297, 4.732586860656738, 5.935253143310547, 7.1379194259643555, 8.340585708618164, 9.543251991271973, 10.745918273925781, 11.94858455657959, 13.151250839233398, 14.353917121887207, 15.556583404541016, 16.75925064086914, 17.961915969848633, 19.164581298828125, 20.36724853515625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 4.0, 4.0, 7.0, 8.0, 10.0, 9.0, 16.0, 15.0, 17.0, 28.0, 37.0, 40.0, 47.0, 42.0, 38.0, 66.0, 60.0, 56.0, 62.0, 61.0, 59.0, 46.0, 47.0, 27.0, 45.0, 33.0, 20.0, 16.0, 22.0, 14.0, 13.0, 11.0, 7.0, 5.0, 4.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.730220794677734, -26.736408233642578, -25.742595672607422, -24.748783111572266, -23.75497055053711, -22.761157989501953, -21.767345428466797, -20.773530960083008, -19.77971839904785, -18.785905838012695, -17.79209327697754, -16.798280715942383, -15.80446720123291, -14.810654640197754, -13.816842079162598, -12.823028564453125, -11.829216957092285, -10.835404396057129, -9.841591835021973, -8.8477783203125, -7.853965759277344, -6.8601531982421875, -5.866340637207031, -4.872527599334717, -3.8787150382995605, -2.884902238845825, -1.8910895586013794, -0.8972768783569336, 0.09653592109680176, 1.090348720550537, 2.0841612815856934, 3.077974319458008, 4.071786880493164, 5.06559944152832, 6.059412479400635, 7.053225040435791, 8.047038078308105, 9.040850639343262, 10.034663200378418, 11.02847671508789, 12.022289276123047, 13.016101837158203, 14.00991439819336, 15.003726959228516, 15.997540473937988, 16.991352081298828, 17.985164642333984, 18.978979110717773, 19.972789764404297, 20.966602325439453, 21.96041488647461, 22.954227447509766, 23.948040008544922, 24.941852569580078, 25.935665130615234, 26.929479598999023, 27.92329216003418, 28.917104721069336, 29.910917282104492, 30.90472984313965, 31.898542404174805, 32.892356872558594, 33.88616943359375, 34.879981994628906, 35.87379455566406]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 4.0, 5.0, 3.0, 12.0, 8.0, 11.0, 9.0, 16.0, 18.0, 21.0, 39.0, 45.0, 64.0, 70.0, 117.0, 207.0, 359.0, 622.0, 1449.0, 3878.0, 16860.0, 883026.0, 3262336.0, 18818.0, 3960.0, 1302.0, 517.0, 245.0, 134.0, 49.0, 29.0, 14.0, 13.0, 13.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.8125, -9.589599609375, -9.36669921875, -9.143798828125, -8.9208984375, -8.697998046875, -8.47509765625, -8.252197265625, -8.029296875, -7.806396484375, -7.58349609375, -7.360595703125, -7.1376953125, -6.914794921875, -6.69189453125, -6.468994140625, -6.24609375, -6.023193359375, -5.80029296875, -5.577392578125, -5.3544921875, -5.131591796875, -4.90869140625, -4.685791015625, -4.462890625, -4.239990234375, -4.01708984375, -3.794189453125, -3.5712890625, -3.348388671875, -3.12548828125, -2.902587890625, -2.6796875, -2.456787109375, -2.23388671875, -2.010986328125, -1.7880859375, -1.565185546875, -1.34228515625, -1.119384765625, -0.896484375, -0.673583984375, -0.45068359375, -0.227783203125, -0.0048828125, 0.218017578125, 0.44091796875, 0.663818359375, 0.88671875, 1.109619140625, 1.33251953125, 1.555419921875, 1.7783203125, 2.001220703125, 2.22412109375, 2.447021484375, 2.669921875, 2.892822265625, 3.11572265625, 3.338623046875, 3.5615234375, 3.784423828125, 4.00732421875, 4.230224609375, 4.453125]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 10.0, 10.0, 18.0, 27.0, 49.0, 67.0, 95.0, 118.0, 119.0, 110.0, 93.0, 94.0, 64.0, 49.0, 31.0, 22.0, 6.0, 8.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.212890625, -2.163421630859375, -2.11395263671875, -2.064483642578125, -2.0150146484375, -1.965545654296875, -1.91607666015625, -1.866607666015625, -1.817138671875, -1.767669677734375, -1.71820068359375, -1.668731689453125, -1.6192626953125, -1.569793701171875, -1.52032470703125, -1.470855712890625, -1.42138671875, -1.371917724609375, -1.32244873046875, -1.272979736328125, -1.2235107421875, -1.174041748046875, -1.12457275390625, -1.075103759765625, -1.025634765625, -0.976165771484375, -0.92669677734375, -0.877227783203125, -0.8277587890625, -0.778289794921875, -0.72882080078125, -0.679351806640625, -0.6298828125, -0.580413818359375, -0.53094482421875, -0.481475830078125, -0.4320068359375, -0.382537841796875, -0.33306884765625, -0.283599853515625, -0.234130859375, -0.184661865234375, -0.13519287109375, -0.085723876953125, -0.0362548828125, 0.013214111328125, 0.06268310546875, 0.112152099609375, 0.16162109375, 0.211090087890625, 0.26055908203125, 0.310028076171875, 0.3594970703125, 0.408966064453125, 0.45843505859375, 0.507904052734375, 0.557373046875, 0.606842041015625, 0.65631103515625, 0.705780029296875, 0.7552490234375, 0.804718017578125, 0.85418701171875, 0.903656005859375, 0.953125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 6.0, 8.0, 17.0, 26.0, 37.0, 63.0, 181.0, 402.0, 1301.0, 5229.0, 43490.0, 4082617.0, 53471.0, 5503.0, 1238.0, 400.0, 142.0, 69.0, 41.0, 16.0, 13.0, 11.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1484375, -11.81591796875, -11.4833984375, -11.15087890625, -10.818359375, -10.48583984375, -10.1533203125, -9.82080078125, -9.48828125, -9.15576171875, -8.8232421875, -8.49072265625, -8.158203125, -7.82568359375, -7.4931640625, -7.16064453125, -6.828125, -6.49560546875, -6.1630859375, -5.83056640625, -5.498046875, -5.16552734375, -4.8330078125, -4.50048828125, -4.16796875, -3.83544921875, -3.5029296875, -3.17041015625, -2.837890625, -2.50537109375, -2.1728515625, -1.84033203125, -1.5078125, -1.17529296875, -0.8427734375, -0.51025390625, -0.177734375, 0.15478515625, 0.4873046875, 0.81982421875, 1.15234375, 1.48486328125, 1.8173828125, 2.14990234375, 2.482421875, 2.81494140625, 3.1474609375, 3.47998046875, 3.8125, 4.14501953125, 4.4775390625, 4.81005859375, 5.142578125, 5.47509765625, 5.8076171875, 6.14013671875, 6.47265625, 6.80517578125, 7.1376953125, 7.47021484375, 7.802734375, 8.13525390625, 8.4677734375, 8.80029296875, 9.1328125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 7.0, 4.0, 4.0, 3.0, 5.0, 9.0, 16.0, 13.0, 33.0, 55.0, 116.0, 401.0, 2759.0, 405.0, 116.0, 46.0, 24.0, 20.0, 12.0, 8.0, 9.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.48828125, -2.42193603515625, -2.3555908203125, -2.28924560546875, -2.222900390625, -2.15655517578125, -2.0902099609375, -2.02386474609375, -1.95751953125, -1.89117431640625, -1.8248291015625, -1.75848388671875, -1.692138671875, -1.62579345703125, -1.5594482421875, -1.49310302734375, -1.4267578125, -1.36041259765625, -1.2940673828125, -1.22772216796875, -1.161376953125, -1.09503173828125, -1.0286865234375, -0.96234130859375, -0.89599609375, -0.82965087890625, -0.7633056640625, -0.69696044921875, -0.630615234375, -0.56427001953125, -0.4979248046875, -0.43157958984375, -0.365234375, -0.29888916015625, -0.2325439453125, -0.16619873046875, -0.099853515625, -0.03350830078125, 0.0328369140625, 0.09918212890625, 0.16552734375, 0.23187255859375, 0.2982177734375, 0.36456298828125, 0.430908203125, 0.49725341796875, 0.5635986328125, 0.62994384765625, 0.6962890625, 0.76263427734375, 0.8289794921875, 0.89532470703125, 0.961669921875, 1.02801513671875, 1.0943603515625, 1.16070556640625, 1.22705078125, 1.29339599609375, 1.3597412109375, 1.42608642578125, 1.492431640625, 1.55877685546875, 1.6251220703125, 1.69146728515625, 1.7578125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 9.0, 26.0, 80.0, 282.0, 397.0, 153.0, 37.0, 10.0, 5.0, 9.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.171379566192627, -6.702581882476807, -6.233784198760986, -5.764986991882324, -5.296189308166504, -4.827391624450684, -4.358593940734863, -3.889796257019043, -3.4209985733032227, -2.9522008895874023, -2.483403205871582, -2.014605760574341, -1.5458080768585205, -1.0770103931427002, -0.608212947845459, -0.13941526412963867, 0.32938241958618164, 0.7981800436973572, 1.2669776678085327, 1.7357752323150635, 2.204572916030884, 2.673370599746704, 3.1421680450439453, 3.6109657287597656, 4.079763412475586, 4.548561096191406, 5.017358779907227, 5.486156463623047, 5.954954147338867, 6.4237518310546875, 6.89254903793335, 7.36134672164917, 7.830144882202148, 8.298942565917969, 8.767740249633789, 9.23653793334961, 9.70533561706543, 10.17413330078125, 10.64293098449707, 11.11172866821289, 11.580526351928711, 12.049324035644531, 12.518121719360352, 12.986919403076172, 13.455717086791992, 13.924514770507812, 14.393312454223633, 14.862110137939453, 15.330906867980957, 15.799704551696777, 16.26850128173828, 16.7372989654541, 17.206096649169922, 17.674894332885742, 18.143692016601562, 18.612489700317383, 19.081287384033203, 19.550085067749023, 20.018882751464844, 20.487680435180664, 20.956478118896484, 21.425275802612305, 21.894073486328125, 22.362871170043945, 22.831668853759766]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 3.0, 5.0, 7.0, 19.0, 10.0, 16.0, 10.0, 17.0, 21.0, 26.0, 34.0, 36.0, 32.0, 41.0, 55.0, 54.0, 41.0, 35.0, 43.0, 45.0, 54.0, 46.0, 35.0, 46.0, 38.0, 33.0, 45.0, 25.0, 26.0, 15.0, 16.0, 13.0, 15.0, 12.0, 8.0, 6.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.1745686531066895, -4.03913688659668, -3.9037046432495117, -3.768272638320923, -3.632840633392334, -3.497408628463745, -3.3619766235351562, -3.2265448570251465, -3.0911126136779785, -2.9556806087493896, -2.820248603820801, -2.684816598892212, -2.549384593963623, -2.413952589035034, -2.2785205841064453, -2.1430888175964355, -2.0076568126678467, -1.8722248077392578, -1.736792802810669, -1.60136079788208, -1.4659287929534912, -1.3304967880249023, -1.195064902305603, -1.0596328973770142, -0.9242008924484253, -0.7887688875198364, -0.6533368825912476, -0.5179049372673035, -0.3824729323387146, -0.24704092741012573, -0.11160898208618164, 0.023823022842407227, 0.1592550277709961, 0.29468703269958496, 0.43011900782585144, 0.5655509829521179, 0.7009829878807068, 0.8364149928092957, 0.9718469381332397, 1.1072789430618286, 1.2427109479904175, 1.3781429529190063, 1.5135749578475952, 1.6490068435668945, 1.7844388484954834, 1.9198708534240723, 2.055302858352661, 2.19073486328125, 2.326166868209839, 2.4615988731384277, 2.5970308780670166, 2.7324628829956055, 2.8678948879241943, 3.003326892852783, 3.138758659362793, 3.274190902709961, 3.4096226692199707, 3.5450546741485596, 3.6804866790771484, 3.8159186840057373, 3.951350688934326, 4.086782455444336, 4.222214698791504, 4.357646465301514, 4.493078708648682]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 10.0, 7.0, 14.0, 15.0, 20.0, 28.0, 60.0, 57.0, 95.0, 156.0, 207.0, 392.0, 744.0, 1658.0, 4591.0, 19668.0, 166799.0, 729114.0, 104044.0, 14325.0, 3618.0, 1362.0, 650.0, 319.0, 195.0, 125.0, 85.0, 65.0, 33.0, 28.0, 19.0, 16.0, 12.0, 9.0, 0.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.0078125, -6.8153076171875, -6.622802734375, -6.4302978515625, -6.23779296875, -6.0452880859375, -5.852783203125, -5.6602783203125, -5.4677734375, -5.2752685546875, -5.082763671875, -4.8902587890625, -4.69775390625, -4.5052490234375, -4.312744140625, -4.1202392578125, -3.927734375, -3.7352294921875, -3.542724609375, -3.3502197265625, -3.15771484375, -2.9652099609375, -2.772705078125, -2.5802001953125, -2.3876953125, -2.1951904296875, -2.002685546875, -1.8101806640625, -1.61767578125, -1.4251708984375, -1.232666015625, -1.0401611328125, -0.84765625, -0.6551513671875, -0.462646484375, -0.2701416015625, -0.07763671875, 0.1148681640625, 0.307373046875, 0.4998779296875, 0.6923828125, 0.8848876953125, 1.077392578125, 1.2698974609375, 1.46240234375, 1.6549072265625, 1.847412109375, 2.0399169921875, 2.232421875, 2.4249267578125, 2.617431640625, 2.8099365234375, 3.00244140625, 3.1949462890625, 3.387451171875, 3.5799560546875, 3.7724609375, 3.9649658203125, 4.157470703125, 4.3499755859375, 4.54248046875, 4.7349853515625, 4.927490234375, 5.1199951171875, 5.3125]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 8.0, 12.0, 18.0, 30.0, 52.0, 78.0, 89.0, 118.0, 101.0, 108.0, 119.0, 87.0, 68.0, 49.0, 26.0, 14.0, 9.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.208984375, -2.159576416015625, -2.11016845703125, -2.060760498046875, -2.0113525390625, -1.961944580078125, -1.91253662109375, -1.863128662109375, -1.813720703125, -1.764312744140625, -1.71490478515625, -1.665496826171875, -1.6160888671875, -1.566680908203125, -1.51727294921875, -1.467864990234375, -1.41845703125, -1.369049072265625, -1.31964111328125, -1.270233154296875, -1.2208251953125, -1.171417236328125, -1.12200927734375, -1.072601318359375, -1.023193359375, -0.973785400390625, -0.92437744140625, -0.874969482421875, -0.8255615234375, -0.776153564453125, -0.72674560546875, -0.677337646484375, -0.6279296875, -0.578521728515625, -0.52911376953125, -0.479705810546875, -0.4302978515625, -0.380889892578125, -0.33148193359375, -0.282073974609375, -0.232666015625, -0.183258056640625, -0.13385009765625, -0.084442138671875, -0.0350341796875, 0.014373779296875, 0.06378173828125, 0.113189697265625, 0.16259765625, 0.212005615234375, 0.26141357421875, 0.310821533203125, 0.3602294921875, 0.409637451171875, 0.45904541015625, 0.508453369140625, 0.557861328125, 0.607269287109375, 0.65667724609375, 0.706085205078125, 0.7554931640625, 0.804901123046875, 0.85430908203125, 0.903717041015625, 0.953125]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 4.0, 2.0, 6.0, 6.0, 5.0, 11.0, 12.0, 17.0, 17.0, 20.0, 28.0, 40.0, 76.0, 115.0, 207.0, 492.0, 1081.0, 3011.0, 12714.0, 81161.0, 693694.0, 221158.0, 26266.0, 5384.0, 1645.0, 621.0, 286.0, 158.0, 91.0, 54.0, 38.0, 26.0, 30.0, 19.0, 10.0, 16.0, 12.0, 11.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.17578125, -5.95294189453125, -5.7301025390625, -5.50726318359375, -5.284423828125, -5.06158447265625, -4.8387451171875, -4.61590576171875, -4.39306640625, -4.17022705078125, -3.9473876953125, -3.72454833984375, -3.501708984375, -3.27886962890625, -3.0560302734375, -2.83319091796875, -2.6103515625, -2.38751220703125, -2.1646728515625, -1.94183349609375, -1.718994140625, -1.49615478515625, -1.2733154296875, -1.05047607421875, -0.82763671875, -0.60479736328125, -0.3819580078125, -0.15911865234375, 0.063720703125, 0.28656005859375, 0.5093994140625, 0.73223876953125, 0.955078125, 1.17791748046875, 1.4007568359375, 1.62359619140625, 1.846435546875, 2.06927490234375, 2.2921142578125, 2.51495361328125, 2.73779296875, 2.96063232421875, 3.1834716796875, 3.40631103515625, 3.629150390625, 3.85198974609375, 4.0748291015625, 4.29766845703125, 4.5205078125, 4.74334716796875, 4.9661865234375, 5.18902587890625, 5.411865234375, 5.63470458984375, 5.8575439453125, 6.08038330078125, 6.30322265625, 6.52606201171875, 6.7489013671875, 6.97174072265625, 7.194580078125, 7.41741943359375, 7.6402587890625, 7.86309814453125, 8.0859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 13.0, 14.0, 15.0, 17.0, 17.0, 23.0, 23.0, 29.0, 32.0, 37.0, 37.0, 31.0, 52.0, 48.0, 52.0, 47.0, 38.0, 45.0, 41.0, 50.0, 48.0, 25.0, 41.0, 37.0, 14.0, 30.0, 29.0, 13.0, 26.0, 15.0, 9.0, 10.0, 4.0, 9.0, 10.0, 2.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.40625, -4.27191162109375, -4.1375732421875, -4.00323486328125, -3.868896484375, -3.73455810546875, -3.6002197265625, -3.46588134765625, -3.33154296875, -3.19720458984375, -3.0628662109375, -2.92852783203125, -2.794189453125, -2.65985107421875, -2.5255126953125, -2.39117431640625, -2.2568359375, -2.12249755859375, -1.9881591796875, -1.85382080078125, -1.719482421875, -1.58514404296875, -1.4508056640625, -1.31646728515625, -1.18212890625, -1.04779052734375, -0.9134521484375, -0.77911376953125, -0.644775390625, -0.51043701171875, -0.3760986328125, -0.24176025390625, -0.107421875, 0.02691650390625, 0.1612548828125, 0.29559326171875, 0.429931640625, 0.56427001953125, 0.6986083984375, 0.83294677734375, 0.96728515625, 1.10162353515625, 1.2359619140625, 1.37030029296875, 1.504638671875, 1.63897705078125, 1.7733154296875, 1.90765380859375, 2.0419921875, 2.17633056640625, 2.3106689453125, 2.44500732421875, 2.579345703125, 2.71368408203125, 2.8480224609375, 2.98236083984375, 3.11669921875, 3.25103759765625, 3.3853759765625, 3.51971435546875, 3.654052734375, 3.78839111328125, 3.9227294921875, 4.05706787109375, 4.19140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 4.0, 5.0, 6.0, 11.0, 18.0, 23.0, 49.0, 45.0, 87.0, 120.0, 220.0, 390.0, 823.0, 1847.0, 5409.0, 23428.0, 213738.0, 697873.0, 85221.0, 12781.0, 3639.0, 1375.0, 614.0, 308.0, 182.0, 111.0, 66.0, 48.0, 36.0, 19.0, 14.0, 13.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6103515625, -1.558929443359375, -1.50750732421875, -1.456085205078125, -1.4046630859375, -1.353240966796875, -1.30181884765625, -1.250396728515625, -1.198974609375, -1.147552490234375, -1.09613037109375, -1.044708251953125, -0.9932861328125, -0.941864013671875, -0.89044189453125, -0.839019775390625, -0.78759765625, -0.736175537109375, -0.68475341796875, -0.633331298828125, -0.5819091796875, -0.530487060546875, -0.47906494140625, -0.427642822265625, -0.376220703125, -0.324798583984375, -0.27337646484375, -0.221954345703125, -0.1705322265625, -0.119110107421875, -0.06768798828125, -0.016265869140625, 0.03515625, 0.086578369140625, 0.13800048828125, 0.189422607421875, 0.2408447265625, 0.292266845703125, 0.34368896484375, 0.395111083984375, 0.446533203125, 0.497955322265625, 0.54937744140625, 0.600799560546875, 0.6522216796875, 0.703643798828125, 0.75506591796875, 0.806488037109375, 0.85791015625, 0.909332275390625, 0.96075439453125, 1.012176513671875, 1.0635986328125, 1.115020751953125, 1.16644287109375, 1.217864990234375, 1.269287109375, 1.320709228515625, 1.37213134765625, 1.423553466796875, 1.4749755859375, 1.526397705078125, 1.57781982421875, 1.629241943359375, 1.6806640625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 9.0, 5.0, 6.0, 4.0, 8.0, 19.0, 17.0, 37.0, 35.0, 42.0, 66.0, 84.0, 103.0, 111.0, 115.0, 93.0, 66.0, 56.0, 37.0, 31.0, 15.0, 14.0, 9.0, 5.0, 5.0, 4.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.00023698806762695312, -0.0002310425043106079, -0.0002250969409942627, -0.00021915137767791748, -0.00021320581436157227, -0.00020726025104522705, -0.00020131468772888184, -0.00019536912441253662, -0.0001894235610961914, -0.0001834779977798462, -0.00017753243446350098, -0.00017158687114715576, -0.00016564130783081055, -0.00015969574451446533, -0.00015375018119812012, -0.0001478046178817749, -0.0001418590545654297, -0.00013591349124908447, -0.00012996792793273926, -0.00012402236461639404, -0.00011807680130004883, -0.00011213123798370361, -0.0001061856746673584, -0.00010024011135101318, -9.429454803466797e-05, -8.834898471832275e-05, -8.240342140197754e-05, -7.645785808563232e-05, -7.051229476928711e-05, -6.45667314529419e-05, -5.862116813659668e-05, -5.2675604820251465e-05, -4.673004150390625e-05, -4.0784478187561035e-05, -3.483891487121582e-05, -2.8893351554870605e-05, -2.294778823852539e-05, -1.7002224922180176e-05, -1.1056661605834961e-05, -5.111098289489746e-06, 8.344650268554688e-07, 6.780028343200684e-06, 1.2725591659545898e-05, 1.8671154975891113e-05, 2.4616718292236328e-05, 3.056228160858154e-05, 3.650784492492676e-05, 4.245340824127197e-05, 4.839897155761719e-05, 5.43445348739624e-05, 6.029009819030762e-05, 6.623566150665283e-05, 7.218122482299805e-05, 7.812678813934326e-05, 8.407235145568848e-05, 9.001791477203369e-05, 9.59634780883789e-05, 0.00010190904140472412, 0.00010785460472106934, 0.00011380016803741455, 0.00011974573135375977, 0.00012569129467010498, 0.0001316368579864502, 0.0001375824213027954, 0.00014352798461914062]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 8.0, 5.0, 12.0, 12.0, 16.0, 21.0, 39.0, 45.0, 99.0, 206.0, 475.0, 1467.0, 6483.0, 67782.0, 868546.0, 93096.0, 7572.0, 1600.0, 574.0, 236.0, 111.0, 54.0, 32.0, 28.0, 13.0, 5.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.857421875, -2.772247314453125, -2.68707275390625, -2.601898193359375, -2.5167236328125, -2.431549072265625, -2.34637451171875, -2.261199951171875, -2.176025390625, -2.090850830078125, -2.00567626953125, -1.920501708984375, -1.8353271484375, -1.750152587890625, -1.66497802734375, -1.579803466796875, -1.49462890625, -1.409454345703125, -1.32427978515625, -1.239105224609375, -1.1539306640625, -1.068756103515625, -0.98358154296875, -0.898406982421875, -0.813232421875, -0.728057861328125, -0.64288330078125, -0.557708740234375, -0.4725341796875, -0.387359619140625, -0.30218505859375, -0.217010498046875, -0.1318359375, -0.046661376953125, 0.03851318359375, 0.123687744140625, 0.2088623046875, 0.294036865234375, 0.37921142578125, 0.464385986328125, 0.549560546875, 0.634735107421875, 0.71990966796875, 0.805084228515625, 0.8902587890625, 0.975433349609375, 1.06060791015625, 1.145782470703125, 1.23095703125, 1.316131591796875, 1.40130615234375, 1.486480712890625, 1.5716552734375, 1.656829833984375, 1.74200439453125, 1.827178955078125, 1.912353515625, 1.997528076171875, 2.08270263671875, 2.167877197265625, 2.2530517578125, 2.338226318359375, 2.42340087890625, 2.508575439453125, 2.59375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0, 4.0, 11.0, 15.0, 14.0, 18.0, 13.0, 20.0, 33.0, 33.0, 47.0, 80.0, 90.0, 81.0, 103.0, 100.0, 88.0, 80.0, 46.0, 41.0, 24.0, 16.0, 15.0, 9.0, 6.0, 2.0, 7.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5146484375, -1.4716644287109375, -1.428680419921875, -1.3856964111328125, -1.34271240234375, -1.2997283935546875, -1.256744384765625, -1.2137603759765625, -1.1707763671875, -1.1277923583984375, -1.084808349609375, -1.0418243408203125, -0.99884033203125, -0.9558563232421875, -0.912872314453125, -0.8698883056640625, -0.826904296875, -0.7839202880859375, -0.740936279296875, -0.6979522705078125, -0.65496826171875, -0.6119842529296875, -0.569000244140625, -0.5260162353515625, -0.4830322265625, -0.4400482177734375, -0.397064208984375, -0.3540802001953125, -0.31109619140625, -0.2681121826171875, -0.225128173828125, -0.1821441650390625, -0.13916015625, -0.0961761474609375, -0.053192138671875, -0.0102081298828125, 0.03277587890625, 0.0757598876953125, 0.118743896484375, 0.1617279052734375, 0.2047119140625, 0.2476959228515625, 0.290679931640625, 0.3336639404296875, 0.37664794921875, 0.4196319580078125, 0.462615966796875, 0.5055999755859375, 0.548583984375, 0.5915679931640625, 0.634552001953125, 0.6775360107421875, 0.72052001953125, 0.7635040283203125, 0.806488037109375, 0.8494720458984375, 0.8924560546875, 0.9354400634765625, 0.978424072265625, 1.0214080810546875, 1.06439208984375, 1.1073760986328125, 1.150360107421875, 1.1933441162109375, 1.236328125]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 8.0, 12.0, 13.0, 48.0, 128.0, 336.0, 294.0, 90.0, 37.0, 28.0, 11.0, 2.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.10966491699219, -57.464717864990234, -55.819766998291016, -54.17481994628906, -52.529869079589844, -50.88492202758789, -49.23997497558594, -47.59502410888672, -45.950077056884766, -44.30513000488281, -42.660179138183594, -41.01523208618164, -39.37028503417969, -37.72533416748047, -36.080387115478516, -34.43544006347656, -32.790489196777344, -31.145540237426758, -29.500591278076172, -27.85564422607422, -26.210695266723633, -24.565746307373047, -22.920799255371094, -21.275850296020508, -19.630901336669922, -17.985952377319336, -16.34100341796875, -14.696056365966797, -13.051107406616211, -11.406158447265625, -9.761210441589355, -8.116262435913086, -6.471317291259766, -4.826368808746338, -3.18142032623291, -1.5364718437194824, 0.10847663879394531, 1.7534255981445312, 3.398373603820801, 5.04332160949707, 6.688270568847656, 8.333219528198242, 9.978167533874512, 11.623115539550781, 13.268064498901367, 14.913013458251953, 16.557960510253906, 18.202909469604492, 19.847858428955078, 21.492807388305664, 23.13775634765625, 24.782703399658203, 26.42765235900879, 28.072601318359375, 29.717548370361328, 31.362497329711914, 33.0074462890625, 34.65239334106445, 36.29734420776367, 37.942291259765625, 39.587242126464844, 41.2321891784668, 42.87713623046875, 44.52208709716797, 46.16703414916992]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 12.0, 8.0, 14.0, 20.0, 17.0, 22.0, 32.0, 42.0, 56.0, 57.0, 70.0, 71.0, 70.0, 70.0, 66.0, 55.0, 56.0, 44.0, 50.0, 47.0, 32.0, 23.0, 19.0, 18.0, 9.0, 8.0, 8.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.40410614013672, -23.30684471130371, -22.209583282470703, -21.112323760986328, -20.01506233215332, -18.917800903320312, -17.820541381835938, -16.72327995300293, -15.626018524169922, -14.528757095336914, -13.431496620178223, -12.334236145019531, -11.236974716186523, -10.139713287353516, -9.042452812194824, -7.945191860198975, -6.847930908203125, -5.750669956207275, -4.653409004211426, -3.556148052215576, -2.4588871002197266, -1.361626148223877, -0.26436519622802734, 0.8328957557678223, 1.9301567077636719, 3.0274176597595215, 4.124678611755371, 5.221939563751221, 6.31920051574707, 7.41646146774292, 8.51372241973877, 9.610982894897461, 10.708248138427734, 11.805509567260742, 12.902770042419434, 14.000030517578125, 15.097291946411133, 16.19455337524414, 17.291812896728516, 18.389074325561523, 19.48633575439453, 20.58359718322754, 21.680858612060547, 22.778118133544922, 23.87537956237793, 24.972640991210938, 26.069900512695312, 27.16716194152832, 28.264423370361328, 29.361684799194336, 30.458946228027344, 31.55620574951172, 32.653465270996094, 33.750728607177734, 34.84798812866211, 35.94525146484375, 37.042510986328125, 38.1397705078125, 39.23703384399414, 40.334293365478516, 41.431556701660156, 42.52881622314453, 43.626075744628906, 44.72333908081055, 45.82059860229492]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 7.0, 4.0, 1.0, 5.0, 6.0, 9.0, 8.0, 7.0, 10.0, 12.0, 23.0, 31.0, 43.0, 45.0, 58.0, 87.0, 138.0, 201.0, 349.0, 615.0, 1305.0, 3436.0, 11807.0, 95584.0, 3964518.0, 98936.0, 11909.0, 3109.0, 1103.0, 477.0, 205.0, 93.0, 51.0, 41.0, 25.0, 12.0, 4.0, 4.0, 9.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-9.140625, -8.93048095703125, -8.7203369140625, -8.51019287109375, -8.300048828125, -8.08990478515625, -7.8797607421875, -7.66961669921875, -7.45947265625, -7.24932861328125, -7.0391845703125, -6.82904052734375, -6.618896484375, -6.40875244140625, -6.1986083984375, -5.98846435546875, -5.7783203125, -5.56817626953125, -5.3580322265625, -5.14788818359375, -4.937744140625, -4.72760009765625, -4.5174560546875, -4.30731201171875, -4.09716796875, -3.88702392578125, -3.6768798828125, -3.46673583984375, -3.256591796875, -3.04644775390625, -2.8363037109375, -2.62615966796875, -2.416015625, -2.20587158203125, -1.9957275390625, -1.78558349609375, -1.575439453125, -1.36529541015625, -1.1551513671875, -0.94500732421875, -0.73486328125, -0.52471923828125, -0.3145751953125, -0.10443115234375, 0.105712890625, 0.31585693359375, 0.5260009765625, 0.73614501953125, 0.9462890625, 1.15643310546875, 1.3665771484375, 1.57672119140625, 1.786865234375, 1.99700927734375, 2.2071533203125, 2.41729736328125, 2.62744140625, 2.83758544921875, 3.0477294921875, 3.25787353515625, 3.468017578125, 3.67816162109375, 3.8883056640625, 4.09844970703125, 4.30859375]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 7.0, 16.0, 29.0, 38.0, 56.0, 77.0, 114.0, 106.0, 128.0, 115.0, 96.0, 73.0, 62.0, 34.0, 22.0, 12.0, 9.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.193359375, -2.1389007568359375, -2.084442138671875, -2.0299835205078125, -1.97552490234375, -1.9210662841796875, -1.866607666015625, -1.8121490478515625, -1.7576904296875, -1.7032318115234375, -1.648773193359375, -1.5943145751953125, -1.53985595703125, -1.4853973388671875, -1.430938720703125, -1.3764801025390625, -1.322021484375, -1.2675628662109375, -1.213104248046875, -1.1586456298828125, -1.10418701171875, -1.0497283935546875, -0.995269775390625, -0.9408111572265625, -0.8863525390625, -0.8318939208984375, -0.777435302734375, -0.7229766845703125, -0.66851806640625, -0.6140594482421875, -0.559600830078125, -0.5051422119140625, -0.45068359375, -0.3962249755859375, -0.341766357421875, -0.2873077392578125, -0.23284912109375, -0.1783905029296875, -0.123931884765625, -0.0694732666015625, -0.0150146484375, 0.0394439697265625, 0.093902587890625, 0.1483612060546875, 0.20281982421875, 0.2572784423828125, 0.311737060546875, 0.3661956787109375, 0.420654296875, 0.4751129150390625, 0.529571533203125, 0.5840301513671875, 0.63848876953125, 0.6929473876953125, 0.747406005859375, 0.8018646240234375, 0.8563232421875, 0.9107818603515625, 0.965240478515625, 1.0196990966796875, 1.07415771484375, 1.1286163330078125, 1.183074951171875, 1.2375335693359375, 1.2919921875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 3.0, 10.0, 5.0, 14.0, 15.0, 20.0, 32.0, 49.0, 134.0, 290.0, 567.0, 1480.0, 5356.0, 32799.0, 3665627.0, 464369.0, 17880.0, 3469.0, 1159.0, 489.0, 249.0, 112.0, 66.0, 25.0, 14.0, 15.0, 11.0, 5.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.35546875, -7.11712646484375, -6.8787841796875, -6.64044189453125, -6.402099609375, -6.16375732421875, -5.9254150390625, -5.68707275390625, -5.44873046875, -5.21038818359375, -4.9720458984375, -4.73370361328125, -4.495361328125, -4.25701904296875, -4.0186767578125, -3.78033447265625, -3.5419921875, -3.30364990234375, -3.0653076171875, -2.82696533203125, -2.588623046875, -2.35028076171875, -2.1119384765625, -1.87359619140625, -1.63525390625, -1.39691162109375, -1.1585693359375, -0.92022705078125, -0.681884765625, -0.44354248046875, -0.2052001953125, 0.03314208984375, 0.271484375, 0.50982666015625, 0.7481689453125, 0.98651123046875, 1.224853515625, 1.46319580078125, 1.7015380859375, 1.93988037109375, 2.17822265625, 2.41656494140625, 2.6549072265625, 2.89324951171875, 3.131591796875, 3.36993408203125, 3.6082763671875, 3.84661865234375, 4.0849609375, 4.32330322265625, 4.5616455078125, 4.79998779296875, 5.038330078125, 5.27667236328125, 5.5150146484375, 5.75335693359375, 5.99169921875, 6.23004150390625, 6.4683837890625, 6.70672607421875, 6.945068359375, 7.18341064453125, 7.4217529296875, 7.66009521484375, 7.8984375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 3.0, 3.0, 11.0, 8.0, 11.0, 19.0, 36.0, 44.0, 95.0, 166.0, 493.0, 2179.0, 539.0, 211.0, 89.0, 49.0, 33.0, 21.0, 16.0, 13.0, 7.0, 5.0, 6.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.341796875, -2.269775390625, -2.19775390625, -2.125732421875, -2.0537109375, -1.981689453125, -1.90966796875, -1.837646484375, -1.765625, -1.693603515625, -1.62158203125, -1.549560546875, -1.4775390625, -1.405517578125, -1.33349609375, -1.261474609375, -1.189453125, -1.117431640625, -1.04541015625, -0.973388671875, -0.9013671875, -0.829345703125, -0.75732421875, -0.685302734375, -0.61328125, -0.541259765625, -0.46923828125, -0.397216796875, -0.3251953125, -0.253173828125, -0.18115234375, -0.109130859375, -0.037109375, 0.034912109375, 0.10693359375, 0.178955078125, 0.2509765625, 0.322998046875, 0.39501953125, 0.467041015625, 0.5390625, 0.611083984375, 0.68310546875, 0.755126953125, 0.8271484375, 0.899169921875, 0.97119140625, 1.043212890625, 1.115234375, 1.187255859375, 1.25927734375, 1.331298828125, 1.4033203125, 1.475341796875, 1.54736328125, 1.619384765625, 1.69140625, 1.763427734375, 1.83544921875, 1.907470703125, 1.9794921875, 2.051513671875, 2.12353515625, 2.195556640625, 2.267578125]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 8.0, 6.0, 33.0, 115.0, 292.0, 350.0, 144.0, 42.0, 11.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.84033203125, -18.169384002685547, -17.498435974121094, -16.82748794555664, -16.15654182434082, -15.485593795776367, -14.814645767211914, -14.143697738647461, -13.472749710083008, -12.801801681518555, -12.130854606628418, -11.459906578063965, -10.788958549499512, -10.118011474609375, -9.447063446044922, -8.776115417480469, -8.105168342590332, -7.434220790863037, -6.763272762298584, -6.092325210571289, -5.421377182006836, -4.750429630279541, -4.079482078552246, -3.408534049987793, -2.737586498260498, -2.066638708114624, -1.3956910371780396, -0.7247433662414551, -0.053795576095581055, 0.617152214050293, 1.288099765777588, 1.959047794342041, 2.629995346069336, 3.30094313621521, 3.971890926361084, 4.642838478088379, 5.313786506652832, 5.984734058380127, 6.655681610107422, 7.326629638671875, 7.99757719039917, 8.668524742126465, 9.339472770690918, 10.010419845581055, 10.681367874145508, 11.352315902709961, 12.023263931274414, 12.694211959838867, 13.365159034729004, 14.036107063293457, 14.707054138183594, 15.378002166748047, 16.0489501953125, 16.719898223876953, 17.390846252441406, 18.06179428100586, 18.73274040222168, 19.403688430786133, 20.074636459350586, 20.745582580566406, 21.41653060913086, 22.087478637695312, 22.758426666259766, 23.42937469482422, 24.100322723388672]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 4.0, 3.0, 4.0, 11.0, 12.0, 15.0, 15.0, 19.0, 22.0, 19.0, 27.0, 27.0, 26.0, 32.0, 37.0, 50.0, 37.0, 34.0, 46.0, 35.0, 33.0, 50.0, 50.0, 47.0, 49.0, 28.0, 42.0, 37.0, 27.0, 27.0, 20.0, 17.0, 20.0, 11.0, 15.0, 10.0, 6.0, 10.0, 6.0, 1.0, 2.0, 5.0, 4.0, 0.0, 1.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.818304061889648, -5.642192363739014, -5.466080665588379, -5.289968490600586, -5.113856792449951, -4.937745094299316, -4.761633396148682, -4.585521697998047, -4.409409999847412, -4.233298301696777, -4.057186603546143, -3.8810746669769287, -3.704962968826294, -3.52885103225708, -3.3527393341064453, -3.1766276359558105, -3.0005156993865967, -2.824404001235962, -2.648292064666748, -2.4721803665161133, -2.2960686683654785, -2.1199569702148438, -1.9438450336456299, -1.7677333354949951, -1.5916215181350708, -1.4155097007751465, -1.2393980026245117, -1.0632861852645874, -0.8871744275093079, -0.7110626697540283, -0.534950852394104, -0.35883915424346924, -0.18272733688354492, -0.006615564227104187, 0.16949620842933655, 0.3456079959869385, 0.521719753742218, 0.6978315114974976, 0.8739433288574219, 1.0500550270080566, 1.226166844367981, 1.4022786617279053, 1.57839035987854, 1.7545021772384644, 1.9306139945983887, 2.1067256927490234, 2.282837390899658, 2.458949089050293, 2.635061025619507, 2.8111727237701416, 2.9872846603393555, 3.1633963584899902, 3.339508056640625, 3.5156197547912598, 3.6917316913604736, 3.8678433895111084, 4.043955326080322, 4.220067024230957, 4.396178722381592, 4.572290420532227, 4.7484025955200195, 4.924514293670654, 5.100625991821289, 5.276737689971924, 5.452849388122559]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 4.0, 5.0, 14.0, 8.0, 13.0, 23.0, 30.0, 40.0, 62.0, 90.0, 157.0, 241.0, 459.0, 825.0, 1736.0, 5273.0, 26074.0, 229131.0, 698101.0, 69653.0, 11191.0, 2882.0, 1121.0, 587.0, 297.0, 191.0, 107.0, 81.0, 39.0, 26.0, 19.0, 29.0, 19.0, 11.0, 5.0, 9.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7265625, -5.5084228515625, -5.290283203125, -5.0721435546875, -4.85400390625, -4.6358642578125, -4.417724609375, -4.1995849609375, -3.9814453125, -3.7633056640625, -3.545166015625, -3.3270263671875, -3.10888671875, -2.8907470703125, -2.672607421875, -2.4544677734375, -2.236328125, -2.0181884765625, -1.800048828125, -1.5819091796875, -1.36376953125, -1.1456298828125, -0.927490234375, -0.7093505859375, -0.4912109375, -0.2730712890625, -0.054931640625, 0.1632080078125, 0.38134765625, 0.5994873046875, 0.817626953125, 1.0357666015625, 1.25390625, 1.4720458984375, 1.690185546875, 1.9083251953125, 2.12646484375, 2.3446044921875, 2.562744140625, 2.7808837890625, 2.9990234375, 3.2171630859375, 3.435302734375, 3.6534423828125, 3.87158203125, 4.0897216796875, 4.307861328125, 4.5260009765625, 4.744140625, 4.9622802734375, 5.180419921875, 5.3985595703125, 5.61669921875, 5.8348388671875, 6.052978515625, 6.2711181640625, 6.4892578125, 6.7073974609375, 6.925537109375, 7.1436767578125, 7.36181640625, 7.5799560546875, 7.798095703125, 8.0162353515625, 8.234375]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 9.0, 13.0, 34.0, 40.0, 52.0, 84.0, 97.0, 132.0, 122.0, 103.0, 97.0, 68.0, 57.0, 38.0, 22.0, 18.0, 6.0, 3.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.296875, -2.243682861328125, -2.19049072265625, -2.137298583984375, -2.0841064453125, -2.030914306640625, -1.97772216796875, -1.924530029296875, -1.871337890625, -1.818145751953125, -1.76495361328125, -1.711761474609375, -1.6585693359375, -1.605377197265625, -1.55218505859375, -1.498992919921875, -1.44580078125, -1.392608642578125, -1.33941650390625, -1.286224365234375, -1.2330322265625, -1.179840087890625, -1.12664794921875, -1.073455810546875, -1.020263671875, -0.967071533203125, -0.91387939453125, -0.860687255859375, -0.8074951171875, -0.754302978515625, -0.70111083984375, -0.647918701171875, -0.5947265625, -0.541534423828125, -0.48834228515625, -0.435150146484375, -0.3819580078125, -0.328765869140625, -0.27557373046875, -0.222381591796875, -0.169189453125, -0.115997314453125, -0.06280517578125, -0.009613037109375, 0.0435791015625, 0.096771240234375, 0.14996337890625, 0.203155517578125, 0.25634765625, 0.309539794921875, 0.36273193359375, 0.415924072265625, 0.4691162109375, 0.522308349609375, 0.57550048828125, 0.628692626953125, 0.681884765625, 0.735076904296875, 0.78826904296875, 0.841461181640625, 0.8946533203125, 0.947845458984375, 1.00103759765625, 1.054229736328125, 1.107421875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 7.0, 4.0, 7.0, 5.0, 12.0, 20.0, 28.0, 38.0, 57.0, 85.0, 178.0, 340.0, 750.0, 1863.0, 6613.0, 30869.0, 260508.0, 659036.0, 70118.0, 12319.0, 3510.0, 1125.0, 494.0, 254.0, 120.0, 80.0, 35.0, 34.0, 17.0, 11.0, 6.0, 4.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84765625, -7.6182861328125, -7.388916015625, -7.1595458984375, -6.93017578125, -6.7008056640625, -6.471435546875, -6.2420654296875, -6.0126953125, -5.7833251953125, -5.553955078125, -5.3245849609375, -5.09521484375, -4.8658447265625, -4.636474609375, -4.4071044921875, -4.177734375, -3.9483642578125, -3.718994140625, -3.4896240234375, -3.26025390625, -3.0308837890625, -2.801513671875, -2.5721435546875, -2.3427734375, -2.1134033203125, -1.884033203125, -1.6546630859375, -1.42529296875, -1.1959228515625, -0.966552734375, -0.7371826171875, -0.5078125, -0.2784423828125, -0.049072265625, 0.1802978515625, 0.40966796875, 0.6390380859375, 0.868408203125, 1.0977783203125, 1.3271484375, 1.5565185546875, 1.785888671875, 2.0152587890625, 2.24462890625, 2.4739990234375, 2.703369140625, 2.9327392578125, 3.162109375, 3.3914794921875, 3.620849609375, 3.8502197265625, 4.07958984375, 4.3089599609375, 4.538330078125, 4.7677001953125, 4.9970703125, 5.2264404296875, 5.455810546875, 5.6851806640625, 5.91455078125, 6.1439208984375, 6.373291015625, 6.6026611328125, 6.83203125]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 5.0, 7.0, 10.0, 12.0, 16.0, 13.0, 16.0, 25.0, 28.0, 36.0, 33.0, 44.0, 40.0, 49.0, 67.0, 43.0, 62.0, 56.0, 70.0, 57.0, 52.0, 37.0, 45.0, 34.0, 38.0, 25.0, 27.0, 18.0, 6.0, 11.0, 11.0, 3.0, 7.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.47845458984375, -5.3123779296875, -5.14630126953125, -4.980224609375, -4.81414794921875, -4.6480712890625, -4.48199462890625, -4.31591796875, -4.14984130859375, -3.9837646484375, -3.81768798828125, -3.651611328125, -3.48553466796875, -3.3194580078125, -3.15338134765625, -2.9873046875, -2.82122802734375, -2.6551513671875, -2.48907470703125, -2.322998046875, -2.15692138671875, -1.9908447265625, -1.82476806640625, -1.65869140625, -1.49261474609375, -1.3265380859375, -1.16046142578125, -0.994384765625, -0.82830810546875, -0.6622314453125, -0.49615478515625, -0.330078125, -0.16400146484375, 0.0020751953125, 0.16815185546875, 0.334228515625, 0.50030517578125, 0.6663818359375, 0.83245849609375, 0.99853515625, 1.16461181640625, 1.3306884765625, 1.49676513671875, 1.662841796875, 1.82891845703125, 1.9949951171875, 2.16107177734375, 2.3271484375, 2.49322509765625, 2.6593017578125, 2.82537841796875, 2.991455078125, 3.15753173828125, 3.3236083984375, 3.48968505859375, 3.65576171875, 3.82183837890625, 3.9879150390625, 4.15399169921875, 4.320068359375, 4.48614501953125, 4.6522216796875, 4.81829833984375, 4.984375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 9.0, 5.0, 12.0, 13.0, 17.0, 31.0, 48.0, 71.0, 134.0, 219.0, 493.0, 898.0, 2059.0, 5669.0, 37052.0, 963520.0, 29456.0, 5098.0, 1859.0, 840.0, 428.0, 239.0, 140.0, 82.0, 59.0, 27.0, 22.0, 14.0, 13.0, 7.0, 3.0, 4.0, 4.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.62109375, -4.43218994140625, -4.2432861328125, -4.05438232421875, -3.865478515625, -3.67657470703125, -3.4876708984375, -3.29876708984375, -3.10986328125, -2.92095947265625, -2.7320556640625, -2.54315185546875, -2.354248046875, -2.16534423828125, -1.9764404296875, -1.78753662109375, -1.5986328125, -1.40972900390625, -1.2208251953125, -1.03192138671875, -0.843017578125, -0.65411376953125, -0.4652099609375, -0.27630615234375, -0.08740234375, 0.10150146484375, 0.2904052734375, 0.47930908203125, 0.668212890625, 0.85711669921875, 1.0460205078125, 1.23492431640625, 1.423828125, 1.61273193359375, 1.8016357421875, 1.99053955078125, 2.179443359375, 2.36834716796875, 2.5572509765625, 2.74615478515625, 2.93505859375, 3.12396240234375, 3.3128662109375, 3.50177001953125, 3.690673828125, 3.87957763671875, 4.0684814453125, 4.25738525390625, 4.4462890625, 4.63519287109375, 4.8240966796875, 5.01300048828125, 5.201904296875, 5.39080810546875, 5.5797119140625, 5.76861572265625, 5.95751953125, 6.14642333984375, 6.3353271484375, 6.52423095703125, 6.713134765625, 6.90203857421875, 7.0909423828125, 7.27984619140625, 7.46875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 8.0, 8.0, 21.0, 42.0, 85.0, 169.0, 306.0, 208.0, 81.0, 33.0, 16.0, 5.0, 11.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007257461547851562, -0.00070943683385849, -0.0006931275129318237, -0.0006768181920051575, -0.0006605088710784912, -0.000644199550151825, -0.0006278902292251587, -0.0006115809082984924, -0.0005952715873718262, -0.0005789622664451599, -0.0005626529455184937, -0.0005463436245918274, -0.0005300343036651611, -0.0005137249827384949, -0.0004974156618118286, -0.00048110634088516235, -0.0004647970199584961, -0.00044848769903182983, -0.0004321783781051636, -0.0004158690571784973, -0.00039955973625183105, -0.0003832504153251648, -0.00036694109439849854, -0.0003506317734718323, -0.000334322452545166, -0.00031801313161849976, -0.0003017038106918335, -0.00028539448976516724, -0.000269085168838501, -0.0002527758479118347, -0.00023646652698516846, -0.0002201572060585022, -0.00020384788513183594, -0.00018753856420516968, -0.00017122924327850342, -0.00015491992235183716, -0.0001386106014251709, -0.00012230128049850464, -0.00010599195957183838, -8.968263864517212e-05, -7.337331771850586e-05, -5.70639967918396e-05, -4.075467586517334e-05, -2.444535493850708e-05, -8.13603401184082e-06, 8.17328691482544e-06, 2.44826078414917e-05, 4.079192876815796e-05, 5.710124969482422e-05, 7.341057062149048e-05, 8.971989154815674e-05, 0.000106029212474823, 0.00012233853340148926, 0.00013864785432815552, 0.00015495717525482178, 0.00017126649618148804, 0.0001875758171081543, 0.00020388513803482056, 0.00022019445896148682, 0.00023650377988815308, 0.00025281310081481934, 0.0002691224217414856, 0.00028543174266815186, 0.0003017410635948181, 0.0003180503845214844]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 11.0, 14.0, 13.0, 36.0, 64.0, 140.0, 263.0, 530.0, 1314.0, 4138.0, 23714.0, 837813.0, 166161.0, 10310.0, 2419.0, 795.0, 399.0, 170.0, 100.0, 47.0, 32.0, 15.0, 17.0, 12.0, 5.0, 6.0, 6.0, 4.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.734375, -4.59429931640625, -4.4542236328125, -4.31414794921875, -4.174072265625, -4.03399658203125, -3.8939208984375, -3.75384521484375, -3.61376953125, -3.47369384765625, -3.3336181640625, -3.19354248046875, -3.053466796875, -2.91339111328125, -2.7733154296875, -2.63323974609375, -2.4931640625, -2.35308837890625, -2.2130126953125, -2.07293701171875, -1.932861328125, -1.79278564453125, -1.6527099609375, -1.51263427734375, -1.37255859375, -1.23248291015625, -1.0924072265625, -0.95233154296875, -0.812255859375, -0.67218017578125, -0.5321044921875, -0.39202880859375, -0.251953125, -0.11187744140625, 0.0281982421875, 0.16827392578125, 0.308349609375, 0.44842529296875, 0.5885009765625, 0.72857666015625, 0.86865234375, 1.00872802734375, 1.1488037109375, 1.28887939453125, 1.428955078125, 1.56903076171875, 1.7091064453125, 1.84918212890625, 1.9892578125, 2.12933349609375, 2.2694091796875, 2.40948486328125, 2.549560546875, 2.68963623046875, 2.8297119140625, 2.96978759765625, 3.10986328125, 3.24993896484375, 3.3900146484375, 3.53009033203125, 3.670166015625, 3.81024169921875, 3.9503173828125, 4.09039306640625, 4.23046875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 9.0, 7.0, 8.0, 8.0, 25.0, 31.0, 73.0, 162.0, 223.0, 199.0, 111.0, 48.0, 31.0, 17.0, 8.0, 8.0, 7.0, 8.0, 3.0, 2.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.439453125, -3.3404541015625, -3.241455078125, -3.1424560546875, -3.04345703125, -2.9444580078125, -2.845458984375, -2.7464599609375, -2.6474609375, -2.5484619140625, -2.449462890625, -2.3504638671875, -2.25146484375, -2.1524658203125, -2.053466796875, -1.9544677734375, -1.85546875, -1.7564697265625, -1.657470703125, -1.5584716796875, -1.45947265625, -1.3604736328125, -1.261474609375, -1.1624755859375, -1.0634765625, -0.9644775390625, -0.865478515625, -0.7664794921875, -0.66748046875, -0.5684814453125, -0.469482421875, -0.3704833984375, -0.271484375, -0.1724853515625, -0.073486328125, 0.0255126953125, 0.12451171875, 0.2235107421875, 0.322509765625, 0.4215087890625, 0.5205078125, 0.6195068359375, 0.718505859375, 0.8175048828125, 0.91650390625, 1.0155029296875, 1.114501953125, 1.2135009765625, 1.3125, 1.4114990234375, 1.510498046875, 1.6094970703125, 1.70849609375, 1.8074951171875, 1.906494140625, 2.0054931640625, 2.1044921875, 2.2034912109375, 2.302490234375, 2.4014892578125, 2.50048828125, 2.5994873046875, 2.698486328125, 2.7974853515625, 2.896484375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 10.0, 24.0, 52.0, 143.0, 330.0, 279.0, 111.0, 38.0, 9.0, 8.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.33234405517578, -37.259361267089844, -35.186378479003906, -33.11339569091797, -31.040416717529297, -28.96743392944336, -26.894451141357422, -24.821468353271484, -22.74848747253418, -20.675504684448242, -18.602523803710938, -16.529541015625, -14.456559181213379, -12.383577346801758, -10.31059455871582, -8.2376127243042, -6.164630889892578, -4.091649055480957, -2.0186667442321777, 0.05431556701660156, 2.1272974014282227, 4.200279235839844, 6.273262023925781, 8.346243858337402, 10.419225692749023, 12.492207527160645, 14.565189361572266, 16.638172149658203, 18.71115493774414, 20.784135818481445, 22.857118606567383, 24.930099487304688, 27.003082275390625, 29.076065063476562, 31.149045944213867, 33.22203063964844, 35.29500961303711, 37.36799240112305, 39.440975189208984, 41.51395797729492, 43.586936950683594, 45.65991973876953, 47.73290252685547, 49.805885314941406, 51.87886428833008, 53.951847076416016, 56.02482986450195, 58.09781265258789, 60.17079544067383, 62.243778228759766, 64.31675720214844, 66.38973999023438, 68.46272277832031, 70.53570556640625, 72.60868835449219, 74.68167114257812, 76.75465393066406, 78.82763671875, 80.90061950683594, 82.97360229492188, 85.04658508300781, 87.11956787109375, 89.19255065917969, 91.2655258178711, 93.33850860595703]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 3.0, 6.0, 13.0, 7.0, 10.0, 13.0, 15.0, 24.0, 33.0, 38.0, 25.0, 54.0, 44.0, 55.0, 65.0, 74.0, 48.0, 49.0, 51.0, 53.0, 53.0, 47.0, 52.0, 34.0, 33.0, 22.0, 20.0, 18.0, 8.0, 8.0, 6.0, 7.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.87354278564453, -24.869884490966797, -23.866228103637695, -22.86256980895996, -21.85891342163086, -20.855255126953125, -19.85159683227539, -18.84794044494629, -17.844284057617188, -16.840625762939453, -15.836969375610352, -14.833311080932617, -13.829654693603516, -12.825996398925781, -11.822339057922363, -10.818681716918945, -9.815023422241211, -8.811366081237793, -7.807708740234375, -6.804050922393799, -5.800393581390381, -4.796736240386963, -3.7930784225463867, -2.7894210815429688, -1.7857637405395508, -0.7821062803268433, 0.22155117988586426, 1.2252087593078613, 2.2288661003112793, 3.2325234413146973, 4.236181259155273, 5.239838600158691, 6.243495941162109, 7.247153282165527, 8.250810623168945, 9.25446891784668, 10.258125305175781, 11.261783599853516, 12.265440940856934, 13.269098281860352, 14.27275562286377, 15.276412963867188, 16.280071258544922, 17.283727645874023, 18.287385940551758, 19.29104232788086, 20.294700622558594, 21.298358917236328, 22.30201530456543, 23.305673599243164, 24.309329986572266, 25.31298828125, 26.3166446685791, 27.320302963256836, 28.323959350585938, 29.327617645263672, 30.331275939941406, 31.33493423461914, 32.338592529296875, 33.342247009277344, 34.34590530395508, 35.34956359863281, 36.35322189331055, 37.35688018798828, 38.36053466796875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 1.0, 5.0, 6.0, 5.0, 5.0, 10.0, 6.0, 10.0, 15.0, 23.0, 30.0, 40.0, 61.0, 116.0, 168.0, 363.0, 707.0, 1641.0, 5440.0, 37384.0, 4027779.0, 106448.0, 9997.0, 2395.0, 838.0, 352.0, 205.0, 99.0, 59.0, 21.0, 25.0, 17.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.8203125, -9.578857421875, -9.33740234375, -9.095947265625, -8.8544921875, -8.613037109375, -8.37158203125, -8.130126953125, -7.888671875, -7.647216796875, -7.40576171875, -7.164306640625, -6.9228515625, -6.681396484375, -6.43994140625, -6.198486328125, -5.95703125, -5.715576171875, -5.47412109375, -5.232666015625, -4.9912109375, -4.749755859375, -4.50830078125, -4.266845703125, -4.025390625, -3.783935546875, -3.54248046875, -3.301025390625, -3.0595703125, -2.818115234375, -2.57666015625, -2.335205078125, -2.09375, -1.852294921875, -1.61083984375, -1.369384765625, -1.1279296875, -0.886474609375, -0.64501953125, -0.403564453125, -0.162109375, 0.079345703125, 0.32080078125, 0.562255859375, 0.8037109375, 1.045166015625, 1.28662109375, 1.528076171875, 1.76953125, 2.010986328125, 2.25244140625, 2.493896484375, 2.7353515625, 2.976806640625, 3.21826171875, 3.459716796875, 3.701171875, 3.942626953125, 4.18408203125, 4.425537109375, 4.6669921875, 4.908447265625, 5.14990234375, 5.391357421875, 5.6328125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 2.0, 9.0, 15.0, 33.0, 47.0, 62.0, 105.0, 111.0, 116.0, 117.0, 124.0, 83.0, 65.0, 49.0, 21.0, 21.0, 15.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40625, -2.3409576416015625, -2.275665283203125, -2.2103729248046875, -2.14508056640625, -2.0797882080078125, -2.014495849609375, -1.9492034912109375, -1.8839111328125, -1.8186187744140625, -1.753326416015625, -1.6880340576171875, -1.62274169921875, -1.5574493408203125, -1.492156982421875, -1.4268646240234375, -1.361572265625, -1.2962799072265625, -1.230987548828125, -1.1656951904296875, -1.10040283203125, -1.0351104736328125, -0.969818115234375, -0.9045257568359375, -0.8392333984375, -0.7739410400390625, -0.708648681640625, -0.6433563232421875, -0.57806396484375, -0.5127716064453125, -0.447479248046875, -0.3821868896484375, -0.31689453125, -0.2516021728515625, -0.186309814453125, -0.1210174560546875, -0.05572509765625, 0.0095672607421875, 0.074859619140625, 0.1401519775390625, 0.2054443359375, 0.2707366943359375, 0.336029052734375, 0.4013214111328125, 0.46661376953125, 0.5319061279296875, 0.597198486328125, 0.6624908447265625, 0.727783203125, 0.7930755615234375, 0.858367919921875, 0.9236602783203125, 0.98895263671875, 1.0542449951171875, 1.119537353515625, 1.1848297119140625, 1.2501220703125, 1.3154144287109375, 1.380706787109375, 1.4459991455078125, 1.51129150390625, 1.5765838623046875, 1.641876220703125, 1.7071685791015625, 1.7724609375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 3.0, 11.0, 11.0, 19.0, 25.0, 44.0, 80.0, 131.0, 239.0, 609.0, 1385.0, 4407.0, 21766.0, 3003017.0, 1135343.0, 20454.0, 4328.0, 1252.0, 514.0, 291.0, 136.0, 80.0, 45.0, 39.0, 17.0, 17.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.3515625, -6.086669921875, -5.82177734375, -5.556884765625, -5.2919921875, -5.027099609375, -4.76220703125, -4.497314453125, -4.232421875, -3.967529296875, -3.70263671875, -3.437744140625, -3.1728515625, -2.907958984375, -2.64306640625, -2.378173828125, -2.11328125, -1.848388671875, -1.58349609375, -1.318603515625, -1.0537109375, -0.788818359375, -0.52392578125, -0.259033203125, 0.005859375, 0.270751953125, 0.53564453125, 0.800537109375, 1.0654296875, 1.330322265625, 1.59521484375, 1.860107421875, 2.125, 2.389892578125, 2.65478515625, 2.919677734375, 3.1845703125, 3.449462890625, 3.71435546875, 3.979248046875, 4.244140625, 4.509033203125, 4.77392578125, 5.038818359375, 5.3037109375, 5.568603515625, 5.83349609375, 6.098388671875, 6.36328125, 6.628173828125, 6.89306640625, 7.157958984375, 7.4228515625, 7.687744140625, 7.95263671875, 8.217529296875, 8.482421875, 8.747314453125, 9.01220703125, 9.277099609375, 9.5419921875, 9.806884765625, 10.07177734375, 10.336669921875, 10.6015625]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 2.0, 2.0, 4.0, 8.0, 9.0, 12.0, 26.0, 58.0, 115.0, 567.0, 2839.0, 242.0, 87.0, 46.0, 18.0, 12.0, 7.0, 8.0, 6.0, 5.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.564453125, -2.4630126953125, -2.361572265625, -2.2601318359375, -2.15869140625, -2.0572509765625, -1.955810546875, -1.8543701171875, -1.7529296875, -1.6514892578125, -1.550048828125, -1.4486083984375, -1.34716796875, -1.2457275390625, -1.144287109375, -1.0428466796875, -0.94140625, -0.8399658203125, -0.738525390625, -0.6370849609375, -0.53564453125, -0.4342041015625, -0.332763671875, -0.2313232421875, -0.1298828125, -0.0284423828125, 0.072998046875, 0.1744384765625, 0.27587890625, 0.3773193359375, 0.478759765625, 0.5802001953125, 0.681640625, 0.7830810546875, 0.884521484375, 0.9859619140625, 1.08740234375, 1.1888427734375, 1.290283203125, 1.3917236328125, 1.4931640625, 1.5946044921875, 1.696044921875, 1.7974853515625, 1.89892578125, 2.0003662109375, 2.101806640625, 2.2032470703125, 2.3046875, 2.4061279296875, 2.507568359375, 2.6090087890625, 2.71044921875, 2.8118896484375, 2.913330078125, 3.0147705078125, 3.1162109375, 3.2176513671875, 3.319091796875, 3.4205322265625, 3.52197265625, 3.6234130859375, 3.724853515625, 3.8262939453125, 3.927734375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 11.0, 104.0, 598.0, 253.0, 40.0, 6.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.666475296020508, -16.371662139892578, -15.076849937438965, -13.782037734985352, -12.487224578857422, -11.192411422729492, -9.897599220275879, -8.602787017822266, -7.307973861694336, -6.0131611824035645, -4.718348503112793, -3.4235358238220215, -2.12872314453125, -0.8339104652404785, 0.46090221405029297, 1.7557144165039062, 3.050527572631836, 4.345340251922607, 5.640152931213379, 6.93496561050415, 8.229778289794922, 9.524591445922852, 10.819403648376465, 12.114215850830078, 13.409029006958008, 14.703842163085938, 15.99865436553955, 17.293466567993164, 18.588279724121094, 19.883092880249023, 21.177906036376953, 22.47271728515625, 23.767532348632812, 25.062345504760742, 26.357158660888672, 27.65196990966797, 28.9467830657959, 30.241596221923828, 31.536407470703125, 32.83122253417969, 34.126033782958984, 35.42084503173828, 36.715660095214844, 38.01047134399414, 39.30528259277344, 40.60009765625, 41.8949089050293, 43.189720153808594, 44.484535217285156, 45.77934646606445, 47.074161529541016, 48.36897277832031, 49.663787841796875, 50.95859909057617, 52.25341033935547, 53.54822540283203, 54.84303665161133, 56.137847900390625, 57.43266296386719, 58.727474212646484, 60.02228546142578, 61.317100524902344, 62.61191177368164, 63.90672302246094, 65.2015380859375]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 1.0, 3.0, 9.0, 10.0, 14.0, 19.0, 7.0, 16.0, 17.0, 21.0, 17.0, 25.0, 23.0, 26.0, 30.0, 21.0, 41.0, 31.0, 31.0, 46.0, 36.0, 35.0, 40.0, 36.0, 35.0, 37.0, 30.0, 39.0, 42.0, 29.0, 34.0, 28.0, 23.0, 17.0, 21.0, 26.0, 16.0, 11.0, 8.0, 8.0, 8.0, 4.0, 8.0, 5.0, 5.0, 4.0, 5.0, 2.0, 3.0, 3.0, 0.0, 3.0], "bins": [-5.686957359313965, -5.52431058883667, -5.361663341522217, -5.199016571044922, -5.036369800567627, -4.873723030090332, -4.711075782775879, -4.548429012298584, -4.385782241821289, -4.223135471343994, -4.060488224029541, -3.897841453552246, -3.735194683074951, -3.572547674179077, -3.409900665283203, -3.247253894805908, -3.084606647491455, -2.921959638595581, -2.759312868118286, -2.596665859222412, -2.434019088745117, -2.271372079849243, -2.108725070953369, -1.9460781812667847, -1.7834312915802002, -1.6207844018936157, -1.4581375122070312, -1.2954905033111572, -1.1328436136245728, -0.9701967239379883, -0.807549774646759, -0.6449028253555298, -0.4822559356689453, -0.31960901618003845, -0.1569620966911316, 0.0056848227977752686, 0.16833174228668213, 0.3309786319732666, 0.49362558126449585, 0.6562725305557251, 0.8189194202423096, 0.981566309928894, 1.1442131996154785, 1.3068602085113525, 1.469507098197937, 1.6321539878845215, 1.7948009967803955, 1.95744788646698, 2.1200947761535645, 2.2827417850494385, 2.4453885555267334, 2.6080355644226074, 2.7706823348999023, 2.9333293437957764, 3.0959763526916504, 3.2586231231689453, 3.4212701320648193, 3.5839171409606934, 3.7465639114379883, 3.9092109203338623, 4.071857929229736, 4.234504699707031, 4.397151470184326, 4.559798717498779, 4.722445487976074]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 5.0, 3.0, 7.0, 4.0, 9.0, 8.0, 18.0, 20.0, 27.0, 33.0, 52.0, 68.0, 90.0, 144.0, 197.0, 347.0, 601.0, 1070.0, 2316.0, 5606.0, 17574.0, 74816.0, 445608.0, 405618.0, 67875.0, 16481.0, 5296.0, 2198.0, 983.0, 525.0, 277.0, 208.0, 136.0, 84.0, 85.0, 43.0, 32.0, 19.0, 16.0, 18.0, 10.0, 7.0, 4.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.44921875, -5.26739501953125, -5.0855712890625, -4.90374755859375, -4.721923828125, -4.54010009765625, -4.3582763671875, -4.17645263671875, -3.99462890625, -3.81280517578125, -3.6309814453125, -3.44915771484375, -3.267333984375, -3.08551025390625, -2.9036865234375, -2.72186279296875, -2.5400390625, -2.35821533203125, -2.1763916015625, -1.99456787109375, -1.812744140625, -1.63092041015625, -1.4490966796875, -1.26727294921875, -1.08544921875, -0.90362548828125, -0.7218017578125, -0.53997802734375, -0.358154296875, -0.17633056640625, 0.0054931640625, 0.18731689453125, 0.369140625, 0.55096435546875, 0.7327880859375, 0.91461181640625, 1.096435546875, 1.27825927734375, 1.4600830078125, 1.64190673828125, 1.82373046875, 2.00555419921875, 2.1873779296875, 2.36920166015625, 2.551025390625, 2.73284912109375, 2.9146728515625, 3.09649658203125, 3.2783203125, 3.46014404296875, 3.6419677734375, 3.82379150390625, 4.005615234375, 4.18743896484375, 4.3692626953125, 4.55108642578125, 4.73291015625, 4.91473388671875, 5.0965576171875, 5.27838134765625, 5.460205078125, 5.64202880859375, 5.8238525390625, 6.00567626953125, 6.1875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 7.0, 7.0, 19.0, 34.0, 44.0, 71.0, 104.0, 93.0, 133.0, 112.0, 100.0, 88.0, 78.0, 36.0, 34.0, 16.0, 18.0, 4.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.41015625, -2.34649658203125, -2.2828369140625, -2.21917724609375, -2.155517578125, -2.09185791015625, -2.0281982421875, -1.96453857421875, -1.90087890625, -1.83721923828125, -1.7735595703125, -1.70989990234375, -1.646240234375, -1.58258056640625, -1.5189208984375, -1.45526123046875, -1.3916015625, -1.32794189453125, -1.2642822265625, -1.20062255859375, -1.136962890625, -1.07330322265625, -1.0096435546875, -0.94598388671875, -0.88232421875, -0.81866455078125, -0.7550048828125, -0.69134521484375, -0.627685546875, -0.56402587890625, -0.5003662109375, -0.43670654296875, -0.373046875, -0.30938720703125, -0.2457275390625, -0.18206787109375, -0.118408203125, -0.05474853515625, 0.0089111328125, 0.07257080078125, 0.13623046875, 0.19989013671875, 0.2635498046875, 0.32720947265625, 0.390869140625, 0.45452880859375, 0.5181884765625, 0.58184814453125, 0.6455078125, 0.70916748046875, 0.7728271484375, 0.83648681640625, 0.900146484375, 0.96380615234375, 1.0274658203125, 1.09112548828125, 1.15478515625, 1.21844482421875, 1.2821044921875, 1.34576416015625, 1.409423828125, 1.47308349609375, 1.5367431640625, 1.60040283203125, 1.6640625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 0.0, 6.0, 3.0, 8.0, 14.0, 11.0, 16.0, 17.0, 29.0, 29.0, 38.0, 54.0, 68.0, 100.0, 126.0, 188.0, 315.0, 546.0, 1033.0, 2043.0, 4481.0, 11827.0, 34421.0, 126937.0, 502262.0, 269437.0, 61784.0, 19431.0, 7065.0, 2997.0, 1331.0, 665.0, 353.0, 258.0, 179.0, 131.0, 82.0, 66.0, 49.0, 43.0, 27.0, 20.0, 17.0, 12.0, 11.0, 8.0, 6.0, 8.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.5546875, -4.41119384765625, -4.2677001953125, -4.12420654296875, -3.980712890625, -3.83721923828125, -3.6937255859375, -3.55023193359375, -3.40673828125, -3.26324462890625, -3.1197509765625, -2.97625732421875, -2.832763671875, -2.68927001953125, -2.5457763671875, -2.40228271484375, -2.2587890625, -2.11529541015625, -1.9718017578125, -1.82830810546875, -1.684814453125, -1.54132080078125, -1.3978271484375, -1.25433349609375, -1.11083984375, -0.96734619140625, -0.8238525390625, -0.68035888671875, -0.536865234375, -0.39337158203125, -0.2498779296875, -0.10638427734375, 0.037109375, 0.18060302734375, 0.3240966796875, 0.46759033203125, 0.611083984375, 0.75457763671875, 0.8980712890625, 1.04156494140625, 1.18505859375, 1.32855224609375, 1.4720458984375, 1.61553955078125, 1.759033203125, 1.90252685546875, 2.0460205078125, 2.18951416015625, 2.3330078125, 2.47650146484375, 2.6199951171875, 2.76348876953125, 2.906982421875, 3.05047607421875, 3.1939697265625, 3.33746337890625, 3.48095703125, 3.62445068359375, 3.7679443359375, 3.91143798828125, 4.054931640625, 4.19842529296875, 4.3419189453125, 4.48541259765625, 4.62890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 4.0, 6.0, 8.0, 9.0, 11.0, 7.0, 7.0, 11.0, 17.0, 15.0, 23.0, 36.0, 32.0, 42.0, 37.0, 49.0, 35.0, 48.0, 48.0, 49.0, 39.0, 49.0, 45.0, 50.0, 24.0, 47.0, 37.0, 35.0, 26.0, 17.0, 24.0, 21.0, 13.0, 25.0, 8.0, 9.0, 10.0, 4.0, 6.0, 3.0, 3.0, 5.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-4.68359375, -4.5411376953125, -4.398681640625, -4.2562255859375, -4.11376953125, -3.9713134765625, -3.828857421875, -3.6864013671875, -3.5439453125, -3.4014892578125, -3.259033203125, -3.1165771484375, -2.97412109375, -2.8316650390625, -2.689208984375, -2.5467529296875, -2.404296875, -2.2618408203125, -2.119384765625, -1.9769287109375, -1.83447265625, -1.6920166015625, -1.549560546875, -1.4071044921875, -1.2646484375, -1.1221923828125, -0.979736328125, -0.8372802734375, -0.69482421875, -0.5523681640625, -0.409912109375, -0.2674560546875, -0.125, 0.0174560546875, 0.159912109375, 0.3023681640625, 0.44482421875, 0.5872802734375, 0.729736328125, 0.8721923828125, 1.0146484375, 1.1571044921875, 1.299560546875, 1.4420166015625, 1.58447265625, 1.7269287109375, 1.869384765625, 2.0118408203125, 2.154296875, 2.2967529296875, 2.439208984375, 2.5816650390625, 2.72412109375, 2.8665771484375, 3.009033203125, 3.1514892578125, 3.2939453125, 3.4364013671875, 3.578857421875, 3.7213134765625, 3.86376953125, 4.0062255859375, 4.148681640625, 4.2911376953125, 4.43359375]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 2.0, 6.0, 16.0, 18.0, 20.0, 28.0, 44.0, 75.0, 115.0, 167.0, 288.0, 563.0, 1154.0, 2595.0, 6450.0, 21239.0, 232126.0, 723258.0, 43509.0, 9929.0, 3602.0, 1579.0, 748.0, 374.0, 222.0, 129.0, 110.0, 58.0, 42.0, 26.0, 15.0, 9.0, 4.0, 11.0, 4.0, 3.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0], "bins": [-3.30078125, -3.20428466796875, -3.1077880859375, -3.01129150390625, -2.914794921875, -2.81829833984375, -2.7218017578125, -2.62530517578125, -2.52880859375, -2.43231201171875, -2.3358154296875, -2.23931884765625, -2.142822265625, -2.04632568359375, -1.9498291015625, -1.85333251953125, -1.7568359375, -1.66033935546875, -1.5638427734375, -1.46734619140625, -1.370849609375, -1.27435302734375, -1.1778564453125, -1.08135986328125, -0.98486328125, -0.88836669921875, -0.7918701171875, -0.69537353515625, -0.598876953125, -0.50238037109375, -0.4058837890625, -0.30938720703125, -0.212890625, -0.11639404296875, -0.0198974609375, 0.07659912109375, 0.173095703125, 0.26959228515625, 0.3660888671875, 0.46258544921875, 0.55908203125, 0.65557861328125, 0.7520751953125, 0.84857177734375, 0.945068359375, 1.04156494140625, 1.1380615234375, 1.23455810546875, 1.3310546875, 1.42755126953125, 1.5240478515625, 1.62054443359375, 1.717041015625, 1.81353759765625, 1.9100341796875, 2.00653076171875, 2.10302734375, 2.19952392578125, 2.2960205078125, 2.39251708984375, 2.489013671875, 2.58551025390625, 2.6820068359375, 2.77850341796875, 2.875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 6.0, 7.0, 7.0, 16.0, 28.0, 60.0, 114.0, 177.0, 202.0, 163.0, 108.0, 67.0, 22.0, 16.0, 10.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003464221954345703, -0.00033332034945487976, -0.0003202185034751892, -0.00030711665749549866, -0.0002940148115158081, -0.00028091296553611755, -0.000267811119556427, -0.00025470927357673645, -0.0002416074275970459, -0.00022850558161735535, -0.0002154037356376648, -0.00020230188965797424, -0.0001892000436782837, -0.00017609819769859314, -0.0001629963517189026, -0.00014989450573921204, -0.00013679265975952148, -0.00012369081377983093, -0.00011058896780014038, -9.748712182044983e-05, -8.438527584075928e-05, -7.128342986106873e-05, -5.8181583881378174e-05, -4.507973790168762e-05, -3.197789192199707e-05, -1.887604594230652e-05, -5.774199962615967e-06, 7.327646017074585e-06, 2.0429491996765137e-05, 3.353133797645569e-05, 4.663318395614624e-05, 5.973502993583679e-05, 7.283687591552734e-05, 8.59387218952179e-05, 9.904056787490845e-05, 0.000112142413854599, 0.00012524425983428955, 0.0001383461058139801, 0.00015144795179367065, 0.0001645497977733612, 0.00017765164375305176, 0.0001907534897327423, 0.00020385533571243286, 0.0002169571816921234, 0.00023005902767181396, 0.00024316087365150452, 0.00025626271963119507, 0.0002693645656108856, 0.00028246641159057617, 0.0002955682575702667, 0.0003086701035499573, 0.00032177194952964783, 0.0003348737955093384, 0.00034797564148902893, 0.0003610774874687195, 0.00037417933344841003, 0.0003872811794281006, 0.00040038302540779114, 0.0004134848713874817, 0.00042658671736717224, 0.0004396885633468628, 0.00045279040932655334, 0.0004658922553062439, 0.00047899410128593445, 0.000492095947265625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 12.0, 16.0, 16.0, 20.0, 31.0, 25.0, 46.0, 72.0, 133.0, 237.0, 524.0, 1205.0, 2924.0, 8318.0, 36486.0, 444259.0, 499798.0, 40095.0, 8729.0, 3121.0, 1191.0, 583.0, 274.0, 139.0, 74.0, 64.0, 41.0, 37.0, 13.0, 10.0, 12.0, 10.0, 8.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.509765625, -2.431396484375, -2.35302734375, -2.274658203125, -2.1962890625, -2.117919921875, -2.03955078125, -1.961181640625, -1.8828125, -1.804443359375, -1.72607421875, -1.647705078125, -1.5693359375, -1.490966796875, -1.41259765625, -1.334228515625, -1.255859375, -1.177490234375, -1.09912109375, -1.020751953125, -0.9423828125, -0.864013671875, -0.78564453125, -0.707275390625, -0.62890625, -0.550537109375, -0.47216796875, -0.393798828125, -0.3154296875, -0.237060546875, -0.15869140625, -0.080322265625, -0.001953125, 0.076416015625, 0.15478515625, 0.233154296875, 0.3115234375, 0.389892578125, 0.46826171875, 0.546630859375, 0.625, 0.703369140625, 0.78173828125, 0.860107421875, 0.9384765625, 1.016845703125, 1.09521484375, 1.173583984375, 1.251953125, 1.330322265625, 1.40869140625, 1.487060546875, 1.5654296875, 1.643798828125, 1.72216796875, 1.800537109375, 1.87890625, 1.957275390625, 2.03564453125, 2.114013671875, 2.1923828125, 2.270751953125, 2.34912109375, 2.427490234375, 2.505859375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 5.0, 10.0, 11.0, 16.0, 20.0, 35.0, 51.0, 66.0, 88.0, 98.0, 108.0, 110.0, 92.0, 60.0, 42.0, 45.0, 25.0, 27.0, 16.0, 9.0, 7.0, 7.0, 4.0, 3.0, 1.0, 2.0, 1.0, 3.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.6962890625, -1.638824462890625, -1.58135986328125, -1.523895263671875, -1.4664306640625, -1.408966064453125, -1.35150146484375, -1.294036865234375, -1.236572265625, -1.179107666015625, -1.12164306640625, -1.064178466796875, -1.0067138671875, -0.949249267578125, -0.89178466796875, -0.834320068359375, -0.77685546875, -0.719390869140625, -0.66192626953125, -0.604461669921875, -0.5469970703125, -0.489532470703125, -0.43206787109375, -0.374603271484375, -0.317138671875, -0.259674072265625, -0.20220947265625, -0.144744873046875, -0.0872802734375, -0.029815673828125, 0.02764892578125, 0.085113525390625, 0.142578125, 0.200042724609375, 0.25750732421875, 0.314971923828125, 0.3724365234375, 0.429901123046875, 0.48736572265625, 0.544830322265625, 0.602294921875, 0.659759521484375, 0.71722412109375, 0.774688720703125, 0.8321533203125, 0.889617919921875, 0.94708251953125, 1.004547119140625, 1.06201171875, 1.119476318359375, 1.17694091796875, 1.234405517578125, 1.2918701171875, 1.349334716796875, 1.40679931640625, 1.464263916015625, 1.521728515625, 1.579193115234375, 1.63665771484375, 1.694122314453125, 1.7515869140625, 1.809051513671875, 1.86651611328125, 1.923980712890625, 1.9814453125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 5.0, 6.0, 20.0, 31.0, 40.0, 62.0, 113.0, 145.0, 196.0, 167.0, 83.0, 54.0, 29.0, 23.0, 16.0, 3.0, 7.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.765317916870117, -24.51405906677246, -23.262798309326172, -22.011539459228516, -20.760278701782227, -19.50901985168457, -18.25775909423828, -17.006500244140625, -15.755240440368652, -14.50398063659668, -13.252720832824707, -12.001461029052734, -10.750202178955078, -9.498941421508789, -8.247682571411133, -6.99642276763916, -5.7451629638671875, -4.493903160095215, -3.2426435947418213, -1.9913840293884277, -0.7401242256164551, 0.5111355781555176, 1.762394905090332, 3.0136547088623047, 4.264914512634277, 5.51617431640625, 6.767434120178223, 8.018693923950195, 9.269952774047852, 10.52121353149414, 11.772472381591797, 13.02373218536377, 14.27499008178711, 15.526249885559082, 16.777509689331055, 18.02876853942871, 19.280029296875, 20.531288146972656, 21.782546997070312, 23.0338077545166, 24.28506851196289, 25.536327362060547, 26.787588119506836, 28.038846969604492, 29.29010772705078, 30.541366577148438, 31.792625427246094, 33.04388427734375, 34.295143127441406, 35.54640197753906, 36.79766082763672, 38.04892349243164, 39.3001823425293, 40.55144119262695, 41.80270004272461, 43.05396270751953, 44.30522155761719, 45.556480407714844, 46.8077392578125, 48.05900192260742, 49.31026077270508, 50.561519622802734, 51.81277847290039, 53.06404113769531, 54.31529998779297]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 4.0, 8.0, 8.0, 10.0, 14.0, 17.0, 18.0, 14.0, 27.0, 26.0, 27.0, 25.0, 39.0, 33.0, 45.0, 51.0, 54.0, 57.0, 55.0, 49.0, 53.0, 57.0, 42.0, 37.0, 29.0, 38.0, 27.0, 24.0, 15.0, 23.0, 20.0, 12.0, 15.0, 6.0, 8.0, 4.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.067604064941406, -26.041175842285156, -25.014747619628906, -23.988319396972656, -22.961891174316406, -21.935462951660156, -20.909034729003906, -19.882606506347656, -18.856178283691406, -17.829750061035156, -16.803321838378906, -15.776893615722656, -14.750465393066406, -13.724037170410156, -12.697608947753906, -11.671180725097656, -10.644752502441406, -9.618324279785156, -8.591896057128906, -7.565467834472656, -6.539039611816406, -5.512611389160156, -4.486183166503906, -3.4597549438476562, -2.4333267211914062, -1.4068984985351562, -0.38047027587890625, 0.6459579467773438, 1.6723861694335938, 2.6988143920898438, 3.7252426147460938, 4.751670837402344, 5.778102874755859, 6.804531097412109, 7.830959320068359, 8.85738754272461, 9.88381576538086, 10.91024398803711, 11.93667221069336, 12.96310043334961, 13.98952865600586, 15.01595687866211, 16.04238510131836, 17.06881332397461, 18.09524154663086, 19.12166976928711, 20.14809799194336, 21.17452621459961, 22.20095443725586, 23.22738265991211, 24.25381088256836, 25.28023910522461, 26.30666732788086, 27.33309555053711, 28.35952377319336, 29.38595199584961, 30.41238021850586, 31.43880844116211, 32.46523666381836, 33.49166488647461, 34.51809310913086, 35.54452133178711, 36.57094955444336, 37.59737777709961, 38.62380599975586]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 6.0, 5.0, 4.0, 8.0, 3.0, 10.0, 16.0, 23.0, 26.0, 24.0, 35.0, 77.0, 140.0, 222.0, 410.0, 878.0, 1981.0, 5985.0, 34261.0, 3962197.0, 168029.0, 13859.0, 3402.0, 1333.0, 631.0, 342.0, 159.0, 92.0, 46.0, 19.0, 18.0, 7.0, 9.0, 6.0, 6.0, 1.0, 3.0, 6.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.71875, -8.46795654296875, -8.2171630859375, -7.96636962890625, -7.715576171875, -7.46478271484375, -7.2139892578125, -6.96319580078125, -6.71240234375, -6.46160888671875, -6.2108154296875, -5.96002197265625, -5.709228515625, -5.45843505859375, -5.2076416015625, -4.95684814453125, -4.7060546875, -4.45526123046875, -4.2044677734375, -3.95367431640625, -3.702880859375, -3.45208740234375, -3.2012939453125, -2.95050048828125, -2.69970703125, -2.44891357421875, -2.1981201171875, -1.94732666015625, -1.696533203125, -1.44573974609375, -1.1949462890625, -0.94415283203125, -0.693359375, -0.44256591796875, -0.1917724609375, 0.05902099609375, 0.309814453125, 0.56060791015625, 0.8114013671875, 1.06219482421875, 1.31298828125, 1.56378173828125, 1.8145751953125, 2.06536865234375, 2.316162109375, 2.56695556640625, 2.8177490234375, 3.06854248046875, 3.3193359375, 3.57012939453125, 3.8209228515625, 4.07171630859375, 4.322509765625, 4.57330322265625, 4.8240966796875, 5.07489013671875, 5.32568359375, 5.57647705078125, 5.8272705078125, 6.07806396484375, 6.328857421875, 6.57965087890625, 6.8304443359375, 7.08123779296875, 7.33203125]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 5.0, 6.0, 13.0, 18.0, 31.0, 52.0, 76.0, 88.0, 95.0, 102.0, 128.0, 110.0, 91.0, 64.0, 46.0, 32.0, 26.0, 13.0, 6.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6171875, -2.54229736328125, -2.4674072265625, -2.39251708984375, -2.317626953125, -2.24273681640625, -2.1678466796875, -2.09295654296875, -2.01806640625, -1.94317626953125, -1.8682861328125, -1.79339599609375, -1.718505859375, -1.64361572265625, -1.5687255859375, -1.49383544921875, -1.4189453125, -1.34405517578125, -1.2691650390625, -1.19427490234375, -1.119384765625, -1.04449462890625, -0.9696044921875, -0.89471435546875, -0.81982421875, -0.74493408203125, -0.6700439453125, -0.59515380859375, -0.520263671875, -0.44537353515625, -0.3704833984375, -0.29559326171875, -0.220703125, -0.14581298828125, -0.0709228515625, 0.00396728515625, 0.078857421875, 0.15374755859375, 0.2286376953125, 0.30352783203125, 0.37841796875, 0.45330810546875, 0.5281982421875, 0.60308837890625, 0.677978515625, 0.75286865234375, 0.8277587890625, 0.90264892578125, 0.9775390625, 1.05242919921875, 1.1273193359375, 1.20220947265625, 1.277099609375, 1.35198974609375, 1.4268798828125, 1.50177001953125, 1.57666015625, 1.65155029296875, 1.7264404296875, 1.80133056640625, 1.876220703125, 1.95111083984375, 2.0260009765625, 2.10089111328125, 2.17578125]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 5.0, 2.0, 7.0, 7.0, 12.0, 19.0, 25.0, 36.0, 64.0, 94.0, 150.0, 259.0, 348.0, 594.0, 1019.0, 1886.0, 3569.0, 8299.0, 24831.0, 140795.0, 3789540.0, 176475.0, 28283.0, 9179.0, 3959.0, 1999.0, 1079.0, 599.0, 424.0, 261.0, 154.0, 110.0, 60.0, 51.0, 31.0, 29.0, 18.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.15625, -4.00537109375, -3.8544921875, -3.70361328125, -3.552734375, -3.40185546875, -3.2509765625, -3.10009765625, -2.94921875, -2.79833984375, -2.6474609375, -2.49658203125, -2.345703125, -2.19482421875, -2.0439453125, -1.89306640625, -1.7421875, -1.59130859375, -1.4404296875, -1.28955078125, -1.138671875, -0.98779296875, -0.8369140625, -0.68603515625, -0.53515625, -0.38427734375, -0.2333984375, -0.08251953125, 0.068359375, 0.21923828125, 0.3701171875, 0.52099609375, 0.671875, 0.82275390625, 0.9736328125, 1.12451171875, 1.275390625, 1.42626953125, 1.5771484375, 1.72802734375, 1.87890625, 2.02978515625, 2.1806640625, 2.33154296875, 2.482421875, 2.63330078125, 2.7841796875, 2.93505859375, 3.0859375, 3.23681640625, 3.3876953125, 3.53857421875, 3.689453125, 3.84033203125, 3.9912109375, 4.14208984375, 4.29296875, 4.44384765625, 4.5947265625, 4.74560546875, 4.896484375, 5.04736328125, 5.1982421875, 5.34912109375, 5.5]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 8.0, 0.0, 7.0, 11.0, 15.0, 22.0, 39.0, 49.0, 127.0, 279.0, 2379.0, 759.0, 163.0, 70.0, 48.0, 23.0, 20.0, 12.0, 8.0, 6.0, 4.0, 4.0, 5.0, 2.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.658203125, -2.56903076171875, -2.4798583984375, -2.39068603515625, -2.301513671875, -2.21234130859375, -2.1231689453125, -2.03399658203125, -1.94482421875, -1.85565185546875, -1.7664794921875, -1.67730712890625, -1.588134765625, -1.49896240234375, -1.4097900390625, -1.32061767578125, -1.2314453125, -1.14227294921875, -1.0531005859375, -0.96392822265625, -0.874755859375, -0.78558349609375, -0.6964111328125, -0.60723876953125, -0.51806640625, -0.42889404296875, -0.3397216796875, -0.25054931640625, -0.161376953125, -0.07220458984375, 0.0169677734375, 0.10614013671875, 0.1953125, 0.28448486328125, 0.3736572265625, 0.46282958984375, 0.552001953125, 0.64117431640625, 0.7303466796875, 0.81951904296875, 0.90869140625, 0.99786376953125, 1.0870361328125, 1.17620849609375, 1.265380859375, 1.35455322265625, 1.4437255859375, 1.53289794921875, 1.6220703125, 1.71124267578125, 1.8004150390625, 1.88958740234375, 1.978759765625, 2.06793212890625, 2.1571044921875, 2.24627685546875, 2.33544921875, 2.42462158203125, 2.5137939453125, 2.60296630859375, 2.692138671875, 2.78131103515625, 2.8704833984375, 2.95965576171875, 3.048828125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 19.0, 92.0, 414.0, 391.0, 67.0, 19.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.033733367919922, -20.808725357055664, -19.58371925354004, -18.35871124267578, -17.133705139160156, -15.908697128295898, -14.68368911743164, -13.4586820602417, -12.233675003051758, -11.008667945861816, -9.783660888671875, -8.558652877807617, -7.333645820617676, -6.108638763427734, -4.883631229400635, -3.658623695373535, -2.4336166381835938, -1.2086093425750732, 0.016397953033447266, 1.2414052486419678, 2.4664125442504883, 3.6914196014404297, 4.916427135467529, 6.141434669494629, 7.36644172668457, 8.591448783874512, 9.816455841064453, 11.041463851928711, 12.266470909118652, 13.491477966308594, 14.716485977172852, 15.941493034362793, 17.16650390625, 18.391511917114258, 19.616518020629883, 20.84152603149414, 22.066532135009766, 23.291540145874023, 24.51654815673828, 25.741554260253906, 26.966562271118164, 28.191570281982422, 29.416576385498047, 30.641584396362305, 31.866592407226562, 33.09159851074219, 34.31660461425781, 35.5416145324707, 36.76662063598633, 37.99162673950195, 39.216636657714844, 40.44164276123047, 41.666648864746094, 42.89165496826172, 44.11666488647461, 45.341670989990234, 46.566680908203125, 47.79168701171875, 49.01669692993164, 50.241703033447266, 51.46670913696289, 52.69171905517578, 53.916725158691406, 55.14173126220703, 56.366737365722656]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 5.0, 7.0, 9.0, 5.0, 14.0, 10.0, 15.0, 32.0, 36.0, 29.0, 33.0, 45.0, 43.0, 54.0, 59.0, 65.0, 69.0, 55.0, 65.0, 51.0, 45.0, 45.0, 44.0, 33.0, 40.0, 35.0, 16.0, 17.0, 6.0, 7.0, 5.0, 4.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.296586990356445, -8.014235496520996, -7.731884002685547, -7.449532985687256, -7.167181491851807, -6.884829998016357, -6.602478981018066, -6.320127487182617, -6.037775993347168, -5.755424499511719, -5.4730730056762695, -5.1907219886779785, -4.908370494842529, -4.62601900100708, -4.343667984008789, -4.06131649017334, -3.7789649963378906, -3.4966135025024414, -3.2142622470855713, -2.931910991668701, -2.649559497833252, -2.3672080039978027, -2.0848567485809326, -1.802505373954773, -1.5201539993286133, -1.2378026247024536, -0.955451250076294, -0.6730998754501343, -0.3907485008239746, -0.10839712619781494, 0.17395424842834473, 0.4563056230545044, 0.7386579513549805, 1.0210093259811401, 1.3033607006072998, 1.5857120752334595, 1.8680634498596191, 2.1504149436950684, 2.4327661991119385, 2.7151174545288086, 2.997468948364258, 3.279820442199707, 3.562171697616577, 3.8445229530334473, 4.1268744468688965, 4.409225940704346, 4.691576957702637, 4.973928451538086, 5.256279945373535, 5.538631439208984, 5.820982933044434, 6.103333950042725, 6.385685443878174, 6.668036937713623, 6.950387954711914, 7.232739448547363, 7.5150909423828125, 7.797442436218262, 8.079793930053711, 8.36214542388916, 8.64449691772461, 8.926847457885742, 9.209198951721191, 9.49155044555664, 9.77390193939209]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 6.0, 4.0, 9.0, 10.0, 10.0, 17.0, 24.0, 30.0, 46.0, 54.0, 66.0, 128.0, 204.0, 291.0, 567.0, 1123.0, 2620.0, 7264.0, 24773.0, 128883.0, 739217.0, 109442.0, 22064.0, 6711.0, 2491.0, 1092.0, 528.0, 296.0, 182.0, 111.0, 75.0, 50.0, 43.0, 35.0, 14.0, 22.0, 13.0, 6.0, 4.0, 10.0, 7.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-6.37890625, -6.16949462890625, -5.9600830078125, -5.75067138671875, -5.541259765625, -5.33184814453125, -5.1224365234375, -4.91302490234375, -4.70361328125, -4.49420166015625, -4.2847900390625, -4.07537841796875, -3.865966796875, -3.65655517578125, -3.4471435546875, -3.23773193359375, -3.0283203125, -2.81890869140625, -2.6094970703125, -2.40008544921875, -2.190673828125, -1.98126220703125, -1.7718505859375, -1.56243896484375, -1.35302734375, -1.14361572265625, -0.9342041015625, -0.72479248046875, -0.515380859375, -0.30596923828125, -0.0965576171875, 0.11285400390625, 0.322265625, 0.53167724609375, 0.7410888671875, 0.95050048828125, 1.159912109375, 1.36932373046875, 1.5787353515625, 1.78814697265625, 1.99755859375, 2.20697021484375, 2.4163818359375, 2.62579345703125, 2.835205078125, 3.04461669921875, 3.2540283203125, 3.46343994140625, 3.6728515625, 3.88226318359375, 4.0916748046875, 4.30108642578125, 4.510498046875, 4.71990966796875, 4.9293212890625, 5.13873291015625, 5.34814453125, 5.55755615234375, 5.7669677734375, 5.97637939453125, 6.185791015625, 6.39520263671875, 6.6046142578125, 6.81402587890625, 7.0234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 15.0, 20.0, 47.0, 64.0, 73.0, 93.0, 130.0, 123.0, 126.0, 85.0, 80.0, 55.0, 26.0, 33.0, 10.0, 9.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.669921875, -2.592041015625, -2.51416015625, -2.436279296875, -2.3583984375, -2.280517578125, -2.20263671875, -2.124755859375, -2.046875, -1.968994140625, -1.89111328125, -1.813232421875, -1.7353515625, -1.657470703125, -1.57958984375, -1.501708984375, -1.423828125, -1.345947265625, -1.26806640625, -1.190185546875, -1.1123046875, -1.034423828125, -0.95654296875, -0.878662109375, -0.80078125, -0.722900390625, -0.64501953125, -0.567138671875, -0.4892578125, -0.411376953125, -0.33349609375, -0.255615234375, -0.177734375, -0.099853515625, -0.02197265625, 0.055908203125, 0.1337890625, 0.211669921875, 0.28955078125, 0.367431640625, 0.4453125, 0.523193359375, 0.60107421875, 0.678955078125, 0.7568359375, 0.834716796875, 0.91259765625, 0.990478515625, 1.068359375, 1.146240234375, 1.22412109375, 1.302001953125, 1.3798828125, 1.457763671875, 1.53564453125, 1.613525390625, 1.69140625, 1.769287109375, 1.84716796875, 1.925048828125, 2.0029296875, 2.080810546875, 2.15869140625, 2.236572265625, 2.314453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 7.0, 8.0, 11.0, 17.0, 17.0, 18.0, 32.0, 43.0, 71.0, 120.0, 211.0, 354.0, 672.0, 1541.0, 4295.0, 15582.0, 88291.0, 786975.0, 122230.0, 19498.0, 5057.0, 1711.0, 808.0, 400.0, 221.0, 117.0, 77.0, 44.0, 41.0, 25.0, 22.0, 10.0, 8.0, 7.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.22265625, -5.98846435546875, -5.7542724609375, -5.52008056640625, -5.285888671875, -5.05169677734375, -4.8175048828125, -4.58331298828125, -4.34912109375, -4.11492919921875, -3.8807373046875, -3.64654541015625, -3.412353515625, -3.17816162109375, -2.9439697265625, -2.70977783203125, -2.4755859375, -2.24139404296875, -2.0072021484375, -1.77301025390625, -1.538818359375, -1.30462646484375, -1.0704345703125, -0.83624267578125, -0.60205078125, -0.36785888671875, -0.1336669921875, 0.10052490234375, 0.334716796875, 0.56890869140625, 0.8031005859375, 1.03729248046875, 1.271484375, 1.50567626953125, 1.7398681640625, 1.97406005859375, 2.208251953125, 2.44244384765625, 2.6766357421875, 2.91082763671875, 3.14501953125, 3.37921142578125, 3.6134033203125, 3.84759521484375, 4.081787109375, 4.31597900390625, 4.5501708984375, 4.78436279296875, 5.0185546875, 5.25274658203125, 5.4869384765625, 5.72113037109375, 5.955322265625, 6.18951416015625, 6.4237060546875, 6.65789794921875, 6.89208984375, 7.12628173828125, 7.3604736328125, 7.59466552734375, 7.828857421875, 8.06304931640625, 8.2972412109375, 8.53143310546875, 8.765625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 8.0, 11.0, 14.0, 19.0, 17.0, 28.0, 33.0, 36.0, 36.0, 46.0, 56.0, 60.0, 78.0, 82.0, 68.0, 81.0, 61.0, 44.0, 44.0, 45.0, 33.0, 27.0, 18.0, 17.0, 13.0, 6.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.71484375, -5.49835205078125, -5.2818603515625, -5.06536865234375, -4.848876953125, -4.63238525390625, -4.4158935546875, -4.19940185546875, -3.98291015625, -3.76641845703125, -3.5499267578125, -3.33343505859375, -3.116943359375, -2.90045166015625, -2.6839599609375, -2.46746826171875, -2.2509765625, -2.03448486328125, -1.8179931640625, -1.60150146484375, -1.385009765625, -1.16851806640625, -0.9520263671875, -0.73553466796875, -0.51904296875, -0.30255126953125, -0.0860595703125, 0.13043212890625, 0.346923828125, 0.56341552734375, 0.7799072265625, 0.99639892578125, 1.212890625, 1.42938232421875, 1.6458740234375, 1.86236572265625, 2.078857421875, 2.29534912109375, 2.5118408203125, 2.72833251953125, 2.94482421875, 3.16131591796875, 3.3778076171875, 3.59429931640625, 3.810791015625, 4.02728271484375, 4.2437744140625, 4.46026611328125, 4.6767578125, 4.89324951171875, 5.1097412109375, 5.32623291015625, 5.542724609375, 5.75921630859375, 5.9757080078125, 6.19219970703125, 6.40869140625, 6.62518310546875, 6.8416748046875, 7.05816650390625, 7.274658203125, 7.49114990234375, 7.7076416015625, 7.92413330078125, 8.140625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 7.0, 4.0, 7.0, 9.0, 16.0, 32.0, 77.0, 170.0, 461.0, 2336.0, 41966.0, 989578.0, 12017.0, 1289.0, 339.0, 139.0, 55.0, 24.0, 17.0, 5.0, 6.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.265625, -8.04998779296875, -7.8343505859375, -7.61871337890625, -7.403076171875, -7.18743896484375, -6.9718017578125, -6.75616455078125, -6.54052734375, -6.32489013671875, -6.1092529296875, -5.89361572265625, -5.677978515625, -5.46234130859375, -5.2467041015625, -5.03106689453125, -4.8154296875, -4.59979248046875, -4.3841552734375, -4.16851806640625, -3.952880859375, -3.73724365234375, -3.5216064453125, -3.30596923828125, -3.09033203125, -2.87469482421875, -2.6590576171875, -2.44342041015625, -2.227783203125, -2.01214599609375, -1.7965087890625, -1.58087158203125, -1.365234375, -1.14959716796875, -0.9339599609375, -0.71832275390625, -0.502685546875, -0.28704833984375, -0.0714111328125, 0.14422607421875, 0.35986328125, 0.57550048828125, 0.7911376953125, 1.00677490234375, 1.222412109375, 1.43804931640625, 1.6536865234375, 1.86932373046875, 2.0849609375, 2.30059814453125, 2.5162353515625, 2.73187255859375, 2.947509765625, 3.16314697265625, 3.3787841796875, 3.59442138671875, 3.81005859375, 4.02569580078125, 4.2413330078125, 4.45697021484375, 4.672607421875, 4.88824462890625, 5.1038818359375, 5.31951904296875, 5.53515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 4.0, 3.0, 5.0, 7.0, 6.0, 7.0, 20.0, 28.0, 33.0, 42.0, 103.0, 201.0, 238.0, 118.0, 61.0, 40.0, 22.0, 27.0, 8.0, 8.0, 8.0, 7.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00027370452880859375, -0.00026428326964378357, -0.0002548620104789734, -0.0002454407513141632, -0.00023601949214935303, -0.00022659823298454285, -0.00021717697381973267, -0.00020775571465492249, -0.0001983344554901123, -0.00018891319632530212, -0.00017949193716049194, -0.00017007067799568176, -0.00016064941883087158, -0.0001512281596660614, -0.00014180690050125122, -0.00013238564133644104, -0.00012296438217163086, -0.00011354312300682068, -0.0001041218638420105, -9.470060467720032e-05, -8.527934551239014e-05, -7.585808634757996e-05, -6.643682718276978e-05, -5.7015568017959595e-05, -4.7594308853149414e-05, -3.8173049688339233e-05, -2.8751790523529053e-05, -1.9330531358718872e-05, -9.909272193908691e-06, -4.880130290985107e-07, 8.93324613571167e-06, 1.835450530052185e-05, 2.777576446533203e-05, 3.719702363014221e-05, 4.661828279495239e-05, 5.603954195976257e-05, 6.546080112457275e-05, 7.488206028938293e-05, 8.430331945419312e-05, 9.37245786190033e-05, 0.00010314583778381348, 0.00011256709694862366, 0.00012198835611343384, 0.00013140961527824402, 0.0001408308744430542, 0.00015025213360786438, 0.00015967339277267456, 0.00016909465193748474, 0.00017851591110229492, 0.0001879371702671051, 0.00019735842943191528, 0.00020677968859672546, 0.00021620094776153564, 0.00022562220692634583, 0.000235043466091156, 0.0002444647252559662, 0.00025388598442077637, 0.00026330724358558655, 0.00027272850275039673, 0.0002821497619152069, 0.0002915710210800171, 0.00030099228024482727, 0.00031041353940963745, 0.00031983479857444763, 0.0003292560577392578]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 20.0, 31.0, 66.0, 136.0, 234.0, 574.0, 5153.0, 906893.0, 131955.0, 2583.0, 477.0, 189.0, 94.0, 64.0, 40.0, 18.0, 7.0, 9.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.234375, -6.98388671875, -6.7333984375, -6.48291015625, -6.232421875, -5.98193359375, -5.7314453125, -5.48095703125, -5.23046875, -4.97998046875, -4.7294921875, -4.47900390625, -4.228515625, -3.97802734375, -3.7275390625, -3.47705078125, -3.2265625, -2.97607421875, -2.7255859375, -2.47509765625, -2.224609375, -1.97412109375, -1.7236328125, -1.47314453125, -1.22265625, -0.97216796875, -0.7216796875, -0.47119140625, -0.220703125, 0.02978515625, 0.2802734375, 0.53076171875, 0.78125, 1.03173828125, 1.2822265625, 1.53271484375, 1.783203125, 2.03369140625, 2.2841796875, 2.53466796875, 2.78515625, 3.03564453125, 3.2861328125, 3.53662109375, 3.787109375, 4.03759765625, 4.2880859375, 4.53857421875, 4.7890625, 5.03955078125, 5.2900390625, 5.54052734375, 5.791015625, 6.04150390625, 6.2919921875, 6.54248046875, 6.79296875, 7.04345703125, 7.2939453125, 7.54443359375, 7.794921875, 8.04541015625, 8.2958984375, 8.54638671875, 8.796875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 12.0, 34.0, 51.0, 142.0, 564.0, 102.0, 48.0, 21.0, 14.0, 5.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3984375, -5.22113037109375, -5.0438232421875, -4.86651611328125, -4.689208984375, -4.51190185546875, -4.3345947265625, -4.15728759765625, -3.97998046875, -3.80267333984375, -3.6253662109375, -3.44805908203125, -3.270751953125, -3.09344482421875, -2.9161376953125, -2.73883056640625, -2.5615234375, -2.38421630859375, -2.2069091796875, -2.02960205078125, -1.852294921875, -1.67498779296875, -1.4976806640625, -1.32037353515625, -1.14306640625, -0.96575927734375, -0.7884521484375, -0.61114501953125, -0.433837890625, -0.25653076171875, -0.0792236328125, 0.09808349609375, 0.275390625, 0.45269775390625, 0.6300048828125, 0.80731201171875, 0.984619140625, 1.16192626953125, 1.3392333984375, 1.51654052734375, 1.69384765625, 1.87115478515625, 2.0484619140625, 2.22576904296875, 2.403076171875, 2.58038330078125, 2.7576904296875, 2.93499755859375, 3.1123046875, 3.28961181640625, 3.4669189453125, 3.64422607421875, 3.821533203125, 3.99884033203125, 4.1761474609375, 4.35345458984375, 4.53076171875, 4.70806884765625, 4.8853759765625, 5.06268310546875, 5.239990234375, 5.41729736328125, 5.5946044921875, 5.77191162109375, 5.94921875]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 6.0, 23.0, 26.0, 70.0, 196.0, 315.0, 229.0, 83.0, 33.0, 14.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.58467864990234, -64.49268341064453, -62.40068435668945, -60.308685302734375, -58.21669006347656, -56.124691009521484, -54.032691955566406, -51.940696716308594, -49.848697662353516, -47.75669860839844, -45.664703369140625, -43.57270431518555, -41.48070526123047, -39.388710021972656, -37.29671096801758, -35.2047119140625, -33.11271667480469, -31.020719528198242, -28.928722381591797, -26.83672332763672, -24.744726181030273, -22.652729034423828, -20.56072998046875, -18.468732833862305, -16.37673568725586, -14.284738540649414, -12.192740440368652, -10.10074234008789, -8.008745193481445, -5.916748046875, -3.8247499465942383, -1.7327518463134766, 0.3592529296875, 2.4512505531311035, 4.543248176574707, 6.6352458000183105, 8.727243423461914, 10.81924057006836, 12.911238670349121, 15.003236770629883, 17.095233917236328, 19.187231063842773, 21.27922821044922, 23.371227264404297, 25.463224411010742, 27.555221557617188, 29.647220611572266, 31.73921775817871, 33.831214904785156, 35.923213958740234, 38.01520919799805, 40.107208251953125, 42.19920349121094, 44.291202545166016, 46.383201599121094, 48.475196838378906, 50.567195892333984, 52.65919494628906, 54.751190185546875, 56.84318923950195, 58.93518829345703, 61.027183532714844, 63.11918258666992, 65.211181640625, 67.30317687988281]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 4.0, 3.0, 3.0, 3.0, 7.0, 8.0, 9.0, 14.0, 22.0, 20.0, 23.0, 24.0, 35.0, 38.0, 42.0, 40.0, 47.0, 50.0, 53.0, 65.0, 58.0, 55.0, 49.0, 48.0, 49.0, 37.0, 39.0, 31.0, 28.0, 24.0, 23.0, 18.0, 11.0, 13.0, 3.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.08418846130371, -30.067859649658203, -29.051528930664062, -28.035200119018555, -27.018869400024414, -26.002540588378906, -24.986209869384766, -23.969881057739258, -22.95355224609375, -21.937223434448242, -20.9208927154541, -19.904563903808594, -18.888233184814453, -17.871904373168945, -16.855575561523438, -15.839244842529297, -14.822914123535156, -13.806584358215332, -12.790254592895508, -11.77392578125, -10.75759506225586, -9.741266250610352, -8.724936485290527, -7.708606719970703, -6.692276954650879, -5.675947189331055, -4.6596174240112305, -3.6432881355285645, -2.6269583702087402, -1.610628604888916, -0.59429931640625, 0.4220304489135742, 1.4383583068847656, 2.45468807220459, 3.471017599105835, 4.48734712600708, 5.503676891326904, 6.5200066566467285, 7.5363359451293945, 8.552665710449219, 9.568995475769043, 10.585325241088867, 11.601655006408691, 12.617984771728516, 13.634313583374023, 14.650644302368164, 15.666973114013672, 16.683303833007812, 17.69963264465332, 18.715961456298828, 19.73229217529297, 20.748620986938477, 21.764951705932617, 22.781280517578125, 23.797611236572266, 24.813940048217773, 25.83026885986328, 26.84659767150879, 27.86292839050293, 28.879257202148438, 29.895587921142578, 30.911916732788086, 31.928245544433594, 32.944576263427734, 33.960906982421875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 2.0, 2.0, 5.0, 10.0, 11.0, 18.0, 21.0, 26.0, 51.0, 87.0, 128.0, 302.0, 616.0, 1646.0, 5346.0, 31541.0, 4074078.0, 68912.0, 7878.0, 2130.0, 780.0, 341.0, 139.0, 90.0, 48.0, 30.0, 13.0, 7.0, 10.0, 2.0, 3.0, 7.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.5625, -10.2286376953125, -9.894775390625, -9.5609130859375, -9.22705078125, -8.8931884765625, -8.559326171875, -8.2254638671875, -7.8916015625, -7.5577392578125, -7.223876953125, -6.8900146484375, -6.55615234375, -6.2222900390625, -5.888427734375, -5.5545654296875, -5.220703125, -4.8868408203125, -4.552978515625, -4.2191162109375, -3.88525390625, -3.5513916015625, -3.217529296875, -2.8836669921875, -2.5498046875, -2.2159423828125, -1.882080078125, -1.5482177734375, -1.21435546875, -0.8804931640625, -0.546630859375, -0.2127685546875, 0.12109375, 0.4549560546875, 0.788818359375, 1.1226806640625, 1.45654296875, 1.7904052734375, 2.124267578125, 2.4581298828125, 2.7919921875, 3.1258544921875, 3.459716796875, 3.7935791015625, 4.12744140625, 4.4613037109375, 4.795166015625, 5.1290283203125, 5.462890625, 5.7967529296875, 6.130615234375, 6.4644775390625, 6.79833984375, 7.1322021484375, 7.466064453125, 7.7999267578125, 8.1337890625, 8.4676513671875, 8.801513671875, 9.1353759765625, 9.46923828125, 9.8031005859375, 10.136962890625, 10.4708251953125, 10.8046875]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 4.0, 3.0, 11.0, 11.0, 24.0, 35.0, 50.0, 85.0, 97.0, 126.0, 138.0, 124.0, 107.0, 77.0, 58.0, 22.0, 14.0, 9.0, 9.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.95703125, -2.86822509765625, -2.7794189453125, -2.69061279296875, -2.601806640625, -2.51300048828125, -2.4241943359375, -2.33538818359375, -2.24658203125, -2.15777587890625, -2.0689697265625, -1.98016357421875, -1.891357421875, -1.80255126953125, -1.7137451171875, -1.62493896484375, -1.5361328125, -1.44732666015625, -1.3585205078125, -1.26971435546875, -1.180908203125, -1.09210205078125, -1.0032958984375, -0.91448974609375, -0.82568359375, -0.73687744140625, -0.6480712890625, -0.55926513671875, -0.470458984375, -0.38165283203125, -0.2928466796875, -0.20404052734375, -0.115234375, -0.02642822265625, 0.0623779296875, 0.15118408203125, 0.239990234375, 0.32879638671875, 0.4176025390625, 0.50640869140625, 0.59521484375, 0.68402099609375, 0.7728271484375, 0.86163330078125, 0.950439453125, 1.03924560546875, 1.1280517578125, 1.21685791015625, 1.3056640625, 1.39447021484375, 1.4832763671875, 1.57208251953125, 1.660888671875, 1.74969482421875, 1.8385009765625, 1.92730712890625, 2.01611328125, 2.10491943359375, 2.1937255859375, 2.28253173828125, 2.371337890625, 2.46014404296875, 2.5489501953125, 2.63775634765625, 2.7265625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 2.0, 10.0, 9.0, 11.0, 20.0, 24.0, 41.0, 52.0, 84.0, 112.0, 139.0, 183.0, 271.0, 377.0, 592.0, 944.0, 1708.0, 3527.0, 9149.0, 34443.0, 916496.0, 3168556.0, 38833.0, 9802.0, 3897.0, 1849.0, 1017.0, 642.0, 412.0, 291.0, 209.0, 164.0, 124.0, 72.0, 73.0, 47.0, 33.0, 29.0, 15.0, 6.0, 3.0, 3.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.23828125, -6.0494384765625, -5.860595703125, -5.6717529296875, -5.48291015625, -5.2940673828125, -5.105224609375, -4.9163818359375, -4.7275390625, -4.5386962890625, -4.349853515625, -4.1610107421875, -3.97216796875, -3.7833251953125, -3.594482421875, -3.4056396484375, -3.216796875, -3.0279541015625, -2.839111328125, -2.6502685546875, -2.46142578125, -2.2725830078125, -2.083740234375, -1.8948974609375, -1.7060546875, -1.5172119140625, -1.328369140625, -1.1395263671875, -0.95068359375, -0.7618408203125, -0.572998046875, -0.3841552734375, -0.1953125, -0.0064697265625, 0.182373046875, 0.3712158203125, 0.56005859375, 0.7489013671875, 0.937744140625, 1.1265869140625, 1.3154296875, 1.5042724609375, 1.693115234375, 1.8819580078125, 2.07080078125, 2.2596435546875, 2.448486328125, 2.6373291015625, 2.826171875, 3.0150146484375, 3.203857421875, 3.3927001953125, 3.58154296875, 3.7703857421875, 3.959228515625, 4.1480712890625, 4.3369140625, 4.5257568359375, 4.714599609375, 4.9034423828125, 5.09228515625, 5.2811279296875, 5.469970703125, 5.6588134765625, 5.84765625]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 13.0, 12.0, 30.0, 46.0, 131.0, 859.0, 2675.0, 152.0, 57.0, 28.0, 22.0, 12.0, 6.0, 5.0, 7.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.751953125, -3.638641357421875, -3.52532958984375, -3.412017822265625, -3.2987060546875, -3.185394287109375, -3.07208251953125, -2.958770751953125, -2.845458984375, -2.732147216796875, -2.61883544921875, -2.505523681640625, -2.3922119140625, -2.278900146484375, -2.16558837890625, -2.052276611328125, -1.93896484375, -1.825653076171875, -1.71234130859375, -1.599029541015625, -1.4857177734375, -1.372406005859375, -1.25909423828125, -1.145782470703125, -1.032470703125, -0.919158935546875, -0.80584716796875, -0.692535400390625, -0.5792236328125, -0.465911865234375, -0.35260009765625, -0.239288330078125, -0.1259765625, -0.012664794921875, 0.10064697265625, 0.213958740234375, 0.3272705078125, 0.440582275390625, 0.55389404296875, 0.667205810546875, 0.780517578125, 0.893829345703125, 1.00714111328125, 1.120452880859375, 1.2337646484375, 1.347076416015625, 1.46038818359375, 1.573699951171875, 1.68701171875, 1.800323486328125, 1.91363525390625, 2.026947021484375, 2.1402587890625, 2.253570556640625, 2.36688232421875, 2.480194091796875, 2.593505859375, 2.706817626953125, 2.82012939453125, 2.933441162109375, 3.0467529296875, 3.160064697265625, 3.27337646484375, 3.386688232421875, 3.5]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 5.0, 17.0, 112.0, 602.0, 228.0, 45.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.793275833129883, -10.251688003540039, -8.710100173950195, -7.168511390686035, -5.626923561096191, -4.085335731506348, -2.5437469482421875, -1.0021591186523438, 0.5394287109375, 2.081016778945923, 3.6226048469543457, 5.164193153381348, 6.705780982971191, 8.247368812561035, 9.788957595825195, 11.330545425415039, 12.872133255004883, 14.413721084594727, 15.95530891418457, 17.496898651123047, 19.03848648071289, 20.580074310302734, 22.121662139892578, 23.663249969482422, 25.204837799072266, 26.74642562866211, 28.288013458251953, 29.829601287841797, 31.37118911743164, 32.912776947021484, 34.454368591308594, 35.99595642089844, 37.53754425048828, 39.079132080078125, 40.62071990966797, 42.16230773925781, 43.703895568847656, 45.2454833984375, 46.787071228027344, 48.32865905761719, 49.87024688720703, 51.411834716796875, 52.95342254638672, 54.49501037597656, 56.036598205566406, 57.57818603515625, 59.119773864746094, 60.66136169433594, 62.20295333862305, 63.74454116821289, 65.2861328125, 66.82772064208984, 68.36930847167969, 69.91089630126953, 71.45248413085938, 72.99407196044922, 74.53565979003906, 76.0772476196289, 77.61883544921875, 79.1604232788086, 80.70201110839844, 82.24359893798828, 83.78518676757812, 85.32677459716797, 86.86836242675781]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 2.0, 8.0, 10.0, 9.0, 24.0, 18.0, 28.0, 29.0, 35.0, 44.0, 43.0, 52.0, 61.0, 62.0, 45.0, 61.0, 36.0, 62.0, 49.0, 58.0, 43.0, 32.0, 37.0, 34.0, 27.0, 15.0, 12.0, 14.0, 16.0, 8.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-7.504338264465332, -7.247499465942383, -6.990660190582275, -6.733821392059326, -6.476982116699219, -6.2201433181762695, -5.96330451965332, -5.706465244293213, -5.4496259689331055, -5.192787170410156, -4.935947895050049, -4.6791090965271, -4.422269821166992, -4.165431022644043, -3.9085919857025146, -3.6517529487609863, -3.394914150238037, -3.138075113296509, -2.8812360763549805, -2.6243972778320312, -2.367558002471924, -2.1107192039489746, -1.8538801670074463, -1.597041130065918, -1.3402020931243896, -1.0833630561828613, -0.8265240788459778, -0.5696851015090942, -0.3128460645675659, -0.0560070276260376, 0.20083189010620117, 0.4576709270477295, 0.7145099639892578, 0.9713490009307861, 1.2281880378723145, 1.4850269556045532, 1.7418659925460815, 1.9987050294876099, 2.2555439472198486, 2.512382984161377, 2.7692220211029053, 3.0260610580444336, 3.282900094985962, 3.5397391319274902, 3.7965779304504395, 4.053417205810547, 4.310256004333496, 4.567094802856445, 4.823934078216553, 5.080772876739502, 5.337612152099609, 5.594450950622559, 5.851290225982666, 6.108129024505615, 6.364968299865723, 6.621807098388672, 6.878645896911621, 7.13548469543457, 7.392323970794678, 7.649162769317627, 7.906002044677734, 8.162840843200684, 8.419679641723633, 8.676519393920898, 8.933358192443848]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 7.0, 6.0, 11.0, 14.0, 32.0, 50.0, 80.0, 162.0, 289.0, 864.0, 2897.0, 20344.0, 600293.0, 402599.0, 16870.0, 2606.0, 796.0, 296.0, 149.0, 68.0, 55.0, 24.0, 22.0, 10.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.296875, -11.912109375, -11.52734375, -11.142578125, -10.7578125, -10.373046875, -9.98828125, -9.603515625, -9.21875, -8.833984375, -8.44921875, -8.064453125, -7.6796875, -7.294921875, -6.91015625, -6.525390625, -6.140625, -5.755859375, -5.37109375, -4.986328125, -4.6015625, -4.216796875, -3.83203125, -3.447265625, -3.0625, -2.677734375, -2.29296875, -1.908203125, -1.5234375, -1.138671875, -0.75390625, -0.369140625, 0.015625, 0.400390625, 0.78515625, 1.169921875, 1.5546875, 1.939453125, 2.32421875, 2.708984375, 3.09375, 3.478515625, 3.86328125, 4.248046875, 4.6328125, 5.017578125, 5.40234375, 5.787109375, 6.171875, 6.556640625, 6.94140625, 7.326171875, 7.7109375, 8.095703125, 8.48046875, 8.865234375, 9.25, 9.634765625, 10.01953125, 10.404296875, 10.7890625, 11.173828125, 11.55859375, 11.943359375, 12.328125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 7.0, 11.0, 22.0, 26.0, 55.0, 70.0, 104.0, 141.0, 138.0, 125.0, 103.0, 81.0, 60.0, 27.0, 12.0, 9.0, 10.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.064453125, -2.969879150390625, -2.87530517578125, -2.780731201171875, -2.6861572265625, -2.591583251953125, -2.49700927734375, -2.402435302734375, -2.307861328125, -2.213287353515625, -2.11871337890625, -2.024139404296875, -1.9295654296875, -1.834991455078125, -1.74041748046875, -1.645843505859375, -1.55126953125, -1.456695556640625, -1.36212158203125, -1.267547607421875, -1.1729736328125, -1.078399658203125, -0.98382568359375, -0.889251708984375, -0.794677734375, -0.700103759765625, -0.60552978515625, -0.510955810546875, -0.4163818359375, -0.321807861328125, -0.22723388671875, -0.132659912109375, -0.0380859375, 0.056488037109375, 0.15106201171875, 0.245635986328125, 0.3402099609375, 0.434783935546875, 0.52935791015625, 0.623931884765625, 0.718505859375, 0.813079833984375, 0.90765380859375, 1.002227783203125, 1.0968017578125, 1.191375732421875, 1.28594970703125, 1.380523681640625, 1.47509765625, 1.569671630859375, 1.66424560546875, 1.758819580078125, 1.8533935546875, 1.947967529296875, 2.04254150390625, 2.137115478515625, 2.231689453125, 2.326263427734375, 2.42083740234375, 2.515411376953125, 2.6099853515625, 2.704559326171875, 2.79913330078125, 2.893707275390625, 2.98828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 6.0, 9.0, 11.0, 11.0, 18.0, 36.0, 20.0, 51.0, 77.0, 143.0, 260.0, 553.0, 1248.0, 2932.0, 7553.0, 22534.0, 91966.0, 689675.0, 179202.0, 34522.0, 10585.0, 3952.0, 1641.0, 738.0, 359.0, 154.0, 102.0, 56.0, 42.0, 19.0, 15.0, 13.0, 10.0, 13.0, 8.0, 1.0, 2.0, 6.0, 3.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.5703125, -6.36920166015625, -6.1680908203125, -5.96697998046875, -5.765869140625, -5.56475830078125, -5.3636474609375, -5.16253662109375, -4.96142578125, -4.76031494140625, -4.5592041015625, -4.35809326171875, -4.156982421875, -3.95587158203125, -3.7547607421875, -3.55364990234375, -3.3525390625, -3.15142822265625, -2.9503173828125, -2.74920654296875, -2.548095703125, -2.34698486328125, -2.1458740234375, -1.94476318359375, -1.74365234375, -1.54254150390625, -1.3414306640625, -1.14031982421875, -0.939208984375, -0.73809814453125, -0.5369873046875, -0.33587646484375, -0.134765625, 0.06634521484375, 0.2674560546875, 0.46856689453125, 0.669677734375, 0.87078857421875, 1.0718994140625, 1.27301025390625, 1.47412109375, 1.67523193359375, 1.8763427734375, 2.07745361328125, 2.278564453125, 2.47967529296875, 2.6807861328125, 2.88189697265625, 3.0830078125, 3.28411865234375, 3.4852294921875, 3.68634033203125, 3.887451171875, 4.08856201171875, 4.2896728515625, 4.49078369140625, 4.69189453125, 4.89300537109375, 5.0941162109375, 5.29522705078125, 5.496337890625, 5.69744873046875, 5.8985595703125, 6.09967041015625, 6.30078125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 5.0, 3.0, 4.0, 4.0, 4.0, 5.0, 8.0, 17.0, 14.0, 20.0, 17.0, 22.0, 24.0, 41.0, 51.0, 49.0, 54.0, 49.0, 64.0, 60.0, 53.0, 57.0, 60.0, 48.0, 38.0, 38.0, 37.0, 30.0, 21.0, 18.0, 12.0, 19.0, 15.0, 7.0, 11.0, 13.0, 2.0, 0.0, 4.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.7421875, -5.5511474609375, -5.360107421875, -5.1690673828125, -4.97802734375, -4.7869873046875, -4.595947265625, -4.4049072265625, -4.2138671875, -4.0228271484375, -3.831787109375, -3.6407470703125, -3.44970703125, -3.2586669921875, -3.067626953125, -2.8765869140625, -2.685546875, -2.4945068359375, -2.303466796875, -2.1124267578125, -1.92138671875, -1.7303466796875, -1.539306640625, -1.3482666015625, -1.1572265625, -0.9661865234375, -0.775146484375, -0.5841064453125, -0.39306640625, -0.2020263671875, -0.010986328125, 0.1800537109375, 0.37109375, 0.5621337890625, 0.753173828125, 0.9442138671875, 1.13525390625, 1.3262939453125, 1.517333984375, 1.7083740234375, 1.8994140625, 2.0904541015625, 2.281494140625, 2.4725341796875, 2.66357421875, 2.8546142578125, 3.045654296875, 3.2366943359375, 3.427734375, 3.6187744140625, 3.809814453125, 4.0008544921875, 4.19189453125, 4.3829345703125, 4.573974609375, 4.7650146484375, 4.9560546875, 5.1470947265625, 5.338134765625, 5.5291748046875, 5.72021484375, 5.9112548828125, 6.102294921875, 6.2933349609375, 6.484375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 4.0, 4.0, 9.0, 10.0, 17.0, 16.0, 26.0, 42.0, 46.0, 79.0, 130.0, 210.0, 378.0, 658.0, 1144.0, 2340.0, 5094.0, 12779.0, 43396.0, 304202.0, 584018.0, 64215.0, 17135.0, 6466.0, 2925.0, 1400.0, 730.0, 412.0, 252.0, 135.0, 89.0, 60.0, 34.0, 30.0, 19.0, 11.0, 13.0, 5.0, 6.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.7568359375, -1.7038116455078125, -1.650787353515625, -1.5977630615234375, -1.54473876953125, -1.4917144775390625, -1.438690185546875, -1.3856658935546875, -1.3326416015625, -1.2796173095703125, -1.226593017578125, -1.1735687255859375, -1.12054443359375, -1.0675201416015625, -1.014495849609375, -0.9614715576171875, -0.908447265625, -0.8554229736328125, -0.802398681640625, -0.7493743896484375, -0.69635009765625, -0.6433258056640625, -0.590301513671875, -0.5372772216796875, -0.4842529296875, -0.4312286376953125, -0.378204345703125, -0.3251800537109375, -0.27215576171875, -0.2191314697265625, -0.166107177734375, -0.1130828857421875, -0.06005859375, -0.0070343017578125, 0.045989990234375, 0.0990142822265625, 0.15203857421875, 0.2050628662109375, 0.258087158203125, 0.3111114501953125, 0.3641357421875, 0.4171600341796875, 0.470184326171875, 0.5232086181640625, 0.57623291015625, 0.6292572021484375, 0.682281494140625, 0.7353057861328125, 0.788330078125, 0.8413543701171875, 0.894378662109375, 0.9474029541015625, 1.00042724609375, 1.0534515380859375, 1.106475830078125, 1.1595001220703125, 1.2125244140625, 1.2655487060546875, 1.318572998046875, 1.3715972900390625, 1.42462158203125, 1.4776458740234375, 1.530670166015625, 1.5836944580078125, 1.63671875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 4.0, 6.0, 4.0, 16.0, 18.0, 19.0, 36.0, 40.0, 62.0, 104.0, 166.0, 151.0, 124.0, 74.0, 45.0, 26.0, 31.0, 14.0, 16.0, 9.0, 5.0, 2.0, 7.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00022530555725097656, -0.00021779164671897888, -0.0002102777361869812, -0.00020276382565498352, -0.00019524991512298584, -0.00018773600459098816, -0.00018022209405899048, -0.0001727081835269928, -0.00016519427299499512, -0.00015768036246299744, -0.00015016645193099976, -0.00014265254139900208, -0.0001351386308670044, -0.00012762472033500671, -0.00012011080980300903, -0.00011259689927101135, -0.00010508298873901367, -9.756907820701599e-05, -9.005516767501831e-05, -8.254125714302063e-05, -7.502734661102295e-05, -6.751343607902527e-05, -5.999952554702759e-05, -5.248561501502991e-05, -4.4971704483032227e-05, -3.7457793951034546e-05, -2.9943883419036865e-05, -2.2429972887039185e-05, -1.4916062355041504e-05, -7.402151823043823e-06, 1.1175870895385742e-07, 7.625669240951538e-06, 1.5139579772949219e-05, 2.26534903049469e-05, 3.016740083694458e-05, 3.768131136894226e-05, 4.519522190093994e-05, 5.270913243293762e-05, 6.02230429649353e-05, 6.773695349693298e-05, 7.525086402893066e-05, 8.276477456092834e-05, 9.027868509292603e-05, 9.77925956249237e-05, 0.00010530650615692139, 0.00011282041668891907, 0.00012033432722091675, 0.00012784823775291443, 0.0001353621482849121, 0.0001428760588169098, 0.00015038996934890747, 0.00015790387988090515, 0.00016541779041290283, 0.0001729317009449005, 0.0001804456114768982, 0.00018795952200889587, 0.00019547343254089355, 0.00020298734307289124, 0.00021050125360488892, 0.0002180151641368866, 0.00022552907466888428, 0.00023304298520088196, 0.00024055689573287964, 0.0002480708062648773, 0.000255584716796875]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 0.0, 3.0, 3.0, 3.0, 7.0, 10.0, 12.0, 28.0, 61.0, 85.0, 150.0, 412.0, 827.0, 2265.0, 7807.0, 59569.0, 880936.0, 82492.0, 9450.0, 2613.0, 989.0, 427.0, 173.0, 108.0, 64.0, 20.0, 10.0, 11.0, 12.0, 7.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.259765625, -3.162628173828125, -3.06549072265625, -2.968353271484375, -2.8712158203125, -2.774078369140625, -2.67694091796875, -2.579803466796875, -2.482666015625, -2.385528564453125, -2.28839111328125, -2.191253662109375, -2.0941162109375, -1.996978759765625, -1.89984130859375, -1.802703857421875, -1.70556640625, -1.608428955078125, -1.51129150390625, -1.414154052734375, -1.3170166015625, -1.219879150390625, -1.12274169921875, -1.025604248046875, -0.928466796875, -0.831329345703125, -0.73419189453125, -0.637054443359375, -0.5399169921875, -0.442779541015625, -0.34564208984375, -0.248504638671875, -0.1513671875, -0.054229736328125, 0.04290771484375, 0.140045166015625, 0.2371826171875, 0.334320068359375, 0.43145751953125, 0.528594970703125, 0.625732421875, 0.722869873046875, 0.82000732421875, 0.917144775390625, 1.0142822265625, 1.111419677734375, 1.20855712890625, 1.305694580078125, 1.40283203125, 1.499969482421875, 1.59710693359375, 1.694244384765625, 1.7913818359375, 1.888519287109375, 1.98565673828125, 2.082794189453125, 2.179931640625, 2.277069091796875, 2.37420654296875, 2.471343994140625, 2.5684814453125, 2.665618896484375, 2.76275634765625, 2.859893798828125, 2.95703125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 1.0, 5.0, 3.0, 2.0, 1.0, 6.0, 9.0, 18.0, 23.0, 41.0, 44.0, 70.0, 98.0, 205.0, 175.0, 122.0, 53.0, 39.0, 24.0, 22.0, 15.0, 7.0, 2.0, 7.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.029296875, -1.954254150390625, -1.87921142578125, -1.804168701171875, -1.7291259765625, -1.654083251953125, -1.57904052734375, -1.503997802734375, -1.428955078125, -1.353912353515625, -1.27886962890625, -1.203826904296875, -1.1287841796875, -1.053741455078125, -0.97869873046875, -0.903656005859375, -0.82861328125, -0.753570556640625, -0.67852783203125, -0.603485107421875, -0.5284423828125, -0.453399658203125, -0.37835693359375, -0.303314208984375, -0.228271484375, -0.153228759765625, -0.07818603515625, -0.003143310546875, 0.0718994140625, 0.146942138671875, 0.22198486328125, 0.297027587890625, 0.3720703125, 0.447113037109375, 0.52215576171875, 0.597198486328125, 0.6722412109375, 0.747283935546875, 0.82232666015625, 0.897369384765625, 0.972412109375, 1.047454833984375, 1.12249755859375, 1.197540283203125, 1.2725830078125, 1.347625732421875, 1.42266845703125, 1.497711181640625, 1.57275390625, 1.647796630859375, 1.72283935546875, 1.797882080078125, 1.8729248046875, 1.947967529296875, 2.02301025390625, 2.098052978515625, 2.173095703125, 2.248138427734375, 2.32318115234375, 2.398223876953125, 2.4732666015625, 2.548309326171875, 2.62335205078125, 2.698394775390625, 2.7734375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 11.0, 20.0, 82.0, 369.0, 385.0, 110.0, 26.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.17121124267578, -44.05184555053711, -40.93247985839844, -37.813114166259766, -34.693748474121094, -31.574382781982422, -28.45501708984375, -25.335651397705078, -22.216285705566406, -19.096920013427734, -15.977554321289062, -12.85818862915039, -9.738822937011719, -6.619457244873047, -3.500091552734375, -0.3807258605957031, 2.7386398315429688, 5.858005523681641, 8.977371215820312, 12.096736907958984, 15.216102600097656, 18.335468292236328, 21.454833984375, 24.574199676513672, 27.693565368652344, 30.812931060791016, 33.93229675292969, 37.05166244506836, 40.17102813720703, 43.2903938293457, 46.409759521484375, 49.52912521362305, 52.64849853515625, 55.76786422729492, 58.887229919433594, 62.006595611572266, 65.12596130371094, 68.24533081054688, 71.36469268798828, 74.48405456542969, 77.60342407226562, 80.72279357910156, 83.84215545654297, 86.96151733398438, 90.08088684082031, 93.20025634765625, 96.31961822509766, 99.43898010253906, 102.558349609375, 105.67771911621094, 108.79708099365234, 111.91644287109375, 115.03581237792969, 118.15518188476562, 121.27454376220703, 124.39390563964844, 127.51327514648438, 130.6326446533203, 133.75201416015625, 136.87136840820312, 139.99073791503906, 143.110107421875, 146.22946166992188, 149.3488311767578, 152.46820068359375]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 7.0, 13.0, 6.0, 18.0, 6.0, 10.0, 19.0, 22.0, 17.0, 28.0, 21.0, 25.0, 44.0, 28.0, 23.0, 36.0, 41.0, 43.0, 47.0, 47.0, 41.0, 35.0, 39.0, 39.0, 38.0, 39.0, 27.0, 32.0, 32.0, 22.0, 20.0, 19.0, 13.0, 17.0, 14.0, 9.0, 14.0, 8.0, 15.0, 5.0, 5.0, 4.0, 7.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-21.87316131591797, -21.203048706054688, -20.532936096191406, -19.862823486328125, -19.19270896911621, -18.52259635925293, -17.85248374938965, -17.182371139526367, -16.512256622314453, -15.842144012451172, -15.172030448913574, -14.501917839050293, -13.831804275512695, -13.161691665649414, -12.491579055786133, -11.821466445922852, -11.15135383605957, -10.481241226196289, -9.811127662658691, -9.14101505279541, -8.470901489257812, -7.800788879394531, -7.13067626953125, -6.4605631828308105, -5.790450096130371, -5.120337009429932, -4.450223922729492, -3.780111312866211, -3.1099982261657715, -2.439885139465332, -1.7697725296020508, -1.0996594429016113, -0.4295482635498047, 0.24056470394134521, 0.9106776714324951, 1.5807905197143555, 2.250903606414795, 2.9210166931152344, 3.5911293029785156, 4.261242389678955, 4.9313554763793945, 5.601468563079834, 6.271581649780273, 6.941694259643555, 7.611807346343994, 8.281920433044434, 8.952033042907715, 9.622146606445312, 10.292259216308594, 10.962371826171875, 11.632485389709473, 12.302597999572754, 12.972711563110352, 13.642824172973633, 14.312936782836914, 14.983049392700195, 15.653162956237793, 16.32327651977539, 16.993389129638672, 17.663501739501953, 18.333614349365234, 19.003726959228516, 19.673839569091797, 20.34395408630371, 21.014066696166992]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 5.0, 9.0, 6.0, 11.0, 13.0, 21.0, 26.0, 41.0, 82.0, 146.0, 254.0, 522.0, 1128.0, 3176.0, 12679.0, 206098.0, 3944629.0, 18815.0, 4146.0, 1329.0, 553.0, 271.0, 117.0, 78.0, 39.0, 29.0, 17.0, 14.0, 6.0, 6.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.359375, -15.865234375, -15.37109375, -14.876953125, -14.3828125, -13.888671875, -13.39453125, -12.900390625, -12.40625, -11.912109375, -11.41796875, -10.923828125, -10.4296875, -9.935546875, -9.44140625, -8.947265625, -8.453125, -7.958984375, -7.46484375, -6.970703125, -6.4765625, -5.982421875, -5.48828125, -4.994140625, -4.5, -4.005859375, -3.51171875, -3.017578125, -2.5234375, -2.029296875, -1.53515625, -1.041015625, -0.546875, -0.052734375, 0.44140625, 0.935546875, 1.4296875, 1.923828125, 2.41796875, 2.912109375, 3.40625, 3.900390625, 4.39453125, 4.888671875, 5.3828125, 5.876953125, 6.37109375, 6.865234375, 7.359375, 7.853515625, 8.34765625, 8.841796875, 9.3359375, 9.830078125, 10.32421875, 10.818359375, 11.3125, 11.806640625, 12.30078125, 12.794921875, 13.2890625, 13.783203125, 14.27734375, 14.771484375, 15.265625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 1.0, 6.0, 9.0, 20.0, 23.0, 46.0, 61.0, 77.0, 108.0, 134.0, 134.0, 117.0, 93.0, 66.0, 45.0, 30.0, 11.0, 15.0, 10.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.09765625, -3.00103759765625, -2.9044189453125, -2.80780029296875, -2.711181640625, -2.61456298828125, -2.5179443359375, -2.42132568359375, -2.32470703125, -2.22808837890625, -2.1314697265625, -2.03485107421875, -1.938232421875, -1.84161376953125, -1.7449951171875, -1.64837646484375, -1.5517578125, -1.45513916015625, -1.3585205078125, -1.26190185546875, -1.165283203125, -1.06866455078125, -0.9720458984375, -0.87542724609375, -0.77880859375, -0.68218994140625, -0.5855712890625, -0.48895263671875, -0.392333984375, -0.29571533203125, -0.1990966796875, -0.10247802734375, -0.005859375, 0.09075927734375, 0.1873779296875, 0.28399658203125, 0.380615234375, 0.47723388671875, 0.5738525390625, 0.67047119140625, 0.76708984375, 0.86370849609375, 0.9603271484375, 1.05694580078125, 1.153564453125, 1.25018310546875, 1.3468017578125, 1.44342041015625, 1.5400390625, 1.63665771484375, 1.7332763671875, 1.82989501953125, 1.926513671875, 2.02313232421875, 2.1197509765625, 2.21636962890625, 2.31298828125, 2.40960693359375, 2.5062255859375, 2.60284423828125, 2.699462890625, 2.79608154296875, 2.8927001953125, 2.98931884765625, 3.0859375]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 10.0, 5.0, 16.0, 14.0, 16.0, 38.0, 34.0, 59.0, 67.0, 92.0, 127.0, 176.0, 284.0, 381.0, 544.0, 855.0, 1377.0, 2189.0, 3507.0, 6118.0, 12625.0, 31575.0, 148624.0, 3831950.0, 101584.0, 26355.0, 11158.0, 5680.0, 3170.0, 1957.0, 1174.0, 799.0, 496.0, 315.0, 243.0, 164.0, 137.0, 92.0, 69.0, 55.0, 40.0, 30.0, 25.0, 14.0, 10.0, 13.0, 5.0, 4.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0], "bins": [-6.48046875, -6.280517578125, -6.08056640625, -5.880615234375, -5.6806640625, -5.480712890625, -5.28076171875, -5.080810546875, -4.880859375, -4.680908203125, -4.48095703125, -4.281005859375, -4.0810546875, -3.881103515625, -3.68115234375, -3.481201171875, -3.28125, -3.081298828125, -2.88134765625, -2.681396484375, -2.4814453125, -2.281494140625, -2.08154296875, -1.881591796875, -1.681640625, -1.481689453125, -1.28173828125, -1.081787109375, -0.8818359375, -0.681884765625, -0.48193359375, -0.281982421875, -0.08203125, 0.117919921875, 0.31787109375, 0.517822265625, 0.7177734375, 0.917724609375, 1.11767578125, 1.317626953125, 1.517578125, 1.717529296875, 1.91748046875, 2.117431640625, 2.3173828125, 2.517333984375, 2.71728515625, 2.917236328125, 3.1171875, 3.317138671875, 3.51708984375, 3.717041015625, 3.9169921875, 4.116943359375, 4.31689453125, 4.516845703125, 4.716796875, 4.916748046875, 5.11669921875, 5.316650390625, 5.5166015625, 5.716552734375, 5.91650390625, 6.116455078125, 6.31640625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 1.0, 4.0, 7.0, 4.0, 4.0, 9.0, 5.0, 14.0, 16.0, 30.0, 52.0, 145.0, 3194.0, 351.0, 93.0, 48.0, 27.0, 17.0, 16.0, 11.0, 4.0, 10.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44140625, -4.296875, -4.15234375, -4.0078125, -3.86328125, -3.71875, -3.57421875, -3.4296875, -3.28515625, -3.140625, -2.99609375, -2.8515625, -2.70703125, -2.5625, -2.41796875, -2.2734375, -2.12890625, -1.984375, -1.83984375, -1.6953125, -1.55078125, -1.40625, -1.26171875, -1.1171875, -0.97265625, -0.828125, -0.68359375, -0.5390625, -0.39453125, -0.25, -0.10546875, 0.0390625, 0.18359375, 0.328125, 0.47265625, 0.6171875, 0.76171875, 0.90625, 1.05078125, 1.1953125, 1.33984375, 1.484375, 1.62890625, 1.7734375, 1.91796875, 2.0625, 2.20703125, 2.3515625, 2.49609375, 2.640625, 2.78515625, 2.9296875, 3.07421875, 3.21875, 3.36328125, 3.5078125, 3.65234375, 3.796875, 3.94140625, 4.0859375, 4.23046875, 4.375, 4.51953125, 4.6640625, 4.80859375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 7.0, 14.0, 18.0, 42.0, 84.0, 220.0, 269.0, 186.0, 90.0, 44.0, 16.0, 12.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.05235481262207, -14.3546142578125, -13.65687370300293, -12.959134101867676, -12.261393547058105, -11.563652992248535, -10.865913391113281, -10.168172836303711, -9.47043228149414, -8.77269172668457, -8.074951171875, -7.377211570739746, -6.679471015930176, -5.9817304611206055, -5.283990383148193, -4.586250305175781, -3.888509750366211, -3.1907694339752197, -2.4930291175842285, -1.7952888011932373, -1.097548484802246, -0.3998081684112549, 0.29793214797973633, 0.9956722259521484, 1.6934127807617188, 2.39115309715271, 3.088893413543701, 3.7866337299346924, 4.484374046325684, 5.182114601135254, 5.879854679107666, 6.577594757080078, 7.275333404541016, 7.973073959350586, 8.670814514160156, 9.36855411529541, 10.06629467010498, 10.76403522491455, 11.461774826049805, 12.159515380859375, 12.857255935668945, 13.554996490478516, 14.252737045288086, 14.95047664642334, 15.64821720123291, 16.345956802368164, 17.043697357177734, 17.741437911987305, 18.439178466796875, 19.136919021606445, 19.834659576416016, 20.532400131225586, 21.230140686035156, 21.927879333496094, 22.625619888305664, 23.323360443115234, 24.021100997924805, 24.718841552734375, 25.416582107543945, 26.114322662353516, 26.812061309814453, 27.509801864624023, 28.207542419433594, 28.905282974243164, 29.603023529052734]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 8.0, 6.0, 7.0, 25.0, 24.0, 28.0, 46.0, 44.0, 66.0, 54.0, 61.0, 89.0, 55.0, 76.0, 54.0, 69.0, 55.0, 54.0, 37.0, 33.0, 28.0, 27.0, 18.0, 9.0, 4.0, 5.0, 5.0, 5.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.620869636535645, -11.232672691345215, -10.844475746154785, -10.456278800964355, -10.068081855773926, -9.679884910583496, -9.29168701171875, -8.90349006652832, -8.51529312133789, -8.127096176147461, -7.738899230957031, -7.350702285766602, -6.962505340576172, -6.574308395385742, -6.186110973358154, -5.797914028167725, -5.409717559814453, -5.021520614624023, -4.633323669433594, -4.245126724243164, -3.8569295406341553, -3.4687325954437256, -3.080535411834717, -2.692338466644287, -2.3041415214538574, -1.9159445762634277, -1.5277475118637085, -1.1395504474639893, -0.7513535022735596, -0.3631565570831299, 0.025040626525878906, 0.4132375717163086, 0.8014335632324219, 1.1896305084228516, 1.5778275728225708, 1.96602463722229, 2.3542215824127197, 2.7424185276031494, 3.130615711212158, 3.518812656402588, 3.9070096015930176, 4.295206546783447, 4.683403491973877, 5.071600914001465, 5.4597978591918945, 5.847994804382324, 6.236191749572754, 6.624388694763184, 7.012585639953613, 7.400782585144043, 7.788979530334473, 8.177176475524902, 8.565373420715332, 8.953570365905762, 9.341768264770508, 9.729965209960938, 10.118162155151367, 10.506359100341797, 10.894556045532227, 11.282752990722656, 11.670949935913086, 12.059146881103516, 12.447343826293945, 12.835540771484375, 13.223737716674805]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 10.0, 14.0, 16.0, 32.0, 52.0, 88.0, 122.0, 261.0, 554.0, 1542.0, 6060.0, 42047.0, 724486.0, 248605.0, 19217.0, 3604.0, 1001.0, 391.0, 190.0, 95.0, 44.0, 38.0, 29.0, 22.0, 11.0, 5.0, 7.0, 5.0, 5.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.796875, -16.2850341796875, -15.773193359375, -15.2613525390625, -14.74951171875, -14.2376708984375, -13.725830078125, -13.2139892578125, -12.7021484375, -12.1903076171875, -11.678466796875, -11.1666259765625, -10.65478515625, -10.1429443359375, -9.631103515625, -9.1192626953125, -8.607421875, -8.0955810546875, -7.583740234375, -7.0718994140625, -6.56005859375, -6.0482177734375, -5.536376953125, -5.0245361328125, -4.5126953125, -4.0008544921875, -3.489013671875, -2.9771728515625, -2.46533203125, -1.9534912109375, -1.441650390625, -0.9298095703125, -0.41796875, 0.0938720703125, 0.605712890625, 1.1175537109375, 1.62939453125, 2.1412353515625, 2.653076171875, 3.1649169921875, 3.6767578125, 4.1885986328125, 4.700439453125, 5.2122802734375, 5.72412109375, 6.2359619140625, 6.747802734375, 7.2596435546875, 7.771484375, 8.2833251953125, 8.795166015625, 9.3070068359375, 9.81884765625, 10.3306884765625, 10.842529296875, 11.3543701171875, 11.8662109375, 12.3780517578125, 12.889892578125, 13.4017333984375, 13.91357421875, 14.4254150390625, 14.937255859375, 15.4490966796875, 15.9609375]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 6.0, 7.0, 22.0, 25.0, 47.0, 70.0, 89.0, 121.0, 144.0, 120.0, 118.0, 83.0, 61.0, 44.0, 21.0, 13.0, 8.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.279296875, -3.17596435546875, -3.0726318359375, -2.96929931640625, -2.865966796875, -2.76263427734375, -2.6593017578125, -2.55596923828125, -2.45263671875, -2.34930419921875, -2.2459716796875, -2.14263916015625, -2.039306640625, -1.93597412109375, -1.8326416015625, -1.72930908203125, -1.6259765625, -1.52264404296875, -1.4193115234375, -1.31597900390625, -1.212646484375, -1.10931396484375, -1.0059814453125, -0.90264892578125, -0.79931640625, -0.69598388671875, -0.5926513671875, -0.48931884765625, -0.385986328125, -0.28265380859375, -0.1793212890625, -0.07598876953125, 0.02734375, 0.13067626953125, 0.2340087890625, 0.33734130859375, 0.440673828125, 0.54400634765625, 0.6473388671875, 0.75067138671875, 0.85400390625, 0.95733642578125, 1.0606689453125, 1.16400146484375, 1.267333984375, 1.37066650390625, 1.4739990234375, 1.57733154296875, 1.6806640625, 1.78399658203125, 1.8873291015625, 1.99066162109375, 2.093994140625, 2.19732666015625, 2.3006591796875, 2.40399169921875, 2.50732421875, 2.61065673828125, 2.7139892578125, 2.81732177734375, 2.920654296875, 3.02398681640625, 3.1273193359375, 3.23065185546875, 3.333984375]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 9.0, 3.0, 6.0, 14.0, 4.0, 23.0, 14.0, 28.0, 37.0, 64.0, 71.0, 108.0, 186.0, 333.0, 491.0, 1057.0, 2065.0, 4681.0, 11687.0, 39187.0, 210514.0, 635449.0, 102945.0, 24263.0, 8186.0, 3478.0, 1635.0, 790.0, 460.0, 251.0, 156.0, 105.0, 85.0, 40.0, 33.0, 15.0, 20.0, 20.0, 10.0, 8.0, 5.0, 2.0, 5.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.4453125, -8.1839599609375, -7.922607421875, -7.6612548828125, -7.39990234375, -7.1385498046875, -6.877197265625, -6.6158447265625, -6.3544921875, -6.0931396484375, -5.831787109375, -5.5704345703125, -5.30908203125, -5.0477294921875, -4.786376953125, -4.5250244140625, -4.263671875, -4.0023193359375, -3.740966796875, -3.4796142578125, -3.21826171875, -2.9569091796875, -2.695556640625, -2.4342041015625, -2.1728515625, -1.9114990234375, -1.650146484375, -1.3887939453125, -1.12744140625, -0.8660888671875, -0.604736328125, -0.3433837890625, -0.08203125, 0.1793212890625, 0.440673828125, 0.7020263671875, 0.96337890625, 1.2247314453125, 1.486083984375, 1.7474365234375, 2.0087890625, 2.2701416015625, 2.531494140625, 2.7928466796875, 3.05419921875, 3.3155517578125, 3.576904296875, 3.8382568359375, 4.099609375, 4.3609619140625, 4.622314453125, 4.8836669921875, 5.14501953125, 5.4063720703125, 5.667724609375, 5.9290771484375, 6.1904296875, 6.4517822265625, 6.713134765625, 6.9744873046875, 7.23583984375, 7.4971923828125, 7.758544921875, 8.0198974609375, 8.28125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 2.0, 2.0, 5.0, 9.0, 4.0, 7.0, 10.0, 10.0, 15.0, 17.0, 17.0, 29.0, 29.0, 45.0, 37.0, 43.0, 43.0, 61.0, 54.0, 57.0, 46.0, 58.0, 53.0, 42.0, 53.0, 33.0, 40.0, 39.0, 28.0, 13.0, 19.0, 13.0, 17.0, 11.0, 8.0, 6.0, 6.0, 1.0, 6.0, 1.0, 2.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.62890625, -7.3880615234375, -7.147216796875, -6.9063720703125, -6.66552734375, -6.4246826171875, -6.183837890625, -5.9429931640625, -5.7021484375, -5.4613037109375, -5.220458984375, -4.9796142578125, -4.73876953125, -4.4979248046875, -4.257080078125, -4.0162353515625, -3.775390625, -3.5345458984375, -3.293701171875, -3.0528564453125, -2.81201171875, -2.5711669921875, -2.330322265625, -2.0894775390625, -1.8486328125, -1.6077880859375, -1.366943359375, -1.1260986328125, -0.88525390625, -0.6444091796875, -0.403564453125, -0.1627197265625, 0.078125, 0.3189697265625, 0.559814453125, 0.8006591796875, 1.04150390625, 1.2823486328125, 1.523193359375, 1.7640380859375, 2.0048828125, 2.2457275390625, 2.486572265625, 2.7274169921875, 2.96826171875, 3.2091064453125, 3.449951171875, 3.6907958984375, 3.931640625, 4.1724853515625, 4.413330078125, 4.6541748046875, 4.89501953125, 5.1358642578125, 5.376708984375, 5.6175537109375, 5.8583984375, 6.0992431640625, 6.340087890625, 6.5809326171875, 6.82177734375, 7.0626220703125, 7.303466796875, 7.5443115234375, 7.78515625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 15.0, 10.0, 15.0, 33.0, 42.0, 63.0, 122.0, 186.0, 341.0, 744.0, 1728.0, 4847.0, 17889.0, 130555.0, 790538.0, 81319.0, 13166.0, 3906.0, 1605.0, 653.0, 344.0, 164.0, 101.0, 61.0, 35.0, 17.0, 15.0, 12.0, 6.0, 2.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.078125, -3.9522705078125, -3.826416015625, -3.7005615234375, -3.57470703125, -3.4488525390625, -3.322998046875, -3.1971435546875, -3.0712890625, -2.9454345703125, -2.819580078125, -2.6937255859375, -2.56787109375, -2.4420166015625, -2.316162109375, -2.1903076171875, -2.064453125, -1.9385986328125, -1.812744140625, -1.6868896484375, -1.56103515625, -1.4351806640625, -1.309326171875, -1.1834716796875, -1.0576171875, -0.9317626953125, -0.805908203125, -0.6800537109375, -0.55419921875, -0.4283447265625, -0.302490234375, -0.1766357421875, -0.05078125, 0.0750732421875, 0.200927734375, 0.3267822265625, 0.45263671875, 0.5784912109375, 0.704345703125, 0.8302001953125, 0.9560546875, 1.0819091796875, 1.207763671875, 1.3336181640625, 1.45947265625, 1.5853271484375, 1.711181640625, 1.8370361328125, 1.962890625, 2.0887451171875, 2.214599609375, 2.3404541015625, 2.46630859375, 2.5921630859375, 2.718017578125, 2.8438720703125, 2.9697265625, 3.0955810546875, 3.221435546875, 3.3472900390625, 3.47314453125, 3.5989990234375, 3.724853515625, 3.8507080078125, 3.9765625]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 6.0, 10.0, 10.0, 15.0, 22.0, 43.0, 71.0, 88.0, 141.0, 182.0, 136.0, 97.0, 67.0, 43.0, 25.0, 15.0, 12.0, 6.0, 8.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0004038810729980469, -0.0003892257809638977, -0.00037457048892974854, -0.00035991519689559937, -0.0003452599048614502, -0.000330604612827301, -0.00031594932079315186, -0.0003012940287590027, -0.0002866387367248535, -0.00027198344469070435, -0.0002573281526565552, -0.000242672860622406, -0.00022801756858825684, -0.00021336227655410767, -0.0001987069845199585, -0.00018405169248580933, -0.00016939640045166016, -0.00015474110841751099, -0.00014008581638336182, -0.00012543052434921265, -0.00011077523231506348, -9.61199402809143e-05, -8.146464824676514e-05, -6.680935621261597e-05, -5.21540641784668e-05, -3.749877214431763e-05, -2.2843480110168457e-05, -8.188188076019287e-06, 6.467103958129883e-06, 2.1122395992279053e-05, 3.577768802642822e-05, 5.043298006057739e-05, 6.508827209472656e-05, 7.974356412887573e-05, 9.43988561630249e-05, 0.00010905414819717407, 0.00012370944023132324, 0.0001383647322654724, 0.00015302002429962158, 0.00016767531633377075, 0.00018233060836791992, 0.0001969859004020691, 0.00021164119243621826, 0.00022629648447036743, 0.0002409517765045166, 0.00025560706853866577, 0.00027026236057281494, 0.0002849176526069641, 0.0002995729446411133, 0.00031422823667526245, 0.0003288835287094116, 0.0003435388207435608, 0.00035819411277770996, 0.00037284940481185913, 0.0003875046968460083, 0.00040215998888015747, 0.00041681528091430664, 0.0004314705729484558, 0.000446125864982605, 0.00046078115701675415, 0.0004754364490509033, 0.0004900917410850525, 0.0005047470331192017, 0.0005194023251533508, 0.0005340576171875]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 4.0, 1.0, 6.0, 5.0, 12.0, 12.0, 12.0, 20.0, 28.0, 48.0, 71.0, 101.0, 171.0, 356.0, 656.0, 1443.0, 3852.0, 15527.0, 117652.0, 760472.0, 125145.0, 15946.0, 4003.0, 1435.0, 718.0, 329.0, 208.0, 111.0, 55.0, 44.0, 34.0, 24.0, 13.0, 18.0, 10.0, 3.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.216796875, -3.103973388671875, -2.99114990234375, -2.878326416015625, -2.7655029296875, -2.652679443359375, -2.53985595703125, -2.427032470703125, -2.314208984375, -2.201385498046875, -2.08856201171875, -1.975738525390625, -1.8629150390625, -1.750091552734375, -1.63726806640625, -1.524444580078125, -1.41162109375, -1.298797607421875, -1.18597412109375, -1.073150634765625, -0.9603271484375, -0.847503662109375, -0.73468017578125, -0.621856689453125, -0.509033203125, -0.396209716796875, -0.28338623046875, -0.170562744140625, -0.0577392578125, 0.055084228515625, 0.16790771484375, 0.280731201171875, 0.3935546875, 0.506378173828125, 0.61920166015625, 0.732025146484375, 0.8448486328125, 0.957672119140625, 1.07049560546875, 1.183319091796875, 1.296142578125, 1.408966064453125, 1.52178955078125, 1.634613037109375, 1.7474365234375, 1.860260009765625, 1.97308349609375, 2.085906982421875, 2.19873046875, 2.311553955078125, 2.42437744140625, 2.537200927734375, 2.6500244140625, 2.762847900390625, 2.87567138671875, 2.988494873046875, 3.101318359375, 3.214141845703125, 3.32696533203125, 3.439788818359375, 3.5526123046875, 3.665435791015625, 3.77825927734375, 3.891082763671875, 4.00390625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 4.0, 3.0, 4.0, 4.0, 7.0, 14.0, 22.0, 19.0, 39.0, 42.0, 54.0, 77.0, 100.0, 119.0, 136.0, 96.0, 81.0, 58.0, 35.0, 35.0, 15.0, 13.0, 9.0, 10.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.595977783203125, -2.48687744140625, -2.377777099609375, -2.2686767578125, -2.159576416015625, -2.05047607421875, -1.941375732421875, -1.832275390625, -1.723175048828125, -1.61407470703125, -1.504974365234375, -1.3958740234375, -1.286773681640625, -1.17767333984375, -1.068572998046875, -0.95947265625, -0.850372314453125, -0.74127197265625, -0.632171630859375, -0.5230712890625, -0.413970947265625, -0.30487060546875, -0.195770263671875, -0.086669921875, 0.022430419921875, 0.13153076171875, 0.240631103515625, 0.3497314453125, 0.458831787109375, 0.56793212890625, 0.677032470703125, 0.7861328125, 0.895233154296875, 1.00433349609375, 1.113433837890625, 1.2225341796875, 1.331634521484375, 1.44073486328125, 1.549835205078125, 1.658935546875, 1.768035888671875, 1.87713623046875, 1.986236572265625, 2.0953369140625, 2.204437255859375, 2.31353759765625, 2.422637939453125, 2.53173828125, 2.640838623046875, 2.74993896484375, 2.859039306640625, 2.9681396484375, 3.077239990234375, 3.18634033203125, 3.295440673828125, 3.404541015625, 3.513641357421875, 3.62274169921875, 3.731842041015625, 3.8409423828125, 3.950042724609375, 4.05914306640625, 4.168243408203125, 4.27734375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 9.0, 13.0, 13.0, 36.0, 78.0, 140.0, 251.0, 208.0, 132.0, 60.0, 28.0, 16.0, 10.0, 6.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.96219253540039, -60.32707595825195, -57.691959381103516, -55.05684280395508, -52.421730041503906, -49.78661346435547, -47.15149688720703, -44.516380310058594, -41.881263732910156, -39.24614715576172, -36.61103057861328, -33.975914001464844, -31.34079933166504, -28.7056827545166, -26.070568084716797, -23.43545150756836, -20.800334930419922, -18.165218353271484, -15.530102729797363, -12.894987106323242, -10.259870529174805, -7.624753952026367, -4.989638328552246, -2.354522705078125, 0.2805938720703125, 2.915709972381592, 5.550826072692871, 8.185941696166992, 10.82105827331543, 13.456174850463867, 16.091289520263672, 18.72640609741211, 21.361526489257812, 23.99664306640625, 26.631759643554688, 29.266874313354492, 31.90199089050293, 34.537109375, 37.17222213745117, 39.80733871459961, 42.44245529174805, 45.077571868896484, 47.71268844604492, 50.34780502319336, 52.98291778564453, 55.61803436279297, 58.253150939941406, 60.888267517089844, 63.52338409423828, 66.15850067138672, 68.79361724853516, 71.4287338256836, 74.06385040283203, 76.69896697998047, 79.3340835571289, 81.96919250488281, 84.60430908203125, 87.23942565917969, 89.87454223632812, 92.50965881347656, 95.144775390625, 97.77989196777344, 100.41500854492188, 103.05012512207031, 105.68524169921875]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 5.0, 2.0, 0.0, 3.0, 3.0, 9.0, 3.0, 7.0, 9.0, 8.0, 7.0, 19.0, 19.0, 16.0, 24.0, 26.0, 28.0, 33.0, 37.0, 35.0, 38.0, 33.0, 31.0, 33.0, 52.0, 43.0, 36.0, 48.0, 36.0, 36.0, 39.0, 40.0, 28.0, 23.0, 28.0, 27.0, 13.0, 23.0, 15.0, 13.0, 13.0, 11.0, 7.0, 12.0, 7.0, 5.0, 7.0, 7.0, 8.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.39800262451172, -32.280540466308594, -31.16307830810547, -30.045618057250977, -28.92815589904785, -27.810693740844727, -26.693233489990234, -25.57577133178711, -24.458309173583984, -23.34084701538086, -22.223384857177734, -21.105924606323242, -19.988462448120117, -18.871000289916992, -17.7535400390625, -16.636077880859375, -15.51861572265625, -14.401153564453125, -13.283692359924316, -12.166231155395508, -11.048768997192383, -9.931306838989258, -8.81384563446045, -7.696383953094482, -6.578922271728516, -5.461460590362549, -4.343998908996582, -3.2265372276306152, -2.1090755462646484, -0.9916138648986816, 0.12584781646728516, 1.243309497833252, 2.360767364501953, 3.47822904586792, 4.595690727233887, 5.7131524085998535, 6.83061408996582, 7.948075771331787, 9.065537452697754, 10.182998657226562, 11.300460815429688, 12.417922973632812, 13.535384178161621, 14.65284538269043, 15.770307540893555, 16.88776969909668, 18.005229949951172, 19.122692108154297, 20.240154266357422, 21.357616424560547, 22.475078582763672, 23.592538833618164, 24.71000099182129, 25.827463150024414, 26.944923400878906, 28.06238555908203, 29.179847717285156, 30.29730987548828, 31.414772033691406, 32.53223419189453, 33.649696350097656, 34.767154693603516, 35.88461685180664, 37.002079010009766, 38.11954116821289]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 5.0, 3.0, 11.0, 12.0, 21.0, 20.0, 61.0, 97.0, 148.0, 321.0, 657.0, 1434.0, 4048.0, 18658.0, 3667568.0, 479240.0, 15581.0, 3671.0, 1400.0, 608.0, 319.0, 169.0, 91.0, 53.0, 30.0, 20.0, 9.0, 7.0, 5.0, 7.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.34375, -18.73828125, -18.1328125, -17.52734375, -16.921875, -16.31640625, -15.7109375, -15.10546875, -14.5, -13.89453125, -13.2890625, -12.68359375, -12.078125, -11.47265625, -10.8671875, -10.26171875, -9.65625, -9.05078125, -8.4453125, -7.83984375, -7.234375, -6.62890625, -6.0234375, -5.41796875, -4.8125, -4.20703125, -3.6015625, -2.99609375, -2.390625, -1.78515625, -1.1796875, -0.57421875, 0.03125, 0.63671875, 1.2421875, 1.84765625, 2.453125, 3.05859375, 3.6640625, 4.26953125, 4.875, 5.48046875, 6.0859375, 6.69140625, 7.296875, 7.90234375, 8.5078125, 9.11328125, 9.71875, 10.32421875, 10.9296875, 11.53515625, 12.140625, 12.74609375, 13.3515625, 13.95703125, 14.5625, 15.16796875, 15.7734375, 16.37890625, 16.984375, 17.58984375, 18.1953125, 18.80078125, 19.40625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 3.0, 11.0, 19.0, 20.0, 44.0, 55.0, 63.0, 107.0, 100.0, 107.0, 104.0, 82.0, 91.0, 61.0, 42.0, 32.0, 16.0, 19.0, 13.0, 9.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.251953125, -3.14630126953125, -3.0406494140625, -2.93499755859375, -2.829345703125, -2.72369384765625, -2.6180419921875, -2.51239013671875, -2.40673828125, -2.30108642578125, -2.1954345703125, -2.08978271484375, -1.984130859375, -1.87847900390625, -1.7728271484375, -1.66717529296875, -1.5615234375, -1.45587158203125, -1.3502197265625, -1.24456787109375, -1.138916015625, -1.03326416015625, -0.9276123046875, -0.82196044921875, -0.71630859375, -0.61065673828125, -0.5050048828125, -0.39935302734375, -0.293701171875, -0.18804931640625, -0.0823974609375, 0.02325439453125, 0.12890625, 0.23455810546875, 0.3402099609375, 0.44586181640625, 0.551513671875, 0.65716552734375, 0.7628173828125, 0.86846923828125, 0.97412109375, 1.07977294921875, 1.1854248046875, 1.29107666015625, 1.396728515625, 1.50238037109375, 1.6080322265625, 1.71368408203125, 1.8193359375, 1.92498779296875, 2.0306396484375, 2.13629150390625, 2.241943359375, 2.34759521484375, 2.4532470703125, 2.55889892578125, 2.66455078125, 2.77020263671875, 2.8758544921875, 2.98150634765625, 3.087158203125, 3.19281005859375, 3.2984619140625, 3.40411376953125, 3.509765625]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 12.0, 18.0, 25.0, 45.0, 75.0, 94.0, 111.0, 189.0, 295.0, 384.0, 612.0, 951.0, 1737.0, 3125.0, 6849.0, 20775.0, 122413.0, 3858641.0, 140307.0, 22306.0, 7417.0, 3216.0, 1714.0, 990.0, 660.0, 421.0, 255.0, 203.0, 142.0, 87.0, 64.0, 38.0, 26.0, 19.0, 19.0, 13.0, 6.0, 7.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.0625, -11.713134765625, -11.36376953125, -11.014404296875, -10.6650390625, -10.315673828125, -9.96630859375, -9.616943359375, -9.267578125, -8.918212890625, -8.56884765625, -8.219482421875, -7.8701171875, -7.520751953125, -7.17138671875, -6.822021484375, -6.47265625, -6.123291015625, -5.77392578125, -5.424560546875, -5.0751953125, -4.725830078125, -4.37646484375, -4.027099609375, -3.677734375, -3.328369140625, -2.97900390625, -2.629638671875, -2.2802734375, -1.930908203125, -1.58154296875, -1.232177734375, -0.8828125, -0.533447265625, -0.18408203125, 0.165283203125, 0.5146484375, 0.864013671875, 1.21337890625, 1.562744140625, 1.912109375, 2.261474609375, 2.61083984375, 2.960205078125, 3.3095703125, 3.658935546875, 4.00830078125, 4.357666015625, 4.70703125, 5.056396484375, 5.40576171875, 5.755126953125, 6.1044921875, 6.453857421875, 6.80322265625, 7.152587890625, 7.501953125, 7.851318359375, 8.20068359375, 8.550048828125, 8.8994140625, 9.248779296875, 9.59814453125, 9.947509765625, 10.296875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 4.0, 6.0, 5.0, 6.0, 9.0, 16.0, 26.0, 38.0, 83.0, 196.0, 2251.0, 1048.0, 186.0, 69.0, 42.0, 23.0, 17.0, 12.0, 8.0, 6.0, 2.0, 4.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.1640625, -5.95098876953125, -5.7379150390625, -5.52484130859375, -5.311767578125, -5.09869384765625, -4.8856201171875, -4.67254638671875, -4.45947265625, -4.24639892578125, -4.0333251953125, -3.82025146484375, -3.607177734375, -3.39410400390625, -3.1810302734375, -2.96795654296875, -2.7548828125, -2.54180908203125, -2.3287353515625, -2.11566162109375, -1.902587890625, -1.68951416015625, -1.4764404296875, -1.26336669921875, -1.05029296875, -0.83721923828125, -0.6241455078125, -0.41107177734375, -0.197998046875, 0.01507568359375, 0.2281494140625, 0.44122314453125, 0.654296875, 0.86737060546875, 1.0804443359375, 1.29351806640625, 1.506591796875, 1.71966552734375, 1.9327392578125, 2.14581298828125, 2.35888671875, 2.57196044921875, 2.7850341796875, 2.99810791015625, 3.211181640625, 3.42425537109375, 3.6373291015625, 3.85040283203125, 4.0634765625, 4.27655029296875, 4.4896240234375, 4.70269775390625, 4.915771484375, 5.12884521484375, 5.3419189453125, 5.55499267578125, 5.76806640625, 5.98114013671875, 6.1942138671875, 6.40728759765625, 6.620361328125, 6.83343505859375, 7.0465087890625, 7.25958251953125, 7.47265625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 15.0, 55.0, 185.0, 358.0, 240.0, 87.0, 34.0, 16.0, 10.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.696670532226562, -12.765999794006348, -10.835329055786133, -8.904659271240234, -6.973988056182861, -5.043317794799805, -3.11264705657959, -1.181976318359375, 0.7486944198608398, 2.6793651580810547, 4.6100358963012695, 6.540706157684326, 8.471376419067383, 10.402047157287598, 12.332717895507812, 14.263388633728027, 16.194059371948242, 18.12472915649414, 20.055400848388672, 21.98607063293457, 23.9167423248291, 25.847412109375, 27.77808380126953, 29.70875358581543, 31.639423370361328, 33.57009506225586, 35.500762939453125, 37.431434631347656, 39.36210632324219, 41.29277801513672, 43.223445892333984, 45.154117584228516, 47.08478927612305, 49.01546096801758, 50.946128845214844, 52.876800537109375, 54.807472229003906, 56.73814392089844, 58.6688117980957, 60.599483489990234, 62.530155181884766, 64.46082305908203, 66.39149475097656, 68.3221664428711, 70.25283813476562, 72.18350982666016, 74.11418151855469, 76.04484558105469, 77.97551727294922, 79.90618896484375, 81.83686065673828, 83.76753234863281, 85.69819641113281, 87.62886810302734, 89.55953979492188, 91.4902114868164, 93.42088317871094, 95.35155487060547, 97.2822265625, 99.21289825439453, 101.14356231689453, 103.07423400878906, 105.0049057006836, 106.93557739257812, 108.86624908447266]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 2.0, 6.0, 5.0, 8.0, 12.0, 8.0, 14.0, 13.0, 14.0, 19.0, 15.0, 12.0, 20.0, 32.0, 22.0, 38.0, 38.0, 39.0, 36.0, 47.0, 50.0, 41.0, 44.0, 44.0, 39.0, 43.0, 33.0, 46.0, 43.0, 25.0, 25.0, 22.0, 25.0, 26.0, 17.0, 14.0, 9.0, 15.0, 13.0, 5.0, 6.0, 5.0, 4.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 2.0], "bins": [-17.335174560546875, -16.855005264282227, -16.374835968017578, -15.894665718078613, -15.414496421813965, -14.934326171875, -14.454156875610352, -13.973987579345703, -13.493818283081055, -13.013648986816406, -12.533478736877441, -12.053309440612793, -11.573140144348145, -11.09296989440918, -10.612800598144531, -10.132631301879883, -9.652461051940918, -9.17229175567627, -8.692121505737305, -8.211952209472656, -7.731782913208008, -7.251613140106201, -6.7714433670043945, -6.291274070739746, -5.8111042976379395, -5.330934524536133, -4.850765228271484, -4.370595455169678, -3.89042592048645, -3.4102563858032227, -2.930086612701416, -2.4499170780181885, -1.9697484970092773, -1.4895789623260498, -1.0094093084335327, -0.5292396545410156, -0.049070119857788086, 0.43109941482543945, 0.9112691879272461, 1.3914387226104736, 1.8716082572937012, 2.3517777919769287, 2.8319473266601562, 3.312117099761963, 3.7922866344451904, 4.272456169128418, 4.752625942230225, 5.232795715332031, 5.71296501159668, 6.193134784698486, 6.673304080963135, 7.153473854064941, 7.63364315032959, 8.113813400268555, 8.593982696533203, 9.074151992797852, 9.5543212890625, 10.034490585327148, 10.514660835266113, 10.994830131530762, 11.47499942779541, 11.955169677734375, 12.435338973999023, 12.915508270263672, 13.395678520202637]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 11.0, 13.0, 13.0, 22.0, 17.0, 32.0, 45.0, 75.0, 91.0, 160.0, 271.0, 481.0, 924.0, 1863.0, 3998.0, 8945.0, 21954.0, 59135.0, 217640.0, 505034.0, 151104.0, 45214.0, 17431.0, 7328.0, 3248.0, 1595.0, 806.0, 436.0, 262.0, 127.0, 87.0, 43.0, 45.0, 25.0, 19.0, 15.0, 14.0, 10.0, 5.0, 4.0, 5.0, 6.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.546875, -8.2655029296875, -7.984130859375, -7.7027587890625, -7.42138671875, -7.1400146484375, -6.858642578125, -6.5772705078125, -6.2958984375, -6.0145263671875, -5.733154296875, -5.4517822265625, -5.17041015625, -4.8890380859375, -4.607666015625, -4.3262939453125, -4.044921875, -3.7635498046875, -3.482177734375, -3.2008056640625, -2.91943359375, -2.6380615234375, -2.356689453125, -2.0753173828125, -1.7939453125, -1.5125732421875, -1.231201171875, -0.9498291015625, -0.66845703125, -0.3870849609375, -0.105712890625, 0.1756591796875, 0.45703125, 0.7384033203125, 1.019775390625, 1.3011474609375, 1.58251953125, 1.8638916015625, 2.145263671875, 2.4266357421875, 2.7080078125, 2.9893798828125, 3.270751953125, 3.5521240234375, 3.83349609375, 4.1148681640625, 4.396240234375, 4.6776123046875, 4.958984375, 5.2403564453125, 5.521728515625, 5.8031005859375, 6.08447265625, 6.3658447265625, 6.647216796875, 6.9285888671875, 7.2099609375, 7.4913330078125, 7.772705078125, 8.0540771484375, 8.33544921875, 8.6168212890625, 8.898193359375, 9.1795654296875, 9.4609375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 15.0, 14.0, 31.0, 49.0, 48.0, 63.0, 80.0, 106.0, 103.0, 114.0, 80.0, 70.0, 53.0, 38.0, 33.0, 38.0, 24.0, 12.0, 7.0, 8.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.234375, -3.125701904296875, -3.01702880859375, -2.908355712890625, -2.7996826171875, -2.691009521484375, -2.58233642578125, -2.473663330078125, -2.364990234375, -2.256317138671875, -2.14764404296875, -2.038970947265625, -1.9302978515625, -1.821624755859375, -1.71295166015625, -1.604278564453125, -1.49560546875, -1.386932373046875, -1.27825927734375, -1.169586181640625, -1.0609130859375, -0.952239990234375, -0.84356689453125, -0.734893798828125, -0.626220703125, -0.517547607421875, -0.40887451171875, -0.300201416015625, -0.1915283203125, -0.082855224609375, 0.02581787109375, 0.134490966796875, 0.2431640625, 0.351837158203125, 0.46051025390625, 0.569183349609375, 0.6778564453125, 0.786529541015625, 0.89520263671875, 1.003875732421875, 1.112548828125, 1.221221923828125, 1.32989501953125, 1.438568115234375, 1.5472412109375, 1.655914306640625, 1.76458740234375, 1.873260498046875, 1.98193359375, 2.090606689453125, 2.19927978515625, 2.307952880859375, 2.4166259765625, 2.525299072265625, 2.63397216796875, 2.742645263671875, 2.851318359375, 2.959991455078125, 3.06866455078125, 3.177337646484375, 3.2860107421875, 3.394683837890625, 3.50335693359375, 3.612030029296875, 3.720703125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 8.0, 6.0, 6.0, 10.0, 9.0, 15.0, 20.0, 28.0, 32.0, 37.0, 73.0, 119.0, 158.0, 232.0, 342.0, 621.0, 1048.0, 2069.0, 4200.0, 9976.0, 25603.0, 82223.0, 392792.0, 399898.0, 83949.0, 26029.0, 9955.0, 4296.0, 2017.0, 1106.0, 610.0, 344.0, 230.0, 153.0, 104.0, 75.0, 54.0, 30.0, 29.0, 18.0, 8.0, 5.0, 6.0, 6.0, 5.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.6015625, -10.2596435546875, -9.917724609375, -9.5758056640625, -9.23388671875, -8.8919677734375, -8.550048828125, -8.2081298828125, -7.8662109375, -7.5242919921875, -7.182373046875, -6.8404541015625, -6.49853515625, -6.1566162109375, -5.814697265625, -5.4727783203125, -5.130859375, -4.7889404296875, -4.447021484375, -4.1051025390625, -3.76318359375, -3.4212646484375, -3.079345703125, -2.7374267578125, -2.3955078125, -2.0535888671875, -1.711669921875, -1.3697509765625, -1.02783203125, -0.6859130859375, -0.343994140625, -0.0020751953125, 0.33984375, 0.6817626953125, 1.023681640625, 1.3656005859375, 1.70751953125, 2.0494384765625, 2.391357421875, 2.7332763671875, 3.0751953125, 3.4171142578125, 3.759033203125, 4.1009521484375, 4.44287109375, 4.7847900390625, 5.126708984375, 5.4686279296875, 5.810546875, 6.1524658203125, 6.494384765625, 6.8363037109375, 7.17822265625, 7.5201416015625, 7.862060546875, 8.2039794921875, 8.5458984375, 8.8878173828125, 9.229736328125, 9.5716552734375, 9.91357421875, 10.2554931640625, 10.597412109375, 10.9393310546875, 11.28125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 4.0, 6.0, 7.0, 13.0, 8.0, 6.0, 15.0, 17.0, 18.0, 25.0, 31.0, 28.0, 32.0, 43.0, 43.0, 47.0, 60.0, 56.0, 54.0, 50.0, 49.0, 40.0, 41.0, 45.0, 32.0, 40.0, 28.0, 26.0, 21.0, 28.0, 13.0, 15.0, 12.0, 16.0, 7.0, 8.0, 7.0, 2.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-11.8671875, -11.483154296875, -11.09912109375, -10.715087890625, -10.3310546875, -9.947021484375, -9.56298828125, -9.178955078125, -8.794921875, -8.410888671875, -8.02685546875, -7.642822265625, -7.2587890625, -6.874755859375, -6.49072265625, -6.106689453125, -5.72265625, -5.338623046875, -4.95458984375, -4.570556640625, -4.1865234375, -3.802490234375, -3.41845703125, -3.034423828125, -2.650390625, -2.266357421875, -1.88232421875, -1.498291015625, -1.1142578125, -0.730224609375, -0.34619140625, 0.037841796875, 0.421875, 0.805908203125, 1.18994140625, 1.573974609375, 1.9580078125, 2.342041015625, 2.72607421875, 3.110107421875, 3.494140625, 3.878173828125, 4.26220703125, 4.646240234375, 5.0302734375, 5.414306640625, 5.79833984375, 6.182373046875, 6.56640625, 6.950439453125, 7.33447265625, 7.718505859375, 8.1025390625, 8.486572265625, 8.87060546875, 9.254638671875, 9.638671875, 10.022705078125, 10.40673828125, 10.790771484375, 11.1748046875, 11.558837890625, 11.94287109375, 12.326904296875, 12.7109375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 6.0, 8.0, 12.0, 14.0, 25.0, 34.0, 29.0, 70.0, 102.0, 149.0, 317.0, 687.0, 1597.0, 5266.0, 31245.0, 740977.0, 246393.0, 15831.0, 3468.0, 1190.0, 488.0, 249.0, 145.0, 78.0, 52.0, 38.0, 20.0, 26.0, 11.0, 8.0, 6.0, 7.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.34765625, -7.09283447265625, -6.8380126953125, -6.58319091796875, -6.328369140625, -6.07354736328125, -5.8187255859375, -5.56390380859375, -5.30908203125, -5.05426025390625, -4.7994384765625, -4.54461669921875, -4.289794921875, -4.03497314453125, -3.7801513671875, -3.52532958984375, -3.2705078125, -3.01568603515625, -2.7608642578125, -2.50604248046875, -2.251220703125, -1.99639892578125, -1.7415771484375, -1.48675537109375, -1.23193359375, -0.97711181640625, -0.7222900390625, -0.46746826171875, -0.212646484375, 0.04217529296875, 0.2969970703125, 0.55181884765625, 0.806640625, 1.06146240234375, 1.3162841796875, 1.57110595703125, 1.825927734375, 2.08074951171875, 2.3355712890625, 2.59039306640625, 2.84521484375, 3.10003662109375, 3.3548583984375, 3.60968017578125, 3.864501953125, 4.11932373046875, 4.3741455078125, 4.62896728515625, 4.8837890625, 5.13861083984375, 5.3934326171875, 5.64825439453125, 5.903076171875, 6.15789794921875, 6.4127197265625, 6.66754150390625, 6.92236328125, 7.17718505859375, 7.4320068359375, 7.68682861328125, 7.941650390625, 8.19647216796875, 8.4512939453125, 8.70611572265625, 8.9609375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 6.0, 9.0, 4.0, 12.0, 18.0, 21.0, 23.0, 36.0, 47.0, 66.0, 114.0, 123.0, 124.0, 118.0, 90.0, 52.0, 41.0, 31.0, 17.0, 11.0, 5.0, 12.0, 7.0, 2.0, 2.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0005536079406738281, -0.0005363672971725464, -0.0005191266536712646, -0.0005018860101699829, -0.00048464536666870117, -0.00046740472316741943, -0.0004501640796661377, -0.00043292343616485596, -0.0004156827926635742, -0.0003984421491622925, -0.00038120150566101074, -0.000363960862159729, -0.00034672021865844727, -0.00032947957515716553, -0.0003122389316558838, -0.00029499828815460205, -0.0002777576446533203, -0.0002605170011520386, -0.00024327635765075684, -0.0002260357141494751, -0.00020879507064819336, -0.00019155442714691162, -0.00017431378364562988, -0.00015707314014434814, -0.0001398324966430664, -0.00012259185314178467, -0.00010535120964050293, -8.811056613922119e-05, -7.086992263793945e-05, -5.3629279136657715e-05, -3.6388635635375977e-05, -1.9147992134094238e-05, -1.9073486328125e-06, 1.5333294868469238e-05, 3.2573938369750977e-05, 4.9814581871032715e-05, 6.705522537231445e-05, 8.429586887359619e-05, 0.00010153651237487793, 0.00011877715587615967, 0.0001360177993774414, 0.00015325844287872314, 0.00017049908638000488, 0.00018773972988128662, 0.00020498037338256836, 0.0002222210168838501, 0.00023946166038513184, 0.0002567023038864136, 0.0002739429473876953, 0.00029118359088897705, 0.0003084242343902588, 0.00032566487789154053, 0.00034290552139282227, 0.000360146164894104, 0.00037738680839538574, 0.0003946274518966675, 0.0004118680953979492, 0.00042910873889923096, 0.0004463493824005127, 0.00046359002590179443, 0.00048083066940307617, 0.0004980713129043579, 0.0005153119564056396, 0.0005325525999069214, 0.0005497932434082031]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 6.0, 0.0, 5.0, 8.0, 6.0, 15.0, 19.0, 26.0, 29.0, 56.0, 81.0, 117.0, 180.0, 315.0, 504.0, 901.0, 1703.0, 3509.0, 8474.0, 24045.0, 94829.0, 522370.0, 307272.0, 55444.0, 16466.0, 6181.0, 2695.0, 1377.0, 752.0, 385.0, 267.0, 163.0, 112.0, 68.0, 55.0, 33.0, 26.0, 17.0, 9.0, 8.0, 7.0, 7.0, 4.0, 1.0, 4.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-3.529296875, -3.421783447265625, -3.31427001953125, -3.206756591796875, -3.0992431640625, -2.991729736328125, -2.88421630859375, -2.776702880859375, -2.669189453125, -2.561676025390625, -2.45416259765625, -2.346649169921875, -2.2391357421875, -2.131622314453125, -2.02410888671875, -1.916595458984375, -1.80908203125, -1.701568603515625, -1.59405517578125, -1.486541748046875, -1.3790283203125, -1.271514892578125, -1.16400146484375, -1.056488037109375, -0.948974609375, -0.841461181640625, -0.73394775390625, -0.626434326171875, -0.5189208984375, -0.411407470703125, -0.30389404296875, -0.196380615234375, -0.0888671875, 0.018646240234375, 0.12615966796875, 0.233673095703125, 0.3411865234375, 0.448699951171875, 0.55621337890625, 0.663726806640625, 0.771240234375, 0.878753662109375, 0.98626708984375, 1.093780517578125, 1.2012939453125, 1.308807373046875, 1.41632080078125, 1.523834228515625, 1.63134765625, 1.738861083984375, 1.84637451171875, 1.953887939453125, 2.0614013671875, 2.168914794921875, 2.27642822265625, 2.383941650390625, 2.491455078125, 2.598968505859375, 2.70648193359375, 2.813995361328125, 2.9215087890625, 3.029022216796875, 3.13653564453125, 3.244049072265625, 3.3515625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 7.0, 6.0, 12.0, 7.0, 12.0, 21.0, 30.0, 20.0, 44.0, 55.0, 63.0, 91.0, 100.0, 110.0, 95.0, 73.0, 53.0, 48.0, 26.0, 29.0, 14.0, 16.0, 13.0, 14.0, 10.0, 6.0, 5.0, 3.0, 0.0, 2.0, 5.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.921875, -3.7911376953125, -3.660400390625, -3.5296630859375, -3.39892578125, -3.2681884765625, -3.137451171875, -3.0067138671875, -2.8759765625, -2.7452392578125, -2.614501953125, -2.4837646484375, -2.35302734375, -2.2222900390625, -2.091552734375, -1.9608154296875, -1.830078125, -1.6993408203125, -1.568603515625, -1.4378662109375, -1.30712890625, -1.1763916015625, -1.045654296875, -0.9149169921875, -0.7841796875, -0.6534423828125, -0.522705078125, -0.3919677734375, -0.26123046875, -0.1304931640625, 0.000244140625, 0.1309814453125, 0.26171875, 0.3924560546875, 0.523193359375, 0.6539306640625, 0.78466796875, 0.9154052734375, 1.046142578125, 1.1768798828125, 1.3076171875, 1.4383544921875, 1.569091796875, 1.6998291015625, 1.83056640625, 1.9613037109375, 2.092041015625, 2.2227783203125, 2.353515625, 2.4842529296875, 2.614990234375, 2.7457275390625, 2.87646484375, 3.0072021484375, 3.137939453125, 3.2686767578125, 3.3994140625, 3.5301513671875, 3.660888671875, 3.7916259765625, 3.92236328125, 4.0531005859375, 4.183837890625, 4.3145751953125, 4.4453125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 10.0, 7.0, 15.0, 15.0, 19.0, 18.0, 40.0, 55.0, 65.0, 99.0, 116.0, 122.0, 103.0, 91.0, 64.0, 47.0, 32.0, 14.0, 13.0, 15.0, 7.0, 4.0, 5.0, 5.0, 4.0, 7.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.342247009277344, -46.25959777832031, -44.17695236206055, -42.094303131103516, -40.011653900146484, -37.92900848388672, -35.84635925292969, -33.763710021972656, -31.681062698364258, -29.59841537475586, -27.515766143798828, -25.43311882019043, -23.35047149658203, -21.267822265625, -19.1851749420166, -17.102527618408203, -15.019878387451172, -12.937230110168457, -10.854581832885742, -8.771934509277344, -6.689286231994629, -4.606637954711914, -2.5239906311035156, -0.4413423538208008, 1.641305923461914, 3.72395396232605, 5.8066020011901855, 7.889249801635742, 9.971898078918457, 12.054546356201172, 14.13719367980957, 16.21984100341797, 18.302490234375, 20.3851375579834, 22.46778678894043, 24.550434112548828, 26.63308334350586, 28.715730667114258, 30.798377990722656, 32.88102722167969, 34.96367645263672, 37.04632568359375, 39.128971099853516, 41.21162033081055, 43.29426956176758, 45.376914978027344, 47.459564208984375, 49.542213439941406, 51.62485885620117, 53.7075080871582, 55.79015350341797, 57.872802734375, 59.95545196533203, 62.03810119628906, 64.12074279785156, 66.2033920288086, 68.28604125976562, 70.36869049072266, 72.45133972167969, 74.53398132324219, 76.61663055419922, 78.69927978515625, 80.78192901611328, 82.86457824707031, 84.94722747802734]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 2.0, 7.0, 9.0, 9.0, 4.0, 12.0, 11.0, 9.0, 17.0, 17.0, 27.0, 17.0, 29.0, 29.0, 24.0, 36.0, 39.0, 39.0, 42.0, 41.0, 57.0, 47.0, 51.0, 58.0, 39.0, 47.0, 39.0, 34.0, 31.0, 18.0, 23.0, 23.0, 23.0, 13.0, 15.0, 10.0, 10.0, 13.0, 9.0, 10.0, 4.0, 5.0, 1.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.44706344604492, -58.39943313598633, -56.351802825927734, -54.30417251586914, -52.25654220581055, -50.20891189575195, -48.16128158569336, -46.113651275634766, -44.06602096557617, -42.01839065551758, -39.970760345458984, -37.92313003540039, -35.8754997253418, -33.8278694152832, -31.78023910522461, -29.732608795166016, -27.684978485107422, -25.637348175048828, -23.589717864990234, -21.54208755493164, -19.494457244873047, -17.446826934814453, -15.39919662475586, -13.351566314697266, -11.303936004638672, -9.256305694580078, -7.208675384521484, -5.161045074462891, -3.113414764404297, -1.0657844543457031, 0.9818458557128906, 3.0294761657714844, 5.0771026611328125, 7.124732971191406, 9.17236328125, 11.219993591308594, 13.267623901367188, 15.315254211425781, 17.362884521484375, 19.41051483154297, 21.458145141601562, 23.505775451660156, 25.55340576171875, 27.601036071777344, 29.648666381835938, 31.69629669189453, 33.743927001953125, 35.79155731201172, 37.83918762207031, 39.886817932128906, 41.9344482421875, 43.982078552246094, 46.02970886230469, 48.07733917236328, 50.124969482421875, 52.17259979248047, 54.22023010253906, 56.267860412597656, 58.31549072265625, 60.363121032714844, 62.41075134277344, 64.45838165283203, 66.50601196289062, 68.55364227294922, 70.60127258300781]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 8.0, 7.0, 15.0, 18.0, 25.0, 24.0, 47.0, 57.0, 80.0, 119.0, 162.0, 247.0, 416.0, 659.0, 1262.0, 3001.0, 11132.0, 4136965.0, 31471.0, 4517.0, 1794.0, 802.0, 504.0, 305.0, 193.0, 130.0, 89.0, 67.0, 37.0, 46.0, 16.0, 22.0, 15.0, 9.0, 3.0, 6.0, 5.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.015625, -19.384033203125, -18.75244140625, -18.120849609375, -17.4892578125, -16.857666015625, -16.22607421875, -15.594482421875, -14.962890625, -14.331298828125, -13.69970703125, -13.068115234375, -12.4365234375, -11.804931640625, -11.17333984375, -10.541748046875, -9.91015625, -9.278564453125, -8.64697265625, -8.015380859375, -7.3837890625, -6.752197265625, -6.12060546875, -5.489013671875, -4.857421875, -4.225830078125, -3.59423828125, -2.962646484375, -2.3310546875, -1.699462890625, -1.06787109375, -0.436279296875, 0.1953125, 0.826904296875, 1.45849609375, 2.090087890625, 2.7216796875, 3.353271484375, 3.98486328125, 4.616455078125, 5.248046875, 5.879638671875, 6.51123046875, 7.142822265625, 7.7744140625, 8.406005859375, 9.03759765625, 9.669189453125, 10.30078125, 10.932373046875, 11.56396484375, 12.195556640625, 12.8271484375, 13.458740234375, 14.09033203125, 14.721923828125, 15.353515625, 15.985107421875, 16.61669921875, 17.248291015625, 17.8798828125, 18.511474609375, 19.14306640625, 19.774658203125, 20.40625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 8.0, 11.0, 15.0, 24.0, 22.0, 24.0, 38.0, 54.0, 45.0, 65.0, 73.0, 71.0, 78.0, 76.0, 64.0, 64.0, 43.0, 32.0, 33.0, 50.0, 22.0, 21.0, 12.0, 14.0, 10.0, 6.0, 9.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2109375, -3.09423828125, -2.9775390625, -2.86083984375, -2.744140625, -2.62744140625, -2.5107421875, -2.39404296875, -2.27734375, -2.16064453125, -2.0439453125, -1.92724609375, -1.810546875, -1.69384765625, -1.5771484375, -1.46044921875, -1.34375, -1.22705078125, -1.1103515625, -0.99365234375, -0.876953125, -0.76025390625, -0.6435546875, -0.52685546875, -0.41015625, -0.29345703125, -0.1767578125, -0.06005859375, 0.056640625, 0.17333984375, 0.2900390625, 0.40673828125, 0.5234375, 0.64013671875, 0.7568359375, 0.87353515625, 0.990234375, 1.10693359375, 1.2236328125, 1.34033203125, 1.45703125, 1.57373046875, 1.6904296875, 1.80712890625, 1.923828125, 2.04052734375, 2.1572265625, 2.27392578125, 2.390625, 2.50732421875, 2.6240234375, 2.74072265625, 2.857421875, 2.97412109375, 3.0908203125, 3.20751953125, 3.32421875, 3.44091796875, 3.5576171875, 3.67431640625, 3.791015625, 3.90771484375, 4.0244140625, 4.14111328125, 4.2578125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 6.0, 4.0, 8.0, 10.0, 5.0, 10.0, 17.0, 15.0, 32.0, 43.0, 48.0, 60.0, 100.0, 172.0, 322.0, 579.0, 1061.0, 2234.0, 6123.0, 55768.0, 4109783.0, 11512.0, 3253.0, 1406.0, 687.0, 388.0, 259.0, 139.0, 63.0, 46.0, 33.0, 25.0, 24.0, 16.0, 9.0, 7.0, 6.0, 3.0, 9.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-26.65625, -25.93994140625, -25.2236328125, -24.50732421875, -23.791015625, -23.07470703125, -22.3583984375, -21.64208984375, -20.92578125, -20.20947265625, -19.4931640625, -18.77685546875, -18.060546875, -17.34423828125, -16.6279296875, -15.91162109375, -15.1953125, -14.47900390625, -13.7626953125, -13.04638671875, -12.330078125, -11.61376953125, -10.8974609375, -10.18115234375, -9.46484375, -8.74853515625, -8.0322265625, -7.31591796875, -6.599609375, -5.88330078125, -5.1669921875, -4.45068359375, -3.734375, -3.01806640625, -2.3017578125, -1.58544921875, -0.869140625, -0.15283203125, 0.5634765625, 1.27978515625, 1.99609375, 2.71240234375, 3.4287109375, 4.14501953125, 4.861328125, 5.57763671875, 6.2939453125, 7.01025390625, 7.7265625, 8.44287109375, 9.1591796875, 9.87548828125, 10.591796875, 11.30810546875, 12.0244140625, 12.74072265625, 13.45703125, 14.17333984375, 14.8896484375, 15.60595703125, 16.322265625, 17.03857421875, 17.7548828125, 18.47119140625, 19.1875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 1.0, 6.0, 3.0, 8.0, 14.0, 40.0, 228.0, 3700.0, 36.0, 11.0, 10.0, 5.0, 1.0, 7.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-6.11328125, -5.983673095703125, -5.85406494140625, -5.724456787109375, -5.5948486328125, -5.465240478515625, -5.33563232421875, -5.206024169921875, -5.076416015625, -4.946807861328125, -4.81719970703125, -4.687591552734375, -4.5579833984375, -4.428375244140625, -4.29876708984375, -4.169158935546875, -4.03955078125, -3.909942626953125, -3.78033447265625, -3.650726318359375, -3.5211181640625, -3.391510009765625, -3.26190185546875, -3.132293701171875, -3.002685546875, -2.873077392578125, -2.74346923828125, -2.613861083984375, -2.4842529296875, -2.354644775390625, -2.22503662109375, -2.095428466796875, -1.9658203125, -1.836212158203125, -1.70660400390625, -1.576995849609375, -1.4473876953125, -1.317779541015625, -1.18817138671875, -1.058563232421875, -0.928955078125, -0.799346923828125, -0.66973876953125, -0.540130615234375, -0.4105224609375, -0.280914306640625, -0.15130615234375, -0.021697998046875, 0.10791015625, 0.237518310546875, 0.36712646484375, 0.496734619140625, 0.6263427734375, 0.755950927734375, 0.88555908203125, 1.015167236328125, 1.144775390625, 1.274383544921875, 1.40399169921875, 1.533599853515625, 1.6632080078125, 1.792816162109375, 1.92242431640625, 2.052032470703125, 2.181640625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 11.0, 25.0, 34.0, 55.0, 106.0, 176.0, 224.0, 202.0, 83.0, 53.0, 20.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.095752716064453, -23.56075096130371, -23.02574920654297, -22.49074935913086, -21.955747604370117, -21.420745849609375, -20.885744094848633, -20.35074234008789, -19.81574249267578, -19.28074073791504, -18.745738983154297, -18.210739135742188, -17.675737380981445, -17.140735626220703, -16.60573387145996, -16.07073211669922, -15.535731315612793, -15.00072956085205, -14.465728759765625, -13.930727005004883, -13.395726203918457, -12.860724449157715, -12.325723648071289, -11.790721893310547, -11.255720138549805, -10.720718383789062, -10.185717582702637, -9.650715827941895, -9.115715026855469, -8.580713272094727, -8.045711517333984, -7.510710716247559, -6.975710868835449, -6.440709590911865, -5.905708312988281, -5.370706558227539, -4.835705757141113, -4.300704002380371, -3.765702724456787, -3.230701446533203, -2.695700168609619, -2.160698890686035, -1.6256974935531616, -1.090696096420288, -0.5556948184967041, -0.020693540573120117, 0.514307975769043, 1.049309253692627, 1.584310531616211, 2.119311809539795, 2.654313087463379, 3.189314603805542, 3.724315881729126, 4.259317398071289, 4.794318675994873, 5.329319953918457, 5.864321231842041, 6.399322509765625, 6.934323787689209, 7.469325065612793, 8.004326820373535, 8.539327621459961, 9.074329376220703, 9.609331130981445, 10.144331932067871]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 12.0, 9.0, 7.0, 10.0, 20.0, 15.0, 24.0, 26.0, 27.0, 18.0, 31.0, 21.0, 45.0, 27.0, 41.0, 34.0, 35.0, 39.0, 45.0, 39.0, 34.0, 36.0, 44.0, 35.0, 34.0, 33.0, 22.0, 34.0, 26.0, 22.0, 20.0, 20.0, 26.0, 12.0, 10.0, 12.0, 10.0, 9.0, 10.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.5264129638671875, -5.336819171905518, -5.147225379943848, -4.957631587982178, -4.768037796020508, -4.578444480895996, -4.388850688934326, -4.199256896972656, -4.009663105010986, -3.8200693130493164, -3.6304755210876465, -3.4408819675445557, -3.2512881755828857, -3.061694383621216, -2.872100830078125, -2.682507038116455, -2.492913246154785, -2.3033194541931152, -2.1137256622314453, -1.9241321086883545, -1.7345383167266846, -1.5449445247650146, -1.3553508520126343, -1.165757179260254, -0.976163387298584, -0.7865696549415588, -0.5969759225845337, -0.40738219022750854, -0.2177884578704834, -0.028194725513458252, 0.1613990068435669, 0.35099267959594727, 0.5405864715576172, 0.7301802039146423, 0.9197739362716675, 1.1093676090240479, 1.2989614009857178, 1.4885551929473877, 1.678148865699768, 1.8677425384521484, 2.0573363304138184, 2.2469301223754883, 2.436523914337158, 2.626117467880249, 2.815711259841919, 3.005305051803589, 3.1948986053466797, 3.3844923973083496, 3.5740861892700195, 3.7636799812316895, 3.9532737731933594, 4.142867565155029, 4.332461357116699, 4.522054672241211, 4.711648464202881, 4.901242256164551, 5.090836048126221, 5.280429840087891, 5.4700236320495605, 5.6596174240112305, 5.849210739135742, 6.038804531097412, 6.228398323059082, 6.417992115020752, 6.607585906982422]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 0.0, 1.0, 3.0, 6.0, 9.0, 5.0, 15.0, 20.0, 26.0, 40.0, 54.0, 107.0, 133.0, 221.0, 419.0, 646.0, 1168.0, 2096.0, 3986.0, 7625.0, 16783.0, 39497.0, 110119.0, 354460.0, 337132.0, 103938.0, 37575.0, 16159.0, 7656.0, 3804.0, 2065.0, 1112.0, 635.0, 374.0, 243.0, 158.0, 99.0, 77.0, 35.0, 25.0, 14.0, 8.0, 4.0, 5.0, 1.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.89453125, -7.60186767578125, -7.3092041015625, -7.01654052734375, -6.723876953125, -6.43121337890625, -6.1385498046875, -5.84588623046875, -5.55322265625, -5.26055908203125, -4.9678955078125, -4.67523193359375, -4.382568359375, -4.08990478515625, -3.7972412109375, -3.50457763671875, -3.2119140625, -2.91925048828125, -2.6265869140625, -2.33392333984375, -2.041259765625, -1.74859619140625, -1.4559326171875, -1.16326904296875, -0.87060546875, -0.57794189453125, -0.2852783203125, 0.00738525390625, 0.300048828125, 0.59271240234375, 0.8853759765625, 1.17803955078125, 1.470703125, 1.76336669921875, 2.0560302734375, 2.34869384765625, 2.641357421875, 2.93402099609375, 3.2266845703125, 3.51934814453125, 3.81201171875, 4.10467529296875, 4.3973388671875, 4.69000244140625, 4.982666015625, 5.27532958984375, 5.5679931640625, 5.86065673828125, 6.1533203125, 6.44598388671875, 6.7386474609375, 7.03131103515625, 7.323974609375, 7.61663818359375, 7.9093017578125, 8.20196533203125, 8.49462890625, 8.78729248046875, 9.0799560546875, 9.37261962890625, 9.665283203125, 9.95794677734375, 10.2506103515625, 10.54327392578125, 10.8359375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 3.0, 5.0, 4.0, 4.0, 6.0, 8.0, 12.0, 13.0, 20.0, 25.0, 20.0, 39.0, 38.0, 66.0, 56.0, 77.0, 74.0, 72.0, 76.0, 66.0, 58.0, 47.0, 39.0, 42.0, 26.0, 34.0, 22.0, 13.0, 12.0, 10.0, 11.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.30078125, -3.18096923828125, -3.0611572265625, -2.94134521484375, -2.821533203125, -2.70172119140625, -2.5819091796875, -2.46209716796875, -2.34228515625, -2.22247314453125, -2.1026611328125, -1.98284912109375, -1.863037109375, -1.74322509765625, -1.6234130859375, -1.50360107421875, -1.3837890625, -1.26397705078125, -1.1441650390625, -1.02435302734375, -0.904541015625, -0.78472900390625, -0.6649169921875, -0.54510498046875, -0.42529296875, -0.30548095703125, -0.1856689453125, -0.06585693359375, 0.053955078125, 0.17376708984375, 0.2935791015625, 0.41339111328125, 0.533203125, 0.65301513671875, 0.7728271484375, 0.89263916015625, 1.012451171875, 1.13226318359375, 1.2520751953125, 1.37188720703125, 1.49169921875, 1.61151123046875, 1.7313232421875, 1.85113525390625, 1.970947265625, 2.09075927734375, 2.2105712890625, 2.33038330078125, 2.4501953125, 2.57000732421875, 2.6898193359375, 2.80963134765625, 2.929443359375, 3.04925537109375, 3.1690673828125, 3.28887939453125, 3.40869140625, 3.52850341796875, 3.6483154296875, 3.76812744140625, 3.887939453125, 4.00775146484375, 4.1275634765625, 4.24737548828125, 4.3671875]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 6.0, 6.0, 5.0, 7.0, 11.0, 18.0, 24.0, 45.0, 37.0, 67.0, 87.0, 124.0, 211.0, 355.0, 650.0, 1151.0, 2346.0, 5335.0, 13511.0, 40259.0, 188169.0, 612403.0, 131788.0, 31884.0, 10895.0, 4505.0, 2076.0, 1014.0, 563.0, 342.0, 205.0, 135.0, 88.0, 63.0, 49.0, 38.0, 27.0, 21.0, 5.0, 6.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.78125, -15.294189453125, -14.80712890625, -14.320068359375, -13.8330078125, -13.345947265625, -12.85888671875, -12.371826171875, -11.884765625, -11.397705078125, -10.91064453125, -10.423583984375, -9.9365234375, -9.449462890625, -8.96240234375, -8.475341796875, -7.98828125, -7.501220703125, -7.01416015625, -6.527099609375, -6.0400390625, -5.552978515625, -5.06591796875, -4.578857421875, -4.091796875, -3.604736328125, -3.11767578125, -2.630615234375, -2.1435546875, -1.656494140625, -1.16943359375, -0.682373046875, -0.1953125, 0.291748046875, 0.77880859375, 1.265869140625, 1.7529296875, 2.239990234375, 2.72705078125, 3.214111328125, 3.701171875, 4.188232421875, 4.67529296875, 5.162353515625, 5.6494140625, 6.136474609375, 6.62353515625, 7.110595703125, 7.59765625, 8.084716796875, 8.57177734375, 9.058837890625, 9.5458984375, 10.032958984375, 10.52001953125, 11.007080078125, 11.494140625, 11.981201171875, 12.46826171875, 12.955322265625, 13.4423828125, 13.929443359375, 14.41650390625, 14.903564453125, 15.390625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 1.0, 10.0, 10.0, 12.0, 13.0, 15.0, 21.0, 18.0, 22.0, 35.0, 20.0, 35.0, 46.0, 42.0, 56.0, 66.0, 42.0, 56.0, 54.0, 51.0, 45.0, 54.0, 33.0, 37.0, 36.0, 26.0, 21.0, 26.0, 18.0, 14.0, 8.0, 16.0, 15.0, 10.0, 4.0, 1.0, 1.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.09375, -17.50341796875, -16.9130859375, -16.32275390625, -15.732421875, -15.14208984375, -14.5517578125, -13.96142578125, -13.37109375, -12.78076171875, -12.1904296875, -11.60009765625, -11.009765625, -10.41943359375, -9.8291015625, -9.23876953125, -8.6484375, -8.05810546875, -7.4677734375, -6.87744140625, -6.287109375, -5.69677734375, -5.1064453125, -4.51611328125, -3.92578125, -3.33544921875, -2.7451171875, -2.15478515625, -1.564453125, -0.97412109375, -0.3837890625, 0.20654296875, 0.796875, 1.38720703125, 1.9775390625, 2.56787109375, 3.158203125, 3.74853515625, 4.3388671875, 4.92919921875, 5.51953125, 6.10986328125, 6.7001953125, 7.29052734375, 7.880859375, 8.47119140625, 9.0615234375, 9.65185546875, 10.2421875, 10.83251953125, 11.4228515625, 12.01318359375, 12.603515625, 13.19384765625, 13.7841796875, 14.37451171875, 14.96484375, 15.55517578125, 16.1455078125, 16.73583984375, 17.326171875, 17.91650390625, 18.5068359375, 19.09716796875, 19.6875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 6.0, 6.0, 20.0, 25.0, 36.0, 54.0, 84.0, 153.0, 206.0, 353.0, 752.0, 1568.0, 4050.0, 14806.0, 122324.0, 837333.0, 51955.0, 9307.0, 2943.0, 1210.0, 558.0, 330.0, 182.0, 100.0, 79.0, 35.0, 29.0, 20.0, 14.0, 9.0, 7.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.890625, -11.4853515625, -11.080078125, -10.6748046875, -10.26953125, -9.8642578125, -9.458984375, -9.0537109375, -8.6484375, -8.2431640625, -7.837890625, -7.4326171875, -7.02734375, -6.6220703125, -6.216796875, -5.8115234375, -5.40625, -5.0009765625, -4.595703125, -4.1904296875, -3.78515625, -3.3798828125, -2.974609375, -2.5693359375, -2.1640625, -1.7587890625, -1.353515625, -0.9482421875, -0.54296875, -0.1376953125, 0.267578125, 0.6728515625, 1.078125, 1.4833984375, 1.888671875, 2.2939453125, 2.69921875, 3.1044921875, 3.509765625, 3.9150390625, 4.3203125, 4.7255859375, 5.130859375, 5.5361328125, 5.94140625, 6.3466796875, 6.751953125, 7.1572265625, 7.5625, 7.9677734375, 8.373046875, 8.7783203125, 9.18359375, 9.5888671875, 9.994140625, 10.3994140625, 10.8046875, 11.2099609375, 11.615234375, 12.0205078125, 12.42578125, 12.8310546875, 13.236328125, 13.6416015625, 14.046875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 8.0, 5.0, 4.0, 7.0, 7.0, 15.0, 30.0, 37.0, 49.0, 90.0, 167.0, 170.0, 148.0, 96.0, 59.0, 37.0, 21.0, 12.0, 7.0, 12.0, 4.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001209259033203125, -0.0011729598045349121, -0.0011366605758666992, -0.0011003613471984863, -0.0010640621185302734, -0.0010277628898620605, -0.0009914636611938477, -0.0009551644325256348, -0.0009188652038574219, -0.000882565975189209, -0.0008462667465209961, -0.0008099675178527832, -0.0007736682891845703, -0.0007373690605163574, -0.0007010698318481445, -0.0006647706031799316, -0.0006284713745117188, -0.0005921721458435059, -0.000555872917175293, -0.0005195736885070801, -0.0004832744598388672, -0.0004469752311706543, -0.0004106760025024414, -0.0003743767738342285, -0.0003380775451660156, -0.00030177831649780273, -0.00026547908782958984, -0.00022917985916137695, -0.00019288063049316406, -0.00015658140182495117, -0.00012028217315673828, -8.398294448852539e-05, -4.76837158203125e-05, -1.138448715209961e-05, 2.491474151611328e-05, 6.121397018432617e-05, 9.751319885253906e-05, 0.00013381242752075195, 0.00017011165618896484, 0.00020641088485717773, 0.00024271011352539062, 0.0002790093421936035, 0.0003153085708618164, 0.0003516077995300293, 0.0003879070281982422, 0.0004242062568664551, 0.00046050548553466797, 0.0004968047142028809, 0.0005331039428710938, 0.0005694031715393066, 0.0006057024002075195, 0.0006420016288757324, 0.0006783008575439453, 0.0007146000862121582, 0.0007508993148803711, 0.000787198543548584, 0.0008234977722167969, 0.0008597970008850098, 0.0008960962295532227, 0.0009323954582214355, 0.0009686946868896484, 0.0010049939155578613, 0.0010412931442260742, 0.0010775923728942871, 0.0011138916015625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 6.0, 3.0, 7.0, 12.0, 16.0, 15.0, 25.0, 29.0, 46.0, 71.0, 140.0, 199.0, 363.0, 710.0, 1648.0, 4599.0, 16711.0, 150058.0, 800964.0, 57410.0, 9895.0, 3068.0, 1220.0, 545.0, 289.0, 187.0, 111.0, 53.0, 47.0, 28.0, 22.0, 24.0, 11.0, 8.0, 7.0, 7.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.671875, -10.3697509765625, -10.067626953125, -9.7655029296875, -9.46337890625, -9.1612548828125, -8.859130859375, -8.5570068359375, -8.2548828125, -7.9527587890625, -7.650634765625, -7.3485107421875, -7.04638671875, -6.7442626953125, -6.442138671875, -6.1400146484375, -5.837890625, -5.5357666015625, -5.233642578125, -4.9315185546875, -4.62939453125, -4.3272705078125, -4.025146484375, -3.7230224609375, -3.4208984375, -3.1187744140625, -2.816650390625, -2.5145263671875, -2.21240234375, -1.9102783203125, -1.608154296875, -1.3060302734375, -1.00390625, -0.7017822265625, -0.399658203125, -0.0975341796875, 0.20458984375, 0.5067138671875, 0.808837890625, 1.1109619140625, 1.4130859375, 1.7152099609375, 2.017333984375, 2.3194580078125, 2.62158203125, 2.9237060546875, 3.225830078125, 3.5279541015625, 3.830078125, 4.1322021484375, 4.434326171875, 4.7364501953125, 5.03857421875, 5.3406982421875, 5.642822265625, 5.9449462890625, 6.2470703125, 6.5491943359375, 6.851318359375, 7.1534423828125, 7.45556640625, 7.7576904296875, 8.059814453125, 8.3619384765625, 8.6640625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 9.0, 5.0, 8.0, 11.0, 19.0, 18.0, 31.0, 42.0, 66.0, 134.0, 159.0, 161.0, 119.0, 79.0, 45.0, 23.0, 16.0, 14.0, 8.0, 5.0, 5.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.4296875, -11.07080078125, -10.7119140625, -10.35302734375, -9.994140625, -9.63525390625, -9.2763671875, -8.91748046875, -8.55859375, -8.19970703125, -7.8408203125, -7.48193359375, -7.123046875, -6.76416015625, -6.4052734375, -6.04638671875, -5.6875, -5.32861328125, -4.9697265625, -4.61083984375, -4.251953125, -3.89306640625, -3.5341796875, -3.17529296875, -2.81640625, -2.45751953125, -2.0986328125, -1.73974609375, -1.380859375, -1.02197265625, -0.6630859375, -0.30419921875, 0.0546875, 0.41357421875, 0.7724609375, 1.13134765625, 1.490234375, 1.84912109375, 2.2080078125, 2.56689453125, 2.92578125, 3.28466796875, 3.6435546875, 4.00244140625, 4.361328125, 4.72021484375, 5.0791015625, 5.43798828125, 5.796875, 6.15576171875, 6.5146484375, 6.87353515625, 7.232421875, 7.59130859375, 7.9501953125, 8.30908203125, 8.66796875, 9.02685546875, 9.3857421875, 9.74462890625, 10.103515625, 10.46240234375, 10.8212890625, 11.18017578125, 11.5390625]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 4.0, 13.0, 12.0, 23.0, 28.0, 38.0, 72.0, 126.0, 171.0, 174.0, 125.0, 84.0, 61.0, 29.0, 14.0, 7.0, 8.0, 7.0, 3.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.21603393554688, -70.16384887695312, -65.11165618896484, -60.05946731567383, -55.00727844238281, -49.9550895690918, -44.90290069580078, -39.850711822509766, -34.79852294921875, -29.746334075927734, -24.69414520263672, -19.641956329345703, -14.589767456054688, -9.537578582763672, -4.485389709472656, 0.5667991638183594, 5.618988037109375, 10.67117691040039, 15.723365783691406, 20.775554656982422, 25.827743530273438, 30.879932403564453, 35.93212127685547, 40.984310150146484, 46.0364990234375, 51.088687896728516, 56.14087677001953, 61.19306564331055, 66.24525451660156, 71.29743957519531, 76.3496322631836, 81.40182495117188, 86.45399475097656, 91.50617980957031, 96.5583724975586, 101.61056518554688, 106.66275024414062, 111.71493530273438, 116.76712799072266, 121.81932067871094, 126.87150573730469, 131.92369079589844, 136.97589111328125, 142.028076171875, 147.08026123046875, 152.1324462890625, 157.18463134765625, 162.23683166503906, 167.2890167236328, 172.34120178222656, 177.39340209960938, 182.44558715820312, 187.49777221679688, 192.54995727539062, 197.60214233398438, 202.6543426513672, 207.70652770996094, 212.7587127685547, 217.8109130859375, 222.86309814453125, 227.915283203125, 232.96746826171875, 238.0196533203125, 243.0718536376953, 248.12403869628906]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 6.0, 9.0, 11.0, 6.0, 19.0, 5.0, 20.0, 21.0, 29.0, 29.0, 44.0, 57.0, 52.0, 57.0, 66.0, 79.0, 67.0, 77.0, 58.0, 49.0, 38.0, 35.0, 30.0, 30.0, 21.0, 17.0, 14.0, 12.0, 6.0, 10.0, 11.0, 8.0, 0.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-104.96003723144531, -101.78387451171875, -98.60770416259766, -95.43153381347656, -92.25537109375, -89.07920837402344, -85.90303802490234, -82.72686767578125, -79.55070495605469, -76.37454223632812, -73.19837188720703, -70.02220153808594, -66.84603881835938, -63.66987228393555, -60.49370574951172, -57.31753921508789, -54.14137268066406, -50.965206146240234, -47.789039611816406, -44.61287307739258, -41.43670654296875, -38.26054000854492, -35.084373474121094, -31.908206939697266, -28.732040405273438, -25.55587387084961, -22.37970733642578, -19.203540802001953, -16.027374267578125, -12.851207733154297, -9.675041198730469, -6.498874664306641, -3.3227005004882812, -0.14653396606445312, 3.029632568359375, 6.205799102783203, 9.381965637207031, 12.55813217163086, 15.734298706054688, 18.910465240478516, 22.086631774902344, 25.262798309326172, 28.43896484375, 31.615131378173828, 34.791297912597656, 37.967464447021484, 41.14363098144531, 44.31979751586914, 47.49596405029297, 50.6721305847168, 53.848297119140625, 57.02446365356445, 60.20063018798828, 63.37679672241211, 66.55296325683594, 69.7291259765625, 72.9052963256836, 76.08146667480469, 79.25762939453125, 82.43379211425781, 85.6099624633789, 88.7861328125, 91.96229553222656, 95.13845825195312, 98.31462860107422]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 2.0, 6.0, 4.0, 2.0, 3.0, 6.0, 6.0, 11.0, 16.0, 22.0, 24.0, 28.0, 21.0, 48.0, 67.0, 89.0, 147.0, 201.0, 318.0, 543.0, 877.0, 1721.0, 3927.0, 13676.0, 4106130.0, 53724.0, 7000.0, 2649.0, 1256.0, 683.0, 405.0, 230.0, 157.0, 90.0, 61.0, 36.0, 23.0, 25.0, 16.0, 9.0, 10.0, 6.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-32.5625, -31.72216796875, -30.8818359375, -30.04150390625, -29.201171875, -28.36083984375, -27.5205078125, -26.68017578125, -25.83984375, -24.99951171875, -24.1591796875, -23.31884765625, -22.478515625, -21.63818359375, -20.7978515625, -19.95751953125, -19.1171875, -18.27685546875, -17.4365234375, -16.59619140625, -15.755859375, -14.91552734375, -14.0751953125, -13.23486328125, -12.39453125, -11.55419921875, -10.7138671875, -9.87353515625, -9.033203125, -8.19287109375, -7.3525390625, -6.51220703125, -5.671875, -4.83154296875, -3.9912109375, -3.15087890625, -2.310546875, -1.47021484375, -0.6298828125, 0.21044921875, 1.05078125, 1.89111328125, 2.7314453125, 3.57177734375, 4.412109375, 5.25244140625, 6.0927734375, 6.93310546875, 7.7734375, 8.61376953125, 9.4541015625, 10.29443359375, 11.134765625, 11.97509765625, 12.8154296875, 13.65576171875, 14.49609375, 15.33642578125, 16.1767578125, 17.01708984375, 17.857421875, 18.69775390625, 19.5380859375, 20.37841796875, 21.21875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 4.0, 7.0, 4.0, 8.0, 10.0, 12.0, 12.0, 16.0, 26.0, 36.0, 46.0, 49.0, 52.0, 54.0, 82.0, 66.0, 70.0, 82.0, 58.0, 58.0, 38.0, 41.0, 35.0, 35.0, 17.0, 13.0, 16.0, 10.0, 8.0, 6.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.18359375, -4.048095703125, -3.91259765625, -3.777099609375, -3.6416015625, -3.506103515625, -3.37060546875, -3.235107421875, -3.099609375, -2.964111328125, -2.82861328125, -2.693115234375, -2.5576171875, -2.422119140625, -2.28662109375, -2.151123046875, -2.015625, -1.880126953125, -1.74462890625, -1.609130859375, -1.4736328125, -1.338134765625, -1.20263671875, -1.067138671875, -0.931640625, -0.796142578125, -0.66064453125, -0.525146484375, -0.3896484375, -0.254150390625, -0.11865234375, 0.016845703125, 0.15234375, 0.287841796875, 0.42333984375, 0.558837890625, 0.6943359375, 0.829833984375, 0.96533203125, 1.100830078125, 1.236328125, 1.371826171875, 1.50732421875, 1.642822265625, 1.7783203125, 1.913818359375, 2.04931640625, 2.184814453125, 2.3203125, 2.455810546875, 2.59130859375, 2.726806640625, 2.8623046875, 2.997802734375, 3.13330078125, 3.268798828125, 3.404296875, 3.539794921875, 3.67529296875, 3.810791015625, 3.9462890625, 4.081787109375, 4.21728515625, 4.352783203125, 4.48828125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 6.0, 6.0, 13.0, 7.0, 18.0, 18.0, 25.0, 40.0, 33.0, 58.0, 70.0, 60.0, 92.0, 148.0, 181.0, 234.0, 370.0, 466.0, 728.0, 1084.0, 1732.0, 2822.0, 5112.0, 10057.0, 24703.0, 3546364.0, 554011.0, 22768.0, 9845.0, 5097.0, 2885.0, 1658.0, 1040.0, 732.0, 501.0, 323.0, 229.0, 164.0, 127.0, 108.0, 74.0, 71.0, 55.0, 35.0, 37.0, 31.0, 15.0, 15.0, 5.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-20.265625, -19.6318359375, -18.998046875, -18.3642578125, -17.73046875, -17.0966796875, -16.462890625, -15.8291015625, -15.1953125, -14.5615234375, -13.927734375, -13.2939453125, -12.66015625, -12.0263671875, -11.392578125, -10.7587890625, -10.125, -9.4912109375, -8.857421875, -8.2236328125, -7.58984375, -6.9560546875, -6.322265625, -5.6884765625, -5.0546875, -4.4208984375, -3.787109375, -3.1533203125, -2.51953125, -1.8857421875, -1.251953125, -0.6181640625, 0.015625, 0.6494140625, 1.283203125, 1.9169921875, 2.55078125, 3.1845703125, 3.818359375, 4.4521484375, 5.0859375, 5.7197265625, 6.353515625, 6.9873046875, 7.62109375, 8.2548828125, 8.888671875, 9.5224609375, 10.15625, 10.7900390625, 11.423828125, 12.0576171875, 12.69140625, 13.3251953125, 13.958984375, 14.5927734375, 15.2265625, 15.8603515625, 16.494140625, 17.1279296875, 17.76171875, 18.3955078125, 19.029296875, 19.6630859375, 20.296875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 3.0, 5.0, 8.0, 5.0, 5.0, 16.0, 6.0, 12.0, 45.0, 223.0, 3526.0, 116.0, 28.0, 17.0, 9.0, 15.0, 8.0, 7.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.31640625, -7.1036376953125, -6.890869140625, -6.6781005859375, -6.46533203125, -6.2525634765625, -6.039794921875, -5.8270263671875, -5.6142578125, -5.4014892578125, -5.188720703125, -4.9759521484375, -4.76318359375, -4.5504150390625, -4.337646484375, -4.1248779296875, -3.912109375, -3.6993408203125, -3.486572265625, -3.2738037109375, -3.06103515625, -2.8482666015625, -2.635498046875, -2.4227294921875, -2.2099609375, -1.9971923828125, -1.784423828125, -1.5716552734375, -1.35888671875, -1.1461181640625, -0.933349609375, -0.7205810546875, -0.5078125, -0.2950439453125, -0.082275390625, 0.1304931640625, 0.34326171875, 0.5560302734375, 0.768798828125, 0.9815673828125, 1.1943359375, 1.4071044921875, 1.619873046875, 1.8326416015625, 2.04541015625, 2.2581787109375, 2.470947265625, 2.6837158203125, 2.896484375, 3.1092529296875, 3.322021484375, 3.5347900390625, 3.74755859375, 3.9603271484375, 4.173095703125, 4.3858642578125, 4.5986328125, 4.8114013671875, 5.024169921875, 5.2369384765625, 5.44970703125, 5.6624755859375, 5.875244140625, 6.0880126953125, 6.30078125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 6.0, 2.0, 5.0, 11.0, 11.0, 13.0, 29.0, 62.0, 84.0, 118.0, 167.0, 151.0, 145.0, 71.0, 60.0, 34.0, 21.0, 12.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.697967529296875, -42.713932037353516, -41.72990036010742, -40.74586486816406, -39.7618293762207, -38.77779769897461, -37.79376220703125, -36.809730529785156, -35.8256950378418, -34.84165954589844, -33.857627868652344, -32.873592376708984, -31.889558792114258, -30.90552520751953, -29.921489715576172, -28.937456130981445, -27.95342254638672, -26.969388961791992, -25.985353469848633, -25.001319885253906, -24.01728630065918, -23.033252716064453, -22.049217224121094, -21.065183639526367, -20.081148147583008, -19.09711456298828, -18.113079071044922, -17.129045486450195, -16.14501190185547, -15.160977363586426, -14.176942825317383, -13.192909240722656, -12.20887565612793, -11.224841117858887, -10.24080753326416, -9.256772994995117, -8.27273941040039, -7.288704872131348, -6.304670810699463, -5.320636749267578, -4.336602687835693, -3.3525686264038086, -2.368534564971924, -1.38450026512146, -0.4004662036895752, 0.5835680961608887, 1.5676021575927734, 2.551636219024658, 3.535670280456543, 4.519704341888428, 5.5037384033203125, 6.4877729415893555, 7.471806526184082, 8.455841064453125, 9.439874649047852, 10.423909187316895, 11.407943725585938, 12.39197826385498, 13.376011848449707, 14.36004638671875, 15.344079971313477, 16.328113555908203, 17.312149047851562, 18.29618263244629, 19.280216217041016]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 4.0, 5.0, 2.0, 9.0, 10.0, 11.0, 14.0, 18.0, 14.0, 13.0, 30.0, 22.0, 26.0, 21.0, 34.0, 36.0, 32.0, 40.0, 46.0, 51.0, 38.0, 55.0, 42.0, 51.0, 53.0, 38.0, 28.0, 26.0, 36.0, 25.0, 33.0, 22.0, 14.0, 22.0, 13.0, 10.0, 9.0, 12.0, 4.0, 6.0, 9.0, 5.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-14.77127742767334, -14.33841323852539, -13.905550003051758, -13.472685813903809, -13.03982162475586, -12.606958389282227, -12.174094200134277, -11.741230010986328, -11.308366775512695, -10.875502586364746, -10.442639350891113, -10.009775161743164, -9.576910972595215, -9.144046783447266, -8.711183547973633, -8.278319358825684, -7.845455169677734, -7.412591457366943, -6.979727268218994, -6.546863555908203, -6.113999366760254, -5.681135654449463, -5.248271942138672, -4.815407752990723, -4.382544040679932, -3.9496800899505615, -3.5168161392211914, -3.0839524269104004, -2.6510884761810303, -2.21822452545166, -1.7853608131408691, -1.352496862411499, -0.9196319580078125, -0.48676806688308716, -0.053904175758361816, 0.37895965576171875, 0.8118236064910889, 1.244687557220459, 1.67755126953125, 2.11041522026062, 2.5432791709899902, 2.9761431217193604, 3.4090070724487305, 3.8418707847595215, 4.2747344970703125, 4.707598686218262, 5.140462398529053, 5.573326110839844, 6.006190299987793, 6.439054012298584, 6.871918201446533, 7.304781913757324, 7.737646102905273, 8.170509338378906, 8.603373527526855, 9.036237716674805, 9.469100952148438, 9.901965141296387, 10.33482837677002, 10.767692565917969, 11.200556755065918, 11.633420944213867, 12.0662841796875, 12.49914836883545, 12.932012557983398]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 5.0, 1.0, 4.0, 10.0, 14.0, 23.0, 36.0, 46.0, 68.0, 102.0, 109.0, 138.0, 218.0, 273.0, 432.0, 640.0, 1065.0, 1800.0, 3115.0, 5864.0, 11952.0, 27123.0, 71720.0, 226178.0, 419859.0, 176193.0, 57022.0, 22134.0, 10208.0, 5064.0, 2709.0, 1528.0, 954.0, 629.0, 392.0, 287.0, 191.0, 122.0, 92.0, 59.0, 49.0, 31.0, 19.0, 23.0, 20.0, 10.0, 8.0, 9.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.30078125, -7.01324462890625, -6.7257080078125, -6.43817138671875, -6.150634765625, -5.86309814453125, -5.5755615234375, -5.28802490234375, -5.00048828125, -4.71295166015625, -4.4254150390625, -4.13787841796875, -3.850341796875, -3.56280517578125, -3.2752685546875, -2.98773193359375, -2.7001953125, -2.41265869140625, -2.1251220703125, -1.83758544921875, -1.550048828125, -1.26251220703125, -0.9749755859375, -0.68743896484375, -0.39990234375, -0.11236572265625, 0.1751708984375, 0.46270751953125, 0.750244140625, 1.03778076171875, 1.3253173828125, 1.61285400390625, 1.900390625, 2.18792724609375, 2.4754638671875, 2.76300048828125, 3.050537109375, 3.33807373046875, 3.6256103515625, 3.91314697265625, 4.20068359375, 4.48822021484375, 4.7757568359375, 5.06329345703125, 5.350830078125, 5.63836669921875, 5.9259033203125, 6.21343994140625, 6.5009765625, 6.78851318359375, 7.0760498046875, 7.36358642578125, 7.651123046875, 7.93865966796875, 8.2261962890625, 8.51373291015625, 8.80126953125, 9.08880615234375, 9.3763427734375, 9.66387939453125, 9.951416015625, 10.23895263671875, 10.5264892578125, 10.81402587890625, 11.1015625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 1.0, 5.0, 6.0, 4.0, 1.0, 2.0, 4.0, 7.0, 9.0, 10.0, 16.0, 19.0, 11.0, 28.0, 33.0, 39.0, 44.0, 60.0, 46.0, 50.0, 49.0, 56.0, 65.0, 48.0, 50.0, 64.0, 46.0, 44.0, 44.0, 21.0, 27.0, 17.0, 11.0, 7.0, 10.0, 13.0, 7.0, 8.0, 3.0, 3.0, 6.0, 2.0, 1.0, 3.0, 1.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.83984375, -3.71075439453125, -3.5816650390625, -3.45257568359375, -3.323486328125, -3.19439697265625, -3.0653076171875, -2.93621826171875, -2.80712890625, -2.67803955078125, -2.5489501953125, -2.41986083984375, -2.290771484375, -2.16168212890625, -2.0325927734375, -1.90350341796875, -1.7744140625, -1.64532470703125, -1.5162353515625, -1.38714599609375, -1.258056640625, -1.12896728515625, -0.9998779296875, -0.87078857421875, -0.74169921875, -0.61260986328125, -0.4835205078125, -0.35443115234375, -0.225341796875, -0.09625244140625, 0.0328369140625, 0.16192626953125, 0.291015625, 0.42010498046875, 0.5491943359375, 0.67828369140625, 0.807373046875, 0.93646240234375, 1.0655517578125, 1.19464111328125, 1.32373046875, 1.45281982421875, 1.5819091796875, 1.71099853515625, 1.840087890625, 1.96917724609375, 2.0982666015625, 2.22735595703125, 2.3564453125, 2.48553466796875, 2.6146240234375, 2.74371337890625, 2.872802734375, 3.00189208984375, 3.1309814453125, 3.26007080078125, 3.38916015625, 3.51824951171875, 3.6473388671875, 3.77642822265625, 3.905517578125, 4.03460693359375, 4.1636962890625, 4.29278564453125, 4.421875]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 2.0, 8.0, 1.0, 7.0, 10.0, 18.0, 23.0, 34.0, 62.0, 93.0, 218.0, 416.0, 1122.0, 3464.0, 19165.0, 366662.0, 624335.0, 26346.0, 4336.0, 1207.0, 499.0, 217.0, 123.0, 64.0, 37.0, 21.0, 21.0, 21.0, 8.0, 5.0, 6.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.015625, -26.941162109375, -25.86669921875, -24.792236328125, -23.7177734375, -22.643310546875, -21.56884765625, -20.494384765625, -19.419921875, -18.345458984375, -17.27099609375, -16.196533203125, -15.1220703125, -14.047607421875, -12.97314453125, -11.898681640625, -10.82421875, -9.749755859375, -8.67529296875, -7.600830078125, -6.5263671875, -5.451904296875, -4.37744140625, -3.302978515625, -2.228515625, -1.154052734375, -0.07958984375, 0.994873046875, 2.0693359375, 3.143798828125, 4.21826171875, 5.292724609375, 6.3671875, 7.441650390625, 8.51611328125, 9.590576171875, 10.6650390625, 11.739501953125, 12.81396484375, 13.888427734375, 14.962890625, 16.037353515625, 17.11181640625, 18.186279296875, 19.2607421875, 20.335205078125, 21.40966796875, 22.484130859375, 23.55859375, 24.633056640625, 25.70751953125, 26.781982421875, 27.8564453125, 28.930908203125, 30.00537109375, 31.079833984375, 32.154296875, 33.228759765625, 34.30322265625, 35.377685546875, 36.4521484375, 37.526611328125, 38.60107421875, 39.675537109375, 40.75]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 6.0, 0.0, 4.0, 6.0, 6.0, 4.0, 12.0, 8.0, 10.0, 17.0, 20.0, 13.0, 40.0, 50.0, 44.0, 48.0, 54.0, 64.0, 63.0, 62.0, 45.0, 69.0, 58.0, 41.0, 54.0, 41.0, 35.0, 23.0, 21.0, 16.0, 17.0, 18.0, 10.0, 6.0, 8.0, 9.0, 0.0, 3.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.6875, -21.8388671875, -20.990234375, -20.1416015625, -19.29296875, -18.4443359375, -17.595703125, -16.7470703125, -15.8984375, -15.0498046875, -14.201171875, -13.3525390625, -12.50390625, -11.6552734375, -10.806640625, -9.9580078125, -9.109375, -8.2607421875, -7.412109375, -6.5634765625, -5.71484375, -4.8662109375, -4.017578125, -3.1689453125, -2.3203125, -1.4716796875, -0.623046875, 0.2255859375, 1.07421875, 1.9228515625, 2.771484375, 3.6201171875, 4.46875, 5.3173828125, 6.166015625, 7.0146484375, 7.86328125, 8.7119140625, 9.560546875, 10.4091796875, 11.2578125, 12.1064453125, 12.955078125, 13.8037109375, 14.65234375, 15.5009765625, 16.349609375, 17.1982421875, 18.046875, 18.8955078125, 19.744140625, 20.5927734375, 21.44140625, 22.2900390625, 23.138671875, 23.9873046875, 24.8359375, 25.6845703125, 26.533203125, 27.3818359375, 28.23046875, 29.0791015625, 29.927734375, 30.7763671875, 31.625]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 7.0, 1.0, 4.0, 4.0, 7.0, 9.0, 13.0, 9.0, 20.0, 25.0, 44.0, 61.0, 92.0, 174.0, 308.0, 690.0, 1977.0, 8953.0, 110569.0, 889094.0, 29881.0, 4290.0, 1211.0, 489.0, 238.0, 131.0, 55.0, 47.0, 38.0, 26.0, 30.0, 12.0, 6.0, 9.0, 10.0, 7.0, 3.0, 4.0, 2.0, 5.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-28.125, -27.3046875, -26.484375, -25.6640625, -24.84375, -24.0234375, -23.203125, -22.3828125, -21.5625, -20.7421875, -19.921875, -19.1015625, -18.28125, -17.4609375, -16.640625, -15.8203125, -15.0, -14.1796875, -13.359375, -12.5390625, -11.71875, -10.8984375, -10.078125, -9.2578125, -8.4375, -7.6171875, -6.796875, -5.9765625, -5.15625, -4.3359375, -3.515625, -2.6953125, -1.875, -1.0546875, -0.234375, 0.5859375, 1.40625, 2.2265625, 3.046875, 3.8671875, 4.6875, 5.5078125, 6.328125, 7.1484375, 7.96875, 8.7890625, 9.609375, 10.4296875, 11.25, 12.0703125, 12.890625, 13.7109375, 14.53125, 15.3515625, 16.171875, 16.9921875, 17.8125, 18.6328125, 19.453125, 20.2734375, 21.09375, 21.9140625, 22.734375, 23.5546875, 24.375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 5.0, 7.0, 6.0, 6.0, 9.0, 17.0, 20.0, 29.0, 44.0, 72.0, 114.0, 156.0, 191.0, 121.0, 65.0, 52.0, 22.0, 13.0, 15.0, 9.0, 7.0, 4.0, 3.0, 3.0, 6.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0023288726806640625, -0.002264544367790222, -0.002200216054916382, -0.0021358877420425415, -0.002071559429168701, -0.002007231116294861, -0.0019429028034210205, -0.0018785744905471802, -0.0018142461776733398, -0.0017499178647994995, -0.0016855895519256592, -0.0016212612390518188, -0.0015569329261779785, -0.0014926046133041382, -0.0014282763004302979, -0.0013639479875564575, -0.0012996196746826172, -0.0012352913618087769, -0.0011709630489349365, -0.0011066347360610962, -0.0010423064231872559, -0.0009779781103134155, -0.0009136497974395752, -0.0008493214845657349, -0.0007849931716918945, -0.0007206648588180542, -0.0006563365459442139, -0.0005920082330703735, -0.0005276799201965332, -0.00046335160732269287, -0.00039902329444885254, -0.0003346949815750122, -0.0002703666687011719, -0.00020603835582733154, -0.0001417100429534912, -7.738173007965088e-05, -1.3053417205810547e-05, 5.1274895668029785e-05, 0.00011560320854187012, 0.00017993152141571045, 0.0002442598342895508, 0.0003085881471633911, 0.00037291646003723145, 0.0004372447729110718, 0.0005015730857849121, 0.0005659013986587524, 0.0006302297115325928, 0.0006945580244064331, 0.0007588863372802734, 0.0008232146501541138, 0.0008875429630279541, 0.0009518712759017944, 0.0010161995887756348, 0.001080527901649475, 0.0011448562145233154, 0.0012091845273971558, 0.001273512840270996, 0.0013378411531448364, 0.0014021694660186768, 0.001466497778892517, 0.0015308260917663574, 0.0015951544046401978, 0.001659482717514038, 0.0017238110303878784, 0.0017881393432617188]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 6.0, 7.0, 10.0, 16.0, 29.0, 35.0, 40.0, 63.0, 82.0, 197.0, 629.0, 3830.0, 97136.0, 929900.0, 14573.0, 1335.0, 318.0, 112.0, 62.0, 52.0, 35.0, 30.0, 13.0, 15.0, 5.0, 11.0, 8.0, 3.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.53125, -34.2734375, -33.015625, -31.7578125, -30.5, -29.2421875, -27.984375, -26.7265625, -25.46875, -24.2109375, -22.953125, -21.6953125, -20.4375, -19.1796875, -17.921875, -16.6640625, -15.40625, -14.1484375, -12.890625, -11.6328125, -10.375, -9.1171875, -7.859375, -6.6015625, -5.34375, -4.0859375, -2.828125, -1.5703125, -0.3125, 0.9453125, 2.203125, 3.4609375, 4.71875, 5.9765625, 7.234375, 8.4921875, 9.75, 11.0078125, 12.265625, 13.5234375, 14.78125, 16.0390625, 17.296875, 18.5546875, 19.8125, 21.0703125, 22.328125, 23.5859375, 24.84375, 26.1015625, 27.359375, 28.6171875, 29.875, 31.1328125, 32.390625, 33.6484375, 34.90625, 36.1640625, 37.421875, 38.6796875, 39.9375, 41.1953125, 42.453125, 43.7109375, 44.96875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 3.0, 9.0, 4.0, 6.0, 17.0, 16.0, 26.0, 38.0, 65.0, 98.0, 154.0, 159.0, 151.0, 63.0, 67.0, 46.0, 28.0, 20.0, 9.0, 11.0, 7.0, 5.0, 3.0, 1.0, 0.0, 2.0, 3.0], "bins": [-25.359375, -24.835693359375, -24.31201171875, -23.788330078125, -23.2646484375, -22.740966796875, -22.21728515625, -21.693603515625, -21.169921875, -20.646240234375, -20.12255859375, -19.598876953125, -19.0751953125, -18.551513671875, -18.02783203125, -17.504150390625, -16.98046875, -16.456787109375, -15.93310546875, -15.409423828125, -14.8857421875, -14.362060546875, -13.83837890625, -13.314697265625, -12.791015625, -12.267333984375, -11.74365234375, -11.219970703125, -10.6962890625, -10.172607421875, -9.64892578125, -9.125244140625, -8.6015625, -8.077880859375, -7.55419921875, -7.030517578125, -6.5068359375, -5.983154296875, -5.45947265625, -4.935791015625, -4.412109375, -3.888427734375, -3.36474609375, -2.841064453125, -2.3173828125, -1.793701171875, -1.27001953125, -0.746337890625, -0.22265625, 0.301025390625, 0.82470703125, 1.348388671875, 1.8720703125, 2.395751953125, 2.91943359375, 3.443115234375, 3.966796875, 4.490478515625, 5.01416015625, 5.537841796875, 6.0615234375, 6.585205078125, 7.10888671875, 7.632568359375, 8.15625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 11.0, 4.0, 19.0, 27.0, 39.0, 76.0, 123.0, 181.0, 175.0, 155.0, 94.0, 45.0, 26.0, 18.0, 9.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-308.2944030761719, -300.6241455078125, -292.9538879394531, -285.2835998535156, -277.61334228515625, -269.9430847167969, -262.2728271484375, -254.60255432128906, -246.93228149414062, -239.26202392578125, -231.5917510986328, -223.92149353027344, -216.251220703125, -208.58096313476562, -200.9106903076172, -193.2404327392578, -185.57015991210938, -177.89990234375, -170.22962951660156, -162.5593719482422, -154.88909912109375, -147.21884155273438, -139.54856872558594, -131.87831115722656, -124.20805358886719, -116.53778839111328, -108.86752319335938, -101.19725799560547, -93.52699279785156, -85.85673522949219, -78.18646240234375, -70.51620483398438, -62.84593200683594, -55.17566680908203, -47.505401611328125, -39.83513641357422, -32.16487121582031, -24.494609832763672, -16.824344635009766, -9.15407943725586, -1.4838142395019531, 6.186450481414795, 13.856715202331543, 21.526979446411133, 29.19724464416504, 36.86750793457031, 44.53777313232422, 52.208038330078125, 59.87830352783203, 67.54856872558594, 75.21883392333984, 82.88909912109375, 90.55936431884766, 98.22962951660156, 105.89988708496094, 113.57015991210938, 121.24041748046875, 128.91067504882812, 136.58094787597656, 144.25120544433594, 151.92147827148438, 159.59173583984375, 167.2620086669922, 174.93226623535156, 182.6025390625]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 9.0, 11.0, 11.0, 11.0, 13.0, 22.0, 28.0, 30.0, 23.0, 29.0, 41.0, 36.0, 46.0, 47.0, 56.0, 56.0, 64.0, 48.0, 46.0, 37.0, 49.0, 31.0, 34.0, 31.0, 31.0, 27.0, 22.0, 13.0, 16.0, 8.0, 6.0, 8.0, 9.0, 9.0, 7.0, 6.0, 7.0, 1.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-109.64665222167969, -106.50016021728516, -103.35367584228516, -100.20718383789062, -97.06069946289062, -93.9142074584961, -90.7677230834961, -87.62123107910156, -84.47474670410156, -81.32825469970703, -78.18177032470703, -75.0352783203125, -71.8887939453125, -68.74230194091797, -65.59581756591797, -62.44932556152344, -59.30283737182617, -56.156349182128906, -53.00986099243164, -49.863372802734375, -46.71688461303711, -43.570396423339844, -40.42390441894531, -37.27742004394531, -34.13092803955078, -30.984439849853516, -27.83795166015625, -24.691463470458984, -21.54497528076172, -18.398487091064453, -15.251996994018555, -12.105508804321289, -8.959022521972656, -5.812534332275391, -2.666045665740967, 0.48044300079345703, 3.6269311904907227, 6.773419380187988, 9.91990852355957, 13.066396713256836, 16.2128849029541, 19.359373092651367, 22.505861282348633, 25.65235137939453, 28.798839569091797, 31.945327758789062, 35.09181594848633, 38.238304138183594, 41.38479232788086, 44.531280517578125, 47.67776870727539, 50.824256896972656, 53.97074508666992, 57.11723327636719, 60.26372528076172, 63.41020965576172, 66.55670166015625, 69.70319366455078, 72.84967803955078, 75.99617004394531, 79.14265441894531, 82.28914642333984, 85.43563079833984, 88.58212280273438, 91.72860717773438]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 10.0, 5.0, 11.0, 9.0, 12.0, 19.0, 27.0, 28.0, 56.0, 75.0, 108.0, 237.0, 415.0, 1121.0, 7294.0, 4178126.0, 4788.0, 1020.0, 378.0, 209.0, 118.0, 76.0, 38.0, 28.0, 23.0, 17.0, 11.0, 7.0, 8.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-93.625, -91.46875, -89.3125, -87.15625, -85.0, -82.84375, -80.6875, -78.53125, -76.375, -74.21875, -72.0625, -69.90625, -67.75, -65.59375, -63.4375, -61.28125, -59.125, -56.96875, -54.8125, -52.65625, -50.5, -48.34375, -46.1875, -44.03125, -41.875, -39.71875, -37.5625, -35.40625, -33.25, -31.09375, -28.9375, -26.78125, -24.625, -22.46875, -20.3125, -18.15625, -16.0, -13.84375, -11.6875, -9.53125, -7.375, -5.21875, -3.0625, -0.90625, 1.25, 3.40625, 5.5625, 7.71875, 9.875, 12.03125, 14.1875, 16.34375, 18.5, 20.65625, 22.8125, 24.96875, 27.125, 29.28125, 31.4375, 33.59375, 35.75, 37.90625, 40.0625, 42.21875, 44.375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 6.0, 12.0, 9.0, 10.0, 21.0, 33.0, 41.0, 52.0, 55.0, 68.0, 87.0, 92.0, 77.0, 87.0, 83.0, 62.0, 60.0, 38.0, 22.0, 19.0, 17.0, 10.0, 10.0, 4.0, 2.0, 11.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.6953125, -7.4923095703125, -7.289306640625, -7.0863037109375, -6.88330078125, -6.6802978515625, -6.477294921875, -6.2742919921875, -6.0712890625, -5.8682861328125, -5.665283203125, -5.4622802734375, -5.25927734375, -5.0562744140625, -4.853271484375, -4.6502685546875, -4.447265625, -4.2442626953125, -4.041259765625, -3.8382568359375, -3.63525390625, -3.4322509765625, -3.229248046875, -3.0262451171875, -2.8232421875, -2.6202392578125, -2.417236328125, -2.2142333984375, -2.01123046875, -1.8082275390625, -1.605224609375, -1.4022216796875, -1.19921875, -0.9962158203125, -0.793212890625, -0.5902099609375, -0.38720703125, -0.1842041015625, 0.018798828125, 0.2218017578125, 0.4248046875, 0.6278076171875, 0.830810546875, 1.0338134765625, 1.23681640625, 1.4398193359375, 1.642822265625, 1.8458251953125, 2.048828125, 2.2518310546875, 2.454833984375, 2.6578369140625, 2.86083984375, 3.0638427734375, 3.266845703125, 3.4698486328125, 3.6728515625, 3.8758544921875, 4.078857421875, 4.2818603515625, 4.48486328125, 4.6878662109375, 4.890869140625, 5.0938720703125, 5.296875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 8.0, 9.0, 8.0, 8.0, 24.0, 25.0, 32.0, 36.0, 52.0, 52.0, 103.0, 167.0, 220.0, 382.0, 733.0, 1641.0, 5734.0, 4160723.0, 19232.0, 2675.0, 1023.0, 520.0, 297.0, 160.0, 107.0, 82.0, 48.0, 35.0, 28.0, 20.0, 19.0, 12.0, 17.0, 8.0, 10.0, 10.0, 3.0, 5.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.4375, -56.330078125, -54.22265625, -52.115234375, -50.0078125, -47.900390625, -45.79296875, -43.685546875, -41.578125, -39.470703125, -37.36328125, -35.255859375, -33.1484375, -31.041015625, -28.93359375, -26.826171875, -24.71875, -22.611328125, -20.50390625, -18.396484375, -16.2890625, -14.181640625, -12.07421875, -9.966796875, -7.859375, -5.751953125, -3.64453125, -1.537109375, 0.5703125, 2.677734375, 4.78515625, 6.892578125, 9.0, 11.107421875, 13.21484375, 15.322265625, 17.4296875, 19.537109375, 21.64453125, 23.751953125, 25.859375, 27.966796875, 30.07421875, 32.181640625, 34.2890625, 36.396484375, 38.50390625, 40.611328125, 42.71875, 44.826171875, 46.93359375, 49.041015625, 51.1484375, 53.255859375, 55.36328125, 57.470703125, 59.578125, 61.685546875, 63.79296875, 65.900390625, 68.0078125, 70.115234375, 72.22265625, 74.330078125, 76.4375]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 4.0, 14.0, 35.0, 3900.0, 97.0, 14.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.453125, -17.053955078125, -16.65478515625, -16.255615234375, -15.8564453125, -15.457275390625, -15.05810546875, -14.658935546875, -14.259765625, -13.860595703125, -13.46142578125, -13.062255859375, -12.6630859375, -12.263916015625, -11.86474609375, -11.465576171875, -11.06640625, -10.667236328125, -10.26806640625, -9.868896484375, -9.4697265625, -9.070556640625, -8.67138671875, -8.272216796875, -7.873046875, -7.473876953125, -7.07470703125, -6.675537109375, -6.2763671875, -5.877197265625, -5.47802734375, -5.078857421875, -4.6796875, -4.280517578125, -3.88134765625, -3.482177734375, -3.0830078125, -2.683837890625, -2.28466796875, -1.885498046875, -1.486328125, -1.087158203125, -0.68798828125, -0.288818359375, 0.1103515625, 0.509521484375, 0.90869140625, 1.307861328125, 1.70703125, 2.106201171875, 2.50537109375, 2.904541015625, 3.3037109375, 3.702880859375, 4.10205078125, 4.501220703125, 4.900390625, 5.299560546875, 5.69873046875, 6.097900390625, 6.4970703125, 6.896240234375, 7.29541015625, 7.694580078125, 8.09375]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 6.0, 6.0, 8.0, 9.0, 14.0, 17.0, 21.0, 24.0, 30.0, 48.0, 64.0, 65.0, 94.0, 104.0, 109.0, 88.0, 73.0, 56.0, 40.0, 33.0, 22.0, 13.0, 12.0, 10.0, 7.0, 4.0, 6.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.995750427246094, -16.414566040039062, -15.833379745483398, -15.252195358276367, -14.67101001739502, -14.089824676513672, -13.50864028930664, -12.927454948425293, -12.346269607543945, -11.765084266662598, -11.18389892578125, -10.602714538574219, -10.021529197692871, -9.440343856811523, -8.859159469604492, -8.277974128723145, -7.696788787841797, -7.115603446960449, -6.53441858291626, -5.95323371887207, -5.372048377990723, -4.790863037109375, -4.2096781730651855, -3.628493309020996, -3.0473079681396484, -2.46612286567688, -1.8849377632141113, -1.3037526607513428, -0.7225675582885742, -0.14138245582580566, 0.4398026466369629, 1.0209875106811523, 1.6021728515625, 2.1833579540252686, 2.764543056488037, 3.3457281589508057, 3.926913261413574, 4.508098602294922, 5.089283466339111, 5.670468330383301, 6.251653671264648, 6.832839012145996, 7.4140238761901855, 7.995208740234375, 8.576394081115723, 9.15757942199707, 9.738763809204102, 10.31994915008545, 10.901134490966797, 11.482319831848145, 12.063505172729492, 12.644689559936523, 13.225874900817871, 13.807060241699219, 14.38824462890625, 14.969429969787598, 15.550615310668945, 16.131799697875977, 16.71298599243164, 17.294170379638672, 17.875354766845703, 18.456541061401367, 19.0377254486084, 19.618911743164062, 20.200096130371094]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 9.0, 16.0, 13.0, 10.0, 18.0, 19.0, 15.0, 39.0, 37.0, 39.0, 41.0, 37.0, 49.0, 66.0, 58.0, 49.0, 52.0, 54.0, 48.0, 47.0, 49.0, 47.0, 31.0, 32.0, 29.0, 23.0, 20.0, 11.0, 14.0, 9.0, 8.0, 3.0, 7.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-19.9779052734375, -19.417823791503906, -18.85774040222168, -18.297658920288086, -17.737577438354492, -17.177494049072266, -16.617412567138672, -16.057331085205078, -15.497248649597168, -14.937166213989258, -14.377084732055664, -13.817002296447754, -13.256919860839844, -12.69683837890625, -12.13675594329834, -11.57667350769043, -11.016592025756836, -10.456509590148926, -9.896428108215332, -9.336345672607422, -8.776264190673828, -8.216181755065918, -7.656099319458008, -7.096017360687256, -6.535935401916504, -5.975853443145752, -5.415771484375, -4.85568904876709, -4.295607089996338, -3.735525131225586, -3.175442934036255, -2.615360736846924, -2.0552806854248047, -1.4951986074447632, -0.9351165294647217, -0.3750344514846802, 0.18504762649536133, 0.7451295852661133, 1.3052117824554443, 1.8652939796447754, 2.4253759384155273, 2.9854578971862793, 3.5455400943756104, 4.105622291564941, 4.665704250335693, 5.225786209106445, 5.7858686447143555, 6.345950603485107, 6.906032562255859, 7.466114521026611, 8.026196479797363, 8.586278915405273, 9.146360397338867, 9.706442832946777, 10.266525268554688, 10.826606750488281, 11.386689186096191, 11.946771621704102, 12.506853103637695, 13.066935539245605, 13.627017974853516, 14.18709945678711, 14.74718189239502, 15.30726432800293, 15.867345809936523]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 5.0, 6.0, 7.0, 17.0, 27.0, 24.0, 32.0, 63.0, 76.0, 135.0, 199.0, 298.0, 606.0, 1121.0, 2248.0, 4866.0, 13002.0, 41640.0, 179553.0, 575664.0, 167660.0, 39306.0, 12591.0, 4739.0, 2115.0, 1056.0, 564.0, 327.0, 211.0, 129.0, 81.0, 58.0, 45.0, 31.0, 14.0, 17.0, 8.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6171875, -14.15283203125, -13.6884765625, -13.22412109375, -12.759765625, -12.29541015625, -11.8310546875, -11.36669921875, -10.90234375, -10.43798828125, -9.9736328125, -9.50927734375, -9.044921875, -8.58056640625, -8.1162109375, -7.65185546875, -7.1875, -6.72314453125, -6.2587890625, -5.79443359375, -5.330078125, -4.86572265625, -4.4013671875, -3.93701171875, -3.47265625, -3.00830078125, -2.5439453125, -2.07958984375, -1.615234375, -1.15087890625, -0.6865234375, -0.22216796875, 0.2421875, 0.70654296875, 1.1708984375, 1.63525390625, 2.099609375, 2.56396484375, 3.0283203125, 3.49267578125, 3.95703125, 4.42138671875, 4.8857421875, 5.35009765625, 5.814453125, 6.27880859375, 6.7431640625, 7.20751953125, 7.671875, 8.13623046875, 8.6005859375, 9.06494140625, 9.529296875, 9.99365234375, 10.4580078125, 10.92236328125, 11.38671875, 11.85107421875, 12.3154296875, 12.77978515625, 13.244140625, 13.70849609375, 14.1728515625, 14.63720703125, 15.1015625]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 6.0, 9.0, 10.0, 4.0, 9.0, 16.0, 20.0, 33.0, 37.0, 48.0, 49.0, 61.0, 64.0, 52.0, 71.0, 78.0, 72.0, 53.0, 50.0, 56.0, 38.0, 34.0, 35.0, 26.0, 15.0, 12.0, 3.0, 8.0, 7.0, 5.0, 2.0, 9.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.578125, -5.3780517578125, -5.177978515625, -4.9779052734375, -4.77783203125, -4.5777587890625, -4.377685546875, -4.1776123046875, -3.9775390625, -3.7774658203125, -3.577392578125, -3.3773193359375, -3.17724609375, -2.9771728515625, -2.777099609375, -2.5770263671875, -2.376953125, -2.1768798828125, -1.976806640625, -1.7767333984375, -1.57666015625, -1.3765869140625, -1.176513671875, -0.9764404296875, -0.7763671875, -0.5762939453125, -0.376220703125, -0.1761474609375, 0.02392578125, 0.2239990234375, 0.424072265625, 0.6241455078125, 0.82421875, 1.0242919921875, 1.224365234375, 1.4244384765625, 1.62451171875, 1.8245849609375, 2.024658203125, 2.2247314453125, 2.4248046875, 2.6248779296875, 2.824951171875, 3.0250244140625, 3.22509765625, 3.4251708984375, 3.625244140625, 3.8253173828125, 4.025390625, 4.2254638671875, 4.425537109375, 4.6256103515625, 4.82568359375, 5.0257568359375, 5.225830078125, 5.4259033203125, 5.6259765625, 5.8260498046875, 6.026123046875, 6.2261962890625, 6.42626953125, 6.6263427734375, 6.826416015625, 7.0264892578125, 7.2265625]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 8.0, 8.0, 8.0, 12.0, 13.0, 13.0, 23.0, 47.0, 55.0, 94.0, 150.0, 206.0, 335.0, 619.0, 1195.0, 3170.0, 11152.0, 63258.0, 704314.0, 227953.0, 25942.0, 5892.0, 1984.0, 817.0, 464.0, 268.0, 175.0, 125.0, 85.0, 39.0, 44.0, 20.0, 14.0, 14.0, 7.0, 6.0, 10.0, 9.0, 1.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-22.03125, -21.265380859375, -20.49951171875, -19.733642578125, -18.9677734375, -18.201904296875, -17.43603515625, -16.670166015625, -15.904296875, -15.138427734375, -14.37255859375, -13.606689453125, -12.8408203125, -12.074951171875, -11.30908203125, -10.543212890625, -9.77734375, -9.011474609375, -8.24560546875, -7.479736328125, -6.7138671875, -5.947998046875, -5.18212890625, -4.416259765625, -3.650390625, -2.884521484375, -2.11865234375, -1.352783203125, -0.5869140625, 0.178955078125, 0.94482421875, 1.710693359375, 2.4765625, 3.242431640625, 4.00830078125, 4.774169921875, 5.5400390625, 6.305908203125, 7.07177734375, 7.837646484375, 8.603515625, 9.369384765625, 10.13525390625, 10.901123046875, 11.6669921875, 12.432861328125, 13.19873046875, 13.964599609375, 14.73046875, 15.496337890625, 16.26220703125, 17.028076171875, 17.7939453125, 18.559814453125, 19.32568359375, 20.091552734375, 20.857421875, 21.623291015625, 22.38916015625, 23.155029296875, 23.9208984375, 24.686767578125, 25.45263671875, 26.218505859375, 26.984375]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 7.0, 4.0, 10.0, 16.0, 15.0, 21.0, 27.0, 34.0, 35.0, 49.0, 53.0, 70.0, 75.0, 66.0, 61.0, 80.0, 66.0, 56.0, 45.0, 43.0, 32.0, 40.0, 31.0, 28.0, 13.0, 11.0, 6.0, 6.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.390625, -23.256591796875, -22.12255859375, -20.988525390625, -19.8544921875, -18.720458984375, -17.58642578125, -16.452392578125, -15.318359375, -14.184326171875, -13.05029296875, -11.916259765625, -10.7822265625, -9.648193359375, -8.51416015625, -7.380126953125, -6.24609375, -5.112060546875, -3.97802734375, -2.843994140625, -1.7099609375, -0.575927734375, 0.55810546875, 1.692138671875, 2.826171875, 3.960205078125, 5.09423828125, 6.228271484375, 7.3623046875, 8.496337890625, 9.63037109375, 10.764404296875, 11.8984375, 13.032470703125, 14.16650390625, 15.300537109375, 16.4345703125, 17.568603515625, 18.70263671875, 19.836669921875, 20.970703125, 22.104736328125, 23.23876953125, 24.372802734375, 25.5068359375, 26.640869140625, 27.77490234375, 28.908935546875, 30.04296875, 31.177001953125, 32.31103515625, 33.445068359375, 34.5791015625, 35.713134765625, 36.84716796875, 37.981201171875, 39.115234375, 40.249267578125, 41.38330078125, 42.517333984375, 43.6513671875, 44.785400390625, 45.91943359375, 47.053466796875, 48.1875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 5.0, 10.0, 9.0, 14.0, 22.0, 35.0, 78.0, 149.0, 353.0, 996.0, 3632.0, 35996.0, 978331.0, 24359.0, 3083.0, 856.0, 302.0, 160.0, 69.0, 35.0, 26.0, 15.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.1875, -23.30615234375, -22.4248046875, -21.54345703125, -20.662109375, -19.78076171875, -18.8994140625, -18.01806640625, -17.13671875, -16.25537109375, -15.3740234375, -14.49267578125, -13.611328125, -12.72998046875, -11.8486328125, -10.96728515625, -10.0859375, -9.20458984375, -8.3232421875, -7.44189453125, -6.560546875, -5.67919921875, -4.7978515625, -3.91650390625, -3.03515625, -2.15380859375, -1.2724609375, -0.39111328125, 0.490234375, 1.37158203125, 2.2529296875, 3.13427734375, 4.015625, 4.89697265625, 5.7783203125, 6.65966796875, 7.541015625, 8.42236328125, 9.3037109375, 10.18505859375, 11.06640625, 11.94775390625, 12.8291015625, 13.71044921875, 14.591796875, 15.47314453125, 16.3544921875, 17.23583984375, 18.1171875, 18.99853515625, 19.8798828125, 20.76123046875, 21.642578125, 22.52392578125, 23.4052734375, 24.28662109375, 25.16796875, 26.04931640625, 26.9306640625, 27.81201171875, 28.693359375, 29.57470703125, 30.4560546875, 31.33740234375, 32.21875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 4.0, 5.0, 4.0, 2.0, 9.0, 14.0, 19.0, 32.0, 32.0, 49.0, 72.0, 128.0, 164.0, 158.0, 101.0, 71.0, 42.0, 18.0, 28.0, 10.0, 8.0, 12.0, 7.0, 3.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0018835067749023438, -0.0018277913331985474, -0.001772075891494751, -0.0017163604497909546, -0.0016606450080871582, -0.0016049295663833618, -0.0015492141246795654, -0.001493498682975769, -0.0014377832412719727, -0.0013820677995681763, -0.0013263523578643799, -0.0012706369161605835, -0.0012149214744567871, -0.0011592060327529907, -0.0011034905910491943, -0.001047775149345398, -0.0009920597076416016, -0.0009363442659378052, -0.0008806288242340088, -0.0008249133825302124, -0.000769197940826416, -0.0007134824991226196, -0.0006577670574188232, -0.0006020516157150269, -0.0005463361740112305, -0.0004906207323074341, -0.0004349052906036377, -0.0003791898488998413, -0.0003234744071960449, -0.00026775896549224854, -0.00021204352378845215, -0.00015632808208465576, -0.00010061264038085938, -4.489719867706299e-05, 1.0818243026733398e-05, 6.653368473052979e-05, 0.00012224912643432617, 0.00017796456813812256, 0.00023368000984191895, 0.00028939545154571533, 0.0003451108932495117, 0.0004008263349533081, 0.0004565417766571045, 0.0005122572183609009, 0.0005679726600646973, 0.0006236881017684937, 0.00067940354347229, 0.0007351189851760864, 0.0007908344268798828, 0.0008465498685836792, 0.0009022653102874756, 0.000957980751991272, 0.0010136961936950684, 0.0010694116353988647, 0.0011251270771026611, 0.0011808425188064575, 0.001236557960510254, 0.0012922734022140503, 0.0013479888439178467, 0.001403704285621643, 0.0014594197273254395, 0.0015151351690292358, 0.0015708506107330322, 0.0016265660524368286, 0.001682281494140625]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 7.0, 6.0, 1.0, 7.0, 11.0, 14.0, 9.0, 22.0, 41.0, 74.0, 112.0, 230.0, 476.0, 1127.0, 3137.0, 17472.0, 935932.0, 81137.0, 5649.0, 1688.0, 691.0, 290.0, 167.0, 83.0, 63.0, 38.0, 16.0, 20.0, 8.0, 11.0, 6.0, 4.0, 3.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.21875, -34.30908203125, -33.3994140625, -32.48974609375, -31.580078125, -30.67041015625, -29.7607421875, -28.85107421875, -27.94140625, -27.03173828125, -26.1220703125, -25.21240234375, -24.302734375, -23.39306640625, -22.4833984375, -21.57373046875, -20.6640625, -19.75439453125, -18.8447265625, -17.93505859375, -17.025390625, -16.11572265625, -15.2060546875, -14.29638671875, -13.38671875, -12.47705078125, -11.5673828125, -10.65771484375, -9.748046875, -8.83837890625, -7.9287109375, -7.01904296875, -6.109375, -5.19970703125, -4.2900390625, -3.38037109375, -2.470703125, -1.56103515625, -0.6513671875, 0.25830078125, 1.16796875, 2.07763671875, 2.9873046875, 3.89697265625, 4.806640625, 5.71630859375, 6.6259765625, 7.53564453125, 8.4453125, 9.35498046875, 10.2646484375, 11.17431640625, 12.083984375, 12.99365234375, 13.9033203125, 14.81298828125, 15.72265625, 16.63232421875, 17.5419921875, 18.45166015625, 19.361328125, 20.27099609375, 21.1806640625, 22.09033203125, 23.0]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 10.0, 17.0, 49.0, 127.0, 222.0, 310.0, 133.0, 57.0, 34.0, 14.0, 7.0, 3.0, 2.0, 2.0, 6.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-36.71875, -35.886962890625, -35.05517578125, -34.223388671875, -33.3916015625, -32.559814453125, -31.72802734375, -30.896240234375, -30.064453125, -29.232666015625, -28.40087890625, -27.569091796875, -26.7373046875, -25.905517578125, -25.07373046875, -24.241943359375, -23.41015625, -22.578369140625, -21.74658203125, -20.914794921875, -20.0830078125, -19.251220703125, -18.41943359375, -17.587646484375, -16.755859375, -15.924072265625, -15.09228515625, -14.260498046875, -13.4287109375, -12.596923828125, -11.76513671875, -10.933349609375, -10.1015625, -9.269775390625, -8.43798828125, -7.606201171875, -6.7744140625, -5.942626953125, -5.11083984375, -4.279052734375, -3.447265625, -2.615478515625, -1.78369140625, -0.951904296875, -0.1201171875, 0.711669921875, 1.54345703125, 2.375244140625, 3.20703125, 4.038818359375, 4.87060546875, 5.702392578125, 6.5341796875, 7.365966796875, 8.19775390625, 9.029541015625, 9.861328125, 10.693115234375, 11.52490234375, 12.356689453125, 13.1884765625, 14.020263671875, 14.85205078125, 15.683837890625, 16.515625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 4.0, 15.0, 25.0, 38.0, 54.0, 86.0, 144.0, 203.0, 147.0, 104.0, 75.0, 40.0, 23.0, 15.0, 12.0, 6.0, 9.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-265.5213623046875, -258.6152648925781, -251.70919799804688, -244.80311584472656, -237.89703369140625, -230.99093627929688, -224.08486938476562, -217.17877197265625, -210.27268981933594, -203.36660766601562, -196.4605255126953, -189.554443359375, -182.6483612060547, -175.74227905273438, -168.836181640625, -161.9300994873047, -155.02401733398438, -148.11793518066406, -141.21185302734375, -134.30577087402344, -127.3996810913086, -120.49359893798828, -113.58751678466797, -106.68142700195312, -99.77536010742188, -92.86927795410156, -85.96319580078125, -79.05711364746094, -72.1510238647461, -65.24494171142578, -58.33885955810547, -51.43277359008789, -44.52668762207031, -37.62060546875, -30.714519500732422, -23.80843734741211, -16.902353286743164, -9.996269226074219, -3.0901870727539062, 3.815898895263672, 10.721981048583984, 17.62806510925293, 24.534149169921875, 31.440231323242188, 38.3463134765625, 45.25239944458008, 52.15848159790039, 59.06456756591797, 65.97064971923828, 72.8767318725586, 79.7828140258789, 86.68890380859375, 93.59498596191406, 100.50106811523438, 107.40715026855469, 114.313232421875, 121.21931457519531, 128.12539672851562, 135.03147888183594, 141.93756103515625, 148.84364318847656, 155.74972534179688, 162.65582275390625, 169.56190490722656, 176.46798706054688]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 8.0, 8.0, 10.0, 14.0, 14.0, 7.0, 14.0, 8.0, 18.0, 29.0, 27.0, 40.0, 45.0, 31.0, 54.0, 42.0, 64.0, 70.0, 66.0, 50.0, 59.0, 42.0, 42.0, 35.0, 30.0, 37.0, 31.0, 18.0, 21.0, 18.0, 14.0, 9.0, 7.0, 7.0, 3.0, 6.0, 5.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-143.69024658203125, -139.3070526123047, -134.92384338378906, -130.5406494140625, -126.1574478149414, -121.77424621582031, -117.39105224609375, -113.00785064697266, -108.62464904785156, -104.24144744873047, -99.85824584960938, -95.47505187988281, -91.09185028076172, -86.70864868164062, -82.32545471191406, -77.94225311279297, -73.55905151367188, -69.17584991455078, -64.79264831542969, -60.409454345703125, -56.02625274658203, -51.64305114746094, -47.25985336303711, -42.87665557861328, -38.49345397949219, -34.110252380371094, -29.727054595947266, -25.343854904174805, -20.960655212402344, -16.577455520629883, -12.194255828857422, -7.811056137084961, -3.4278411865234375, 0.9553585052490234, 5.338558197021484, 9.721757888793945, 14.104957580566406, 18.488157272338867, 22.871356964111328, 27.25455665588379, 31.63775634765625, 36.020957946777344, 40.40415573120117, 44.787353515625, 49.170555114746094, 53.55375671386719, 57.936954498291016, 62.320152282714844, 66.70335388183594, 71.08655548095703, 75.46975708007812, 79.85295104980469, 84.23615264892578, 88.61935424804688, 93.00254821777344, 97.38574981689453, 101.76895141601562, 106.15215301513672, 110.53535461425781, 114.91854858398438, 119.30175018310547, 123.68495178222656, 128.06814575195312, 132.45135498046875, 136.8345489501953]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 4.0, 3.0, 3.0, 7.0, 6.0, 10.0, 9.0, 14.0, 22.0, 31.0, 43.0, 61.0, 79.0, 121.0, 170.0, 353.0, 618.0, 1320.0, 4245.0, 90417.0, 4087750.0, 5651.0, 1608.0, 732.0, 352.0, 237.0, 141.0, 90.0, 55.0, 41.0, 24.0, 19.0, 11.0, 15.0, 5.0, 5.0, 1.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-52.65625, -51.19677734375, -49.7373046875, -48.27783203125, -46.818359375, -45.35888671875, -43.8994140625, -42.43994140625, -40.98046875, -39.52099609375, -38.0615234375, -36.60205078125, -35.142578125, -33.68310546875, -32.2236328125, -30.76416015625, -29.3046875, -27.84521484375, -26.3857421875, -24.92626953125, -23.466796875, -22.00732421875, -20.5478515625, -19.08837890625, -17.62890625, -16.16943359375, -14.7099609375, -13.25048828125, -11.791015625, -10.33154296875, -8.8720703125, -7.41259765625, -5.953125, -4.49365234375, -3.0341796875, -1.57470703125, -0.115234375, 1.34423828125, 2.8037109375, 4.26318359375, 5.72265625, 7.18212890625, 8.6416015625, 10.10107421875, 11.560546875, 13.02001953125, 14.4794921875, 15.93896484375, 17.3984375, 18.85791015625, 20.3173828125, 21.77685546875, 23.236328125, 24.69580078125, 26.1552734375, 27.61474609375, 29.07421875, 30.53369140625, 31.9931640625, 33.45263671875, 34.912109375, 36.37158203125, 37.8310546875, 39.29052734375, 40.75]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 8.0, 6.0, 18.0, 17.0, 24.0, 32.0, 63.0, 84.0, 89.0, 109.0, 105.0, 102.0, 75.0, 64.0, 49.0, 50.0, 29.0, 28.0, 10.0, 13.0, 3.0, 3.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.21875, -8.950927734375, -8.68310546875, -8.415283203125, -8.1474609375, -7.879638671875, -7.61181640625, -7.343994140625, -7.076171875, -6.808349609375, -6.54052734375, -6.272705078125, -6.0048828125, -5.737060546875, -5.46923828125, -5.201416015625, -4.93359375, -4.665771484375, -4.39794921875, -4.130126953125, -3.8623046875, -3.594482421875, -3.32666015625, -3.058837890625, -2.791015625, -2.523193359375, -2.25537109375, -1.987548828125, -1.7197265625, -1.451904296875, -1.18408203125, -0.916259765625, -0.6484375, -0.380615234375, -0.11279296875, 0.155029296875, 0.4228515625, 0.690673828125, 0.95849609375, 1.226318359375, 1.494140625, 1.761962890625, 2.02978515625, 2.297607421875, 2.5654296875, 2.833251953125, 3.10107421875, 3.368896484375, 3.63671875, 3.904541015625, 4.17236328125, 4.440185546875, 4.7080078125, 4.975830078125, 5.24365234375, 5.511474609375, 5.779296875, 6.047119140625, 6.31494140625, 6.582763671875, 6.8505859375, 7.118408203125, 7.38623046875, 7.654052734375, 7.921875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 8.0, 15.0, 10.0, 22.0, 27.0, 34.0, 44.0, 60.0, 71.0, 105.0, 153.0, 235.0, 345.0, 516.0, 841.0, 1326.0, 2641.0, 5967.0, 23169.0, 4097367.0, 45575.0, 8015.0, 3295.0, 1616.0, 916.0, 605.0, 379.0, 263.0, 189.0, 130.0, 83.0, 78.0, 44.0, 37.0, 16.0, 20.0, 12.0, 17.0, 5.0, 9.0, 6.0, 1.0, 3.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.703125, -28.733642578125, -27.76416015625, -26.794677734375, -25.8251953125, -24.855712890625, -23.88623046875, -22.916748046875, -21.947265625, -20.977783203125, -20.00830078125, -19.038818359375, -18.0693359375, -17.099853515625, -16.13037109375, -15.160888671875, -14.19140625, -13.221923828125, -12.25244140625, -11.282958984375, -10.3134765625, -9.343994140625, -8.37451171875, -7.405029296875, -6.435546875, -5.466064453125, -4.49658203125, -3.527099609375, -2.5576171875, -1.588134765625, -0.61865234375, 0.350830078125, 1.3203125, 2.289794921875, 3.25927734375, 4.228759765625, 5.1982421875, 6.167724609375, 7.13720703125, 8.106689453125, 9.076171875, 10.045654296875, 11.01513671875, 11.984619140625, 12.9541015625, 13.923583984375, 14.89306640625, 15.862548828125, 16.83203125, 17.801513671875, 18.77099609375, 19.740478515625, 20.7099609375, 21.679443359375, 22.64892578125, 23.618408203125, 24.587890625, 25.557373046875, 26.52685546875, 27.496337890625, 28.4658203125, 29.435302734375, 30.40478515625, 31.374267578125, 32.34375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 6.0, 15.0, 18.0, 91.0, 3646.0, 191.0, 43.0, 19.0, 11.0, 9.0, 4.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.75, -15.2679443359375, -14.785888671875, -14.3038330078125, -13.82177734375, -13.3397216796875, -12.857666015625, -12.3756103515625, -11.8935546875, -11.4114990234375, -10.929443359375, -10.4473876953125, -9.96533203125, -9.4832763671875, -9.001220703125, -8.5191650390625, -8.037109375, -7.5550537109375, -7.072998046875, -6.5909423828125, -6.10888671875, -5.6268310546875, -5.144775390625, -4.6627197265625, -4.1806640625, -3.6986083984375, -3.216552734375, -2.7344970703125, -2.25244140625, -1.7703857421875, -1.288330078125, -0.8062744140625, -0.32421875, 0.1578369140625, 0.639892578125, 1.1219482421875, 1.60400390625, 2.0860595703125, 2.568115234375, 3.0501708984375, 3.5322265625, 4.0142822265625, 4.496337890625, 4.9783935546875, 5.46044921875, 5.9425048828125, 6.424560546875, 6.9066162109375, 7.388671875, 7.8707275390625, 8.352783203125, 8.8348388671875, 9.31689453125, 9.7989501953125, 10.281005859375, 10.7630615234375, 11.2451171875, 11.7271728515625, 12.209228515625, 12.6912841796875, 13.17333984375, 13.6553955078125, 14.137451171875, 14.6195068359375, 15.1015625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 8.0, 10.0, 28.0, 62.0, 126.0, 214.0, 201.0, 149.0, 82.0, 43.0, 26.0, 13.0, 12.0, 13.0, 7.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.55660629272461, -35.55962371826172, -33.56264114379883, -31.56566047668457, -29.56867790222168, -27.57169532775879, -25.57471466064453, -23.57773208618164, -21.58074951171875, -19.58376693725586, -17.58678436279297, -15.589803695678711, -13.59282112121582, -11.59583854675293, -9.598856925964355, -7.601875305175781, -5.604892730712891, -3.607910633087158, -1.6109285354614258, 0.38605356216430664, 2.383035659790039, 4.38001823425293, 6.376999855041504, 8.373981475830078, 10.370964050292969, 12.36794662475586, 14.364928245544434, 16.361909866333008, 18.3588924407959, 20.35587501525879, 22.352855682373047, 24.349838256835938, 26.346817016601562, 28.343799591064453, 30.340782165527344, 32.337764739990234, 34.334747314453125, 36.33172607421875, 38.32870864868164, 40.32569122314453, 42.32267379760742, 44.31965637207031, 46.3166389465332, 48.313621520996094, 50.31060028076172, 52.307586669921875, 54.3045654296875, 56.30154800415039, 58.29853057861328, 60.29551315307617, 62.29249572753906, 64.28947448730469, 66.28646087646484, 68.28343963623047, 70.28042602539062, 72.27740478515625, 74.27438354492188, 76.2713623046875, 78.26834869384766, 80.26532745361328, 82.26231384277344, 84.25929260253906, 86.25627899169922, 88.25325775146484, 90.250244140625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 6.0, 7.0, 4.0, 2.0, 6.0, 7.0, 14.0, 19.0, 15.0, 18.0, 19.0, 22.0, 21.0, 31.0, 23.0, 33.0, 35.0, 48.0, 37.0, 50.0, 32.0, 50.0, 36.0, 37.0, 38.0, 29.0, 40.0, 37.0, 30.0, 40.0, 31.0, 23.0, 29.0, 24.0, 20.0, 16.0, 14.0, 11.0, 12.0, 9.0, 10.0, 4.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-24.404634475708008, -23.700088500976562, -22.995542526245117, -22.290996551513672, -21.58645248413086, -20.881906509399414, -20.17736053466797, -19.472814559936523, -18.768268585205078, -18.063722610473633, -17.359176635742188, -16.654630661010742, -15.950085639953613, -15.245539665222168, -14.540994644165039, -13.836448669433594, -13.131902694702148, -12.427356719970703, -11.722810745239258, -11.018265724182129, -10.313719749450684, -9.609173774719238, -8.90462875366211, -8.200082778930664, -7.495536804199219, -6.790990829467773, -6.086445331573486, -5.381899833679199, -4.677353858947754, -3.9728081226348877, -3.2682623863220215, -2.5637168884277344, -1.8591728210449219, -1.1546270847320557, -0.45008134841918945, 0.25446438789367676, 0.959010124206543, 1.6635558605194092, 2.3681015968322754, 3.0726470947265625, 3.777193069458008, 4.481739044189453, 5.18628454208374, 5.890830039978027, 6.595376014709473, 7.299921989440918, 8.004467010498047, 8.709012985229492, 9.413558959960938, 10.118104934692383, 10.822650909423828, 11.527195930480957, 12.231741905212402, 12.936287879943848, 13.640832901000977, 14.345378875732422, 15.049924850463867, 15.754470825195312, 16.459016799926758, 17.163562774658203, 17.868106842041016, 18.57265281677246, 19.277198791503906, 19.98174476623535, 20.686290740966797]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 6.0, 7.0, 17.0, 23.0, 36.0, 77.0, 149.0, 262.0, 535.0, 1116.0, 2816.0, 8535.0, 34441.0, 240255.0, 647535.0, 87678.0, 16869.0, 4805.0, 1803.0, 756.0, 374.0, 194.0, 96.0, 76.0, 35.0, 25.0, 10.0, 8.0, 6.0, 2.0, 3.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.515625, -23.648193359375, -22.78076171875, -21.913330078125, -21.0458984375, -20.178466796875, -19.31103515625, -18.443603515625, -17.576171875, -16.708740234375, -15.84130859375, -14.973876953125, -14.1064453125, -13.239013671875, -12.37158203125, -11.504150390625, -10.63671875, -9.769287109375, -8.90185546875, -8.034423828125, -7.1669921875, -6.299560546875, -5.43212890625, -4.564697265625, -3.697265625, -2.829833984375, -1.96240234375, -1.094970703125, -0.2275390625, 0.639892578125, 1.50732421875, 2.374755859375, 3.2421875, 4.109619140625, 4.97705078125, 5.844482421875, 6.7119140625, 7.579345703125, 8.44677734375, 9.314208984375, 10.181640625, 11.049072265625, 11.91650390625, 12.783935546875, 13.6513671875, 14.518798828125, 15.38623046875, 16.253662109375, 17.12109375, 17.988525390625, 18.85595703125, 19.723388671875, 20.5908203125, 21.458251953125, 22.32568359375, 23.193115234375, 24.060546875, 24.927978515625, 25.79541015625, 26.662841796875, 27.5302734375, 28.397705078125, 29.26513671875, 30.132568359375, 31.0]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 4.0, 8.0, 14.0, 10.0, 8.0, 16.0, 27.0, 28.0, 48.0, 62.0, 52.0, 72.0, 75.0, 106.0, 86.0, 79.0, 71.0, 45.0, 48.0, 37.0, 28.0, 24.0, 13.0, 9.0, 7.0, 10.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.2578125, -8.00439453125, -7.7509765625, -7.49755859375, -7.244140625, -6.99072265625, -6.7373046875, -6.48388671875, -6.23046875, -5.97705078125, -5.7236328125, -5.47021484375, -5.216796875, -4.96337890625, -4.7099609375, -4.45654296875, -4.203125, -3.94970703125, -3.6962890625, -3.44287109375, -3.189453125, -2.93603515625, -2.6826171875, -2.42919921875, -2.17578125, -1.92236328125, -1.6689453125, -1.41552734375, -1.162109375, -0.90869140625, -0.6552734375, -0.40185546875, -0.1484375, 0.10498046875, 0.3583984375, 0.61181640625, 0.865234375, 1.11865234375, 1.3720703125, 1.62548828125, 1.87890625, 2.13232421875, 2.3857421875, 2.63916015625, 2.892578125, 3.14599609375, 3.3994140625, 3.65283203125, 3.90625, 4.15966796875, 4.4130859375, 4.66650390625, 4.919921875, 5.17333984375, 5.4267578125, 5.68017578125, 5.93359375, 6.18701171875, 6.4404296875, 6.69384765625, 6.947265625, 7.20068359375, 7.4541015625, 7.70751953125, 7.9609375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 9.0, 12.0, 13.0, 32.0, 39.0, 46.0, 78.0, 134.0, 220.0, 456.0, 894.0, 2364.0, 8110.0, 47372.0, 635730.0, 315899.0, 27946.0, 5710.0, 1829.0, 702.0, 374.0, 212.0, 127.0, 76.0, 44.0, 29.0, 25.0, 15.0, 12.0, 12.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.171875, -21.202392578125, -20.23291015625, -19.263427734375, -18.2939453125, -17.324462890625, -16.35498046875, -15.385498046875, -14.416015625, -13.446533203125, -12.47705078125, -11.507568359375, -10.5380859375, -9.568603515625, -8.59912109375, -7.629638671875, -6.66015625, -5.690673828125, -4.72119140625, -3.751708984375, -2.7822265625, -1.812744140625, -0.84326171875, 0.126220703125, 1.095703125, 2.065185546875, 3.03466796875, 4.004150390625, 4.9736328125, 5.943115234375, 6.91259765625, 7.882080078125, 8.8515625, 9.821044921875, 10.79052734375, 11.760009765625, 12.7294921875, 13.698974609375, 14.66845703125, 15.637939453125, 16.607421875, 17.576904296875, 18.54638671875, 19.515869140625, 20.4853515625, 21.454833984375, 22.42431640625, 23.393798828125, 24.36328125, 25.332763671875, 26.30224609375, 27.271728515625, 28.2412109375, 29.210693359375, 30.18017578125, 31.149658203125, 32.119140625, 33.088623046875, 34.05810546875, 35.027587890625, 35.9970703125, 36.966552734375, 37.93603515625, 38.905517578125, 39.875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 7.0, 5.0, 6.0, 9.0, 13.0, 8.0, 9.0, 12.0, 21.0, 26.0, 28.0, 25.0, 28.0, 34.0, 38.0, 31.0, 38.0, 35.0, 38.0, 45.0, 44.0, 34.0, 40.0, 39.0, 48.0, 41.0, 38.0, 34.0, 32.0, 27.0, 24.0, 24.0, 16.0, 15.0, 13.0, 15.0, 11.0, 7.0, 6.0, 4.0, 7.0, 4.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-18.578125, -17.9267578125, -17.275390625, -16.6240234375, -15.97265625, -15.3212890625, -14.669921875, -14.0185546875, -13.3671875, -12.7158203125, -12.064453125, -11.4130859375, -10.76171875, -10.1103515625, -9.458984375, -8.8076171875, -8.15625, -7.5048828125, -6.853515625, -6.2021484375, -5.55078125, -4.8994140625, -4.248046875, -3.5966796875, -2.9453125, -2.2939453125, -1.642578125, -0.9912109375, -0.33984375, 0.3115234375, 0.962890625, 1.6142578125, 2.265625, 2.9169921875, 3.568359375, 4.2197265625, 4.87109375, 5.5224609375, 6.173828125, 6.8251953125, 7.4765625, 8.1279296875, 8.779296875, 9.4306640625, 10.08203125, 10.7333984375, 11.384765625, 12.0361328125, 12.6875, 13.3388671875, 13.990234375, 14.6416015625, 15.29296875, 15.9443359375, 16.595703125, 17.2470703125, 17.8984375, 18.5498046875, 19.201171875, 19.8525390625, 20.50390625, 21.1552734375, 21.806640625, 22.4580078125, 23.109375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 2.0, 5.0, 6.0, 16.0, 13.0, 13.0, 21.0, 29.0, 49.0, 65.0, 102.0, 214.0, 406.0, 987.0, 2993.0, 13089.0, 151561.0, 806377.0, 61336.0, 7768.0, 1992.0, 734.0, 354.0, 145.0, 99.0, 67.0, 28.0, 26.0, 10.0, 14.0, 7.0, 7.0, 1.0, 7.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.87109375, -7.57232666015625, -7.2735595703125, -6.97479248046875, -6.676025390625, -6.37725830078125, -6.0784912109375, -5.77972412109375, -5.48095703125, -5.18218994140625, -4.8834228515625, -4.58465576171875, -4.285888671875, -3.98712158203125, -3.6883544921875, -3.38958740234375, -3.0908203125, -2.79205322265625, -2.4932861328125, -2.19451904296875, -1.895751953125, -1.59698486328125, -1.2982177734375, -0.99945068359375, -0.70068359375, -0.40191650390625, -0.1031494140625, 0.19561767578125, 0.494384765625, 0.79315185546875, 1.0919189453125, 1.39068603515625, 1.689453125, 1.98822021484375, 2.2869873046875, 2.58575439453125, 2.884521484375, 3.18328857421875, 3.4820556640625, 3.78082275390625, 4.07958984375, 4.37835693359375, 4.6771240234375, 4.97589111328125, 5.274658203125, 5.57342529296875, 5.8721923828125, 6.17095947265625, 6.4697265625, 6.76849365234375, 7.0672607421875, 7.36602783203125, 7.664794921875, 7.96356201171875, 8.2623291015625, 8.56109619140625, 8.85986328125, 9.15863037109375, 9.4573974609375, 9.75616455078125, 10.054931640625, 10.35369873046875, 10.6524658203125, 10.95123291015625, 11.25]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 1.0, 4.0, 3.0, 3.0, 7.0, 3.0, 12.0, 10.0, 13.0, 10.0, 15.0, 24.0, 24.0, 49.0, 43.0, 45.0, 86.0, 75.0, 82.0, 88.0, 67.0, 64.0, 66.0, 47.0, 34.0, 22.0, 19.0, 14.0, 13.0, 13.0, 10.0, 9.0, 6.0, 5.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 4.0], "bins": [-0.0009570121765136719, -0.0009287819266319275, -0.0009005516767501831, -0.0008723214268684387, -0.0008440911769866943, -0.00081586092710495, -0.0007876306772232056, -0.0007594004273414612, -0.0007311701774597168, -0.0007029399275779724, -0.000674709677696228, -0.0006464794278144836, -0.0006182491779327393, -0.0005900189280509949, -0.0005617886781692505, -0.0005335584282875061, -0.0005053281784057617, -0.00047709792852401733, -0.00044886767864227295, -0.00042063742876052856, -0.0003924071788787842, -0.0003641769289970398, -0.0003359466791152954, -0.000307716429233551, -0.00027948617935180664, -0.00025125592947006226, -0.00022302567958831787, -0.00019479542970657349, -0.0001665651798248291, -0.00013833492994308472, -0.00011010468006134033, -8.187443017959595e-05, -5.364418029785156e-05, -2.5413930416107178e-05, 2.816319465637207e-06, 3.104656934738159e-05, 5.9276819229125977e-05, 8.750706911087036e-05, 0.00011573731899261475, 0.00014396756887435913, 0.00017219781875610352, 0.0002004280686378479, 0.00022865831851959229, 0.00025688856840133667, 0.00028511881828308105, 0.00031334906816482544, 0.0003415793180465698, 0.0003698095679283142, 0.0003980398178100586, 0.000426270067691803, 0.00045450031757354736, 0.00048273056745529175, 0.0005109608173370361, 0.0005391910672187805, 0.0005674213171005249, 0.0005956515669822693, 0.0006238818168640137, 0.0006521120667457581, 0.0006803423166275024, 0.0007085725665092468, 0.0007368028163909912, 0.0007650330662727356, 0.00079326331615448, 0.0008214935660362244, 0.0008497238159179688]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 4.0, 6.0, 8.0, 13.0, 30.0, 47.0, 119.0, 201.0, 544.0, 2076.0, 17988.0, 875212.0, 145020.0, 5560.0, 1049.0, 327.0, 154.0, 90.0, 39.0, 27.0, 19.0, 10.0, 5.0, 3.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.4765625, -9.9466552734375, -9.416748046875, -8.8868408203125, -8.35693359375, -7.8270263671875, -7.297119140625, -6.7672119140625, -6.2373046875, -5.7073974609375, -5.177490234375, -4.6475830078125, -4.11767578125, -3.5877685546875, -3.057861328125, -2.5279541015625, -1.998046875, -1.4681396484375, -0.938232421875, -0.4083251953125, 0.12158203125, 0.6514892578125, 1.181396484375, 1.7113037109375, 2.2412109375, 2.7711181640625, 3.301025390625, 3.8309326171875, 4.36083984375, 4.8907470703125, 5.420654296875, 5.9505615234375, 6.48046875, 7.0103759765625, 7.540283203125, 8.0701904296875, 8.60009765625, 9.1300048828125, 9.659912109375, 10.1898193359375, 10.7197265625, 11.2496337890625, 11.779541015625, 12.3094482421875, 12.83935546875, 13.3692626953125, 13.899169921875, 14.4290771484375, 14.958984375, 15.4888916015625, 16.018798828125, 16.5487060546875, 17.07861328125, 17.6085205078125, 18.138427734375, 18.6683349609375, 19.1982421875, 19.7281494140625, 20.258056640625, 20.7879638671875, 21.31787109375, 21.8477783203125, 22.377685546875, 22.9075927734375, 23.4375]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 11.0, 9.0, 18.0, 24.0, 34.0, 69.0, 79.0, 106.0, 132.0, 131.0, 125.0, 86.0, 56.0, 39.0, 29.0, 20.0, 18.0, 4.0, 7.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.09375, -7.7703857421875, -7.447021484375, -7.1236572265625, -6.80029296875, -6.4769287109375, -6.153564453125, -5.8302001953125, -5.5068359375, -5.1834716796875, -4.860107421875, -4.5367431640625, -4.21337890625, -3.8900146484375, -3.566650390625, -3.2432861328125, -2.919921875, -2.5965576171875, -2.273193359375, -1.9498291015625, -1.62646484375, -1.3031005859375, -0.979736328125, -0.6563720703125, -0.3330078125, -0.0096435546875, 0.313720703125, 0.6370849609375, 0.96044921875, 1.2838134765625, 1.607177734375, 1.9305419921875, 2.25390625, 2.5772705078125, 2.900634765625, 3.2239990234375, 3.54736328125, 3.8707275390625, 4.194091796875, 4.5174560546875, 4.8408203125, 5.1641845703125, 5.487548828125, 5.8109130859375, 6.13427734375, 6.4576416015625, 6.781005859375, 7.1043701171875, 7.427734375, 7.7510986328125, 8.074462890625, 8.3978271484375, 8.72119140625, 9.0445556640625, 9.367919921875, 9.6912841796875, 10.0146484375, 10.3380126953125, 10.661376953125, 10.9847412109375, 11.30810546875, 11.6314697265625, 11.954833984375, 12.2781982421875, 12.6015625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 9.0, 15.0, 53.0, 106.0, 207.0, 299.0, 202.0, 74.0, 21.0, 7.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-368.8743896484375, -358.4471740722656, -348.01995849609375, -337.59271240234375, -327.1654968261719, -316.73828125, -306.31103515625, -295.8838195800781, -285.45660400390625, -275.0293884277344, -264.6021728515625, -254.1749267578125, -243.74771118164062, -233.32049560546875, -222.8932647705078, -212.46603393554688, -202.038818359375, -191.61160278320312, -181.1843719482422, -170.75714111328125, -160.32992553710938, -149.9027099609375, -139.47547912597656, -129.04824829101562, -118.62103271484375, -108.19380950927734, -97.76658630371094, -87.33936309814453, -76.91213989257812, -66.48491668701172, -56.05769348144531, -45.630470275878906, -35.203216552734375, -24.77599334716797, -14.348770141601562, -3.9215469360351562, 6.50567626953125, 16.932899475097656, 27.360122680664062, 37.78734588623047, 48.214569091796875, 58.64179229736328, 69.06901550292969, 79.4962387084961, 89.9234619140625, 100.3506851196289, 110.77790832519531, 121.20513153076172, 131.63235473632812, 142.0595703125, 152.48680114746094, 162.91403198242188, 173.34124755859375, 183.76846313476562, 194.19569396972656, 204.6229248046875, 215.05014038085938, 225.47735595703125, 235.9045867919922, 246.33181762695312, 256.759033203125, 267.1862487792969, 277.61346435546875, 288.04071044921875, 298.4679260253906]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 4.0, 1.0, 2.0, 9.0, 6.0, 9.0, 8.0, 12.0, 8.0, 9.0, 15.0, 20.0, 22.0, 26.0, 29.0, 37.0, 34.0, 42.0, 40.0, 45.0, 47.0, 44.0, 51.0, 59.0, 45.0, 40.0, 32.0, 40.0, 42.0, 39.0, 30.0, 22.0, 18.0, 24.0, 17.0, 23.0, 9.0, 8.0, 3.0, 8.0, 3.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-106.68327331542969, -103.49650573730469, -100.30973052978516, -97.12296295166016, -93.93618774414062, -90.74942016601562, -87.56265258789062, -84.3758773803711, -81.1891098022461, -78.0023422241211, -74.81556701660156, -71.62879943847656, -68.44202423095703, -65.25525665283203, -62.068485260009766, -58.8817138671875, -55.694942474365234, -52.50817108154297, -49.3213996887207, -46.13462829589844, -42.94786071777344, -39.76108932495117, -36.574317932128906, -33.387550354003906, -30.200777053833008, -27.014005661010742, -23.82723617553711, -20.640464782714844, -17.453693389892578, -14.266923904418945, -11.08015251159668, -7.893383026123047, -4.706611633300781, -1.519840955734253, 1.6669297218322754, 4.853700637817383, 8.040471076965332, 11.227241516113281, 14.414012908935547, 17.60078239440918, 20.787553787231445, 23.97432518005371, 27.161094665527344, 30.34786605834961, 33.534637451171875, 36.721405029296875, 39.908180236816406, 43.094947814941406, 46.28171920776367, 49.46849060058594, 52.6552619934082, 55.84203338623047, 59.02880096435547, 62.215572357177734, 65.40234375, 68.589111328125, 71.77588653564453, 74.96265411376953, 78.14942932128906, 81.33619689941406, 84.5229721069336, 87.7097396850586, 90.89651489257812, 94.08328247070312, 97.27005004882812]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 16.0, 22.0, 33.0, 62.0, 89.0, 132.0, 203.0, 345.0, 588.0, 925.0, 1791.0, 3531.0, 7863.0, 21478.0, 97236.0, 3593024.0, 406738.0, 37408.0, 12195.0, 5113.0, 2503.0, 1245.0, 677.0, 412.0, 252.0, 146.0, 85.0, 58.0, 31.0, 27.0, 16.0, 3.0, 7.0, 6.0, 4.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2109375, -13.7327880859375, -13.254638671875, -12.7764892578125, -12.29833984375, -11.8201904296875, -11.342041015625, -10.8638916015625, -10.3857421875, -9.9075927734375, -9.429443359375, -8.9512939453125, -8.47314453125, -7.9949951171875, -7.516845703125, -7.0386962890625, -6.560546875, -6.0823974609375, -5.604248046875, -5.1260986328125, -4.64794921875, -4.1697998046875, -3.691650390625, -3.2135009765625, -2.7353515625, -2.2572021484375, -1.779052734375, -1.3009033203125, -0.82275390625, -0.3446044921875, 0.133544921875, 0.6116943359375, 1.08984375, 1.5679931640625, 2.046142578125, 2.5242919921875, 3.00244140625, 3.4805908203125, 3.958740234375, 4.4368896484375, 4.9150390625, 5.3931884765625, 5.871337890625, 6.3494873046875, 6.82763671875, 7.3057861328125, 7.783935546875, 8.2620849609375, 8.740234375, 9.2183837890625, 9.696533203125, 10.1746826171875, 10.65283203125, 11.1309814453125, 11.609130859375, 12.0872802734375, 12.5654296875, 13.0435791015625, 13.521728515625, 13.9998779296875, 14.47802734375, 14.9561767578125, 15.434326171875, 15.9124755859375, 16.390625]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 10.0, 10.0, 15.0, 25.0, 28.0, 34.0, 51.0, 50.0, 73.0, 62.0, 57.0, 75.0, 66.0, 70.0, 70.0, 54.0, 49.0, 41.0, 28.0, 26.0, 23.0, 17.0, 16.0, 10.0, 12.0, 7.0, 6.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.6953125, -6.49884033203125, -6.3023681640625, -6.10589599609375, -5.909423828125, -5.71295166015625, -5.5164794921875, -5.32000732421875, -5.12353515625, -4.92706298828125, -4.7305908203125, -4.53411865234375, -4.337646484375, -4.14117431640625, -3.9447021484375, -3.74822998046875, -3.5517578125, -3.35528564453125, -3.1588134765625, -2.96234130859375, -2.765869140625, -2.56939697265625, -2.3729248046875, -2.17645263671875, -1.97998046875, -1.78350830078125, -1.5870361328125, -1.39056396484375, -1.194091796875, -0.99761962890625, -0.8011474609375, -0.60467529296875, -0.408203125, -0.21173095703125, -0.0152587890625, 0.18121337890625, 0.377685546875, 0.57415771484375, 0.7706298828125, 0.96710205078125, 1.16357421875, 1.36004638671875, 1.5565185546875, 1.75299072265625, 1.949462890625, 2.14593505859375, 2.3424072265625, 2.53887939453125, 2.7353515625, 2.93182373046875, 3.1282958984375, 3.32476806640625, 3.521240234375, 3.71771240234375, 3.9141845703125, 4.11065673828125, 4.30712890625, 4.50360107421875, 4.7000732421875, 4.89654541015625, 5.093017578125, 5.28948974609375, 5.4859619140625, 5.68243408203125, 5.87890625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 18.0, 19.0, 25.0, 27.0, 39.0, 47.0, 80.0, 115.0, 225.0, 322.0, 613.0, 1142.0, 2011.0, 4016.0, 8066.0, 18718.0, 55971.0, 355818.0, 3504023.0, 175654.0, 39531.0, 14345.0, 6205.0, 3238.0, 1681.0, 895.0, 572.0, 278.0, 197.0, 117.0, 88.0, 51.0, 36.0, 22.0, 21.0, 15.0, 6.0, 10.0, 7.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.8203125, -12.4114990234375, -12.002685546875, -11.5938720703125, -11.18505859375, -10.7762451171875, -10.367431640625, -9.9586181640625, -9.5498046875, -9.1409912109375, -8.732177734375, -8.3233642578125, -7.91455078125, -7.5057373046875, -7.096923828125, -6.6881103515625, -6.279296875, -5.8704833984375, -5.461669921875, -5.0528564453125, -4.64404296875, -4.2352294921875, -3.826416015625, -3.4176025390625, -3.0087890625, -2.5999755859375, -2.191162109375, -1.7823486328125, -1.37353515625, -0.9647216796875, -0.555908203125, -0.1470947265625, 0.26171875, 0.6705322265625, 1.079345703125, 1.4881591796875, 1.89697265625, 2.3057861328125, 2.714599609375, 3.1234130859375, 3.5322265625, 3.9410400390625, 4.349853515625, 4.7586669921875, 5.16748046875, 5.5762939453125, 5.985107421875, 6.3939208984375, 6.802734375, 7.2115478515625, 7.620361328125, 8.0291748046875, 8.43798828125, 8.8468017578125, 9.255615234375, 9.6644287109375, 10.0732421875, 10.4820556640625, 10.890869140625, 11.2996826171875, 11.70849609375, 12.1173095703125, 12.526123046875, 12.9349365234375, 13.34375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 7.0, 2.0, 4.0, 4.0, 7.0, 3.0, 15.0, 7.0, 17.0, 19.0, 25.0, 41.0, 52.0, 93.0, 117.0, 271.0, 761.0, 1416.0, 603.0, 241.0, 104.0, 59.0, 60.0, 29.0, 27.0, 20.0, 17.0, 9.0, 11.0, 4.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.703125, -13.20263671875, -12.7021484375, -12.20166015625, -11.701171875, -11.20068359375, -10.7001953125, -10.19970703125, -9.69921875, -9.19873046875, -8.6982421875, -8.19775390625, -7.697265625, -7.19677734375, -6.6962890625, -6.19580078125, -5.6953125, -5.19482421875, -4.6943359375, -4.19384765625, -3.693359375, -3.19287109375, -2.6923828125, -2.19189453125, -1.69140625, -1.19091796875, -0.6904296875, -0.18994140625, 0.310546875, 0.81103515625, 1.3115234375, 1.81201171875, 2.3125, 2.81298828125, 3.3134765625, 3.81396484375, 4.314453125, 4.81494140625, 5.3154296875, 5.81591796875, 6.31640625, 6.81689453125, 7.3173828125, 7.81787109375, 8.318359375, 8.81884765625, 9.3193359375, 9.81982421875, 10.3203125, 10.82080078125, 11.3212890625, 11.82177734375, 12.322265625, 12.82275390625, 13.3232421875, 13.82373046875, 14.32421875, 14.82470703125, 15.3251953125, 15.82568359375, 16.326171875, 16.82666015625, 17.3271484375, 17.82763671875, 18.328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 3.0, 7.0, 11.0, 21.0, 43.0, 154.0, 282.0, 272.0, 125.0, 44.0, 20.0, 7.0, 5.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-323.97894287109375, -317.2300720214844, -310.481201171875, -303.7322998046875, -296.9834289550781, -290.23455810546875, -283.4856872558594, -276.73681640625, -269.9879455566406, -263.23907470703125, -256.4902038574219, -249.74131774902344, -242.99244689941406, -236.24356079101562, -229.49468994140625, -222.74581909179688, -215.99691772460938, -209.248046875, -202.49916076660156, -195.7502899169922, -189.0014190673828, -182.25253295898438, -175.503662109375, -168.75479125976562, -162.00592041015625, -155.25704956054688, -148.50816345214844, -141.75929260253906, -135.0104217529297, -128.26153564453125, -121.51266479492188, -114.76378631591797, -108.01490783691406, -101.26602935791016, -94.51715850830078, -87.76828002929688, -81.01940155029297, -74.27052307128906, -67.52165222167969, -60.77277374267578, -54.02389907836914, -47.2750244140625, -40.526145935058594, -33.77727127075195, -27.02839469909668, -20.279518127441406, -13.530643463134766, -6.781764984130859, -0.03289031982421875, 6.7159857749938965, 13.464861869812012, 20.21373748779297, 26.962614059448242, 33.711490631103516, 40.460365295410156, 47.20924377441406, 53.9581184387207, 60.706993103027344, 67.45587158203125, 74.20474243164062, 80.95362091064453, 87.70249938964844, 94.45137023925781, 101.20025634765625, 107.94912719726562]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 3.0, 3.0, 7.0, 11.0, 14.0, 15.0, 23.0, 34.0, 22.0, 30.0, 40.0, 46.0, 46.0, 50.0, 44.0, 53.0, 58.0, 57.0, 53.0, 53.0, 47.0, 42.0, 38.0, 32.0, 33.0, 34.0, 23.0, 21.0, 8.0, 14.0, 10.0, 8.0, 3.0, 5.0, 7.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.70966339111328, -71.57650756835938, -69.443359375, -67.3102035522461, -65.17705535888672, -63.04389953613281, -60.91074752807617, -58.77759552001953, -56.644439697265625, -54.511287689208984, -52.378135681152344, -50.24497985839844, -48.1118278503418, -45.978675842285156, -43.845523834228516, -41.712371826171875, -39.579219818115234, -37.446067810058594, -35.31291580200195, -33.17976379394531, -31.046607971191406, -28.913455963134766, -26.780303955078125, -24.647151947021484, -22.51399803161621, -20.38084602355957, -18.247692108154297, -16.114540100097656, -13.9813871383667, -11.848234176635742, -9.715082168579102, -7.5819292068481445, -5.4487762451171875, -3.3156235218048096, -1.1824707984924316, 0.9506816864013672, 3.083834648132324, 5.216987609863281, 7.350139617919922, 9.483292579650879, 11.616445541381836, 13.749598503112793, 15.88275146484375, 18.01590347290039, 20.14905548095703, 22.282209396362305, 24.415361404418945, 26.54851531982422, 28.68166732788086, 30.8148193359375, 32.94797134399414, 35.08112335205078, 37.21427917480469, 39.34743118286133, 41.48058319091797, 43.61373519897461, 45.74688720703125, 47.88003921508789, 50.01319122314453, 52.14634704589844, 54.27949905395508, 56.41265106201172, 58.54580307006836, 60.678955078125, 62.812110900878906]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 1.0, 3.0, 4.0, 4.0, 6.0, 5.0, 16.0, 15.0, 17.0, 37.0, 48.0, 85.0, 76.0, 147.0, 238.0, 336.0, 501.0, 745.0, 1242.0, 1971.0, 3649.0, 7057.0, 14776.0, 34832.0, 88901.0, 253111.0, 387278.0, 152252.0, 55972.0, 22783.0, 10280.0, 4995.0, 2783.0, 1562.0, 975.0, 630.0, 388.0, 263.0, 185.0, 112.0, 90.0, 63.0, 44.0, 23.0, 26.0, 12.0, 8.0, 5.0, 1.0, 7.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.6622314453125, -8.355712890625, -8.0491943359375, -7.74267578125, -7.4361572265625, -7.129638671875, -6.8231201171875, -6.5166015625, -6.2100830078125, -5.903564453125, -5.5970458984375, -5.29052734375, -4.9840087890625, -4.677490234375, -4.3709716796875, -4.064453125, -3.7579345703125, -3.451416015625, -3.1448974609375, -2.83837890625, -2.5318603515625, -2.225341796875, -1.9188232421875, -1.6123046875, -1.3057861328125, -0.999267578125, -0.6927490234375, -0.38623046875, -0.0797119140625, 0.226806640625, 0.5333251953125, 0.83984375, 1.1463623046875, 1.452880859375, 1.7593994140625, 2.06591796875, 2.3724365234375, 2.678955078125, 2.9854736328125, 3.2919921875, 3.5985107421875, 3.905029296875, 4.2115478515625, 4.51806640625, 4.8245849609375, 5.131103515625, 5.4376220703125, 5.744140625, 6.0506591796875, 6.357177734375, 6.6636962890625, 6.97021484375, 7.2767333984375, 7.583251953125, 7.8897705078125, 8.1962890625, 8.5028076171875, 8.809326171875, 9.1158447265625, 9.42236328125, 9.7288818359375, 10.035400390625, 10.3419189453125, 10.6484375]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 0.0, 7.0, 15.0, 13.0, 21.0, 23.0, 21.0, 35.0, 46.0, 46.0, 55.0, 49.0, 50.0, 53.0, 51.0, 59.0, 74.0, 57.0, 41.0, 45.0, 34.0, 40.0, 30.0, 21.0, 17.0, 24.0, 13.0, 17.0, 7.0, 10.0, 10.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.09375, -3.9298095703125, -3.765869140625, -3.6019287109375, -3.43798828125, -3.2740478515625, -3.110107421875, -2.9461669921875, -2.7822265625, -2.6182861328125, -2.454345703125, -2.2904052734375, -2.12646484375, -1.9625244140625, -1.798583984375, -1.6346435546875, -1.470703125, -1.3067626953125, -1.142822265625, -0.9788818359375, -0.81494140625, -0.6510009765625, -0.487060546875, -0.3231201171875, -0.1591796875, 0.0047607421875, 0.168701171875, 0.3326416015625, 0.49658203125, 0.6605224609375, 0.824462890625, 0.9884033203125, 1.15234375, 1.3162841796875, 1.480224609375, 1.6441650390625, 1.80810546875, 1.9720458984375, 2.135986328125, 2.2999267578125, 2.4638671875, 2.6278076171875, 2.791748046875, 2.9556884765625, 3.11962890625, 3.2835693359375, 3.447509765625, 3.6114501953125, 3.775390625, 3.9393310546875, 4.103271484375, 4.2672119140625, 4.43115234375, 4.5950927734375, 4.759033203125, 4.9229736328125, 5.0869140625, 5.2508544921875, 5.414794921875, 5.5787353515625, 5.74267578125, 5.9066162109375, 6.070556640625, 6.2344970703125, 6.3984375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 10.0, 12.0, 13.0, 14.0, 25.0, 31.0, 63.0, 86.0, 128.0, 231.0, 403.0, 819.0, 2017.0, 6475.0, 39311.0, 649931.0, 316538.0, 24226.0, 4852.0, 1627.0, 765.0, 387.0, 213.0, 128.0, 82.0, 58.0, 33.0, 22.0, 12.0, 11.0, 11.0, 6.0, 4.0, 1.0, 0.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.765625, -20.02099609375, -19.2763671875, -18.53173828125, -17.787109375, -17.04248046875, -16.2978515625, -15.55322265625, -14.80859375, -14.06396484375, -13.3193359375, -12.57470703125, -11.830078125, -11.08544921875, -10.3408203125, -9.59619140625, -8.8515625, -8.10693359375, -7.3623046875, -6.61767578125, -5.873046875, -5.12841796875, -4.3837890625, -3.63916015625, -2.89453125, -2.14990234375, -1.4052734375, -0.66064453125, 0.083984375, 0.82861328125, 1.5732421875, 2.31787109375, 3.0625, 3.80712890625, 4.5517578125, 5.29638671875, 6.041015625, 6.78564453125, 7.5302734375, 8.27490234375, 9.01953125, 9.76416015625, 10.5087890625, 11.25341796875, 11.998046875, 12.74267578125, 13.4873046875, 14.23193359375, 14.9765625, 15.72119140625, 16.4658203125, 17.21044921875, 17.955078125, 18.69970703125, 19.4443359375, 20.18896484375, 20.93359375, 21.67822265625, 22.4228515625, 23.16748046875, 23.912109375, 24.65673828125, 25.4013671875, 26.14599609375, 26.890625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 6.0, 6.0, 6.0, 14.0, 9.0, 8.0, 12.0, 15.0, 16.0, 20.0, 21.0, 35.0, 37.0, 35.0, 38.0, 57.0, 61.0, 58.0, 60.0, 59.0, 54.0, 46.0, 56.0, 52.0, 33.0, 26.0, 33.0, 25.0, 22.0, 20.0, 18.0, 15.0, 12.0, 8.0, 5.0, 4.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.640625, -18.953125, -18.265625, -17.578125, -16.890625, -16.203125, -15.515625, -14.828125, -14.140625, -13.453125, -12.765625, -12.078125, -11.390625, -10.703125, -10.015625, -9.328125, -8.640625, -7.953125, -7.265625, -6.578125, -5.890625, -5.203125, -4.515625, -3.828125, -3.140625, -2.453125, -1.765625, -1.078125, -0.390625, 0.296875, 0.984375, 1.671875, 2.359375, 3.046875, 3.734375, 4.421875, 5.109375, 5.796875, 6.484375, 7.171875, 7.859375, 8.546875, 9.234375, 9.921875, 10.609375, 11.296875, 11.984375, 12.671875, 13.359375, 14.046875, 14.734375, 15.421875, 16.109375, 16.796875, 17.484375, 18.171875, 18.859375, 19.546875, 20.234375, 20.921875, 21.609375, 22.296875, 22.984375, 23.671875, 24.359375]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 4.0, 6.0, 6.0, 12.0, 16.0, 31.0, 40.0, 77.0, 137.0, 272.0, 585.0, 1412.0, 4773.0, 24360.0, 398572.0, 581404.0, 28568.0, 5431.0, 1610.0, 603.0, 265.0, 150.0, 85.0, 46.0, 33.0, 23.0, 14.0, 8.0, 5.0, 2.0, 3.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.6796875, -10.4129638671875, -10.146240234375, -9.8795166015625, -9.61279296875, -9.3460693359375, -9.079345703125, -8.8126220703125, -8.5458984375, -8.2791748046875, -8.012451171875, -7.7457275390625, -7.47900390625, -7.2122802734375, -6.945556640625, -6.6788330078125, -6.412109375, -6.1453857421875, -5.878662109375, -5.6119384765625, -5.34521484375, -5.0784912109375, -4.811767578125, -4.5450439453125, -4.2783203125, -4.0115966796875, -3.744873046875, -3.4781494140625, -3.21142578125, -2.9447021484375, -2.677978515625, -2.4112548828125, -2.14453125, -1.8778076171875, -1.611083984375, -1.3443603515625, -1.07763671875, -0.8109130859375, -0.544189453125, -0.2774658203125, -0.0107421875, 0.2559814453125, 0.522705078125, 0.7894287109375, 1.05615234375, 1.3228759765625, 1.589599609375, 1.8563232421875, 2.123046875, 2.3897705078125, 2.656494140625, 2.9232177734375, 3.18994140625, 3.4566650390625, 3.723388671875, 3.9901123046875, 4.2568359375, 4.5235595703125, 4.790283203125, 5.0570068359375, 5.32373046875, 5.5904541015625, 5.857177734375, 6.1239013671875, 6.390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 6.0, 5.0, 4.0, 7.0, 7.0, 9.0, 15.0, 17.0, 16.0, 27.0, 45.0, 58.0, 69.0, 109.0, 131.0, 128.0, 90.0, 66.0, 59.0, 33.0, 35.0, 19.0, 8.0, 7.0, 8.0, 7.0, 6.0, 6.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001041412353515625, -0.0010052919387817383, -0.0009691715240478516, -0.0009330511093139648, -0.0008969306945800781, -0.0008608102798461914, -0.0008246898651123047, -0.000788569450378418, -0.0007524490356445312, -0.0007163286209106445, -0.0006802082061767578, -0.0006440877914428711, -0.0006079673767089844, -0.0005718469619750977, -0.0005357265472412109, -0.0004996061325073242, -0.0004634857177734375, -0.0004273653030395508, -0.00039124488830566406, -0.00035512447357177734, -0.0003190040588378906, -0.0002828836441040039, -0.0002467632293701172, -0.00021064281463623047, -0.00017452239990234375, -0.00013840198516845703, -0.00010228157043457031, -6.61611557006836e-05, -3.0040740966796875e-05, 6.079673767089844e-06, 4.220008850097656e-05, 7.832050323486328e-05, 0.00011444091796875, 0.00015056133270263672, 0.00018668174743652344, 0.00022280216217041016, 0.0002589225769042969, 0.0002950429916381836, 0.0003311634063720703, 0.00036728382110595703, 0.00040340423583984375, 0.00043952465057373047, 0.0004756450653076172, 0.0005117654800415039, 0.0005478858947753906, 0.0005840063095092773, 0.0006201267242431641, 0.0006562471389770508, 0.0006923675537109375, 0.0007284879684448242, 0.0007646083831787109, 0.0008007287979125977, 0.0008368492126464844, 0.0008729696273803711, 0.0009090900421142578, 0.0009452104568481445, 0.0009813308715820312, 0.001017451286315918, 0.0010535717010498047, 0.0010896921157836914, 0.0011258125305175781, 0.0011619329452514648, 0.0011980533599853516, 0.0012341737747192383, 0.001270294189453125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 5.0, 4.0, 3.0, 2.0, 8.0, 5.0, 9.0, 17.0, 13.0, 31.0, 59.0, 63.0, 69.0, 97.0, 178.0, 308.0, 546.0, 1081.0, 2134.0, 6084.0, 23758.0, 171669.0, 727649.0, 91078.0, 15430.0, 4560.0, 1693.0, 786.0, 424.0, 241.0, 166.0, 110.0, 72.0, 54.0, 47.0, 27.0, 20.0, 16.0, 14.0, 9.0, 6.0, 3.0, 4.0, 4.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.21484375, -5.00921630859375, -4.8035888671875, -4.59796142578125, -4.392333984375, -4.18670654296875, -3.9810791015625, -3.77545166015625, -3.56982421875, -3.36419677734375, -3.1585693359375, -2.95294189453125, -2.747314453125, -2.54168701171875, -2.3360595703125, -2.13043212890625, -1.9248046875, -1.71917724609375, -1.5135498046875, -1.30792236328125, -1.102294921875, -0.89666748046875, -0.6910400390625, -0.48541259765625, -0.27978515625, -0.07415771484375, 0.1314697265625, 0.33709716796875, 0.542724609375, 0.74835205078125, 0.9539794921875, 1.15960693359375, 1.365234375, 1.57086181640625, 1.7764892578125, 1.98211669921875, 2.187744140625, 2.39337158203125, 2.5989990234375, 2.80462646484375, 3.01025390625, 3.21588134765625, 3.4215087890625, 3.62713623046875, 3.832763671875, 4.03839111328125, 4.2440185546875, 4.44964599609375, 4.6552734375, 4.86090087890625, 5.0665283203125, 5.27215576171875, 5.477783203125, 5.68341064453125, 5.8890380859375, 6.09466552734375, 6.30029296875, 6.50592041015625, 6.7115478515625, 6.91717529296875, 7.122802734375, 7.32843017578125, 7.5340576171875, 7.73968505859375, 7.9453125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 3.0, 10.0, 10.0, 10.0, 16.0, 22.0, 19.0, 28.0, 34.0, 55.0, 51.0, 63.0, 85.0, 91.0, 88.0, 76.0, 78.0, 35.0, 36.0, 35.0, 26.0, 23.0, 24.0, 25.0, 12.0, 12.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.43359375, -5.245361328125, -5.05712890625, -4.868896484375, -4.6806640625, -4.492431640625, -4.30419921875, -4.115966796875, -3.927734375, -3.739501953125, -3.55126953125, -3.363037109375, -3.1748046875, -2.986572265625, -2.79833984375, -2.610107421875, -2.421875, -2.233642578125, -2.04541015625, -1.857177734375, -1.6689453125, -1.480712890625, -1.29248046875, -1.104248046875, -0.916015625, -0.727783203125, -0.53955078125, -0.351318359375, -0.1630859375, 0.025146484375, 0.21337890625, 0.401611328125, 0.58984375, 0.778076171875, 0.96630859375, 1.154541015625, 1.3427734375, 1.531005859375, 1.71923828125, 1.907470703125, 2.095703125, 2.283935546875, 2.47216796875, 2.660400390625, 2.8486328125, 3.036865234375, 3.22509765625, 3.413330078125, 3.6015625, 3.789794921875, 3.97802734375, 4.166259765625, 4.3544921875, 4.542724609375, 4.73095703125, 4.919189453125, 5.107421875, 5.295654296875, 5.48388671875, 5.672119140625, 5.8603515625, 6.048583984375, 6.23681640625, 6.425048828125, 6.61328125]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 6.0, 2.0, 7.0, 11.0, 11.0, 29.0, 47.0, 97.0, 130.0, 207.0, 184.0, 134.0, 52.0, 39.0, 22.0, 9.0, 7.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.02127075195312, -166.4908447265625, -161.96041870117188, -157.42999267578125, -152.89956665039062, -148.369140625, -143.83871459960938, -139.30828857421875, -134.77786254882812, -130.2474365234375, -125.71701049804688, -121.18658447265625, -116.65615844726562, -112.125732421875, -107.5953140258789, -103.06488800048828, -98.53446960449219, -94.00404357910156, -89.47361755371094, -84.94319152832031, -80.41276550292969, -75.88233947753906, -71.35192108154297, -66.82149505615234, -62.29106903076172, -57.760643005371094, -53.23021697998047, -48.69979476928711, -44.169368743896484, -39.63894271850586, -35.1085205078125, -30.578094482421875, -26.047653198242188, -21.517227172851562, -16.98680305480957, -12.456377983093262, -7.925952911376953, -3.395526885986328, 1.134897232055664, 5.665321350097656, 10.195747375488281, 14.72617244720459, 19.2565975189209, 23.78702163696289, 28.317447662353516, 32.84787368774414, 37.3782958984375, 41.908721923828125, 46.43914794921875, 50.969573974609375, 55.5, 60.03042221069336, 64.56085205078125, 69.09127807617188, 73.62169647216797, 78.1521224975586, 82.68254852294922, 87.21297454833984, 91.74340057373047, 96.2738265991211, 100.80424499511719, 105.33467102050781, 109.86509704589844, 114.39552307128906, 118.92594909667969]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 5.0, 2.0, 7.0, 5.0, 15.0, 13.0, 17.0, 15.0, 27.0, 20.0, 26.0, 30.0, 24.0, 41.0, 31.0, 50.0, 44.0, 67.0, 65.0, 52.0, 65.0, 58.0, 35.0, 43.0, 32.0, 41.0, 31.0, 24.0, 16.0, 23.0, 18.0, 15.0, 11.0, 8.0, 3.0, 9.0, 5.0, 6.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-89.40168762207031, -86.83890533447266, -84.27611541748047, -81.71333312988281, -79.15055084228516, -76.5877685546875, -74.02497863769531, -71.46219635009766, -68.8994140625, -66.33663177490234, -63.77384567260742, -61.2110595703125, -58.648277282714844, -56.08549118041992, -53.522705078125, -50.959922790527344, -48.39713668823242, -45.8343505859375, -43.271568298339844, -40.70878219604492, -38.145999908447266, -35.583213806152344, -33.02043151855469, -30.457645416259766, -27.894861221313477, -25.332077026367188, -22.7692928314209, -20.20650863647461, -17.643722534179688, -15.080939292907715, -12.51815414428711, -9.95536994934082, -7.392585754394531, -4.829801559448242, -2.267016887664795, 0.29576778411865234, 2.8585519790649414, 5.4213361740112305, 7.984121322631836, 10.546905517578125, 13.109689712524414, 15.672473907470703, 18.235258102416992, 20.79804229736328, 23.360828399658203, 25.92361068725586, 28.48639678955078, 31.04918098449707, 33.61196517944336, 36.17475128173828, 38.73753356933594, 41.30031967163086, 43.863101959228516, 46.42588806152344, 48.988670349121094, 51.551456451416016, 54.11424255371094, 56.67702865600586, 59.239810943603516, 61.80259704589844, 64.3653793334961, 66.92816162109375, 69.49095153808594, 72.0537338256836, 74.61651611328125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 4.0, 2.0, 14.0, 13.0, 19.0, 33.0, 51.0, 83.0, 178.0, 494.0, 3460.0, 3793231.0, 393432.0, 2491.0, 407.0, 148.0, 76.0, 43.0, 30.0, 20.0, 15.0, 8.0, 6.0, 2.0, 6.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.375, -63.69580078125, -62.0166015625, -60.33740234375, -58.658203125, -56.97900390625, -55.2998046875, -53.62060546875, -51.94140625, -50.26220703125, -48.5830078125, -46.90380859375, -45.224609375, -43.54541015625, -41.8662109375, -40.18701171875, -38.5078125, -36.82861328125, -35.1494140625, -33.47021484375, -31.791015625, -30.11181640625, -28.4326171875, -26.75341796875, -25.07421875, -23.39501953125, -21.7158203125, -20.03662109375, -18.357421875, -16.67822265625, -14.9990234375, -13.31982421875, -11.640625, -9.96142578125, -8.2822265625, -6.60302734375, -4.923828125, -3.24462890625, -1.5654296875, 0.11376953125, 1.79296875, 3.47216796875, 5.1513671875, 6.83056640625, 8.509765625, 10.18896484375, 11.8681640625, 13.54736328125, 15.2265625, 16.90576171875, 18.5849609375, 20.26416015625, 21.943359375, 23.62255859375, 25.3017578125, 26.98095703125, 28.66015625, 30.33935546875, 32.0185546875, 33.69775390625, 35.376953125, 37.05615234375, 38.7353515625, 40.41455078125, 42.09375]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 7.0, 17.0, 22.0, 22.0, 44.0, 52.0, 69.0, 86.0, 84.0, 86.0, 104.0, 82.0, 85.0, 55.0, 57.0, 31.0, 35.0, 26.0, 19.0, 13.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.0078125, -9.75823974609375, -9.5086669921875, -9.25909423828125, -9.009521484375, -8.75994873046875, -8.5103759765625, -8.26080322265625, -8.01123046875, -7.76165771484375, -7.5120849609375, -7.26251220703125, -7.012939453125, -6.76336669921875, -6.5137939453125, -6.26422119140625, -6.0146484375, -5.76507568359375, -5.5155029296875, -5.26593017578125, -5.016357421875, -4.76678466796875, -4.5172119140625, -4.26763916015625, -4.01806640625, -3.76849365234375, -3.5189208984375, -3.26934814453125, -3.019775390625, -2.77020263671875, -2.5206298828125, -2.27105712890625, -2.021484375, -1.77191162109375, -1.5223388671875, -1.27276611328125, -1.023193359375, -0.77362060546875, -0.5240478515625, -0.27447509765625, -0.02490234375, 0.22467041015625, 0.4742431640625, 0.72381591796875, 0.973388671875, 1.22296142578125, 1.4725341796875, 1.72210693359375, 1.9716796875, 2.22125244140625, 2.4708251953125, 2.72039794921875, 2.969970703125, 3.21954345703125, 3.4691162109375, 3.71868896484375, 3.96826171875, 4.21783447265625, 4.4674072265625, 4.71697998046875, 4.966552734375, 5.21612548828125, 5.4656982421875, 5.71527099609375, 5.96484375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 8.0, 6.0, 15.0, 16.0, 25.0, 34.0, 60.0, 64.0, 128.0, 195.0, 379.0, 677.0, 1309.0, 2739.0, 6917.0, 20299.0, 85019.0, 2219743.0, 1741078.0, 81150.0, 20670.0, 7291.0, 3142.0, 1461.0, 740.0, 410.0, 251.0, 133.0, 100.0, 64.0, 51.0, 29.0, 29.0, 14.0, 17.0, 5.0, 9.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.3046875, -10.951171875, -10.59765625, -10.244140625, -9.890625, -9.537109375, -9.18359375, -8.830078125, -8.4765625, -8.123046875, -7.76953125, -7.416015625, -7.0625, -6.708984375, -6.35546875, -6.001953125, -5.6484375, -5.294921875, -4.94140625, -4.587890625, -4.234375, -3.880859375, -3.52734375, -3.173828125, -2.8203125, -2.466796875, -2.11328125, -1.759765625, -1.40625, -1.052734375, -0.69921875, -0.345703125, 0.0078125, 0.361328125, 0.71484375, 1.068359375, 1.421875, 1.775390625, 2.12890625, 2.482421875, 2.8359375, 3.189453125, 3.54296875, 3.896484375, 4.25, 4.603515625, 4.95703125, 5.310546875, 5.6640625, 6.017578125, 6.37109375, 6.724609375, 7.078125, 7.431640625, 7.78515625, 8.138671875, 8.4921875, 8.845703125, 9.19921875, 9.552734375, 9.90625, 10.259765625, 10.61328125, 10.966796875, 11.3203125]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 9.0, 7.0, 16.0, 17.0, 32.0, 36.0, 67.0, 110.0, 327.0, 902.0, 1487.0, 575.0, 196.0, 82.0, 62.0, 48.0, 30.0, 14.0, 19.0, 8.0, 11.0, 6.0, 4.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.9921875, -13.530029296875, -13.06787109375, -12.605712890625, -12.1435546875, -11.681396484375, -11.21923828125, -10.757080078125, -10.294921875, -9.832763671875, -9.37060546875, -8.908447265625, -8.4462890625, -7.984130859375, -7.52197265625, -7.059814453125, -6.59765625, -6.135498046875, -5.67333984375, -5.211181640625, -4.7490234375, -4.286865234375, -3.82470703125, -3.362548828125, -2.900390625, -2.438232421875, -1.97607421875, -1.513916015625, -1.0517578125, -0.589599609375, -0.12744140625, 0.334716796875, 0.796875, 1.259033203125, 1.72119140625, 2.183349609375, 2.6455078125, 3.107666015625, 3.56982421875, 4.031982421875, 4.494140625, 4.956298828125, 5.41845703125, 5.880615234375, 6.3427734375, 6.804931640625, 7.26708984375, 7.729248046875, 8.19140625, 8.653564453125, 9.11572265625, 9.577880859375, 10.0400390625, 10.502197265625, 10.96435546875, 11.426513671875, 11.888671875, 12.350830078125, 12.81298828125, 13.275146484375, 13.7373046875, 14.199462890625, 14.66162109375, 15.123779296875, 15.5859375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 17.0, 54.0, 273.0, 391.0, 174.0, 39.0, 22.0, 8.0, 5.0, 3.0, 3.0, 2.0, 6.0, 4.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.26020812988281, -61.57416534423828, -54.88812255859375, -48.202083587646484, -41.51604080200195, -34.82999801635742, -28.143959045410156, -21.457916259765625, -14.771873474121094, -8.085831642150879, -1.399789810180664, 5.286251068115234, 11.972293853759766, 18.658336639404297, 25.344375610351562, 32.030418395996094, 38.716461181640625, 45.402503967285156, 52.08854675292969, 58.77458572387695, 65.46063232421875, 72.14666748046875, 78.83271026611328, 85.51875305175781, 92.20479583740234, 98.89083862304688, 105.5768814086914, 112.26292419433594, 118.94895935058594, 125.635009765625, 132.321044921875, 139.007080078125, 145.69314575195312, 152.37918090820312, 159.0652313232422, 165.7512664794922, 172.43731689453125, 179.12335205078125, 185.80938720703125, 192.4954376220703, 199.18148803710938, 205.86752319335938, 212.55357360839844, 219.23960876464844, 225.9256591796875, 232.6116943359375, 239.2977294921875, 245.98377990722656, 252.66981506347656, 259.3558654785156, 266.0419006347656, 272.7279357910156, 279.4139709472656, 286.10003662109375, 292.78607177734375, 299.47210693359375, 306.15814208984375, 312.84417724609375, 319.53021240234375, 326.2162780761719, 332.9023132324219, 339.5883483886719, 346.2743835449219, 352.96044921875, 359.646484375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 3.0, 4.0, 7.0, 9.0, 17.0, 17.0, 25.0, 41.0, 32.0, 44.0, 41.0, 52.0, 78.0, 62.0, 58.0, 62.0, 57.0, 41.0, 58.0, 54.0, 49.0, 40.0, 35.0, 30.0, 21.0, 16.0, 14.0, 16.0, 6.0, 7.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.45680236816406, -48.3878173828125, -46.3188362121582, -44.24985122680664, -42.180870056152344, -40.11188507080078, -38.04290008544922, -35.973915100097656, -33.90493392944336, -31.83595085144043, -29.7669677734375, -27.697982788085938, -25.628999710083008, -23.560016632080078, -21.491031646728516, -19.422048568725586, -17.353065490722656, -15.284082412719727, -13.21509838104248, -11.146114349365234, -9.077131271362305, -7.008148193359375, -4.939164161682129, -2.870180130004883, -0.8011970520019531, 1.2677865028381348, 3.3367700576782227, 5.4057536125183105, 7.474737167358398, 9.543720245361328, 11.612704277038574, 13.68168830871582, 15.75067138671875, 17.81965446472168, 19.88863754272461, 21.957622528076172, 24.0266056060791, 26.09558868408203, 28.164573669433594, 30.233556747436523, 32.30253982543945, 34.371524810791016, 36.44050598144531, 38.509490966796875, 40.57847595214844, 42.647457122802734, 44.7164421081543, 46.785423278808594, 48.854408264160156, 50.92339324951172, 52.992374420166016, 55.06135940551758, 57.130340576171875, 59.19932556152344, 61.268310546875, 63.33729553222656, 65.40628051757812, 67.47526550292969, 69.54425048828125, 71.61322784423828, 73.68221282958984, 75.7511978149414, 77.82018280029297, 79.88916778564453, 81.95814514160156]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 9.0, 10.0, 7.0, 21.0, 26.0, 20.0, 27.0, 63.0, 66.0, 108.0, 155.0, 214.0, 355.0, 631.0, 1005.0, 1784.0, 3622.0, 7951.0, 19529.0, 54320.0, 168365.0, 445453.0, 228857.0, 71076.0, 25298.0, 9821.0, 4516.0, 2157.0, 1185.0, 683.0, 400.0, 278.0, 173.0, 120.0, 87.0, 43.0, 32.0, 21.0, 28.0, 13.0, 6.0, 5.0, 4.0, 11.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-10.25, -9.9451904296875, -9.640380859375, -9.3355712890625, -9.03076171875, -8.7259521484375, -8.421142578125, -8.1163330078125, -7.8115234375, -7.5067138671875, -7.201904296875, -6.8970947265625, -6.59228515625, -6.2874755859375, -5.982666015625, -5.6778564453125, -5.373046875, -5.0682373046875, -4.763427734375, -4.4586181640625, -4.15380859375, -3.8489990234375, -3.544189453125, -3.2393798828125, -2.9345703125, -2.6297607421875, -2.324951171875, -2.0201416015625, -1.71533203125, -1.4105224609375, -1.105712890625, -0.8009033203125, -0.49609375, -0.1912841796875, 0.113525390625, 0.4183349609375, 0.72314453125, 1.0279541015625, 1.332763671875, 1.6375732421875, 1.9423828125, 2.2471923828125, 2.552001953125, 2.8568115234375, 3.16162109375, 3.4664306640625, 3.771240234375, 4.0760498046875, 4.380859375, 4.6856689453125, 4.990478515625, 5.2952880859375, 5.60009765625, 5.9049072265625, 6.209716796875, 6.5145263671875, 6.8193359375, 7.1241455078125, 7.428955078125, 7.7337646484375, 8.03857421875, 8.3433837890625, 8.648193359375, 8.9530029296875, 9.2578125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [5.0, 0.0, 0.0, 1.0, 2.0, 7.0, 5.0, 8.0, 10.0, 11.0, 13.0, 15.0, 25.0, 27.0, 26.0, 34.0, 40.0, 37.0, 38.0, 41.0, 52.0, 58.0, 55.0, 54.0, 52.0, 56.0, 55.0, 30.0, 40.0, 40.0, 35.0, 22.0, 29.0, 26.0, 17.0, 14.0, 7.0, 8.0, 8.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.408203125, -3.260223388671875, -3.11224365234375, -2.964263916015625, -2.8162841796875, -2.668304443359375, -2.52032470703125, -2.372344970703125, -2.224365234375, -2.076385498046875, -1.92840576171875, -1.780426025390625, -1.6324462890625, -1.484466552734375, -1.33648681640625, -1.188507080078125, -1.04052734375, -0.892547607421875, -0.74456787109375, -0.596588134765625, -0.4486083984375, -0.300628662109375, -0.15264892578125, -0.004669189453125, 0.143310546875, 0.291290283203125, 0.43927001953125, 0.587249755859375, 0.7352294921875, 0.883209228515625, 1.03118896484375, 1.179168701171875, 1.3271484375, 1.475128173828125, 1.62310791015625, 1.771087646484375, 1.9190673828125, 2.067047119140625, 2.21502685546875, 2.363006591796875, 2.510986328125, 2.658966064453125, 2.80694580078125, 2.954925537109375, 3.1029052734375, 3.250885009765625, 3.39886474609375, 3.546844482421875, 3.69482421875, 3.842803955078125, 3.99078369140625, 4.138763427734375, 4.2867431640625, 4.434722900390625, 4.58270263671875, 4.730682373046875, 4.878662109375, 5.026641845703125, 5.17462158203125, 5.322601318359375, 5.4705810546875, 5.618560791015625, 5.76654052734375, 5.914520263671875, 6.0625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 8.0, 13.0, 19.0, 39.0, 36.0, 47.0, 101.0, 170.0, 259.0, 524.0, 1001.0, 2405.0, 7045.0, 31429.0, 233871.0, 672907.0, 77990.0, 13779.0, 3884.0, 1423.0, 639.0, 370.0, 196.0, 132.0, 70.0, 52.0, 39.0, 27.0, 10.0, 17.0, 11.0, 12.0, 3.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-16.6875, -16.1357421875, -15.583984375, -15.0322265625, -14.48046875, -13.9287109375, -13.376953125, -12.8251953125, -12.2734375, -11.7216796875, -11.169921875, -10.6181640625, -10.06640625, -9.5146484375, -8.962890625, -8.4111328125, -7.859375, -7.3076171875, -6.755859375, -6.2041015625, -5.65234375, -5.1005859375, -4.548828125, -3.9970703125, -3.4453125, -2.8935546875, -2.341796875, -1.7900390625, -1.23828125, -0.6865234375, -0.134765625, 0.4169921875, 0.96875, 1.5205078125, 2.072265625, 2.6240234375, 3.17578125, 3.7275390625, 4.279296875, 4.8310546875, 5.3828125, 5.9345703125, 6.486328125, 7.0380859375, 7.58984375, 8.1416015625, 8.693359375, 9.2451171875, 9.796875, 10.3486328125, 10.900390625, 11.4521484375, 12.00390625, 12.5556640625, 13.107421875, 13.6591796875, 14.2109375, 14.7626953125, 15.314453125, 15.8662109375, 16.41796875, 16.9697265625, 17.521484375, 18.0732421875, 18.625]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 6.0, 10.0, 6.0, 17.0, 12.0, 17.0, 29.0, 23.0, 34.0, 33.0, 37.0, 45.0, 38.0, 50.0, 44.0, 40.0, 52.0, 46.0, 45.0, 31.0, 44.0, 49.0, 35.0, 30.0, 43.0, 33.0, 25.0, 22.0, 14.0, 8.0, 12.0, 11.0, 11.0, 8.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0], "bins": [-15.046875, -14.549560546875, -14.05224609375, -13.554931640625, -13.0576171875, -12.560302734375, -12.06298828125, -11.565673828125, -11.068359375, -10.571044921875, -10.07373046875, -9.576416015625, -9.0791015625, -8.581787109375, -8.08447265625, -7.587158203125, -7.08984375, -6.592529296875, -6.09521484375, -5.597900390625, -5.1005859375, -4.603271484375, -4.10595703125, -3.608642578125, -3.111328125, -2.614013671875, -2.11669921875, -1.619384765625, -1.1220703125, -0.624755859375, -0.12744140625, 0.369873046875, 0.8671875, 1.364501953125, 1.86181640625, 2.359130859375, 2.8564453125, 3.353759765625, 3.85107421875, 4.348388671875, 4.845703125, 5.343017578125, 5.84033203125, 6.337646484375, 6.8349609375, 7.332275390625, 7.82958984375, 8.326904296875, 8.82421875, 9.321533203125, 9.81884765625, 10.316162109375, 10.8134765625, 11.310791015625, 11.80810546875, 12.305419921875, 12.802734375, 13.300048828125, 13.79736328125, 14.294677734375, 14.7919921875, 15.289306640625, 15.78662109375, 16.283935546875, 16.78125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 4.0, 5.0, 15.0, 21.0, 22.0, 26.0, 43.0, 87.0, 144.0, 362.0, 999.0, 4004.0, 29955.0, 794061.0, 204478.0, 11049.0, 2086.0, 599.0, 262.0, 137.0, 66.0, 39.0, 31.0, 16.0, 9.0, 6.0, 11.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0], "bins": [-7.7578125, -7.505859375, -7.25390625, -7.001953125, -6.75, -6.498046875, -6.24609375, -5.994140625, -5.7421875, -5.490234375, -5.23828125, -4.986328125, -4.734375, -4.482421875, -4.23046875, -3.978515625, -3.7265625, -3.474609375, -3.22265625, -2.970703125, -2.71875, -2.466796875, -2.21484375, -1.962890625, -1.7109375, -1.458984375, -1.20703125, -0.955078125, -0.703125, -0.451171875, -0.19921875, 0.052734375, 0.3046875, 0.556640625, 0.80859375, 1.060546875, 1.3125, 1.564453125, 1.81640625, 2.068359375, 2.3203125, 2.572265625, 2.82421875, 3.076171875, 3.328125, 3.580078125, 3.83203125, 4.083984375, 4.3359375, 4.587890625, 4.83984375, 5.091796875, 5.34375, 5.595703125, 5.84765625, 6.099609375, 6.3515625, 6.603515625, 6.85546875, 7.107421875, 7.359375, 7.611328125, 7.86328125, 8.115234375, 8.3671875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 12.0, 6.0, 9.0, 19.0, 29.0, 50.0, 62.0, 87.0, 150.0, 134.0, 145.0, 106.0, 84.0, 26.0, 26.0, 25.0, 9.0, 10.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.002086639404296875, -0.002041757106781006, -0.0019968748092651367, -0.0019519925117492676, -0.0019071102142333984, -0.0018622279167175293, -0.0018173456192016602, -0.001772463321685791, -0.0017275810241699219, -0.0016826987266540527, -0.0016378164291381836, -0.0015929341316223145, -0.0015480518341064453, -0.0015031695365905762, -0.001458287239074707, -0.0014134049415588379, -0.0013685226440429688, -0.0013236403465270996, -0.0012787580490112305, -0.0012338757514953613, -0.0011889934539794922, -0.001144111156463623, -0.001099228858947754, -0.0010543465614318848, -0.0010094642639160156, -0.0009645819664001465, -0.0009196996688842773, -0.0008748173713684082, -0.0008299350738525391, -0.0007850527763366699, -0.0007401704788208008, -0.0006952881813049316, -0.0006504058837890625, -0.0006055235862731934, -0.0005606412887573242, -0.0005157589912414551, -0.00047087669372558594, -0.0004259943962097168, -0.00038111209869384766, -0.0003362298011779785, -0.0002913475036621094, -0.00024646520614624023, -0.0002015829086303711, -0.00015670061111450195, -0.00011181831359863281, -6.693601608276367e-05, -2.205371856689453e-05, 2.282857894897461e-05, 6.771087646484375e-05, 0.00011259317398071289, 0.00015747547149658203, 0.00020235776901245117, 0.0002472400665283203, 0.00029212236404418945, 0.0003370046615600586, 0.00038188695907592773, 0.0004267692565917969, 0.000471651554107666, 0.0005165338516235352, 0.0005614161491394043, 0.0006062984466552734, 0.0006511807441711426, 0.0006960630416870117, 0.0007409453392028809, 0.00078582763671875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 6.0, 2.0, 3.0, 7.0, 8.0, 11.0, 18.0, 18.0, 36.0, 63.0, 89.0, 153.0, 333.0, 825.0, 2465.0, 12026.0, 147405.0, 827352.0, 48874.0, 6090.0, 1576.0, 583.0, 263.0, 129.0, 83.0, 54.0, 32.0, 20.0, 12.0, 7.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.72265625, -7.49761962890625, -7.2725830078125, -7.04754638671875, -6.822509765625, -6.59747314453125, -6.3724365234375, -6.14739990234375, -5.92236328125, -5.69732666015625, -5.4722900390625, -5.24725341796875, -5.022216796875, -4.79718017578125, -4.5721435546875, -4.34710693359375, -4.1220703125, -3.89703369140625, -3.6719970703125, -3.44696044921875, -3.221923828125, -2.99688720703125, -2.7718505859375, -2.54681396484375, -2.32177734375, -2.09674072265625, -1.8717041015625, -1.64666748046875, -1.421630859375, -1.19659423828125, -0.9715576171875, -0.74652099609375, -0.521484375, -0.29644775390625, -0.0714111328125, 0.15362548828125, 0.378662109375, 0.60369873046875, 0.8287353515625, 1.05377197265625, 1.27880859375, 1.50384521484375, 1.7288818359375, 1.95391845703125, 2.178955078125, 2.40399169921875, 2.6290283203125, 2.85406494140625, 3.0791015625, 3.30413818359375, 3.5291748046875, 3.75421142578125, 3.979248046875, 4.20428466796875, 4.4293212890625, 4.65435791015625, 4.87939453125, 5.10443115234375, 5.3294677734375, 5.55450439453125, 5.779541015625, 6.00457763671875, 6.2296142578125, 6.45465087890625, 6.6796875]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 6.0, 3.0, 5.0, 7.0, 15.0, 11.0, 13.0, 21.0, 21.0, 38.0, 59.0, 51.0, 88.0, 73.0, 96.0, 89.0, 81.0, 65.0, 41.0, 47.0, 41.0, 24.0, 26.0, 12.0, 16.0, 11.0, 8.0, 10.0, 5.0, 5.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-4.43359375, -4.2994384765625, -4.165283203125, -4.0311279296875, -3.89697265625, -3.7628173828125, -3.628662109375, -3.4945068359375, -3.3603515625, -3.2261962890625, -3.092041015625, -2.9578857421875, -2.82373046875, -2.6895751953125, -2.555419921875, -2.4212646484375, -2.287109375, -2.1529541015625, -2.018798828125, -1.8846435546875, -1.75048828125, -1.6163330078125, -1.482177734375, -1.3480224609375, -1.2138671875, -1.0797119140625, -0.945556640625, -0.8114013671875, -0.67724609375, -0.5430908203125, -0.408935546875, -0.2747802734375, -0.140625, -0.0064697265625, 0.127685546875, 0.2618408203125, 0.39599609375, 0.5301513671875, 0.664306640625, 0.7984619140625, 0.9326171875, 1.0667724609375, 1.200927734375, 1.3350830078125, 1.46923828125, 1.6033935546875, 1.737548828125, 1.8717041015625, 2.005859375, 2.1400146484375, 2.274169921875, 2.4083251953125, 2.54248046875, 2.6766357421875, 2.810791015625, 2.9449462890625, 3.0791015625, 3.2132568359375, 3.347412109375, 3.4815673828125, 3.61572265625, 3.7498779296875, 3.884033203125, 4.0181884765625, 4.15234375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 13.0, 34.0, 83.0, 250.0, 362.0, 166.0, 54.0, 21.0, 10.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-200.30690002441406, -194.11257934570312, -187.9182586669922, -181.72393798828125, -175.5296173095703, -169.33529663085938, -163.1409912109375, -156.9466552734375, -150.75234985351562, -144.5580291748047, -138.36370849609375, -132.1693878173828, -125.97506713867188, -119.78074645996094, -113.58643341064453, -107.3921127319336, -101.19778442382812, -95.00346374511719, -88.80914306640625, -82.61482238769531, -76.42050170898438, -70.22618103027344, -64.03186798095703, -57.837547302246094, -51.643226623535156, -45.44890594482422, -39.25458526611328, -33.06026840209961, -26.865947723388672, -20.671627044677734, -14.477310180664062, -8.282989501953125, -2.08868408203125, 4.105635643005371, 10.299955368041992, 16.494274139404297, 22.688594818115234, 28.882915496826172, 35.077232360839844, 41.27155303955078, 47.46587371826172, 53.660194396972656, 59.854515075683594, 66.048828125, 72.24314880371094, 78.43746948242188, 84.63179016113281, 90.82611083984375, 97.02043151855469, 103.21475219726562, 109.40907287597656, 115.6033935546875, 121.79771423339844, 127.99203491210938, 134.18634033203125, 140.38067626953125, 146.57498168945312, 152.76930236816406, 158.963623046875, 165.15794372558594, 171.35226440429688, 177.5465850830078, 183.74090576171875, 189.93521118164062, 196.12954711914062]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 1.0, 2.0, 5.0, 3.0, 8.0, 6.0, 10.0, 7.0, 13.0, 13.0, 10.0, 11.0, 19.0, 19.0, 20.0, 26.0, 24.0, 26.0, 35.0, 21.0, 44.0, 44.0, 51.0, 54.0, 47.0, 53.0, 43.0, 35.0, 44.0, 37.0, 33.0, 21.0, 36.0, 32.0, 18.0, 22.0, 24.0, 12.0, 13.0, 8.0, 10.0, 9.0, 5.0, 8.0, 2.0, 4.0, 4.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0], "bins": [-57.63092041015625, -55.8527717590332, -54.07462692260742, -52.296478271484375, -50.51832962036133, -48.74018096923828, -46.9620361328125, -45.18388748168945, -43.405738830566406, -41.62759017944336, -39.84944534301758, -38.07129669189453, -36.293148040771484, -34.51499938964844, -32.736854553222656, -30.95870590209961, -29.180559158325195, -27.40241241455078, -25.624263763427734, -23.84611701965332, -22.067968368530273, -20.28982162475586, -18.511672973632812, -16.7335262298584, -14.955378532409668, -13.177230834960938, -11.399083137512207, -9.620935440063477, -7.842788219451904, -6.064640998840332, -4.286493301391602, -2.508345603942871, -0.7301979064941406, 1.0479496717453003, 2.826097249984741, 4.604244709014893, 6.382392406463623, 8.160539627075195, 9.938687324523926, 11.716835021972656, 13.494982719421387, 15.273130416870117, 17.05127716064453, 18.829425811767578, 20.607572555541992, 22.385719299316406, 24.163867950439453, 25.9420166015625, 27.720163345336914, 29.498310089111328, 31.276458740234375, 33.05460739135742, 34.8327522277832, 36.61090087890625, 38.3890495300293, 40.167198181152344, 41.945343017578125, 43.72349166870117, 45.50163650512695, 47.27978515625, 49.05793380737305, 50.836082458496094, 52.614227294921875, 54.39237594604492, 56.17052459716797]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 9.0, 7.0, 11.0, 5.0, 9.0, 13.0, 12.0, 36.0, 53.0, 76.0, 121.0, 192.0, 285.0, 397.0, 677.0, 1142.0, 2128.0, 3796.0, 7970.0, 18394.0, 58882.0, 329741.0, 2413627.0, 1148182.0, 148708.0, 34141.0, 12719.0, 5903.0, 2937.0, 1662.0, 911.0, 538.0, 354.0, 206.0, 134.0, 109.0, 77.0, 47.0, 21.0, 19.0, 13.0, 6.0, 7.0, 7.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.578125, -4.429443359375, -4.28076171875, -4.132080078125, -3.9833984375, -3.834716796875, -3.68603515625, -3.537353515625, -3.388671875, -3.239990234375, -3.09130859375, -2.942626953125, -2.7939453125, -2.645263671875, -2.49658203125, -2.347900390625, -2.19921875, -2.050537109375, -1.90185546875, -1.753173828125, -1.6044921875, -1.455810546875, -1.30712890625, -1.158447265625, -1.009765625, -0.861083984375, -0.71240234375, -0.563720703125, -0.4150390625, -0.266357421875, -0.11767578125, 0.031005859375, 0.1796875, 0.328369140625, 0.47705078125, 0.625732421875, 0.7744140625, 0.923095703125, 1.07177734375, 1.220458984375, 1.369140625, 1.517822265625, 1.66650390625, 1.815185546875, 1.9638671875, 2.112548828125, 2.26123046875, 2.409912109375, 2.55859375, 2.707275390625, 2.85595703125, 3.004638671875, 3.1533203125, 3.302001953125, 3.45068359375, 3.599365234375, 3.748046875, 3.896728515625, 4.04541015625, 4.194091796875, 4.3427734375, 4.491455078125, 4.64013671875, 4.788818359375, 4.9375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 7.0, 4.0, 6.0, 12.0, 8.0, 15.0, 20.0, 38.0, 45.0, 39.0, 39.0, 41.0, 46.0, 60.0, 61.0, 60.0, 54.0, 59.0, 64.0, 51.0, 57.0, 35.0, 46.0, 34.0, 23.0, 18.0, 19.0, 18.0, 4.0, 8.0, 9.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.41796875, -3.26953125, -3.12109375, -2.97265625, -2.82421875, -2.67578125, -2.52734375, -2.37890625, -2.23046875, -2.08203125, -1.93359375, -1.78515625, -1.63671875, -1.48828125, -1.33984375, -1.19140625, -1.04296875, -0.89453125, -0.74609375, -0.59765625, -0.44921875, -0.30078125, -0.15234375, -0.00390625, 0.14453125, 0.29296875, 0.44140625, 0.58984375, 0.73828125, 0.88671875, 1.03515625, 1.18359375, 1.33203125, 1.48046875, 1.62890625, 1.77734375, 1.92578125, 2.07421875, 2.22265625, 2.37109375, 2.51953125, 2.66796875, 2.81640625, 2.96484375, 3.11328125, 3.26171875, 3.41015625, 3.55859375, 3.70703125, 3.85546875, 4.00390625, 4.15234375, 4.30078125, 4.44921875, 4.59765625, 4.74609375, 4.89453125, 5.04296875, 5.19140625, 5.33984375, 5.48828125, 5.63671875, 5.78515625, 5.93359375, 6.08203125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 3.0, 3.0, 0.0, 2.0, 3.0, 9.0, 6.0, 12.0, 19.0, 23.0, 29.0, 40.0, 68.0, 101.0, 159.0, 262.0, 485.0, 890.0, 1756.0, 3827.0, 9148.0, 27427.0, 117659.0, 2225243.0, 1667582.0, 99855.0, 24875.0, 8317.0, 3246.0, 1529.0, 723.0, 398.0, 218.0, 113.0, 76.0, 49.0, 29.0, 31.0, 17.0, 16.0, 5.0, 7.0, 11.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.87890625, -7.62445068359375, -7.3699951171875, -7.11553955078125, -6.861083984375, -6.60662841796875, -6.3521728515625, -6.09771728515625, -5.84326171875, -5.58880615234375, -5.3343505859375, -5.07989501953125, -4.825439453125, -4.57098388671875, -4.3165283203125, -4.06207275390625, -3.8076171875, -3.55316162109375, -3.2987060546875, -3.04425048828125, -2.789794921875, -2.53533935546875, -2.2808837890625, -2.02642822265625, -1.77197265625, -1.51751708984375, -1.2630615234375, -1.00860595703125, -0.754150390625, -0.49969482421875, -0.2452392578125, 0.00921630859375, 0.263671875, 0.51812744140625, 0.7725830078125, 1.02703857421875, 1.281494140625, 1.53594970703125, 1.7904052734375, 2.04486083984375, 2.29931640625, 2.55377197265625, 2.8082275390625, 3.06268310546875, 3.317138671875, 3.57159423828125, 3.8260498046875, 4.08050537109375, 4.3349609375, 4.58941650390625, 4.8438720703125, 5.09832763671875, 5.352783203125, 5.60723876953125, 5.8616943359375, 6.11614990234375, 6.37060546875, 6.62506103515625, 6.8795166015625, 7.13397216796875, 7.388427734375, 7.64288330078125, 7.8973388671875, 8.15179443359375, 8.40625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 7.0, 6.0, 6.0, 10.0, 15.0, 18.0, 24.0, 48.0, 57.0, 91.0, 125.0, 278.0, 583.0, 984.0, 871.0, 411.0, 200.0, 106.0, 60.0, 37.0, 37.0, 22.0, 16.0, 9.0, 15.0, 8.0, 8.0, 4.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13.7734375, -13.43603515625, -13.0986328125, -12.76123046875, -12.423828125, -12.08642578125, -11.7490234375, -11.41162109375, -11.07421875, -10.73681640625, -10.3994140625, -10.06201171875, -9.724609375, -9.38720703125, -9.0498046875, -8.71240234375, -8.375, -8.03759765625, -7.7001953125, -7.36279296875, -7.025390625, -6.68798828125, -6.3505859375, -6.01318359375, -5.67578125, -5.33837890625, -5.0009765625, -4.66357421875, -4.326171875, -3.98876953125, -3.6513671875, -3.31396484375, -2.9765625, -2.63916015625, -2.3017578125, -1.96435546875, -1.626953125, -1.28955078125, -0.9521484375, -0.61474609375, -0.27734375, 0.06005859375, 0.3974609375, 0.73486328125, 1.072265625, 1.40966796875, 1.7470703125, 2.08447265625, 2.421875, 2.75927734375, 3.0966796875, 3.43408203125, 3.771484375, 4.10888671875, 4.4462890625, 4.78369140625, 5.12109375, 5.45849609375, 5.7958984375, 6.13330078125, 6.470703125, 6.80810546875, 7.1455078125, 7.48291015625, 7.8203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 4.0, 1.0, 4.0, 3.0, 5.0, 12.0, 31.0, 102.0, 258.0, 297.0, 184.0, 64.0, 16.0, 12.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-106.27273559570312, -101.88432312011719, -97.49591827392578, -93.10751342773438, -88.71910095214844, -84.3306884765625, -79.9422836303711, -75.55387878417969, -71.16546630859375, -66.77705383300781, -62.388648986816406, -58.000240325927734, -53.61183166503906, -49.22342300415039, -44.83501434326172, -40.44660568237305, -36.058197021484375, -31.669788360595703, -27.28137969970703, -22.89297103881836, -18.504562377929688, -14.116153717041016, -9.727745056152344, -5.339336395263672, -0.950927734375, 3.437480926513672, 7.825889587402344, 12.214298248291016, 16.602706909179688, 20.99111557006836, 25.37952423095703, 29.767932891845703, 34.15635681152344, 38.54476547241211, 42.93317413330078, 47.32158279418945, 51.709991455078125, 56.0984001159668, 60.48680877685547, 64.87521362304688, 69.26362609863281, 73.65203857421875, 78.04044342041016, 82.42884826660156, 86.8172607421875, 91.20567321777344, 95.59407806396484, 99.98248291015625, 104.37089538574219, 108.75930786132812, 113.14771270751953, 117.53611755371094, 121.92453002929688, 126.31294250488281, 130.70135498046875, 135.08975219726562, 139.47816467285156, 143.8665771484375, 148.25497436523438, 152.6433868408203, 157.03179931640625, 161.4202117919922, 165.80862426757812, 170.197021484375, 174.58543395996094]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 7.0, 10.0, 16.0, 13.0, 9.0, 7.0, 15.0, 27.0, 24.0, 22.0, 41.0, 38.0, 32.0, 41.0, 35.0, 50.0, 49.0, 59.0, 56.0, 52.0, 48.0, 47.0, 48.0, 38.0, 45.0, 21.0, 37.0, 24.0, 17.0, 9.0, 16.0, 3.0, 15.0, 13.0, 7.0, 2.0, 3.0, 2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.043025970458984, -42.64542007446289, -41.24781799316406, -39.85021209716797, -38.452606201171875, -37.05500411987305, -35.65739822387695, -34.259796142578125, -32.86219024658203, -31.46458625793457, -30.06698226928711, -28.669376373291016, -27.271772384643555, -25.874168395996094, -24.4765625, -23.07895851135254, -21.681354522705078, -20.283750534057617, -18.886146545410156, -17.488540649414062, -16.0909366607666, -14.69333267211914, -13.295727729797363, -11.898122787475586, -10.500518798828125, -9.102914810180664, -7.705309867858887, -6.307705402374268, -4.910100936889648, -3.5124964714050293, -2.11489200592041, -0.7172870635986328, 0.6803131103515625, 2.0779175758361816, 3.475522041320801, 4.87312650680542, 6.270730972290039, 7.668335437774658, 9.065939903259277, 10.463544845581055, 11.861148834228516, 13.258752822875977, 14.656357765197754, 16.05396270751953, 17.451566696166992, 18.849170684814453, 20.246776580810547, 21.644380569458008, 23.04198455810547, 24.43958854675293, 25.83719253540039, 27.234798431396484, 28.632402420043945, 30.030006408691406, 31.4276123046875, 32.825218200683594, 34.22282028198242, 35.620426177978516, 37.018028259277344, 38.41563415527344, 39.81324005126953, 41.21084213256836, 42.60844802856445, 44.00605010986328, 45.403656005859375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 6.0, 6.0, 7.0, 14.0, 16.0, 20.0, 25.0, 26.0, 49.0, 70.0, 97.0, 170.0, 266.0, 482.0, 975.0, 1803.0, 4049.0, 9232.0, 23951.0, 65819.0, 185850.0, 404627.0, 222924.0, 79324.0, 28678.0, 11078.0, 4576.0, 2007.0, 1034.0, 525.0, 285.0, 179.0, 115.0, 69.0, 65.0, 37.0, 22.0, 21.0, 10.0, 11.0, 8.0, 6.0, 12.0, 7.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.71875, -7.4578857421875, -7.197021484375, -6.9361572265625, -6.67529296875, -6.4144287109375, -6.153564453125, -5.8927001953125, -5.6318359375, -5.3709716796875, -5.110107421875, -4.8492431640625, -4.58837890625, -4.3275146484375, -4.066650390625, -3.8057861328125, -3.544921875, -3.2840576171875, -3.023193359375, -2.7623291015625, -2.50146484375, -2.2406005859375, -1.979736328125, -1.7188720703125, -1.4580078125, -1.1971435546875, -0.936279296875, -0.6754150390625, -0.41455078125, -0.1536865234375, 0.107177734375, 0.3680419921875, 0.62890625, 0.8897705078125, 1.150634765625, 1.4114990234375, 1.67236328125, 1.9332275390625, 2.194091796875, 2.4549560546875, 2.7158203125, 2.9766845703125, 3.237548828125, 3.4984130859375, 3.75927734375, 4.0201416015625, 4.281005859375, 4.5418701171875, 4.802734375, 5.0635986328125, 5.324462890625, 5.5853271484375, 5.84619140625, 6.1070556640625, 6.367919921875, 6.6287841796875, 6.8896484375, 7.1505126953125, 7.411376953125, 7.6722412109375, 7.93310546875, 8.1939697265625, 8.454833984375, 8.7156982421875, 8.9765625]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 6.0, 6.0, 9.0, 9.0, 10.0, 21.0, 27.0, 22.0, 39.0, 36.0, 49.0, 60.0, 78.0, 62.0, 56.0, 61.0, 65.0, 64.0, 58.0, 62.0, 43.0, 37.0, 23.0, 28.0, 21.0, 20.0, 11.0, 11.0, 5.0, 4.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.8671875, -3.71368408203125, -3.5601806640625, -3.40667724609375, -3.253173828125, -3.09967041015625, -2.9461669921875, -2.79266357421875, -2.63916015625, -2.48565673828125, -2.3321533203125, -2.17864990234375, -2.025146484375, -1.87164306640625, -1.7181396484375, -1.56463623046875, -1.4111328125, -1.25762939453125, -1.1041259765625, -0.95062255859375, -0.797119140625, -0.64361572265625, -0.4901123046875, -0.33660888671875, -0.18310546875, -0.02960205078125, 0.1239013671875, 0.27740478515625, 0.430908203125, 0.58441162109375, 0.7379150390625, 0.89141845703125, 1.044921875, 1.19842529296875, 1.3519287109375, 1.50543212890625, 1.658935546875, 1.81243896484375, 1.9659423828125, 2.11944580078125, 2.27294921875, 2.42645263671875, 2.5799560546875, 2.73345947265625, 2.886962890625, 3.04046630859375, 3.1939697265625, 3.34747314453125, 3.5009765625, 3.65447998046875, 3.8079833984375, 3.96148681640625, 4.114990234375, 4.26849365234375, 4.4219970703125, 4.57550048828125, 4.72900390625, 4.88250732421875, 5.0360107421875, 5.18951416015625, 5.343017578125, 5.49652099609375, 5.6500244140625, 5.80352783203125, 5.95703125]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 6.0, 4.0, 3.0, 5.0, 3.0, 4.0, 6.0, 14.0, 13.0, 17.0, 23.0, 34.0, 53.0, 80.0, 95.0, 146.0, 188.0, 246.0, 322.0, 479.0, 744.0, 1230.0, 2182.0, 4448.0, 11747.0, 45063.0, 228653.0, 606220.0, 107417.0, 23808.0, 7355.0, 3126.0, 1712.0, 1008.0, 661.0, 409.0, 266.0, 225.0, 145.0, 122.0, 73.0, 52.0, 49.0, 29.0, 23.0, 20.0, 10.0, 10.0, 7.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-9.3671875, -9.035888671875, -8.70458984375, -8.373291015625, -8.0419921875, -7.710693359375, -7.37939453125, -7.048095703125, -6.716796875, -6.385498046875, -6.05419921875, -5.722900390625, -5.3916015625, -5.060302734375, -4.72900390625, -4.397705078125, -4.06640625, -3.735107421875, -3.40380859375, -3.072509765625, -2.7412109375, -2.409912109375, -2.07861328125, -1.747314453125, -1.416015625, -1.084716796875, -0.75341796875, -0.422119140625, -0.0908203125, 0.240478515625, 0.57177734375, 0.903076171875, 1.234375, 1.565673828125, 1.89697265625, 2.228271484375, 2.5595703125, 2.890869140625, 3.22216796875, 3.553466796875, 3.884765625, 4.216064453125, 4.54736328125, 4.878662109375, 5.2099609375, 5.541259765625, 5.87255859375, 6.203857421875, 6.53515625, 6.866455078125, 7.19775390625, 7.529052734375, 7.8603515625, 8.191650390625, 8.52294921875, 8.854248046875, 9.185546875, 9.516845703125, 9.84814453125, 10.179443359375, 10.5107421875, 10.842041015625, 11.17333984375, 11.504638671875, 11.8359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 9.0, 6.0, 7.0, 6.0, 10.0, 6.0, 11.0, 19.0, 11.0, 9.0, 21.0, 17.0, 21.0, 21.0, 23.0, 28.0, 33.0, 33.0, 30.0, 34.0, 33.0, 32.0, 34.0, 32.0, 39.0, 47.0, 34.0, 31.0, 38.0, 34.0, 39.0, 27.0, 33.0, 30.0, 25.0, 30.0, 16.0, 17.0, 8.0, 13.0, 11.0, 11.0, 7.0, 7.0, 3.0, 7.0, 1.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-12.6171875, -12.2425537109375, -11.867919921875, -11.4932861328125, -11.11865234375, -10.7440185546875, -10.369384765625, -9.9947509765625, -9.6201171875, -9.2454833984375, -8.870849609375, -8.4962158203125, -8.12158203125, -7.7469482421875, -7.372314453125, -6.9976806640625, -6.623046875, -6.2484130859375, -5.873779296875, -5.4991455078125, -5.12451171875, -4.7498779296875, -4.375244140625, -4.0006103515625, -3.6259765625, -3.2513427734375, -2.876708984375, -2.5020751953125, -2.12744140625, -1.7528076171875, -1.378173828125, -1.0035400390625, -0.62890625, -0.2542724609375, 0.120361328125, 0.4949951171875, 0.86962890625, 1.2442626953125, 1.618896484375, 1.9935302734375, 2.3681640625, 2.7427978515625, 3.117431640625, 3.4920654296875, 3.86669921875, 4.2413330078125, 4.615966796875, 4.9906005859375, 5.365234375, 5.7398681640625, 6.114501953125, 6.4891357421875, 6.86376953125, 7.2384033203125, 7.613037109375, 7.9876708984375, 8.3623046875, 8.7369384765625, 9.111572265625, 9.4862060546875, 9.86083984375, 10.2354736328125, 10.610107421875, 10.9847412109375, 11.359375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 5.0, 9.0, 8.0, 19.0, 15.0, 36.0, 47.0, 44.0, 71.0, 129.0, 226.0, 380.0, 806.0, 2167.0, 8019.0, 57290.0, 807187.0, 152048.0, 14558.0, 3094.0, 1099.0, 506.0, 261.0, 183.0, 113.0, 71.0, 36.0, 43.0, 21.0, 20.0, 12.0, 3.0, 10.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-5.51171875, -5.352783203125, -5.19384765625, -5.034912109375, -4.8759765625, -4.717041015625, -4.55810546875, -4.399169921875, -4.240234375, -4.081298828125, -3.92236328125, -3.763427734375, -3.6044921875, -3.445556640625, -3.28662109375, -3.127685546875, -2.96875, -2.809814453125, -2.65087890625, -2.491943359375, -2.3330078125, -2.174072265625, -2.01513671875, -1.856201171875, -1.697265625, -1.538330078125, -1.37939453125, -1.220458984375, -1.0615234375, -0.902587890625, -0.74365234375, -0.584716796875, -0.42578125, -0.266845703125, -0.10791015625, 0.051025390625, 0.2099609375, 0.368896484375, 0.52783203125, 0.686767578125, 0.845703125, 1.004638671875, 1.16357421875, 1.322509765625, 1.4814453125, 1.640380859375, 1.79931640625, 1.958251953125, 2.1171875, 2.276123046875, 2.43505859375, 2.593994140625, 2.7529296875, 2.911865234375, 3.07080078125, 3.229736328125, 3.388671875, 3.547607421875, 3.70654296875, 3.865478515625, 4.0244140625, 4.183349609375, 4.34228515625, 4.501220703125, 4.66015625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 2.0, 3.0, 4.0, 7.0, 6.0, 10.0, 19.0, 12.0, 20.0, 23.0, 29.0, 40.0, 46.0, 48.0, 69.0, 95.0, 100.0, 83.0, 63.0, 62.0, 44.0, 49.0, 32.0, 28.0, 16.0, 16.0, 7.0, 11.0, 12.0, 10.0, 6.0, 11.0, 5.0, 4.0, 5.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.0007886886596679688, -0.0007663518190383911, -0.0007440149784088135, -0.0007216781377792358, -0.0006993412971496582, -0.0006770044565200806, -0.0006546676158905029, -0.0006323307752609253, -0.0006099939346313477, -0.00058765709400177, -0.0005653202533721924, -0.0005429834127426147, -0.0005206465721130371, -0.0004983097314834595, -0.00047597289085388184, -0.0004536360502243042, -0.00043129920959472656, -0.0004089623689651489, -0.0003866255283355713, -0.00036428868770599365, -0.000341951847076416, -0.0003196150064468384, -0.00029727816581726074, -0.0002749413251876831, -0.00025260448455810547, -0.00023026764392852783, -0.0002079308032989502, -0.00018559396266937256, -0.00016325712203979492, -0.00014092028141021729, -0.00011858344078063965, -9.624660015106201e-05, -7.390975952148438e-05, -5.157291889190674e-05, -2.92360782623291e-05, -6.899237632751465e-06, 1.5437602996826172e-05, 3.777444362640381e-05, 6.0111284255981445e-05, 8.244812488555908e-05, 0.00010478496551513672, 0.00012712180614471436, 0.000149458646774292, 0.00017179548740386963, 0.00019413232803344727, 0.0002164691686630249, 0.00023880600929260254, 0.0002611428499221802, 0.0002834796905517578, 0.00030581653118133545, 0.0003281533718109131, 0.0003504902124404907, 0.00037282705307006836, 0.000395163893699646, 0.00041750073432922363, 0.00043983757495880127, 0.0004621744155883789, 0.00048451125621795654, 0.0005068480968475342, 0.0005291849374771118, 0.0005515217781066895, 0.0005738586187362671, 0.0005961954593658447, 0.0006185322999954224, 0.000640869140625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 5.0, 6.0, 3.0, 11.0, 19.0, 28.0, 53.0, 72.0, 189.0, 376.0, 822.0, 2901.0, 18373.0, 704497.0, 304702.0, 12549.0, 2382.0, 827.0, 346.0, 158.0, 90.0, 59.0, 26.0, 20.0, 19.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.92578125, -6.7017822265625, -6.477783203125, -6.2537841796875, -6.02978515625, -5.8057861328125, -5.581787109375, -5.3577880859375, -5.1337890625, -4.9097900390625, -4.685791015625, -4.4617919921875, -4.23779296875, -4.0137939453125, -3.789794921875, -3.5657958984375, -3.341796875, -3.1177978515625, -2.893798828125, -2.6697998046875, -2.44580078125, -2.2218017578125, -1.997802734375, -1.7738037109375, -1.5498046875, -1.3258056640625, -1.101806640625, -0.8778076171875, -0.65380859375, -0.4298095703125, -0.205810546875, 0.0181884765625, 0.2421875, 0.4661865234375, 0.690185546875, 0.9141845703125, 1.13818359375, 1.3621826171875, 1.586181640625, 1.8101806640625, 2.0341796875, 2.2581787109375, 2.482177734375, 2.7061767578125, 2.93017578125, 3.1541748046875, 3.378173828125, 3.6021728515625, 3.826171875, 4.0501708984375, 4.274169921875, 4.4981689453125, 4.72216796875, 4.9461669921875, 5.170166015625, 5.3941650390625, 5.6181640625, 5.8421630859375, 6.066162109375, 6.2901611328125, 6.51416015625, 6.7381591796875, 6.962158203125, 7.1861572265625, 7.41015625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 11.0, 4.0, 3.0, 8.0, 11.0, 15.0, 23.0, 28.0, 41.0, 46.0, 58.0, 69.0, 100.0, 124.0, 97.0, 67.0, 64.0, 48.0, 36.0, 25.0, 21.0, 24.0, 21.0, 12.0, 15.0, 7.0, 9.0, 6.0, 3.0, 0.0, 5.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.375, -3.2427978515625, -3.110595703125, -2.9783935546875, -2.84619140625, -2.7139892578125, -2.581787109375, -2.4495849609375, -2.3173828125, -2.1851806640625, -2.052978515625, -1.9207763671875, -1.78857421875, -1.6563720703125, -1.524169921875, -1.3919677734375, -1.259765625, -1.1275634765625, -0.995361328125, -0.8631591796875, -0.73095703125, -0.5987548828125, -0.466552734375, -0.3343505859375, -0.2021484375, -0.0699462890625, 0.062255859375, 0.1944580078125, 0.32666015625, 0.4588623046875, 0.591064453125, 0.7232666015625, 0.85546875, 0.9876708984375, 1.119873046875, 1.2520751953125, 1.38427734375, 1.5164794921875, 1.648681640625, 1.7808837890625, 1.9130859375, 2.0452880859375, 2.177490234375, 2.3096923828125, 2.44189453125, 2.5740966796875, 2.706298828125, 2.8385009765625, 2.970703125, 3.1029052734375, 3.235107421875, 3.3673095703125, 3.49951171875, 3.6317138671875, 3.763916015625, 3.8961181640625, 4.0283203125, 4.1605224609375, 4.292724609375, 4.4249267578125, 4.55712890625, 4.6893310546875, 4.821533203125, 4.9537353515625, 5.0859375]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 6.0, 3.0, 6.0, 18.0, 40.0, 93.0, 215.0, 309.0, 172.0, 76.0, 34.0, 18.0, 6.0, 2.0, 3.0, 3.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.42596435546875, -160.3578338623047, -156.2897186279297, -152.22158813476562, -148.15347290039062, -144.08534240722656, -140.0172119140625, -135.9490966796875, -131.88096618652344, -127.8128433227539, -123.74472045898438, -119.67658996582031, -115.60846710205078, -111.54034423828125, -107.47221374511719, -103.40409088134766, -99.33596801757812, -95.2678451538086, -91.19972229003906, -87.131591796875, -83.06346893310547, -78.99534606933594, -74.92721557617188, -70.85909271240234, -66.79096984863281, -62.72284698486328, -58.654720306396484, -54.58659362792969, -50.518470764160156, -46.450347900390625, -42.38222122192383, -38.31409454345703, -34.24598693847656, -30.1778621673584, -26.109737396240234, -22.04161262512207, -17.973487854003906, -13.905363082885742, -9.837238311767578, -5.769113540649414, -1.70098876953125, 2.367136001586914, 6.435260772705078, 10.503385543823242, 14.571510314941406, 18.63963508605957, 22.707759857177734, 26.7758846282959, 30.844009399414062, 34.912132263183594, 38.98025894165039, 43.04838562011719, 47.11650848388672, 51.18463134765625, 55.25275802612305, 59.320884704589844, 63.389007568359375, 67.4571304321289, 71.52525329589844, 75.5933837890625, 79.66150665283203, 83.72962951660156, 87.79776000976562, 91.86588287353516, 95.93400573730469]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 2.0, 5.0, 10.0, 11.0, 13.0, 18.0, 17.0, 20.0, 14.0, 21.0, 27.0, 23.0, 34.0, 32.0, 33.0, 47.0, 41.0, 52.0, 53.0, 57.0, 80.0, 49.0, 40.0, 41.0, 33.0, 33.0, 28.0, 25.0, 20.0, 24.0, 18.0, 16.0, 14.0, 9.0, 6.0, 2.0, 11.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-51.095027923583984, -49.467533111572266, -47.84003829956055, -46.21254348754883, -44.58504867553711, -42.957550048828125, -41.330055236816406, -39.70256042480469, -38.07506561279297, -36.44757080078125, -34.82007598876953, -33.19258117675781, -31.56508445739746, -29.937589645385742, -28.310094833374023, -26.682598114013672, -25.055105209350586, -23.427610397338867, -21.80011558532715, -20.172618865966797, -18.545124053955078, -16.91762924194336, -15.29013442993164, -13.662638664245605, -12.035143852233887, -10.407649040222168, -8.780153274536133, -7.152658462524414, -5.525163173675537, -3.89766788482666, -2.2701730728149414, -0.6426773071289062, 0.9848175048828125, 2.6123127937316895, 4.239808082580566, 5.867302894592285, 7.494798183441162, 9.122293472290039, 10.749788284301758, 12.377284049987793, 14.004778861999512, 15.63227367401123, 17.259769439697266, 18.887264251708984, 20.514759063720703, 22.142253875732422, 23.76974868774414, 25.397245407104492, 27.02474021911621, 28.65223503112793, 30.27972984313965, 31.9072265625, 33.53472137451172, 35.16221618652344, 36.789710998535156, 38.417205810546875, 40.044700622558594, 41.67219543457031, 43.29969024658203, 44.92718505859375, 46.55467987060547, 48.18217468261719, 49.809669494628906, 51.43716812133789, 53.06466293334961]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 8.0, 9.0, 11.0, 21.0, 41.0, 30.0, 83.0, 88.0, 187.0, 399.0, 1000.0, 2802.0, 9391.0, 40388.0, 425983.0, 3365041.0, 302893.0, 33149.0, 8289.0, 2760.0, 973.0, 367.0, 167.0, 77.0, 41.0, 26.0, 19.0, 8.0, 9.0, 10.0, 6.0, 1.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.4375, -6.211181640625, -5.98486328125, -5.758544921875, -5.5322265625, -5.305908203125, -5.07958984375, -4.853271484375, -4.626953125, -4.400634765625, -4.17431640625, -3.947998046875, -3.7216796875, -3.495361328125, -3.26904296875, -3.042724609375, -2.81640625, -2.590087890625, -2.36376953125, -2.137451171875, -1.9111328125, -1.684814453125, -1.45849609375, -1.232177734375, -1.005859375, -0.779541015625, -0.55322265625, -0.326904296875, -0.1005859375, 0.125732421875, 0.35205078125, 0.578369140625, 0.8046875, 1.031005859375, 1.25732421875, 1.483642578125, 1.7099609375, 1.936279296875, 2.16259765625, 2.388916015625, 2.615234375, 2.841552734375, 3.06787109375, 3.294189453125, 3.5205078125, 3.746826171875, 3.97314453125, 4.199462890625, 4.42578125, 4.652099609375, 4.87841796875, 5.104736328125, 5.3310546875, 5.557373046875, 5.78369140625, 6.010009765625, 6.236328125, 6.462646484375, 6.68896484375, 6.915283203125, 7.1416015625, 7.367919921875, 7.59423828125, 7.820556640625, 8.046875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 4.0, 3.0, 2.0, 9.0, 8.0, 12.0, 11.0, 14.0, 21.0, 22.0, 36.0, 36.0, 40.0, 55.0, 50.0, 59.0, 63.0, 63.0, 58.0, 71.0, 68.0, 58.0, 48.0, 47.0, 29.0, 30.0, 25.0, 17.0, 18.0, 12.0, 4.0, 9.0, 3.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.935546875, -2.795440673828125, -2.65533447265625, -2.515228271484375, -2.3751220703125, -2.235015869140625, -2.09490966796875, -1.954803466796875, -1.814697265625, -1.674591064453125, -1.53448486328125, -1.394378662109375, -1.2542724609375, -1.114166259765625, -0.97406005859375, -0.833953857421875, -0.69384765625, -0.553741455078125, -0.41363525390625, -0.273529052734375, -0.1334228515625, 0.006683349609375, 0.14678955078125, 0.286895751953125, 0.427001953125, 0.567108154296875, 0.70721435546875, 0.847320556640625, 0.9874267578125, 1.127532958984375, 1.26763916015625, 1.407745361328125, 1.5478515625, 1.687957763671875, 1.82806396484375, 1.968170166015625, 2.1082763671875, 2.248382568359375, 2.38848876953125, 2.528594970703125, 2.668701171875, 2.808807373046875, 2.94891357421875, 3.089019775390625, 3.2291259765625, 3.369232177734375, 3.50933837890625, 3.649444580078125, 3.78955078125, 3.929656982421875, 4.06976318359375, 4.209869384765625, 4.3499755859375, 4.490081787109375, 4.63018798828125, 4.770294189453125, 4.910400390625, 5.050506591796875, 5.19061279296875, 5.330718994140625, 5.4708251953125, 5.610931396484375, 5.75103759765625, 5.891143798828125, 6.03125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 5.0, 3.0, 4.0, 4.0, 6.0, 4.0, 15.0, 21.0, 26.0, 34.0, 63.0, 77.0, 146.0, 280.0, 564.0, 1180.0, 2822.0, 8534.0, 29941.0, 156047.0, 3286413.0, 623352.0, 61675.0, 14704.0, 4743.0, 1819.0, 842.0, 420.0, 205.0, 115.0, 71.0, 50.0, 25.0, 23.0, 23.0, 6.0, 8.0, 13.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-9.4609375, -9.216796875, -8.97265625, -8.728515625, -8.484375, -8.240234375, -7.99609375, -7.751953125, -7.5078125, -7.263671875, -7.01953125, -6.775390625, -6.53125, -6.287109375, -6.04296875, -5.798828125, -5.5546875, -5.310546875, -5.06640625, -4.822265625, -4.578125, -4.333984375, -4.08984375, -3.845703125, -3.6015625, -3.357421875, -3.11328125, -2.869140625, -2.625, -2.380859375, -2.13671875, -1.892578125, -1.6484375, -1.404296875, -1.16015625, -0.916015625, -0.671875, -0.427734375, -0.18359375, 0.060546875, 0.3046875, 0.548828125, 0.79296875, 1.037109375, 1.28125, 1.525390625, 1.76953125, 2.013671875, 2.2578125, 2.501953125, 2.74609375, 2.990234375, 3.234375, 3.478515625, 3.72265625, 3.966796875, 4.2109375, 4.455078125, 4.69921875, 4.943359375, 5.1875, 5.431640625, 5.67578125, 5.919921875, 6.1640625]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 4.0, 6.0, 8.0, 5.0, 12.0, 14.0, 21.0, 27.0, 31.0, 41.0, 48.0, 72.0, 116.0, 210.0, 409.0, 729.0, 962.0, 608.0, 278.0, 163.0, 79.0, 59.0, 33.0, 33.0, 24.0, 20.0, 19.0, 13.0, 6.0, 8.0, 4.0, 4.0, 4.0, 3.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.87109375, -6.61004638671875, -6.3489990234375, -6.08795166015625, -5.826904296875, -5.56585693359375, -5.3048095703125, -5.04376220703125, -4.78271484375, -4.52166748046875, -4.2606201171875, -3.99957275390625, -3.738525390625, -3.47747802734375, -3.2164306640625, -2.95538330078125, -2.6943359375, -2.43328857421875, -2.1722412109375, -1.91119384765625, -1.650146484375, -1.38909912109375, -1.1280517578125, -0.86700439453125, -0.60595703125, -0.34490966796875, -0.0838623046875, 0.17718505859375, 0.438232421875, 0.69927978515625, 0.9603271484375, 1.22137451171875, 1.482421875, 1.74346923828125, 2.0045166015625, 2.26556396484375, 2.526611328125, 2.78765869140625, 3.0487060546875, 3.30975341796875, 3.57080078125, 3.83184814453125, 4.0928955078125, 4.35394287109375, 4.614990234375, 4.87603759765625, 5.1370849609375, 5.39813232421875, 5.6591796875, 5.92022705078125, 6.1812744140625, 6.44232177734375, 6.703369140625, 6.96441650390625, 7.2254638671875, 7.48651123046875, 7.74755859375, 8.00860595703125, 8.2696533203125, 8.53070068359375, 8.791748046875, 9.05279541015625, 9.3138427734375, 9.57489013671875, 9.8359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 3.0, 1.0, 4.0, 5.0, 14.0, 21.0, 70.0, 176.0, 298.0, 262.0, 95.0, 29.0, 15.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-130.84140014648438, -127.27920532226562, -123.71701049804688, -120.15481567382812, -116.59262084960938, -113.03042602539062, -109.46823120117188, -105.90603637695312, -102.34384155273438, -98.78164672851562, -95.21945190429688, -91.65725708007812, -88.09506225585938, -84.53286743164062, -80.97067260742188, -77.40847778320312, -73.84628295898438, -70.28408813476562, -66.72189331054688, -63.159698486328125, -59.597503662109375, -56.035308837890625, -52.473114013671875, -48.910919189453125, -45.348716735839844, -41.786521911621094, -38.224327087402344, -34.662132263183594, -31.099937438964844, -27.53774070739746, -23.97554588317871, -20.41335105895996, -16.851158142089844, -13.288963317871094, -9.726768493652344, -6.164572715759277, -2.6023778915405273, 0.9598178863525391, 4.522012710571289, 8.084207534790039, 11.646402359008789, 15.208597183227539, 18.77079200744629, 22.332988739013672, 25.895183563232422, 29.457378387451172, 33.01957321166992, 36.58176803588867, 40.14396286010742, 43.70615768432617, 47.26835250854492, 50.83054733276367, 54.39274215698242, 57.95494079589844, 61.51713562011719, 65.07933044433594, 68.64152526855469, 72.20372009277344, 75.76591491699219, 79.32810974121094, 82.89030456542969, 86.45249938964844, 90.01469421386719, 93.57688903808594, 97.13908386230469]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 3.0, 5.0, 4.0, 7.0, 11.0, 5.0, 8.0, 8.0, 4.0, 9.0, 13.0, 19.0, 16.0, 18.0, 36.0, 31.0, 28.0, 37.0, 31.0, 35.0, 36.0, 39.0, 37.0, 33.0, 30.0, 36.0, 35.0, 60.0, 45.0, 37.0, 32.0, 31.0, 24.0, 39.0, 41.0, 23.0, 25.0, 11.0, 9.0, 9.0, 19.0, 3.0, 7.0, 5.0, 3.0, 5.0, 2.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-26.71070098876953, -25.708580017089844, -24.706457138061523, -23.704334259033203, -22.702213287353516, -21.700092315673828, -20.697969436645508, -19.695846557617188, -18.6937255859375, -17.691604614257812, -16.689481735229492, -15.687359809875488, -14.685237884521484, -13.68311595916748, -12.680994033813477, -11.678872108459473, -10.676750183105469, -9.674628257751465, -8.672506332397461, -7.670384407043457, -6.668262481689453, -5.666140556335449, -4.664018630981445, -3.6618967056274414, -2.6597747802734375, -1.6576528549194336, -0.6555309295654297, 0.3465909957885742, 1.3487129211425781, 2.350834846496582, 3.352956771850586, 4.35507869720459, 5.357204437255859, 6.359326362609863, 7.361448287963867, 8.363570213317871, 9.365692138671875, 10.367814064025879, 11.369935989379883, 12.372057914733887, 13.37417984008789, 14.376301765441895, 15.378423690795898, 16.38054656982422, 17.382667541503906, 18.384788513183594, 19.386911392211914, 20.389034271240234, 21.391155242919922, 22.39327621459961, 23.39539909362793, 24.39752197265625, 25.399642944335938, 26.401763916015625, 27.403886795043945, 28.406009674072266, 29.408130645751953, 30.41025161743164, 31.41237449645996, 32.41449737548828, 33.41661834716797, 34.418739318847656, 35.420860290527344, 36.4229850769043, 37.425106048583984]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 9.0, 16.0, 13.0, 28.0, 43.0, 69.0, 96.0, 152.0, 194.0, 340.0, 513.0, 840.0, 1408.0, 2483.0, 4651.0, 9277.0, 19484.0, 44672.0, 108266.0, 265571.0, 329507.0, 149408.0, 60336.0, 25833.0, 11961.0, 5860.0, 3069.0, 1679.0, 1074.0, 621.0, 404.0, 216.0, 163.0, 98.0, 64.0, 37.0, 32.0, 18.0, 17.0, 10.0, 9.0, 4.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.80859375, -5.6160888671875, -5.423583984375, -5.2310791015625, -5.03857421875, -4.8460693359375, -4.653564453125, -4.4610595703125, -4.2685546875, -4.0760498046875, -3.883544921875, -3.6910400390625, -3.49853515625, -3.3060302734375, -3.113525390625, -2.9210205078125, -2.728515625, -2.5360107421875, -2.343505859375, -2.1510009765625, -1.95849609375, -1.7659912109375, -1.573486328125, -1.3809814453125, -1.1884765625, -0.9959716796875, -0.803466796875, -0.6109619140625, -0.41845703125, -0.2259521484375, -0.033447265625, 0.1590576171875, 0.3515625, 0.5440673828125, 0.736572265625, 0.9290771484375, 1.12158203125, 1.3140869140625, 1.506591796875, 1.6990966796875, 1.8916015625, 2.0841064453125, 2.276611328125, 2.4691162109375, 2.66162109375, 2.8541259765625, 3.046630859375, 3.2391357421875, 3.431640625, 3.6241455078125, 3.816650390625, 4.0091552734375, 4.20166015625, 4.3941650390625, 4.586669921875, 4.7791748046875, 4.9716796875, 5.1641845703125, 5.356689453125, 5.5491943359375, 5.74169921875, 5.9342041015625, 6.126708984375, 6.3192138671875, 6.51171875]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 9.0, 7.0, 9.0, 12.0, 9.0, 18.0, 24.0, 34.0, 25.0, 38.0, 39.0, 57.0, 57.0, 66.0, 81.0, 62.0, 66.0, 52.0, 54.0, 57.0, 58.0, 27.0, 37.0, 23.0, 27.0, 14.0, 8.0, 9.0, 10.0, 11.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.083984375, -2.946319580078125, -2.80865478515625, -2.670989990234375, -2.5333251953125, -2.395660400390625, -2.25799560546875, -2.120330810546875, -1.982666015625, -1.845001220703125, -1.70733642578125, -1.569671630859375, -1.4320068359375, -1.294342041015625, -1.15667724609375, -1.019012451171875, -0.88134765625, -0.743682861328125, -0.60601806640625, -0.468353271484375, -0.3306884765625, -0.193023681640625, -0.05535888671875, 0.082305908203125, 0.219970703125, 0.357635498046875, 0.49530029296875, 0.632965087890625, 0.7706298828125, 0.908294677734375, 1.04595947265625, 1.183624267578125, 1.3212890625, 1.458953857421875, 1.59661865234375, 1.734283447265625, 1.8719482421875, 2.009613037109375, 2.14727783203125, 2.284942626953125, 2.422607421875, 2.560272216796875, 2.69793701171875, 2.835601806640625, 2.9732666015625, 3.110931396484375, 3.24859619140625, 3.386260986328125, 3.52392578125, 3.661590576171875, 3.79925537109375, 3.936920166015625, 4.0745849609375, 4.212249755859375, 4.34991455078125, 4.487579345703125, 4.625244140625, 4.762908935546875, 4.90057373046875, 5.038238525390625, 5.1759033203125, 5.313568115234375, 5.45123291015625, 5.588897705078125, 5.7265625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 4.0, 4.0, 3.0, 5.0, 6.0, 14.0, 11.0, 15.0, 15.0, 22.0, 39.0, 43.0, 78.0, 115.0, 155.0, 257.0, 427.0, 685.0, 1328.0, 3038.0, 9083.0, 45794.0, 376058.0, 543750.0, 51319.0, 9773.0, 3191.0, 1369.0, 739.0, 397.0, 247.0, 184.0, 108.0, 82.0, 56.0, 43.0, 28.0, 25.0, 11.0, 13.0, 7.0, 7.0, 6.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.90625, -12.5032958984375, -12.100341796875, -11.6973876953125, -11.29443359375, -10.8914794921875, -10.488525390625, -10.0855712890625, -9.6826171875, -9.2796630859375, -8.876708984375, -8.4737548828125, -8.07080078125, -7.6678466796875, -7.264892578125, -6.8619384765625, -6.458984375, -6.0560302734375, -5.653076171875, -5.2501220703125, -4.84716796875, -4.4442138671875, -4.041259765625, -3.6383056640625, -3.2353515625, -2.8323974609375, -2.429443359375, -2.0264892578125, -1.62353515625, -1.2205810546875, -0.817626953125, -0.4146728515625, -0.01171875, 0.3912353515625, 0.794189453125, 1.1971435546875, 1.60009765625, 2.0030517578125, 2.406005859375, 2.8089599609375, 3.2119140625, 3.6148681640625, 4.017822265625, 4.4207763671875, 4.82373046875, 5.2266845703125, 5.629638671875, 6.0325927734375, 6.435546875, 6.8385009765625, 7.241455078125, 7.6444091796875, 8.04736328125, 8.4503173828125, 8.853271484375, 9.2562255859375, 9.6591796875, 10.0621337890625, 10.465087890625, 10.8680419921875, 11.27099609375, 11.6739501953125, 12.076904296875, 12.4798583984375, 12.8828125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 12.0, 11.0, 10.0, 10.0, 17.0, 13.0, 13.0, 19.0, 27.0, 27.0, 40.0, 43.0, 45.0, 49.0, 35.0, 40.0, 57.0, 48.0, 52.0, 46.0, 47.0, 40.0, 50.0, 19.0, 37.0, 40.0, 21.0, 21.0, 20.0, 20.0, 9.0, 11.0, 7.0, 12.0, 6.0, 5.0, 6.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.9921875, -13.5985107421875, -13.204833984375, -12.8111572265625, -12.41748046875, -12.0238037109375, -11.630126953125, -11.2364501953125, -10.8427734375, -10.4490966796875, -10.055419921875, -9.6617431640625, -9.26806640625, -8.8743896484375, -8.480712890625, -8.0870361328125, -7.693359375, -7.2996826171875, -6.906005859375, -6.5123291015625, -6.11865234375, -5.7249755859375, -5.331298828125, -4.9376220703125, -4.5439453125, -4.1502685546875, -3.756591796875, -3.3629150390625, -2.96923828125, -2.5755615234375, -2.181884765625, -1.7882080078125, -1.39453125, -1.0008544921875, -0.607177734375, -0.2135009765625, 0.18017578125, 0.5738525390625, 0.967529296875, 1.3612060546875, 1.7548828125, 2.1485595703125, 2.542236328125, 2.9359130859375, 3.32958984375, 3.7232666015625, 4.116943359375, 4.5106201171875, 4.904296875, 5.2979736328125, 5.691650390625, 6.0853271484375, 6.47900390625, 6.8726806640625, 7.266357421875, 7.6600341796875, 8.0537109375, 8.4473876953125, 8.841064453125, 9.2347412109375, 9.62841796875, 10.0220947265625, 10.415771484375, 10.8094482421875, 11.203125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 11.0, 10.0, 13.0, 21.0, 17.0, 36.0, 48.0, 65.0, 108.0, 215.0, 423.0, 942.0, 2788.0, 12015.0, 85845.0, 744002.0, 175159.0, 20197.0, 4127.0, 1297.0, 558.0, 240.0, 142.0, 86.0, 49.0, 29.0, 30.0, 23.0, 10.0, 14.0, 9.0, 8.0, 5.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0], "bins": [-3.85546875, -3.74420166015625, -3.6329345703125, -3.52166748046875, -3.410400390625, -3.29913330078125, -3.1878662109375, -3.07659912109375, -2.96533203125, -2.85406494140625, -2.7427978515625, -2.63153076171875, -2.520263671875, -2.40899658203125, -2.2977294921875, -2.18646240234375, -2.0751953125, -1.96392822265625, -1.8526611328125, -1.74139404296875, -1.630126953125, -1.51885986328125, -1.4075927734375, -1.29632568359375, -1.18505859375, -1.07379150390625, -0.9625244140625, -0.85125732421875, -0.739990234375, -0.62872314453125, -0.5174560546875, -0.40618896484375, -0.294921875, -0.18365478515625, -0.0723876953125, 0.03887939453125, 0.150146484375, 0.26141357421875, 0.3726806640625, 0.48394775390625, 0.59521484375, 0.70648193359375, 0.8177490234375, 0.92901611328125, 1.040283203125, 1.15155029296875, 1.2628173828125, 1.37408447265625, 1.4853515625, 1.59661865234375, 1.7078857421875, 1.81915283203125, 1.930419921875, 2.04168701171875, 2.1529541015625, 2.26422119140625, 2.37548828125, 2.48675537109375, 2.5980224609375, 2.70928955078125, 2.820556640625, 2.93182373046875, 3.0430908203125, 3.15435791015625, 3.265625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 4.0, 5.0, 5.0, 6.0, 10.0, 10.0, 7.0, 18.0, 15.0, 18.0, 23.0, 26.0, 35.0, 39.0, 45.0, 60.0, 68.0, 64.0, 85.0, 69.0, 71.0, 70.0, 51.0, 38.0, 31.0, 30.0, 22.0, 15.0, 16.0, 11.0, 6.0, 11.0, 5.0, 5.0, 4.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006175041198730469, -0.0005973353981971741, -0.0005771666765213013, -0.0005569979548454285, -0.0005368292331695557, -0.0005166605114936829, -0.0004964917898178101, -0.00047632306814193726, -0.00045615434646606445, -0.00043598562479019165, -0.00041581690311431885, -0.00039564818143844604, -0.00037547945976257324, -0.00035531073808670044, -0.00033514201641082764, -0.00031497329473495483, -0.00029480457305908203, -0.00027463585138320923, -0.0002544671297073364, -0.00023429840803146362, -0.00021412968635559082, -0.00019396096467971802, -0.00017379224300384521, -0.0001536235213279724, -0.0001334547996520996, -0.0001132860779762268, -9.3117356300354e-05, -7.29486346244812e-05, -5.27799129486084e-05, -3.2611191272735596e-05, -1.2442469596862793e-05, 7.72625207901001e-06, 2.7894973754882812e-05, 4.8063695430755615e-05, 6.823241710662842e-05, 8.840113878250122e-05, 0.00010856986045837402, 0.00012873858213424683, 0.00014890730381011963, 0.00016907602548599243, 0.00018924474716186523, 0.00020941346883773804, 0.00022958219051361084, 0.00024975091218948364, 0.00026991963386535645, 0.00029008835554122925, 0.00031025707721710205, 0.00033042579889297485, 0.00035059452056884766, 0.00037076324224472046, 0.00039093196392059326, 0.00041110068559646606, 0.00043126940727233887, 0.00045143812894821167, 0.00047160685062408447, 0.0004917755722999573, 0.0005119442939758301, 0.0005321130156517029, 0.0005522817373275757, 0.0005724504590034485, 0.0005926191806793213, 0.0006127879023551941, 0.0006329566240310669, 0.0006531253457069397, 0.0006732940673828125]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 5.0, 7.0, 15.0, 22.0, 40.0, 52.0, 96.0, 165.0, 324.0, 710.0, 1872.0, 6575.0, 42854.0, 708164.0, 260546.0, 20444.0, 4110.0, 1395.0, 534.0, 266.0, 162.0, 78.0, 53.0, 14.0, 31.0, 15.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.07421875, -4.949951171875, -4.82568359375, -4.701416015625, -4.5771484375, -4.452880859375, -4.32861328125, -4.204345703125, -4.080078125, -3.955810546875, -3.83154296875, -3.707275390625, -3.5830078125, -3.458740234375, -3.33447265625, -3.210205078125, -3.0859375, -2.961669921875, -2.83740234375, -2.713134765625, -2.5888671875, -2.464599609375, -2.34033203125, -2.216064453125, -2.091796875, -1.967529296875, -1.84326171875, -1.718994140625, -1.5947265625, -1.470458984375, -1.34619140625, -1.221923828125, -1.09765625, -0.973388671875, -0.84912109375, -0.724853515625, -0.6005859375, -0.476318359375, -0.35205078125, -0.227783203125, -0.103515625, 0.020751953125, 0.14501953125, 0.269287109375, 0.3935546875, 0.517822265625, 0.64208984375, 0.766357421875, 0.890625, 1.014892578125, 1.13916015625, 1.263427734375, 1.3876953125, 1.511962890625, 1.63623046875, 1.760498046875, 1.884765625, 2.009033203125, 2.13330078125, 2.257568359375, 2.3818359375, 2.506103515625, 2.63037109375, 2.754638671875, 2.87890625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 7.0, 13.0, 12.0, 13.0, 22.0, 25.0, 17.0, 44.0, 53.0, 67.0, 76.0, 65.0, 70.0, 75.0, 72.0, 73.0, 57.0, 50.0, 33.0, 19.0, 22.0, 24.0, 26.0, 11.0, 8.0, 7.0, 11.0, 6.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.673828125, -2.5875244140625, -2.501220703125, -2.4149169921875, -2.32861328125, -2.2423095703125, -2.156005859375, -2.0697021484375, -1.9833984375, -1.8970947265625, -1.810791015625, -1.7244873046875, -1.63818359375, -1.5518798828125, -1.465576171875, -1.3792724609375, -1.29296875, -1.2066650390625, -1.120361328125, -1.0340576171875, -0.94775390625, -0.8614501953125, -0.775146484375, -0.6888427734375, -0.6025390625, -0.5162353515625, -0.429931640625, -0.3436279296875, -0.25732421875, -0.1710205078125, -0.084716796875, 0.0015869140625, 0.087890625, 0.1741943359375, 0.260498046875, 0.3468017578125, 0.43310546875, 0.5194091796875, 0.605712890625, 0.6920166015625, 0.7783203125, 0.8646240234375, 0.950927734375, 1.0372314453125, 1.12353515625, 1.2098388671875, 1.296142578125, 1.3824462890625, 1.46875, 1.5550537109375, 1.641357421875, 1.7276611328125, 1.81396484375, 1.9002685546875, 1.986572265625, 2.0728759765625, 2.1591796875, 2.2454833984375, 2.331787109375, 2.4180908203125, 2.50439453125, 2.5906982421875, 2.677001953125, 2.7633056640625, 2.849609375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 6.0, 9.0, 27.0, 33.0, 67.0, 97.0, 189.0, 216.0, 141.0, 97.0, 52.0, 16.0, 16.0, 10.0, 3.0, 2.0, 7.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.8323974609375, -93.44868469238281, -91.06497955322266, -88.68126678466797, -86.29756164550781, -83.91384887695312, -81.53013610839844, -79.14642333984375, -76.7627182006836, -74.3790054321289, -71.99530029296875, -69.61158752441406, -67.22787475585938, -64.84416961669922, -62.46045684814453, -60.07674789428711, -57.69303894042969, -55.309329986572266, -52.925621032714844, -50.541908264160156, -48.158199310302734, -45.77449035644531, -43.390777587890625, -41.0070686340332, -38.62335968017578, -36.23965072631836, -33.85594177246094, -31.47222900390625, -29.088520050048828, -26.704811096191406, -24.32110023498535, -21.937389373779297, -19.55368423461914, -17.16997528076172, -14.786264419555664, -12.402554512023926, -10.018844604492188, -7.635134696960449, -5.251424789428711, -2.8677139282226562, -0.4840049743652344, 1.899704933166504, 4.283414840698242, 6.6671247482299805, 9.050834655761719, 11.434544563293457, 13.818254470825195, 16.20196533203125, 18.585674285888672, 20.969383239746094, 23.35309410095215, 25.736804962158203, 28.120513916015625, 30.504222869873047, 32.88793182373047, 35.271644592285156, 37.65535354614258, 40.0390625, 42.42277526855469, 44.80648422241211, 47.19019317626953, 49.57390213012695, 51.957611083984375, 54.34132385253906, 56.725032806396484]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 5.0, 4.0, 10.0, 10.0, 8.0, 10.0, 12.0, 12.0, 16.0, 14.0, 23.0, 31.0, 34.0, 28.0, 28.0, 36.0, 46.0, 45.0, 74.0, 80.0, 77.0, 61.0, 57.0, 41.0, 36.0, 30.0, 36.0, 30.0, 24.0, 14.0, 9.0, 16.0, 10.0, 10.0, 7.0, 2.0, 6.0, 6.0, 3.0, 2.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.941307067871094, -39.22537612915039, -37.50944519042969, -35.79351043701172, -34.077579498291016, -32.36164855957031, -30.64571762084961, -28.929784774780273, -27.213851928710938, -25.497920989990234, -23.7819881439209, -22.066057205200195, -20.35012435913086, -18.634193420410156, -16.918262481689453, -15.202329635620117, -13.486398696899414, -11.770466804504395, -10.054534912109375, -8.338603973388672, -6.622671604156494, -4.906740188598633, -3.1908082962036133, -1.4748764038085938, 0.24105548858642578, 1.9569872617721558, 3.6729190349578857, 5.388850688934326, 7.104782581329346, 8.820713996887207, 10.536645889282227, 12.252577781677246, 13.968509674072266, 15.684441566467285, 17.400373458862305, 19.116304397583008, 20.832237243652344, 22.548168182373047, 24.26409912109375, 25.980031967163086, 27.695964813232422, 29.411895751953125, 31.12782859802246, 32.8437614440918, 34.5596923828125, 36.2756233215332, 37.991554260253906, 39.707489013671875, 41.42341613769531, 43.139347076416016, 44.85527801513672, 46.57121276855469, 48.28714370727539, 50.003074645996094, 51.7190055847168, 53.4349365234375, 55.15087127685547, 56.86680221557617, 58.582733154296875, 60.298667907714844, 62.01459884643555, 63.73052978515625, 65.44646453857422, 67.16239166259766, 68.87832641601562]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 4.0, 10.0, 12.0, 23.0, 32.0, 54.0, 76.0, 131.0, 252.0, 562.0, 1283.0, 3990.0, 16042.0, 137193.0, 3246178.0, 739393.0, 37186.0, 7750.0, 2389.0, 900.0, 399.0, 186.0, 95.0, 50.0, 41.0, 22.0, 14.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.0390625, -8.8057861328125, -8.572509765625, -8.3392333984375, -8.10595703125, -7.8726806640625, -7.639404296875, -7.4061279296875, -7.1728515625, -6.9395751953125, -6.706298828125, -6.4730224609375, -6.23974609375, -6.0064697265625, -5.773193359375, -5.5399169921875, -5.306640625, -5.0733642578125, -4.840087890625, -4.6068115234375, -4.37353515625, -4.1402587890625, -3.906982421875, -3.6737060546875, -3.4404296875, -3.2071533203125, -2.973876953125, -2.7406005859375, -2.50732421875, -2.2740478515625, -2.040771484375, -1.8074951171875, -1.57421875, -1.3409423828125, -1.107666015625, -0.8743896484375, -0.64111328125, -0.4078369140625, -0.174560546875, 0.0587158203125, 0.2919921875, 0.5252685546875, 0.758544921875, 0.9918212890625, 1.22509765625, 1.4583740234375, 1.691650390625, 1.9249267578125, 2.158203125, 2.3914794921875, 2.624755859375, 2.8580322265625, 3.09130859375, 3.3245849609375, 3.557861328125, 3.7911376953125, 4.0244140625, 4.2576904296875, 4.490966796875, 4.7242431640625, 4.95751953125, 5.1907958984375, 5.424072265625, 5.6573486328125, 5.890625]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 6.0, 8.0, 8.0, 13.0, 9.0, 8.0, 27.0, 34.0, 28.0, 41.0, 35.0, 61.0, 82.0, 70.0, 79.0, 57.0, 77.0, 61.0, 60.0, 35.0, 31.0, 33.0, 37.0, 24.0, 25.0, 23.0, 8.0, 8.0, 5.0, 4.0, 3.0, 7.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.030120849609375, -2.89422607421875, -2.758331298828125, -2.6224365234375, -2.486541748046875, -2.35064697265625, -2.214752197265625, -2.078857421875, -1.942962646484375, -1.80706787109375, -1.671173095703125, -1.5352783203125, -1.399383544921875, -1.26348876953125, -1.127593994140625, -0.99169921875, -0.855804443359375, -0.71990966796875, -0.584014892578125, -0.4481201171875, -0.312225341796875, -0.17633056640625, -0.040435791015625, 0.095458984375, 0.231353759765625, 0.36724853515625, 0.503143310546875, 0.6390380859375, 0.774932861328125, 0.91082763671875, 1.046722412109375, 1.1826171875, 1.318511962890625, 1.45440673828125, 1.590301513671875, 1.7261962890625, 1.862091064453125, 1.99798583984375, 2.133880615234375, 2.269775390625, 2.405670166015625, 2.54156494140625, 2.677459716796875, 2.8133544921875, 2.949249267578125, 3.08514404296875, 3.221038818359375, 3.35693359375, 3.492828369140625, 3.62872314453125, 3.764617919921875, 3.9005126953125, 4.036407470703125, 4.17230224609375, 4.308197021484375, 4.444091796875, 4.579986572265625, 4.71588134765625, 4.851776123046875, 4.9876708984375, 5.123565673828125, 5.25946044921875, 5.395355224609375, 5.53125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 4.0, 1.0, 4.0, 4.0, 7.0, 18.0, 23.0, 50.0, 59.0, 108.0, 178.0, 335.0, 984.0, 3388.0, 15285.0, 141868.0, 3818038.0, 186903.0, 20206.0, 4357.0, 1292.0, 552.0, 269.0, 127.0, 68.0, 53.0, 21.0, 20.0, 20.0, 7.0, 9.0, 8.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.46875, -9.15869140625, -8.8486328125, -8.53857421875, -8.228515625, -7.91845703125, -7.6083984375, -7.29833984375, -6.98828125, -6.67822265625, -6.3681640625, -6.05810546875, -5.748046875, -5.43798828125, -5.1279296875, -4.81787109375, -4.5078125, -4.19775390625, -3.8876953125, -3.57763671875, -3.267578125, -2.95751953125, -2.6474609375, -2.33740234375, -2.02734375, -1.71728515625, -1.4072265625, -1.09716796875, -0.787109375, -0.47705078125, -0.1669921875, 0.14306640625, 0.453125, 0.76318359375, 1.0732421875, 1.38330078125, 1.693359375, 2.00341796875, 2.3134765625, 2.62353515625, 2.93359375, 3.24365234375, 3.5537109375, 3.86376953125, 4.173828125, 4.48388671875, 4.7939453125, 5.10400390625, 5.4140625, 5.72412109375, 6.0341796875, 6.34423828125, 6.654296875, 6.96435546875, 7.2744140625, 7.58447265625, 7.89453125, 8.20458984375, 8.5146484375, 8.82470703125, 9.134765625, 9.44482421875, 9.7548828125, 10.06494140625, 10.375]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 4.0, 0.0, 4.0, 3.0, 5.0, 6.0, 15.0, 14.0, 28.0, 34.0, 50.0, 77.0, 177.0, 368.0, 811.0, 1154.0, 645.0, 267.0, 128.0, 79.0, 51.0, 49.0, 26.0, 26.0, 17.0, 9.0, 12.0, 6.0, 6.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.01171875, -6.74591064453125, -6.4801025390625, -6.21429443359375, -5.948486328125, -5.68267822265625, -5.4168701171875, -5.15106201171875, -4.88525390625, -4.61944580078125, -4.3536376953125, -4.08782958984375, -3.822021484375, -3.55621337890625, -3.2904052734375, -3.02459716796875, -2.7587890625, -2.49298095703125, -2.2271728515625, -1.96136474609375, -1.695556640625, -1.42974853515625, -1.1639404296875, -0.89813232421875, -0.63232421875, -0.36651611328125, -0.1007080078125, 0.16510009765625, 0.430908203125, 0.69671630859375, 0.9625244140625, 1.22833251953125, 1.494140625, 1.75994873046875, 2.0257568359375, 2.29156494140625, 2.557373046875, 2.82318115234375, 3.0889892578125, 3.35479736328125, 3.62060546875, 3.88641357421875, 4.1522216796875, 4.41802978515625, 4.683837890625, 4.94964599609375, 5.2154541015625, 5.48126220703125, 5.7470703125, 6.01287841796875, 6.2786865234375, 6.54449462890625, 6.810302734375, 7.07611083984375, 7.3419189453125, 7.60772705078125, 7.87353515625, 8.13934326171875, 8.4051513671875, 8.67095947265625, 8.936767578125, 9.20257568359375, 9.4683837890625, 9.73419189453125, 10.0]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 8.0, 18.0, 43.0, 236.0, 435.0, 187.0, 48.0, 21.0, 6.0, 2.0, 3.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.50337982177734, -111.28587341308594, -107.06836700439453, -102.85086059570312, -98.63335418701172, -94.41584777832031, -90.19834899902344, -85.9808349609375, -81.76333618164062, -77.54582977294922, -73.32832336425781, -69.1108169555664, -64.893310546875, -60.675804138183594, -56.45830154418945, -52.24079513549805, -48.023284912109375, -43.80577850341797, -39.58827209472656, -35.370765686035156, -31.153261184692383, -26.935754776000977, -22.718250274658203, -18.500743865966797, -14.28323745727539, -10.065731048583984, -5.8482255935668945, -1.6307201385498047, 2.5867862701416016, 6.804292678833008, 11.021797180175781, 15.239303588867188, 19.456802368164062, 23.67430877685547, 27.891815185546875, 32.10932159423828, 36.32682800292969, 40.544334411621094, 44.761837005615234, 48.97934341430664, 53.19684982299805, 57.41435623168945, 61.63186264038086, 65.849365234375, 70.0668716430664, 74.28437805175781, 78.50188446044922, 82.71939086914062, 86.93689727783203, 91.15440368652344, 95.37191009521484, 99.58941650390625, 103.80692291259766, 108.02442932128906, 112.24192810058594, 116.45944213867188, 120.67694091796875, 124.89444732666016, 129.11195373535156, 133.32945251464844, 137.54696655273438, 141.76446533203125, 145.9819793701172, 150.19947814941406, 154.4169921875]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 5.0, 5.0, 5.0, 12.0, 8.0, 12.0, 18.0, 18.0, 23.0, 20.0, 32.0, 28.0, 35.0, 36.0, 36.0, 49.0, 50.0, 41.0, 57.0, 55.0, 50.0, 48.0, 54.0, 50.0, 42.0, 24.0, 30.0, 28.0, 32.0, 29.0, 15.0, 17.0, 8.0, 15.0, 9.0, 5.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.07742691040039, -29.08233642578125, -28.087244033813477, -27.092153549194336, -26.097061157226562, -25.101970672607422, -24.10688018798828, -23.11178970336914, -22.116697311401367, -21.121606826782227, -20.126514434814453, -19.131423950195312, -18.136333465576172, -17.1412410736084, -16.146150588989258, -15.1510591506958, -14.155967712402344, -13.160876274108887, -12.16578483581543, -11.170694351196289, -10.175602912902832, -9.180511474609375, -8.185420989990234, -7.190329551696777, -6.19523811340332, -5.200146675109863, -4.2050557136535645, -3.2099645137786865, -2.2148733139038086, -1.2197818756103516, -0.22469091415405273, 0.7704000473022461, 1.7654914855957031, 2.760582685470581, 3.755673885345459, 4.750764846801758, 5.745856285095215, 6.740947723388672, 7.736038684844971, 8.73112964630127, 9.726221084594727, 10.721312522888184, 11.71640396118164, 12.711494445800781, 13.706585884094238, 14.701677322387695, 15.696767807006836, 16.69186019897461, 17.68695068359375, 18.68204116821289, 19.677133560180664, 20.672224044799805, 21.667316436767578, 22.66240692138672, 23.65749740600586, 24.652587890625, 25.647680282592773, 26.642770767211914, 27.637863159179688, 28.632953643798828, 29.62804412841797, 30.623136520385742, 31.618227005004883, 32.613319396972656, 33.6084098815918]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 7.0, 12.0, 15.0, 35.0, 38.0, 75.0, 154.0, 255.0, 451.0, 844.0, 1967.0, 5257.0, 16404.0, 66648.0, 302156.0, 481431.0, 129521.0, 29593.0, 8268.0, 2897.0, 1201.0, 563.0, 331.0, 169.0, 92.0, 49.0, 32.0, 27.0, 18.0, 12.0, 13.0, 7.0, 3.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.34375, -6.0582275390625, -5.772705078125, -5.4871826171875, -5.20166015625, -4.9161376953125, -4.630615234375, -4.3450927734375, -4.0595703125, -3.7740478515625, -3.488525390625, -3.2030029296875, -2.91748046875, -2.6319580078125, -2.346435546875, -2.0609130859375, -1.775390625, -1.4898681640625, -1.204345703125, -0.9188232421875, -0.63330078125, -0.3477783203125, -0.062255859375, 0.2232666015625, 0.5087890625, 0.7943115234375, 1.079833984375, 1.3653564453125, 1.65087890625, 1.9364013671875, 2.221923828125, 2.5074462890625, 2.79296875, 3.0784912109375, 3.364013671875, 3.6495361328125, 3.93505859375, 4.2205810546875, 4.506103515625, 4.7916259765625, 5.0771484375, 5.3626708984375, 5.648193359375, 5.9337158203125, 6.21923828125, 6.5047607421875, 6.790283203125, 7.0758056640625, 7.361328125, 7.6468505859375, 7.932373046875, 8.2178955078125, 8.50341796875, 8.7889404296875, 9.074462890625, 9.3599853515625, 9.6455078125, 9.9310302734375, 10.216552734375, 10.5020751953125, 10.78759765625, 11.0731201171875, 11.358642578125, 11.6441650390625, 11.9296875]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 8.0, 11.0, 12.0, 11.0, 18.0, 19.0, 30.0, 39.0, 39.0, 41.0, 54.0, 62.0, 71.0, 76.0, 66.0, 54.0, 65.0, 62.0, 45.0, 37.0, 38.0, 26.0, 21.0, 25.0, 21.0, 16.0, 10.0, 5.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2109375, -3.0794677734375, -2.947998046875, -2.8165283203125, -2.68505859375, -2.5535888671875, -2.422119140625, -2.2906494140625, -2.1591796875, -2.0277099609375, -1.896240234375, -1.7647705078125, -1.63330078125, -1.5018310546875, -1.370361328125, -1.2388916015625, -1.107421875, -0.9759521484375, -0.844482421875, -0.7130126953125, -0.58154296875, -0.4500732421875, -0.318603515625, -0.1871337890625, -0.0556640625, 0.0758056640625, 0.207275390625, 0.3387451171875, 0.47021484375, 0.6016845703125, 0.733154296875, 0.8646240234375, 0.99609375, 1.1275634765625, 1.259033203125, 1.3905029296875, 1.52197265625, 1.6534423828125, 1.784912109375, 1.9163818359375, 2.0478515625, 2.1793212890625, 2.310791015625, 2.4422607421875, 2.57373046875, 2.7052001953125, 2.836669921875, 2.9681396484375, 3.099609375, 3.2310791015625, 3.362548828125, 3.4940185546875, 3.62548828125, 3.7569580078125, 3.888427734375, 4.0198974609375, 4.1513671875, 4.2828369140625, 4.414306640625, 4.5457763671875, 4.67724609375, 4.8087158203125, 4.940185546875, 5.0716552734375, 5.203125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 10.0, 9.0, 13.0, 20.0, 28.0, 28.0, 38.0, 63.0, 78.0, 137.0, 311.0, 710.0, 2326.0, 9989.0, 57557.0, 575968.0, 343345.0, 46332.0, 8250.0, 2006.0, 624.0, 263.0, 148.0, 97.0, 59.0, 40.0, 33.0, 17.0, 17.0, 8.0, 8.0, 5.0, 4.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.7421875, -10.4058837890625, -10.069580078125, -9.7332763671875, -9.39697265625, -9.0606689453125, -8.724365234375, -8.3880615234375, -8.0517578125, -7.7154541015625, -7.379150390625, -7.0428466796875, -6.70654296875, -6.3702392578125, -6.033935546875, -5.6976318359375, -5.361328125, -5.0250244140625, -4.688720703125, -4.3524169921875, -4.01611328125, -3.6798095703125, -3.343505859375, -3.0072021484375, -2.6708984375, -2.3345947265625, -1.998291015625, -1.6619873046875, -1.32568359375, -0.9893798828125, -0.653076171875, -0.3167724609375, 0.01953125, 0.3558349609375, 0.692138671875, 1.0284423828125, 1.36474609375, 1.7010498046875, 2.037353515625, 2.3736572265625, 2.7099609375, 3.0462646484375, 3.382568359375, 3.7188720703125, 4.05517578125, 4.3914794921875, 4.727783203125, 5.0640869140625, 5.400390625, 5.7366943359375, 6.072998046875, 6.4093017578125, 6.74560546875, 7.0819091796875, 7.418212890625, 7.7545166015625, 8.0908203125, 8.4271240234375, 8.763427734375, 9.0997314453125, 9.43603515625, 9.7723388671875, 10.108642578125, 10.4449462890625, 10.78125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 6.0, 6.0, 5.0, 8.0, 12.0, 21.0, 19.0, 22.0, 28.0, 34.0, 28.0, 32.0, 37.0, 38.0, 41.0, 49.0, 53.0, 49.0, 44.0, 54.0, 43.0, 60.0, 44.0, 22.0, 32.0, 32.0, 31.0, 27.0, 29.0, 22.0, 9.0, 11.0, 14.0, 4.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-11.046875, -10.7127685546875, -10.378662109375, -10.0445556640625, -9.71044921875, -9.3763427734375, -9.042236328125, -8.7081298828125, -8.3740234375, -8.0399169921875, -7.705810546875, -7.3717041015625, -7.03759765625, -6.7034912109375, -6.369384765625, -6.0352783203125, -5.701171875, -5.3670654296875, -5.032958984375, -4.6988525390625, -4.36474609375, -4.0306396484375, -3.696533203125, -3.3624267578125, -3.0283203125, -2.6942138671875, -2.360107421875, -2.0260009765625, -1.69189453125, -1.3577880859375, -1.023681640625, -0.6895751953125, -0.35546875, -0.0213623046875, 0.312744140625, 0.6468505859375, 0.98095703125, 1.3150634765625, 1.649169921875, 1.9832763671875, 2.3173828125, 2.6514892578125, 2.985595703125, 3.3197021484375, 3.65380859375, 3.9879150390625, 4.322021484375, 4.6561279296875, 4.990234375, 5.3243408203125, 5.658447265625, 5.9925537109375, 6.32666015625, 6.6607666015625, 6.994873046875, 7.3289794921875, 7.6630859375, 7.9971923828125, 8.331298828125, 8.6654052734375, 8.99951171875, 9.3336181640625, 9.667724609375, 10.0018310546875, 10.3359375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 2.0, 3.0, 7.0, 15.0, 12.0, 32.0, 24.0, 33.0, 53.0, 101.0, 218.0, 401.0, 873.0, 2374.0, 7634.0, 31454.0, 166415.0, 658059.0, 142798.0, 27318.0, 6855.0, 2204.0, 857.0, 355.0, 190.0, 103.0, 59.0, 31.0, 16.0, 12.0, 11.0, 5.0, 11.0, 6.0, 8.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.671875, -2.6005401611328125, -2.529205322265625, -2.4578704833984375, -2.38653564453125, -2.3152008056640625, -2.243865966796875, -2.1725311279296875, -2.1011962890625, -2.0298614501953125, -1.958526611328125, -1.8871917724609375, -1.81585693359375, -1.7445220947265625, -1.673187255859375, -1.6018524169921875, -1.530517578125, -1.4591827392578125, -1.387847900390625, -1.3165130615234375, -1.24517822265625, -1.1738433837890625, -1.102508544921875, -1.0311737060546875, -0.9598388671875, -0.8885040283203125, -0.817169189453125, -0.7458343505859375, -0.67449951171875, -0.6031646728515625, -0.531829833984375, -0.4604949951171875, -0.38916015625, -0.3178253173828125, -0.246490478515625, -0.1751556396484375, -0.10382080078125, -0.0324859619140625, 0.038848876953125, 0.1101837158203125, 0.1815185546875, 0.2528533935546875, 0.324188232421875, 0.3955230712890625, 0.46685791015625, 0.5381927490234375, 0.609527587890625, 0.6808624267578125, 0.752197265625, 0.8235321044921875, 0.894866943359375, 0.9662017822265625, 1.03753662109375, 1.1088714599609375, 1.180206298828125, 1.2515411376953125, 1.3228759765625, 1.3942108154296875, 1.465545654296875, 1.5368804931640625, 1.60821533203125, 1.6795501708984375, 1.750885009765625, 1.8222198486328125, 1.8935546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 5.0, 2.0, 7.0, 3.0, 8.0, 12.0, 15.0, 27.0, 43.0, 39.0, 72.0, 57.0, 87.0, 125.0, 114.0, 95.0, 81.0, 40.0, 61.0, 27.0, 18.0, 20.0, 16.0, 10.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007195472717285156, -0.0006956607103347778, -0.00067177414894104, -0.0006478875875473022, -0.0006240010261535645, -0.0006001144647598267, -0.0005762279033660889, -0.0005523413419723511, -0.0005284547805786133, -0.0005045682191848755, -0.0004806816577911377, -0.0004567950963973999, -0.0004329085350036621, -0.0004090219736099243, -0.0003851354122161865, -0.00036124885082244873, -0.00033736228942871094, -0.00031347572803497314, -0.00028958916664123535, -0.00026570260524749756, -0.00024181604385375977, -0.00021792948246002197, -0.00019404292106628418, -0.0001701563596725464, -0.0001462697982788086, -0.0001223832368850708, -9.849667549133301e-05, -7.461011409759521e-05, -5.072355270385742e-05, -2.683699131011963e-05, -2.950429916381836e-06, 2.0936131477355957e-05, 4.482269287109375e-05, 6.870925426483154e-05, 9.259581565856934e-05, 0.00011648237705230713, 0.00014036893844604492, 0.00016425549983978271, 0.0001881420612335205, 0.0002120286226272583, 0.0002359151840209961, 0.0002598017454147339, 0.0002836883068084717, 0.00030757486820220947, 0.00033146142959594727, 0.00035534799098968506, 0.00037923455238342285, 0.00040312111377716064, 0.00042700767517089844, 0.00045089423656463623, 0.000474780797958374, 0.0004986673593521118, 0.0005225539207458496, 0.0005464404821395874, 0.0005703270435333252, 0.000594213604927063, 0.0006181001663208008, 0.0006419867277145386, 0.0006658732891082764, 0.0006897598505020142, 0.000713646411895752, 0.0007375329732894897, 0.0007614195346832275, 0.0007853060960769653, 0.0008091926574707031]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 4.0, 3.0, 2.0, 4.0, 3.0, 10.0, 5.0, 10.0, 12.0, 13.0, 26.0, 28.0, 46.0, 99.0, 163.0, 283.0, 607.0, 1380.0, 3802.0, 13584.0, 70420.0, 581732.0, 311907.0, 48908.0, 10218.0, 3002.0, 1148.0, 513.0, 251.0, 119.0, 86.0, 50.0, 37.0, 24.0, 15.0, 16.0, 6.0, 9.0, 3.0, 3.0, 4.0, 2.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0234375, -1.9453125, -1.8671875, -1.7890625, -1.7109375, -1.6328125, -1.5546875, -1.4765625, -1.3984375, -1.3203125, -1.2421875, -1.1640625, -1.0859375, -1.0078125, -0.9296875, -0.8515625, -0.7734375, -0.6953125, -0.6171875, -0.5390625, -0.4609375, -0.3828125, -0.3046875, -0.2265625, -0.1484375, -0.0703125, 0.0078125, 0.0859375, 0.1640625, 0.2421875, 0.3203125, 0.3984375, 0.4765625, 0.5546875, 0.6328125, 0.7109375, 0.7890625, 0.8671875, 0.9453125, 1.0234375, 1.1015625, 1.1796875, 1.2578125, 1.3359375, 1.4140625, 1.4921875, 1.5703125, 1.6484375, 1.7265625, 1.8046875, 1.8828125, 1.9609375, 2.0390625, 2.1171875, 2.1953125, 2.2734375, 2.3515625, 2.4296875, 2.5078125, 2.5859375, 2.6640625, 2.7421875, 2.8203125, 2.8984375, 2.9765625]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 5.0, 2.0, 8.0, 8.0, 14.0, 8.0, 31.0, 33.0, 40.0, 38.0, 72.0, 70.0, 76.0, 89.0, 110.0, 98.0, 70.0, 54.0, 38.0, 45.0, 30.0, 16.0, 12.0, 9.0, 9.0, 10.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.029296875, -1.94378662109375, -1.8582763671875, -1.77276611328125, -1.687255859375, -1.60174560546875, -1.5162353515625, -1.43072509765625, -1.34521484375, -1.25970458984375, -1.1741943359375, -1.08868408203125, -1.003173828125, -0.91766357421875, -0.8321533203125, -0.74664306640625, -0.6611328125, -0.57562255859375, -0.4901123046875, -0.40460205078125, -0.319091796875, -0.23358154296875, -0.1480712890625, -0.06256103515625, 0.02294921875, 0.10845947265625, 0.1939697265625, 0.27947998046875, 0.364990234375, 0.45050048828125, 0.5360107421875, 0.62152099609375, 0.70703125, 0.79254150390625, 0.8780517578125, 0.96356201171875, 1.049072265625, 1.13458251953125, 1.2200927734375, 1.30560302734375, 1.39111328125, 1.47662353515625, 1.5621337890625, 1.64764404296875, 1.733154296875, 1.81866455078125, 1.9041748046875, 1.98968505859375, 2.0751953125, 2.16070556640625, 2.2462158203125, 2.33172607421875, 2.417236328125, 2.50274658203125, 2.5882568359375, 2.67376708984375, 2.75927734375, 2.84478759765625, 2.9302978515625, 3.01580810546875, 3.101318359375, 3.18682861328125, 3.2723388671875, 3.35784912109375, 3.443359375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 6.0, 5.0, 7.0, 10.0, 22.0, 32.0, 78.0, 111.0, 269.0, 210.0, 130.0, 56.0, 30.0, 16.0, 9.0, 5.0, 5.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.42835235595703, -76.17144775390625, -73.91454315185547, -71.65763854980469, -69.4007339477539, -67.14382934570312, -64.88692474365234, -62.63002395629883, -60.37311935424805, -58.116214752197266, -55.859310150146484, -53.6024055480957, -51.34550476074219, -49.088600158691406, -46.831695556640625, -44.574790954589844, -42.31788635253906, -40.06098175048828, -37.8040771484375, -35.54717254638672, -33.29026794433594, -31.03336524963379, -28.77646255493164, -26.51955795288086, -24.262653350830078, -22.005748748779297, -19.748844146728516, -17.491941452026367, -15.235036849975586, -12.978132247924805, -10.72122859954834, -8.464324951171875, -6.2074127197265625, -3.9505085945129395, -1.6936044692993164, 0.5632996559143066, 2.8202037811279297, 5.077108383178711, 7.334012031555176, 9.59091567993164, 11.847820281982422, 14.104724884033203, 16.361629486083984, 18.618532180786133, 20.875436782836914, 23.132341384887695, 25.389244079589844, 27.646148681640625, 29.903053283691406, 32.15995788574219, 34.41686248779297, 36.67376708984375, 38.93067169189453, 41.18757629394531, 43.44447708129883, 45.70138168334961, 47.95828628540039, 50.21519088745117, 52.47209548950195, 54.729000091552734, 56.98590087890625, 59.24280548095703, 61.49971008300781, 63.756614685058594, 66.01351928710938]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 4.0, 12.0, 8.0, 9.0, 11.0, 7.0, 24.0, 19.0, 25.0, 12.0, 27.0, 28.0, 38.0, 29.0, 31.0, 40.0, 46.0, 61.0, 64.0, 90.0, 65.0, 51.0, 33.0, 26.0, 42.0, 22.0, 28.0, 31.0, 25.0, 18.0, 12.0, 11.0, 9.0, 9.0, 8.0, 8.0, 4.0, 5.0, 8.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-41.709571838378906, -40.51557159423828, -39.321571350097656, -38.12757110595703, -36.933570861816406, -35.73957061767578, -34.545570373535156, -33.35157012939453, -32.157569885253906, -30.96356964111328, -29.769569396972656, -28.57556915283203, -27.381568908691406, -26.18756866455078, -24.993568420410156, -23.79956817626953, -22.605566024780273, -21.41156578063965, -20.217565536499023, -19.0235652923584, -17.829565048217773, -16.63556480407715, -15.441563606262207, -14.247563362121582, -13.053563117980957, -11.859562873840332, -10.665562629699707, -9.471561431884766, -8.27756118774414, -7.083561420440674, -5.889560699462891, -4.695560455322266, -3.5015602111816406, -2.3075599670410156, -1.1135594844818115, 0.08044099807739258, 1.2744412422180176, 2.4684414863586426, 3.662442207336426, 4.856442451477051, 6.050442695617676, 7.244442939758301, 8.438443183898926, 9.632444381713867, 10.826444625854492, 12.020444869995117, 13.214445114135742, 14.408445358276367, 15.602445602416992, 16.796445846557617, 17.990446090698242, 19.184446334838867, 20.378446578979492, 21.572446823120117, 22.766448974609375, 23.96044921875, 25.154449462890625, 26.34844970703125, 27.542449951171875, 28.7364501953125, 29.930450439453125, 31.12445068359375, 32.318450927734375, 33.512451171875, 34.706451416015625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 1.0, 4.0, 3.0, 10.0, 17.0, 30.0, 25.0, 49.0, 94.0, 149.0, 270.0, 468.0, 880.0, 2055.0, 5785.0, 24010.0, 240099.0, 3051608.0, 797516.0, 55876.0, 9560.0, 3043.0, 1306.0, 645.0, 315.0, 190.0, 121.0, 61.0, 41.0, 25.0, 13.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.37890625, -6.21826171875, -6.0576171875, -5.89697265625, -5.736328125, -5.57568359375, -5.4150390625, -5.25439453125, -5.09375, -4.93310546875, -4.7724609375, -4.61181640625, -4.451171875, -4.29052734375, -4.1298828125, -3.96923828125, -3.80859375, -3.64794921875, -3.4873046875, -3.32666015625, -3.166015625, -3.00537109375, -2.8447265625, -2.68408203125, -2.5234375, -2.36279296875, -2.2021484375, -2.04150390625, -1.880859375, -1.72021484375, -1.5595703125, -1.39892578125, -1.23828125, -1.07763671875, -0.9169921875, -0.75634765625, -0.595703125, -0.43505859375, -0.2744140625, -0.11376953125, 0.046875, 0.20751953125, 0.3681640625, 0.52880859375, 0.689453125, 0.85009765625, 1.0107421875, 1.17138671875, 1.33203125, 1.49267578125, 1.6533203125, 1.81396484375, 1.974609375, 2.13525390625, 2.2958984375, 2.45654296875, 2.6171875, 2.77783203125, 2.9384765625, 3.09912109375, 3.259765625, 3.42041015625, 3.5810546875, 3.74169921875, 3.90234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 4.0, 2.0, 6.0, 10.0, 13.0, 19.0, 18.0, 21.0, 30.0, 45.0, 45.0, 47.0, 47.0, 59.0, 67.0, 64.0, 62.0, 77.0, 58.0, 40.0, 44.0, 44.0, 39.0, 27.0, 31.0, 22.0, 14.0, 13.0, 8.0, 7.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.814453125, -2.692230224609375, -2.57000732421875, -2.447784423828125, -2.3255615234375, -2.203338623046875, -2.08111572265625, -1.958892822265625, -1.836669921875, -1.714447021484375, -1.59222412109375, -1.470001220703125, -1.3477783203125, -1.225555419921875, -1.10333251953125, -0.981109619140625, -0.85888671875, -0.736663818359375, -0.61444091796875, -0.492218017578125, -0.3699951171875, -0.247772216796875, -0.12554931640625, -0.003326416015625, 0.118896484375, 0.241119384765625, 0.36334228515625, 0.485565185546875, 0.6077880859375, 0.730010986328125, 0.85223388671875, 0.974456787109375, 1.0966796875, 1.218902587890625, 1.34112548828125, 1.463348388671875, 1.5855712890625, 1.707794189453125, 1.83001708984375, 1.952239990234375, 2.074462890625, 2.196685791015625, 2.31890869140625, 2.441131591796875, 2.5633544921875, 2.685577392578125, 2.80780029296875, 2.930023193359375, 3.05224609375, 3.174468994140625, 3.29669189453125, 3.418914794921875, 3.5411376953125, 3.663360595703125, 3.78558349609375, 3.907806396484375, 4.030029296875, 4.152252197265625, 4.27447509765625, 4.396697998046875, 4.5189208984375, 4.641143798828125, 4.76336669921875, 4.885589599609375, 5.0078125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 4.0, 5.0, 11.0, 14.0, 29.0, 39.0, 77.0, 131.0, 343.0, 926.0, 3490.0, 24366.0, 3194503.0, 949630.0, 16621.0, 2692.0, 802.0, 294.0, 121.0, 46.0, 48.0, 29.0, 18.0, 9.0, 7.0, 2.0, 1.0, 3.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.4765625, -12.0975341796875, -11.718505859375, -11.3394775390625, -10.96044921875, -10.5814208984375, -10.202392578125, -9.8233642578125, -9.4443359375, -9.0653076171875, -8.686279296875, -8.3072509765625, -7.92822265625, -7.5491943359375, -7.170166015625, -6.7911376953125, -6.412109375, -6.0330810546875, -5.654052734375, -5.2750244140625, -4.89599609375, -4.5169677734375, -4.137939453125, -3.7589111328125, -3.3798828125, -3.0008544921875, -2.621826171875, -2.2427978515625, -1.86376953125, -1.4847412109375, -1.105712890625, -0.7266845703125, -0.34765625, 0.0313720703125, 0.410400390625, 0.7894287109375, 1.16845703125, 1.5474853515625, 1.926513671875, 2.3055419921875, 2.6845703125, 3.0635986328125, 3.442626953125, 3.8216552734375, 4.20068359375, 4.5797119140625, 4.958740234375, 5.3377685546875, 5.716796875, 6.0958251953125, 6.474853515625, 6.8538818359375, 7.23291015625, 7.6119384765625, 7.990966796875, 8.3699951171875, 8.7490234375, 9.1280517578125, 9.507080078125, 9.8861083984375, 10.26513671875, 10.6441650390625, 11.023193359375, 11.4022216796875, 11.78125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 8.0, 11.0, 11.0, 17.0, 26.0, 41.0, 67.0, 149.0, 330.0, 842.0, 1311.0, 673.0, 282.0, 118.0, 77.0, 27.0, 21.0, 17.0, 13.0, 11.0, 7.0, 3.0, 4.0, 3.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-10.0390625, -9.77032470703125, -9.5015869140625, -9.23284912109375, -8.964111328125, -8.69537353515625, -8.4266357421875, -8.15789794921875, -7.88916015625, -7.62042236328125, -7.3516845703125, -7.08294677734375, -6.814208984375, -6.54547119140625, -6.2767333984375, -6.00799560546875, -5.7392578125, -5.47052001953125, -5.2017822265625, -4.93304443359375, -4.664306640625, -4.39556884765625, -4.1268310546875, -3.85809326171875, -3.58935546875, -3.32061767578125, -3.0518798828125, -2.78314208984375, -2.514404296875, -2.24566650390625, -1.9769287109375, -1.70819091796875, -1.439453125, -1.17071533203125, -0.9019775390625, -0.63323974609375, -0.364501953125, -0.09576416015625, 0.1729736328125, 0.44171142578125, 0.71044921875, 0.97918701171875, 1.2479248046875, 1.51666259765625, 1.785400390625, 2.05413818359375, 2.3228759765625, 2.59161376953125, 2.8603515625, 3.12908935546875, 3.3978271484375, 3.66656494140625, 3.935302734375, 4.20404052734375, 4.4727783203125, 4.74151611328125, 5.01025390625, 5.27899169921875, 5.5477294921875, 5.81646728515625, 6.085205078125, 6.35394287109375, 6.6226806640625, 6.89141845703125, 7.16015625]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 7.0, 23.0, 54.0, 142.0, 220.0, 225.0, 169.0, 65.0, 53.0, 19.0, 11.0, 4.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.946502685546875, -23.998870849609375, -22.051239013671875, -20.103609085083008, -18.155977249145508, -16.208345413208008, -14.260714530944824, -12.31308364868164, -10.36545181274414, -8.41781997680664, -6.470189094543457, -4.522557735443115, -2.5749263763427734, -0.6272945404052734, 1.3203363418579102, 3.2679672241210938, 5.215599060058594, 7.1632304191589355, 9.110861778259277, 11.058492660522461, 13.006124496459961, 14.953756332397461, 16.901386260986328, 18.849018096923828, 20.796649932861328, 22.744281768798828, 24.691913604736328, 26.639543533325195, 28.587175369262695, 30.534807205200195, 32.48243713378906, 34.43006896972656, 36.37770080566406, 38.32533264160156, 40.27296447753906, 42.22059631347656, 44.16822814941406, 46.11585998535156, 48.0634880065918, 50.0111198425293, 51.9587516784668, 53.9063835144043, 55.8540153503418, 57.8016471862793, 59.74927520751953, 61.69690704345703, 63.64453887939453, 65.59217071533203, 67.53980255126953, 69.48743438720703, 71.43506622314453, 73.38269805908203, 75.33032989501953, 77.27796173095703, 79.22559356689453, 81.1732177734375, 83.120849609375, 85.0684814453125, 87.01611328125, 88.9637451171875, 90.911376953125, 92.8590087890625, 94.806640625, 96.7542724609375, 98.701904296875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 4.0, 9.0, 15.0, 8.0, 21.0, 12.0, 21.0, 23.0, 32.0, 32.0, 31.0, 39.0, 43.0, 47.0, 48.0, 55.0, 55.0, 40.0, 57.0, 55.0, 49.0, 35.0, 37.0, 38.0, 29.0, 32.0, 16.0, 20.0, 19.0, 16.0, 9.0, 10.0, 10.0, 7.0, 6.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.020801544189453, -25.223102569580078, -24.425405502319336, -23.62770652770996, -22.83000946044922, -22.032310485839844, -21.23461151123047, -20.436912536621094, -19.63921546936035, -18.841516494750977, -18.043819427490234, -17.24612045288086, -16.448421478271484, -15.650724411010742, -14.853025436401367, -14.055327415466309, -13.25762939453125, -12.459931373596191, -11.662233352661133, -10.864534378051758, -10.0668363571167, -9.26913833618164, -8.471439361572266, -7.673741340637207, -6.876043319702148, -6.07834529876709, -5.280646800994873, -4.482948303222656, -3.6852502822875977, -2.88755202293396, -2.0898537635803223, -1.2921552658081055, -0.4944572448730469, 0.3032410144805908, 1.1009392738342285, 1.8986375331878662, 2.696335792541504, 3.4940340518951416, 4.291732311248779, 5.089430809020996, 5.887128829956055, 6.684826850891113, 7.48252534866333, 8.280223846435547, 9.077921867370605, 9.875619888305664, 10.673318862915039, 11.471016883850098, 12.268714904785156, 13.066412925720215, 13.864110946655273, 14.661809921264648, 15.459507942199707, 16.257205963134766, 17.05490493774414, 17.852603912353516, 18.650300979614258, 19.447999954223633, 20.245697021484375, 21.04339599609375, 21.841094970703125, 22.638792037963867, 23.436491012573242, 24.234188079833984, 25.03188705444336]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 4.0, 5.0, 4.0, 6.0, 12.0, 13.0, 20.0, 48.0, 65.0, 85.0, 152.0, 247.0, 429.0, 868.0, 1642.0, 3408.0, 7548.0, 17427.0, 44776.0, 129635.0, 360961.0, 311307.0, 105381.0, 37199.0, 14877.0, 6269.0, 2977.0, 1466.0, 747.0, 414.0, 213.0, 134.0, 66.0, 53.0, 26.0, 24.0, 11.0, 13.0, 12.0, 5.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-4.06640625, -3.90313720703125, -3.7398681640625, -3.57659912109375, -3.413330078125, -3.25006103515625, -3.0867919921875, -2.92352294921875, -2.76025390625, -2.59698486328125, -2.4337158203125, -2.27044677734375, -2.107177734375, -1.94390869140625, -1.7806396484375, -1.61737060546875, -1.4541015625, -1.29083251953125, -1.1275634765625, -0.96429443359375, -0.801025390625, -0.63775634765625, -0.4744873046875, -0.31121826171875, -0.14794921875, 0.01531982421875, 0.1785888671875, 0.34185791015625, 0.505126953125, 0.66839599609375, 0.8316650390625, 0.99493408203125, 1.158203125, 1.32147216796875, 1.4847412109375, 1.64801025390625, 1.811279296875, 1.97454833984375, 2.1378173828125, 2.30108642578125, 2.46435546875, 2.62762451171875, 2.7908935546875, 2.95416259765625, 3.117431640625, 3.28070068359375, 3.4439697265625, 3.60723876953125, 3.7705078125, 3.93377685546875, 4.0970458984375, 4.26031494140625, 4.423583984375, 4.58685302734375, 4.7501220703125, 4.91339111328125, 5.07666015625, 5.23992919921875, 5.4031982421875, 5.56646728515625, 5.729736328125, 5.89300537109375, 6.0562744140625, 6.21954345703125, 6.3828125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 5.0, 7.0, 8.0, 8.0, 8.0, 22.0, 26.0, 24.0, 26.0, 42.0, 48.0, 60.0, 59.0, 68.0, 62.0, 56.0, 71.0, 63.0, 44.0, 53.0, 40.0, 35.0, 32.0, 33.0, 30.0, 22.0, 9.0, 10.0, 10.0, 5.0, 3.0, 8.0, 6.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.28125, -3.15777587890625, -3.0343017578125, -2.91082763671875, -2.787353515625, -2.66387939453125, -2.5404052734375, -2.41693115234375, -2.29345703125, -2.16998291015625, -2.0465087890625, -1.92303466796875, -1.799560546875, -1.67608642578125, -1.5526123046875, -1.42913818359375, -1.3056640625, -1.18218994140625, -1.0587158203125, -0.93524169921875, -0.811767578125, -0.68829345703125, -0.5648193359375, -0.44134521484375, -0.31787109375, -0.19439697265625, -0.0709228515625, 0.05255126953125, 0.176025390625, 0.29949951171875, 0.4229736328125, 0.54644775390625, 0.669921875, 0.79339599609375, 0.9168701171875, 1.04034423828125, 1.163818359375, 1.28729248046875, 1.4107666015625, 1.53424072265625, 1.65771484375, 1.78118896484375, 1.9046630859375, 2.02813720703125, 2.151611328125, 2.27508544921875, 2.3985595703125, 2.52203369140625, 2.6455078125, 2.76898193359375, 2.8924560546875, 3.01593017578125, 3.139404296875, 3.26287841796875, 3.3863525390625, 3.50982666015625, 3.63330078125, 3.75677490234375, 3.8802490234375, 4.00372314453125, 4.127197265625, 4.25067138671875, 4.3741455078125, 4.49761962890625, 4.62109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 10.0, 11.0, 17.0, 18.0, 23.0, 36.0, 44.0, 71.0, 91.0, 151.0, 255.0, 385.0, 686.0, 1436.0, 3280.0, 9254.0, 33470.0, 164231.0, 679783.0, 116711.0, 25451.0, 7490.0, 2742.0, 1240.0, 672.0, 339.0, 207.0, 134.0, 72.0, 73.0, 38.0, 26.0, 36.0, 20.0, 12.0, 9.0, 10.0, 6.0, 10.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8203125, -5.5911865234375, -5.362060546875, -5.1329345703125, -4.90380859375, -4.6746826171875, -4.445556640625, -4.2164306640625, -3.9873046875, -3.7581787109375, -3.529052734375, -3.2999267578125, -3.07080078125, -2.8416748046875, -2.612548828125, -2.3834228515625, -2.154296875, -1.9251708984375, -1.696044921875, -1.4669189453125, -1.23779296875, -1.0086669921875, -0.779541015625, -0.5504150390625, -0.3212890625, -0.0921630859375, 0.136962890625, 0.3660888671875, 0.59521484375, 0.8243408203125, 1.053466796875, 1.2825927734375, 1.51171875, 1.7408447265625, 1.969970703125, 2.1990966796875, 2.42822265625, 2.6573486328125, 2.886474609375, 3.1156005859375, 3.3447265625, 3.5738525390625, 3.802978515625, 4.0321044921875, 4.26123046875, 4.4903564453125, 4.719482421875, 4.9486083984375, 5.177734375, 5.4068603515625, 5.635986328125, 5.8651123046875, 6.09423828125, 6.3233642578125, 6.552490234375, 6.7816162109375, 7.0107421875, 7.2398681640625, 7.468994140625, 7.6981201171875, 7.92724609375, 8.1563720703125, 8.385498046875, 8.6146240234375, 8.84375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 7.0, 3.0, 6.0, 9.0, 4.0, 15.0, 10.0, 8.0, 14.0, 24.0, 31.0, 37.0, 39.0, 47.0, 45.0, 66.0, 68.0, 74.0, 73.0, 56.0, 68.0, 51.0, 47.0, 39.0, 32.0, 36.0, 16.0, 19.0, 12.0, 14.0, 15.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0], "bins": [-14.5078125, -14.104736328125, -13.70166015625, -13.298583984375, -12.8955078125, -12.492431640625, -12.08935546875, -11.686279296875, -11.283203125, -10.880126953125, -10.47705078125, -10.073974609375, -9.6708984375, -9.267822265625, -8.86474609375, -8.461669921875, -8.05859375, -7.655517578125, -7.25244140625, -6.849365234375, -6.4462890625, -6.043212890625, -5.64013671875, -5.237060546875, -4.833984375, -4.430908203125, -4.02783203125, -3.624755859375, -3.2216796875, -2.818603515625, -2.41552734375, -2.012451171875, -1.609375, -1.206298828125, -0.80322265625, -0.400146484375, 0.0029296875, 0.406005859375, 0.80908203125, 1.212158203125, 1.615234375, 2.018310546875, 2.42138671875, 2.824462890625, 3.2275390625, 3.630615234375, 4.03369140625, 4.436767578125, 4.83984375, 5.242919921875, 5.64599609375, 6.049072265625, 6.4521484375, 6.855224609375, 7.25830078125, 7.661376953125, 8.064453125, 8.467529296875, 8.87060546875, 9.273681640625, 9.6767578125, 10.079833984375, 10.48291015625, 10.885986328125, 11.2890625]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 9.0, 8.0, 14.0, 15.0, 22.0, 19.0, 36.0, 61.0, 85.0, 147.0, 243.0, 406.0, 788.0, 1623.0, 3881.0, 11133.0, 39075.0, 187065.0, 668095.0, 98998.0, 23931.0, 7349.0, 2834.0, 1227.0, 638.0, 325.0, 204.0, 99.0, 67.0, 35.0, 32.0, 29.0, 11.0, 11.0, 8.0, 8.0, 9.0, 5.0, 4.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.12890625, -2.0718536376953125, -2.014801025390625, -1.9577484130859375, -1.90069580078125, -1.8436431884765625, -1.786590576171875, -1.7295379638671875, -1.6724853515625, -1.6154327392578125, -1.558380126953125, -1.5013275146484375, -1.44427490234375, -1.3872222900390625, -1.330169677734375, -1.2731170654296875, -1.216064453125, -1.1590118408203125, -1.101959228515625, -1.0449066162109375, -0.98785400390625, -0.9308013916015625, -0.873748779296875, -0.8166961669921875, -0.7596435546875, -0.7025909423828125, -0.645538330078125, -0.5884857177734375, -0.53143310546875, -0.4743804931640625, -0.417327880859375, -0.3602752685546875, -0.30322265625, -0.2461700439453125, -0.189117431640625, -0.1320648193359375, -0.07501220703125, -0.0179595947265625, 0.039093017578125, 0.0961456298828125, 0.1531982421875, 0.2102508544921875, 0.267303466796875, 0.3243560791015625, 0.38140869140625, 0.4384613037109375, 0.495513916015625, 0.5525665283203125, 0.609619140625, 0.6666717529296875, 0.723724365234375, 0.7807769775390625, 0.83782958984375, 0.8948822021484375, 0.951934814453125, 1.0089874267578125, 1.0660400390625, 1.1230926513671875, 1.180145263671875, 1.2371978759765625, 1.29425048828125, 1.3513031005859375, 1.408355712890625, 1.4654083251953125, 1.5224609375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 5.0, 4.0, 8.0, 9.0, 17.0, 18.0, 16.0, 31.0, 32.0, 33.0, 55.0, 61.0, 76.0, 75.0, 79.0, 109.0, 73.0, 60.0, 46.0, 36.0, 36.0, 23.0, 22.0, 11.0, 16.0, 11.0, 3.0, 5.0, 4.0, 5.0, 6.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0003807544708251953, -0.0003657899796962738, -0.0003508254885673523, -0.0003358609974384308, -0.0003208965063095093, -0.00030593201518058777, -0.00029096752405166626, -0.00027600303292274475, -0.00026103854179382324, -0.00024607405066490173, -0.00023110955953598022, -0.00021614506840705872, -0.0002011805772781372, -0.0001862160861492157, -0.0001712515950202942, -0.00015628710389137268, -0.00014132261276245117, -0.00012635812163352966, -0.00011139363050460815, -9.642913937568665e-05, -8.146464824676514e-05, -6.650015711784363e-05, -5.153566598892212e-05, -3.657117486000061e-05, -2.16066837310791e-05, -6.642192602157593e-06, 8.322298526763916e-06, 2.3286789655685425e-05, 3.8251280784606934e-05, 5.321577191352844e-05, 6.818026304244995e-05, 8.314475417137146e-05, 9.810924530029297e-05, 0.00011307373642921448, 0.00012803822755813599, 0.0001430027186870575, 0.000157967209815979, 0.0001729317009449005, 0.00018789619207382202, 0.00020286068320274353, 0.00021782517433166504, 0.00023278966546058655, 0.00024775415658950806, 0.00026271864771842957, 0.0002776831388473511, 0.0002926476299762726, 0.0003076121211051941, 0.0003225766122341156, 0.0003375411033630371, 0.0003525055944919586, 0.0003674700856208801, 0.00038243457674980164, 0.00039739906787872314, 0.00041236355900764465, 0.00042732805013656616, 0.00044229254126548767, 0.0004572570323944092, 0.0004722215235233307, 0.0004871860146522522, 0.0005021505057811737, 0.0005171149969100952, 0.0005320794880390167, 0.0005470439791679382, 0.0005620084702968597, 0.0005769729614257812]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 7.0, 5.0, 15.0, 13.0, 17.0, 23.0, 44.0, 60.0, 76.0, 106.0, 155.0, 263.0, 419.0, 666.0, 1273.0, 2602.0, 5349.0, 12760.0, 35274.0, 122521.0, 611377.0, 177724.0, 47963.0, 16508.0, 6574.0, 3054.0, 1499.0, 873.0, 438.0, 288.0, 178.0, 130.0, 82.0, 53.0, 54.0, 21.0, 26.0, 16.0, 7.0, 9.0, 12.0, 2.0, 5.0, 2.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0], "bins": [-1.4892578125, -1.444976806640625, -1.40069580078125, -1.356414794921875, -1.3121337890625, -1.267852783203125, -1.22357177734375, -1.179290771484375, -1.135009765625, -1.090728759765625, -1.04644775390625, -1.002166748046875, -0.9578857421875, -0.913604736328125, -0.86932373046875, -0.825042724609375, -0.78076171875, -0.736480712890625, -0.69219970703125, -0.647918701171875, -0.6036376953125, -0.559356689453125, -0.51507568359375, -0.470794677734375, -0.426513671875, -0.382232666015625, -0.33795166015625, -0.293670654296875, -0.2493896484375, -0.205108642578125, -0.16082763671875, -0.116546630859375, -0.072265625, -0.027984619140625, 0.01629638671875, 0.060577392578125, 0.1048583984375, 0.149139404296875, 0.19342041015625, 0.237701416015625, 0.281982421875, 0.326263427734375, 0.37054443359375, 0.414825439453125, 0.4591064453125, 0.503387451171875, 0.54766845703125, 0.591949462890625, 0.63623046875, 0.680511474609375, 0.72479248046875, 0.769073486328125, 0.8133544921875, 0.857635498046875, 0.90191650390625, 0.946197509765625, 0.990478515625, 1.034759521484375, 1.07904052734375, 1.123321533203125, 1.1676025390625, 1.211883544921875, 1.25616455078125, 1.300445556640625, 1.3447265625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 3.0, 9.0, 6.0, 5.0, 15.0, 15.0, 15.0, 26.0, 22.0, 28.0, 44.0, 41.0, 89.0, 73.0, 77.0, 78.0, 72.0, 63.0, 44.0, 47.0, 37.0, 43.0, 23.0, 20.0, 12.0, 13.0, 8.0, 11.0, 6.0, 9.0, 2.0, 5.0, 2.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-1.79296875, -1.7374420166015625, -1.681915283203125, -1.6263885498046875, -1.57086181640625, -1.5153350830078125, -1.459808349609375, -1.4042816162109375, -1.3487548828125, -1.2932281494140625, -1.237701416015625, -1.1821746826171875, -1.12664794921875, -1.0711212158203125, -1.015594482421875, -0.9600677490234375, -0.904541015625, -0.8490142822265625, -0.793487548828125, -0.7379608154296875, -0.68243408203125, -0.6269073486328125, -0.571380615234375, -0.5158538818359375, -0.4603271484375, -0.4048004150390625, -0.349273681640625, -0.2937469482421875, -0.23822021484375, -0.1826934814453125, -0.127166748046875, -0.0716400146484375, -0.01611328125, 0.0394134521484375, 0.094940185546875, 0.1504669189453125, 0.20599365234375, 0.2615203857421875, 0.317047119140625, 0.3725738525390625, 0.4281005859375, 0.4836273193359375, 0.539154052734375, 0.5946807861328125, 0.65020751953125, 0.7057342529296875, 0.761260986328125, 0.8167877197265625, 0.872314453125, 0.9278411865234375, 0.983367919921875, 1.0388946533203125, 1.09442138671875, 1.1499481201171875, 1.205474853515625, 1.2610015869140625, 1.3165283203125, 1.3720550537109375, 1.427581787109375, 1.4831085205078125, 1.53863525390625, 1.5941619873046875, 1.649688720703125, 1.7052154541015625, 1.7607421875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 7.0, 9.0, 17.0, 28.0, 42.0, 91.0, 173.0, 327.0, 143.0, 78.0, 39.0, 16.0, 13.0, 9.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.86172485351562, -66.86456298828125, -64.86739349365234, -62.87023162841797, -60.87306594848633, -58.87590026855469, -56.87873840332031, -54.88157272338867, -52.88440704345703, -50.88724136352539, -48.89007568359375, -46.892913818359375, -44.895748138427734, -42.898582458496094, -40.90142059326172, -38.90425491333008, -36.90708923339844, -34.9099235534668, -32.912757873535156, -30.91559600830078, -28.91843032836914, -26.9212646484375, -24.924100875854492, -22.926937103271484, -20.929771423339844, -18.932605743408203, -16.935441970825195, -14.938277244567871, -12.941112518310547, -10.943947792053223, -8.946783065795898, -6.949618339538574, -4.95245361328125, -2.955288887023926, -0.9581241607666016, 1.0390405654907227, 3.036205291748047, 5.033370018005371, 7.030534744262695, 9.02769947052002, 11.024864196777344, 13.022028923034668, 15.019193649291992, 17.016357421875, 19.01352310180664, 21.01068878173828, 23.00785255432129, 25.005016326904297, 27.002182006835938, 28.999347686767578, 30.996511459350586, 32.993675231933594, 34.990840911865234, 36.988006591796875, 38.98516845703125, 40.98233413696289, 42.97949981689453, 44.97666549682617, 46.97383117675781, 48.97099304199219, 50.96815872192383, 52.96532440185547, 54.962486267089844, 56.959651947021484, 58.956817626953125]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 6.0, 5.0, 8.0, 7.0, 8.0, 10.0, 6.0, 18.0, 28.0, 6.0, 19.0, 23.0, 22.0, 30.0, 32.0, 38.0, 32.0, 49.0, 77.0, 108.0, 81.0, 68.0, 41.0, 35.0, 20.0, 31.0, 17.0, 22.0, 21.0, 23.0, 11.0, 12.0, 13.0, 20.0, 8.0, 6.0, 7.0, 7.0, 6.0, 8.0, 1.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0], "bins": [-37.4849853515625, -36.410030364990234, -35.33507537841797, -34.26012420654297, -33.1851692199707, -32.11021423339844, -31.035259246826172, -29.960304260253906, -28.885351181030273, -27.810396194458008, -26.735443115234375, -25.66048812866211, -24.585533142089844, -23.51058006286621, -22.435625076293945, -21.360671997070312, -20.285717010498047, -19.21076202392578, -18.13580894470215, -17.060853958129883, -15.985899925231934, -14.910945892333984, -13.835990905761719, -12.76103687286377, -11.68608283996582, -10.611128807067871, -9.536174774169922, -8.461219787597656, -7.386265754699707, -6.311311721801758, -5.23635721206665, -4.161402702331543, -3.086444854736328, -2.0114905834198, -0.9365363121032715, 0.13841795921325684, 1.2133722305297852, 2.2883262634277344, 3.363280773162842, 4.438235282897949, 5.513189315795898, 6.588143348693848, 7.663097858428955, 8.738052368164062, 9.813006401062012, 10.887960433959961, 11.962915420532227, 13.037869453430176, 14.112823486328125, 15.187777519226074, 16.262731552124023, 17.33768653869629, 18.412639617919922, 19.487594604492188, 20.562549591064453, 21.63750457763672, 22.71245765686035, 23.787412643432617, 24.86236572265625, 25.937320709228516, 27.01227569580078, 28.087228775024414, 29.16218376159668, 30.237136840820312, 31.312091827392578]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 6.0, 10.0, 9.0, 9.0, 15.0, 22.0, 45.0, 53.0, 83.0, 141.0, 247.0, 439.0, 941.0, 2212.0, 7312.0, 39327.0, 517621.0, 3177604.0, 403807.0, 33849.0, 6387.0, 2163.0, 961.0, 431.0, 237.0, 134.0, 63.0, 57.0, 32.0, 17.0, 10.0, 13.0, 6.0, 4.0, 3.0, 2.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0], "bins": [-6.8828125, -6.7083740234375, -6.533935546875, -6.3594970703125, -6.18505859375, -6.0106201171875, -5.836181640625, -5.6617431640625, -5.4873046875, -5.3128662109375, -5.138427734375, -4.9639892578125, -4.78955078125, -4.6151123046875, -4.440673828125, -4.2662353515625, -4.091796875, -3.9173583984375, -3.742919921875, -3.5684814453125, -3.39404296875, -3.2196044921875, -3.045166015625, -2.8707275390625, -2.6962890625, -2.5218505859375, -2.347412109375, -2.1729736328125, -1.99853515625, -1.8240966796875, -1.649658203125, -1.4752197265625, -1.30078125, -1.1263427734375, -0.951904296875, -0.7774658203125, -0.60302734375, -0.4285888671875, -0.254150390625, -0.0797119140625, 0.0947265625, 0.2691650390625, 0.443603515625, 0.6180419921875, 0.79248046875, 0.9669189453125, 1.141357421875, 1.3157958984375, 1.490234375, 1.6646728515625, 1.839111328125, 2.0135498046875, 2.18798828125, 2.3624267578125, 2.536865234375, 2.7113037109375, 2.8857421875, 3.0601806640625, 3.234619140625, 3.4090576171875, 3.58349609375, 3.7579345703125, 3.932373046875, 4.1068115234375, 4.28125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 5.0, 5.0, 5.0, 6.0, 16.0, 23.0, 25.0, 23.0, 33.0, 28.0, 59.0, 52.0, 62.0, 61.0, 47.0, 71.0, 63.0, 48.0, 54.0, 50.0, 47.0, 29.0, 37.0, 30.0, 35.0, 22.0, 16.0, 12.0, 5.0, 5.0, 8.0, 5.0, 3.0, 8.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.908203125, -2.790435791015625, -2.67266845703125, -2.554901123046875, -2.4371337890625, -2.319366455078125, -2.20159912109375, -2.083831787109375, -1.966064453125, -1.848297119140625, -1.73052978515625, -1.612762451171875, -1.4949951171875, -1.377227783203125, -1.25946044921875, -1.141693115234375, -1.02392578125, -0.906158447265625, -0.78839111328125, -0.670623779296875, -0.5528564453125, -0.435089111328125, -0.31732177734375, -0.199554443359375, -0.081787109375, 0.035980224609375, 0.15374755859375, 0.271514892578125, 0.3892822265625, 0.507049560546875, 0.62481689453125, 0.742584228515625, 0.8603515625, 0.978118896484375, 1.09588623046875, 1.213653564453125, 1.3314208984375, 1.449188232421875, 1.56695556640625, 1.684722900390625, 1.802490234375, 1.920257568359375, 2.03802490234375, 2.155792236328125, 2.2735595703125, 2.391326904296875, 2.50909423828125, 2.626861572265625, 2.74462890625, 2.862396240234375, 2.98016357421875, 3.097930908203125, 3.2156982421875, 3.333465576171875, 3.45123291015625, 3.569000244140625, 3.686767578125, 3.804534912109375, 3.92230224609375, 4.040069580078125, 4.1578369140625, 4.275604248046875, 4.39337158203125, 4.511138916015625, 4.62890625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 7.0, 9.0, 12.0, 18.0, 19.0, 30.0, 63.0, 146.0, 341.0, 995.0, 5011.0, 96898.0, 4044440.0, 41735.0, 3290.0, 736.0, 267.0, 140.0, 49.0, 29.0, 21.0, 12.0, 6.0, 1.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-16.921875, -16.44384765625, -15.9658203125, -15.48779296875, -15.009765625, -14.53173828125, -14.0537109375, -13.57568359375, -13.09765625, -12.61962890625, -12.1416015625, -11.66357421875, -11.185546875, -10.70751953125, -10.2294921875, -9.75146484375, -9.2734375, -8.79541015625, -8.3173828125, -7.83935546875, -7.361328125, -6.88330078125, -6.4052734375, -5.92724609375, -5.44921875, -4.97119140625, -4.4931640625, -4.01513671875, -3.537109375, -3.05908203125, -2.5810546875, -2.10302734375, -1.625, -1.14697265625, -0.6689453125, -0.19091796875, 0.287109375, 0.76513671875, 1.2431640625, 1.72119140625, 2.19921875, 2.67724609375, 3.1552734375, 3.63330078125, 4.111328125, 4.58935546875, 5.0673828125, 5.54541015625, 6.0234375, 6.50146484375, 6.9794921875, 7.45751953125, 7.935546875, 8.41357421875, 8.8916015625, 9.36962890625, 9.84765625, 10.32568359375, 10.8037109375, 11.28173828125, 11.759765625, 12.23779296875, 12.7158203125, 13.19384765625, 13.671875]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 4.0, 4.0, 4.0, 11.0, 23.0, 16.0, 41.0, 88.0, 136.0, 418.0, 1032.0, 1305.0, 567.0, 220.0, 93.0, 41.0, 28.0, 13.0, 14.0, 9.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.921875, -13.5755615234375, -13.229248046875, -12.8829345703125, -12.53662109375, -12.1903076171875, -11.843994140625, -11.4976806640625, -11.1513671875, -10.8050537109375, -10.458740234375, -10.1124267578125, -9.76611328125, -9.4197998046875, -9.073486328125, -8.7271728515625, -8.380859375, -8.0345458984375, -7.688232421875, -7.3419189453125, -6.99560546875, -6.6492919921875, -6.302978515625, -5.9566650390625, -5.6103515625, -5.2640380859375, -4.917724609375, -4.5714111328125, -4.22509765625, -3.8787841796875, -3.532470703125, -3.1861572265625, -2.83984375, -2.4935302734375, -2.147216796875, -1.8009033203125, -1.45458984375, -1.1082763671875, -0.761962890625, -0.4156494140625, -0.0693359375, 0.2769775390625, 0.623291015625, 0.9696044921875, 1.31591796875, 1.6622314453125, 2.008544921875, 2.3548583984375, 2.701171875, 3.0474853515625, 3.393798828125, 3.7401123046875, 4.08642578125, 4.4327392578125, 4.779052734375, 5.1253662109375, 5.4716796875, 5.8179931640625, 6.164306640625, 6.5106201171875, 6.85693359375, 7.2032470703125, 7.549560546875, 7.8958740234375, 8.2421875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 2.0, 2.0, 5.0, 8.0, 14.0, 22.0, 18.0, 43.0, 53.0, 86.0, 115.0, 137.0, 180.0, 128.0, 75.0, 47.0, 28.0, 13.0, 9.0, 5.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-57.12649154663086, -55.70967483520508, -54.29285430908203, -52.87603759765625, -51.45922088623047, -50.04240417480469, -48.62558364868164, -47.20876693725586, -45.79194641113281, -44.37512969970703, -42.958309173583984, -41.5414924621582, -40.12467575073242, -38.707855224609375, -37.291038513183594, -35.87422180175781, -34.45740509033203, -33.04058837890625, -31.623769760131836, -30.206951141357422, -28.79013442993164, -27.373315811157227, -25.956497192382812, -24.53968048095703, -23.122861862182617, -21.706043243408203, -20.289226531982422, -18.872407913208008, -17.455589294433594, -16.038772583007812, -14.621953964233398, -13.2051362991333, -11.788314819335938, -10.37149715423584, -8.954679489135742, -7.537860870361328, -6.1210432052612305, -4.704225540161133, -3.2874069213867188, -1.870589256286621, -0.45377159118652344, 0.9630463123321533, 2.37986421585083, 3.796682357788086, 5.213500022888184, 6.630317687988281, 8.047136306762695, 9.463953971862793, 10.88077163696289, 12.297589302062988, 13.714406967163086, 15.1312255859375, 16.54804229736328, 17.964860916137695, 19.38167953491211, 20.79849624633789, 22.215314865112305, 23.63213348388672, 25.0489501953125, 26.465768814086914, 27.882587432861328, 29.29940414428711, 30.716222763061523, 32.13304138183594, 33.54985809326172]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 8.0, 10.0, 9.0, 10.0, 13.0, 12.0, 23.0, 17.0, 19.0, 20.0, 23.0, 23.0, 24.0, 31.0, 40.0, 39.0, 30.0, 34.0, 38.0, 41.0, 42.0, 40.0, 46.0, 54.0, 37.0, 33.0, 36.0, 32.0, 24.0, 27.0, 18.0, 17.0, 18.0, 15.0, 18.0, 14.0, 17.0, 11.0, 12.0, 8.0, 6.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-27.05431365966797, -26.233734130859375, -25.41315269470215, -24.592573165893555, -23.77199363708496, -22.951412200927734, -22.13083267211914, -21.310253143310547, -20.48967170715332, -19.669092178344727, -18.8485107421875, -18.027931213378906, -17.207351684570312, -16.386770248413086, -15.566190719604492, -14.745610237121582, -13.925030708312988, -13.104450225830078, -12.283870697021484, -11.463290214538574, -10.642709732055664, -9.82213020324707, -9.00154972076416, -8.18096923828125, -7.360389232635498, -6.539809226989746, -5.719228744506836, -4.898648738861084, -4.078068733215332, -3.257488250732422, -2.43690824508667, -1.6163277626037598, -0.7957477569580078, 0.024832427501678467, 0.8454126119613647, 1.6659927368164062, 2.4865729808807373, 3.3071532249450684, 4.12773323059082, 4.9483137130737305, 5.768893718719482, 6.589473724365234, 7.4100542068481445, 8.230634689331055, 9.051214218139648, 9.871794700622559, 10.692375183105469, 11.512954711914062, 12.333535194396973, 13.154115676879883, 13.974695205688477, 14.795275688171387, 15.615856170654297, 16.43643569946289, 17.257015228271484, 18.07759666442871, 18.898176193237305, 19.7187557220459, 20.539337158203125, 21.35991668701172, 22.180496215820312, 23.00107765197754, 23.821657180786133, 24.64223861694336, 25.462818145751953]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 6.0, 11.0, 10.0, 18.0, 27.0, 42.0, 69.0, 133.0, 212.0, 329.0, 674.0, 1221.0, 2262.0, 4624.0, 9992.0, 23085.0, 63817.0, 217312.0, 473976.0, 164647.0, 50186.0, 19214.0, 8275.0, 3957.0, 2029.0, 1093.0, 565.0, 313.0, 182.0, 106.0, 52.0, 42.0, 32.0, 14.0, 13.0, 10.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-7.80078125, -7.5921630859375, -7.383544921875, -7.1749267578125, -6.96630859375, -6.7576904296875, -6.549072265625, -6.3404541015625, -6.1318359375, -5.9232177734375, -5.714599609375, -5.5059814453125, -5.29736328125, -5.0887451171875, -4.880126953125, -4.6715087890625, -4.462890625, -4.2542724609375, -4.045654296875, -3.8370361328125, -3.62841796875, -3.4197998046875, -3.211181640625, -3.0025634765625, -2.7939453125, -2.5853271484375, -2.376708984375, -2.1680908203125, -1.95947265625, -1.7508544921875, -1.542236328125, -1.3336181640625, -1.125, -0.9163818359375, -0.707763671875, -0.4991455078125, -0.29052734375, -0.0819091796875, 0.126708984375, 0.3353271484375, 0.5439453125, 0.7525634765625, 0.961181640625, 1.1697998046875, 1.37841796875, 1.5870361328125, 1.795654296875, 2.0042724609375, 2.212890625, 2.4215087890625, 2.630126953125, 2.8387451171875, 3.04736328125, 3.2559814453125, 3.464599609375, 3.6732177734375, 3.8818359375, 4.0904541015625, 4.299072265625, 4.5076904296875, 4.71630859375, 4.9249267578125, 5.133544921875, 5.3421630859375, 5.55078125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 7.0, 7.0, 5.0, 8.0, 7.0, 16.0, 24.0, 21.0, 21.0, 26.0, 35.0, 36.0, 50.0, 53.0, 63.0, 65.0, 59.0, 56.0, 43.0, 51.0, 57.0, 50.0, 43.0, 36.0, 28.0, 31.0, 21.0, 22.0, 13.0, 10.0, 20.0, 7.0, 7.0, 5.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.236328125, -3.117767333984375, -2.99920654296875, -2.880645751953125, -2.7620849609375, -2.643524169921875, -2.52496337890625, -2.406402587890625, -2.287841796875, -2.169281005859375, -2.05072021484375, -1.932159423828125, -1.8135986328125, -1.695037841796875, -1.57647705078125, -1.457916259765625, -1.33935546875, -1.220794677734375, -1.10223388671875, -0.983673095703125, -0.8651123046875, -0.746551513671875, -0.62799072265625, -0.509429931640625, -0.390869140625, -0.272308349609375, -0.15374755859375, -0.035186767578125, 0.0833740234375, 0.201934814453125, 0.32049560546875, 0.439056396484375, 0.5576171875, 0.676177978515625, 0.79473876953125, 0.913299560546875, 1.0318603515625, 1.150421142578125, 1.26898193359375, 1.387542724609375, 1.506103515625, 1.624664306640625, 1.74322509765625, 1.861785888671875, 1.9803466796875, 2.098907470703125, 2.21746826171875, 2.336029052734375, 2.45458984375, 2.573150634765625, 2.69171142578125, 2.810272216796875, 2.9288330078125, 3.047393798828125, 3.16595458984375, 3.284515380859375, 3.403076171875, 3.521636962890625, 3.64019775390625, 3.758758544921875, 3.8773193359375, 3.995880126953125, 4.11444091796875, 4.233001708984375, 4.3515625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 0.0, 4.0, 4.0, 4.0, 10.0, 16.0, 17.0, 23.0, 51.0, 61.0, 127.0, 182.0, 323.0, 642.0, 1321.0, 3552.0, 16770.0, 220225.0, 766802.0, 29886.0, 5220.0, 1649.0, 716.0, 380.0, 221.0, 122.0, 93.0, 52.0, 28.0, 19.0, 14.0, 8.0, 7.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0, -10.5792236328125, -10.158447265625, -9.7376708984375, -9.31689453125, -8.8961181640625, -8.475341796875, -8.0545654296875, -7.6337890625, -7.2130126953125, -6.792236328125, -6.3714599609375, -5.95068359375, -5.5299072265625, -5.109130859375, -4.6883544921875, -4.267578125, -3.8468017578125, -3.426025390625, -3.0052490234375, -2.58447265625, -2.1636962890625, -1.742919921875, -1.3221435546875, -0.9013671875, -0.4805908203125, -0.059814453125, 0.3609619140625, 0.78173828125, 1.2025146484375, 1.623291015625, 2.0440673828125, 2.46484375, 2.8856201171875, 3.306396484375, 3.7271728515625, 4.14794921875, 4.5687255859375, 4.989501953125, 5.4102783203125, 5.8310546875, 6.2518310546875, 6.672607421875, 7.0933837890625, 7.51416015625, 7.9349365234375, 8.355712890625, 8.7764892578125, 9.197265625, 9.6180419921875, 10.038818359375, 10.4595947265625, 10.88037109375, 11.3011474609375, 11.721923828125, 12.1427001953125, 12.5634765625, 12.9842529296875, 13.405029296875, 13.8258056640625, 14.24658203125, 14.6673583984375, 15.088134765625, 15.5089111328125, 15.9296875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 8.0, 4.0, 8.0, 2.0, 7.0, 7.0, 12.0, 22.0, 26.0, 26.0, 34.0, 44.0, 54.0, 73.0, 93.0, 82.0, 82.0, 85.0, 69.0, 60.0, 59.0, 39.0, 23.0, 24.0, 12.0, 11.0, 6.0, 10.0, 5.0, 6.0, 3.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0], "bins": [-19.46875, -18.97119140625, -18.4736328125, -17.97607421875, -17.478515625, -16.98095703125, -16.4833984375, -15.98583984375, -15.48828125, -14.99072265625, -14.4931640625, -13.99560546875, -13.498046875, -13.00048828125, -12.5029296875, -12.00537109375, -11.5078125, -11.01025390625, -10.5126953125, -10.01513671875, -9.517578125, -9.02001953125, -8.5224609375, -8.02490234375, -7.52734375, -7.02978515625, -6.5322265625, -6.03466796875, -5.537109375, -5.03955078125, -4.5419921875, -4.04443359375, -3.546875, -3.04931640625, -2.5517578125, -2.05419921875, -1.556640625, -1.05908203125, -0.5615234375, -0.06396484375, 0.43359375, 0.93115234375, 1.4287109375, 1.92626953125, 2.423828125, 2.92138671875, 3.4189453125, 3.91650390625, 4.4140625, 4.91162109375, 5.4091796875, 5.90673828125, 6.404296875, 6.90185546875, 7.3994140625, 7.89697265625, 8.39453125, 8.89208984375, 9.3896484375, 9.88720703125, 10.384765625, 10.88232421875, 11.3798828125, 11.87744140625, 12.375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 7.0, 5.0, 9.0, 12.0, 14.0, 17.0, 26.0, 32.0, 46.0, 52.0, 81.0, 127.0, 200.0, 285.0, 530.0, 890.0, 1873.0, 4759.0, 15161.0, 65905.0, 659554.0, 239317.0, 41909.0, 10576.0, 3614.0, 1542.0, 797.0, 367.0, 268.0, 164.0, 124.0, 63.0, 58.0, 45.0, 33.0, 25.0, 22.0, 12.0, 10.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 3.0, 3.0, 2.0, 0.0, 0.0, 2.0, 2.0], "bins": [-1.9091796875, -1.85107421875, -1.79296875, -1.73486328125, -1.6767578125, -1.61865234375, -1.560546875, -1.50244140625, -1.4443359375, -1.38623046875, -1.328125, -1.27001953125, -1.2119140625, -1.15380859375, -1.095703125, -1.03759765625, -0.9794921875, -0.92138671875, -0.86328125, -0.80517578125, -0.7470703125, -0.68896484375, -0.630859375, -0.57275390625, -0.5146484375, -0.45654296875, -0.3984375, -0.34033203125, -0.2822265625, -0.22412109375, -0.166015625, -0.10791015625, -0.0498046875, 0.00830078125, 0.06640625, 0.12451171875, 0.1826171875, 0.24072265625, 0.298828125, 0.35693359375, 0.4150390625, 0.47314453125, 0.53125, 0.58935546875, 0.6474609375, 0.70556640625, 0.763671875, 0.82177734375, 0.8798828125, 0.93798828125, 0.99609375, 1.05419921875, 1.1123046875, 1.17041015625, 1.228515625, 1.28662109375, 1.3447265625, 1.40283203125, 1.4609375, 1.51904296875, 1.5771484375, 1.63525390625, 1.693359375, 1.75146484375, 1.8095703125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 3.0, 5.0, 5.0, 6.0, 4.0, 13.0, 10.0, 10.0, 11.0, 17.0, 19.0, 25.0, 30.0, 51.0, 54.0, 92.0, 103.0, 104.0, 107.0, 75.0, 73.0, 44.0, 38.0, 19.0, 20.0, 17.0, 14.0, 15.0, 4.0, 2.0, 3.0, 4.0, 6.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0006914138793945312, -0.0006729662418365479, -0.0006545186042785645, -0.0006360709667205811, -0.0006176233291625977, -0.0005991756916046143, -0.0005807280540466309, -0.0005622804164886475, -0.0005438327789306641, -0.0005253851413726807, -0.0005069375038146973, -0.0004884898662567139, -0.00047004222869873047, -0.00045159459114074707, -0.00043314695358276367, -0.0004146993160247803, -0.0003962516784667969, -0.0003778040409088135, -0.0003593564033508301, -0.0003409087657928467, -0.0003224611282348633, -0.0003040134906768799, -0.0002855658531188965, -0.0002671182155609131, -0.0002486705780029297, -0.0002302229404449463, -0.0002117753028869629, -0.0001933276653289795, -0.0001748800277709961, -0.0001564323902130127, -0.0001379847526550293, -0.0001195371150970459, -0.0001010894775390625, -8.26418399810791e-05, -6.41942024230957e-05, -4.5746564865112305e-05, -2.7298927307128906e-05, -8.851289749145508e-06, 9.59634780883789e-06, 2.804398536682129e-05, 4.649162292480469e-05, 6.493926048278809e-05, 8.338689804077148e-05, 0.00010183453559875488, 0.00012028217315673828, 0.00013872981071472168, 0.00015717744827270508, 0.00017562508583068848, 0.00019407272338867188, 0.00021252036094665527, 0.00023096799850463867, 0.00024941563606262207, 0.00026786327362060547, 0.00028631091117858887, 0.00030475854873657227, 0.00032320618629455566, 0.00034165382385253906, 0.00036010146141052246, 0.00037854909896850586, 0.00039699673652648926, 0.00041544437408447266, 0.00043389201164245605, 0.00045233964920043945, 0.00047078728675842285, 0.0004892349243164062]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 1.0, 0.0, 4.0, 4.0, 10.0, 15.0, 22.0, 47.0, 77.0, 127.0, 223.0, 498.0, 1051.0, 2964.0, 10951.0, 81139.0, 847685.0, 86914.0, 11443.0, 3177.0, 1164.0, 468.0, 243.0, 124.0, 77.0, 50.0, 21.0, 19.0, 10.0, 11.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-3.2890625, -3.201385498046875, -3.11370849609375, -3.026031494140625, -2.9383544921875, -2.850677490234375, -2.76300048828125, -2.675323486328125, -2.587646484375, -2.499969482421875, -2.41229248046875, -2.324615478515625, -2.2369384765625, -2.149261474609375, -2.06158447265625, -1.973907470703125, -1.88623046875, -1.798553466796875, -1.71087646484375, -1.623199462890625, -1.5355224609375, -1.447845458984375, -1.36016845703125, -1.272491455078125, -1.184814453125, -1.097137451171875, -1.00946044921875, -0.921783447265625, -0.8341064453125, -0.746429443359375, -0.65875244140625, -0.571075439453125, -0.4833984375, -0.395721435546875, -0.30804443359375, -0.220367431640625, -0.1326904296875, -0.045013427734375, 0.04266357421875, 0.130340576171875, 0.218017578125, 0.305694580078125, 0.39337158203125, 0.481048583984375, 0.5687255859375, 0.656402587890625, 0.74407958984375, 0.831756591796875, 0.91943359375, 1.007110595703125, 1.09478759765625, 1.182464599609375, 1.2701416015625, 1.357818603515625, 1.44549560546875, 1.533172607421875, 1.620849609375, 1.708526611328125, 1.79620361328125, 1.883880615234375, 1.9715576171875, 2.059234619140625, 2.14691162109375, 2.234588623046875, 2.322265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 1.0, 3.0, 10.0, 6.0, 6.0, 19.0, 22.0, 22.0, 36.0, 42.0, 76.0, 91.0, 129.0, 128.0, 109.0, 81.0, 51.0, 55.0, 37.0, 29.0, 21.0, 11.0, 9.0, 3.0, 6.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0625, -2.975555419921875, -2.88861083984375, -2.801666259765625, -2.7147216796875, -2.627777099609375, -2.54083251953125, -2.453887939453125, -2.366943359375, -2.279998779296875, -2.19305419921875, -2.106109619140625, -2.0191650390625, -1.932220458984375, -1.84527587890625, -1.758331298828125, -1.67138671875, -1.584442138671875, -1.49749755859375, -1.410552978515625, -1.3236083984375, -1.236663818359375, -1.14971923828125, -1.062774658203125, -0.975830078125, -0.888885498046875, -0.80194091796875, -0.714996337890625, -0.6280517578125, -0.541107177734375, -0.45416259765625, -0.367218017578125, -0.2802734375, -0.193328857421875, -0.10638427734375, -0.019439697265625, 0.0675048828125, 0.154449462890625, 0.24139404296875, 0.328338623046875, 0.415283203125, 0.502227783203125, 0.58917236328125, 0.676116943359375, 0.7630615234375, 0.850006103515625, 0.93695068359375, 1.023895263671875, 1.11083984375, 1.197784423828125, 1.28472900390625, 1.371673583984375, 1.4586181640625, 1.545562744140625, 1.63250732421875, 1.719451904296875, 1.806396484375, 1.893341064453125, 1.98028564453125, 2.067230224609375, 2.1541748046875, 2.241119384765625, 2.32806396484375, 2.415008544921875, 2.501953125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 7.0, 20.0, 43.0, 101.0, 280.0, 298.0, 118.0, 65.0, 32.0, 7.0, 7.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.96814727783203, -79.55622863769531, -77.1443099975586, -74.7323989868164, -72.32048034667969, -69.90856170654297, -67.49664306640625, -65.08473205566406, -62.672813415527344, -60.260894775390625, -57.84897994995117, -55.43706130981445, -53.025146484375, -50.61322784423828, -48.20130920410156, -45.78939437866211, -43.37747573852539, -40.96555709838867, -38.55364227294922, -36.1417236328125, -33.72980880737305, -31.317890167236328, -28.905973434448242, -26.494056701660156, -24.08213996887207, -21.670223236083984, -19.2583065032959, -16.846389770507812, -14.43447208404541, -12.022555351257324, -9.610637664794922, -7.198720932006836, -4.78680419921875, -2.374887228012085, 0.03702974319458008, 2.448946952819824, 4.86086368560791, 7.272780418395996, 9.684698104858398, 12.096614837646484, 14.50853157043457, 16.920448303222656, 19.332365036010742, 21.744281768798828, 24.156200408935547, 26.568115234375, 28.98003387451172, 31.391950607299805, 33.80386734008789, 36.21578598022461, 38.62770080566406, 41.03961944580078, 43.451534271240234, 45.86345291137695, 48.275367736816406, 50.687286376953125, 53.099205017089844, 55.51112365722656, 57.923038482666016, 60.334957122802734, 62.74687194824219, 65.1587905883789, 67.57070922851562, 69.98262023925781, 72.39453887939453]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 6.0, 7.0, 5.0, 13.0, 10.0, 12.0, 14.0, 16.0, 10.0, 23.0, 25.0, 22.0, 19.0, 25.0, 39.0, 33.0, 46.0, 93.0, 128.0, 111.0, 51.0, 42.0, 31.0, 30.0, 17.0, 22.0, 22.0, 15.0, 23.0, 8.0, 21.0, 15.0, 7.0, 2.0, 8.0, 8.0, 5.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.72791290283203, -37.50796127319336, -36.28800582885742, -35.06805419921875, -33.84809875488281, -32.62814712524414, -31.408191680908203, -30.18824005126953, -28.968284606933594, -27.74833106994629, -26.528377532958984, -25.30842399597168, -24.088470458984375, -22.86851692199707, -21.648563385009766, -20.428611755371094, -19.20865821838379, -17.988704681396484, -16.76875114440918, -15.548797607421875, -14.32884407043457, -13.108890533447266, -11.888937950134277, -10.668984413146973, -9.449030876159668, -8.229077339172363, -7.009123802185059, -5.789170742034912, -4.569217205047607, -3.3492636680603027, -2.1293106079101562, -0.9093570709228516, 0.3105964660644531, 1.5305498838424683, 2.7505033016204834, 3.970456600189209, 5.190410137176514, 6.410363674163818, 7.630316734313965, 8.85027027130127, 10.070223808288574, 11.290177345275879, 12.510130882263184, 13.730083465576172, 14.950037002563477, 16.16999053955078, 17.389944076538086, 18.60989761352539, 19.829851150512695, 21.0498046875, 22.269758224487305, 23.48971176147461, 24.709665298461914, 25.92961883544922, 27.14957046508789, 28.369525909423828, 29.5894775390625, 30.809431076049805, 32.02938461303711, 33.24933624267578, 34.46929168701172, 35.68924331665039, 36.90919876098633, 38.129150390625, 39.34910583496094]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 6.0, 6.0, 10.0, 6.0, 18.0, 23.0, 56.0, 78.0, 138.0, 301.0, 602.0, 1692.0, 5366.0, 29384.0, 672991.0, 3288345.0, 175650.0, 14293.0, 3361.0, 1103.0, 451.0, 205.0, 76.0, 54.0, 31.0, 25.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3046875, -11.9749755859375, -11.645263671875, -11.3155517578125, -10.98583984375, -10.6561279296875, -10.326416015625, -9.9967041015625, -9.6669921875, -9.3372802734375, -9.007568359375, -8.6778564453125, -8.34814453125, -8.0184326171875, -7.688720703125, -7.3590087890625, -7.029296875, -6.6995849609375, -6.369873046875, -6.0401611328125, -5.71044921875, -5.3807373046875, -5.051025390625, -4.7213134765625, -4.3916015625, -4.0618896484375, -3.732177734375, -3.4024658203125, -3.07275390625, -2.7430419921875, -2.413330078125, -2.0836181640625, -1.75390625, -1.4241943359375, -1.094482421875, -0.7647705078125, -0.43505859375, -0.1053466796875, 0.224365234375, 0.5540771484375, 0.8837890625, 1.2135009765625, 1.543212890625, 1.8729248046875, 2.20263671875, 2.5323486328125, 2.862060546875, 3.1917724609375, 3.521484375, 3.8511962890625, 4.180908203125, 4.5106201171875, 4.84033203125, 5.1700439453125, 5.499755859375, 5.8294677734375, 6.1591796875, 6.4888916015625, 6.818603515625, 7.1483154296875, 7.47802734375, 7.8077392578125, 8.137451171875, 8.4671630859375, 8.796875]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 13.0, 17.0, 20.0, 17.0, 16.0, 29.0, 35.0, 45.0, 47.0, 46.0, 52.0, 51.0, 62.0, 68.0, 61.0, 48.0, 58.0, 52.0, 54.0, 31.0, 39.0, 32.0, 20.0, 16.0, 15.0, 11.0, 12.0, 8.0, 7.0, 5.0, 4.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2109375, -3.09423828125, -2.9775390625, -2.86083984375, -2.744140625, -2.62744140625, -2.5107421875, -2.39404296875, -2.27734375, -2.16064453125, -2.0439453125, -1.92724609375, -1.810546875, -1.69384765625, -1.5771484375, -1.46044921875, -1.34375, -1.22705078125, -1.1103515625, -0.99365234375, -0.876953125, -0.76025390625, -0.6435546875, -0.52685546875, -0.41015625, -0.29345703125, -0.1767578125, -0.06005859375, 0.056640625, 0.17333984375, 0.2900390625, 0.40673828125, 0.5234375, 0.64013671875, 0.7568359375, 0.87353515625, 0.990234375, 1.10693359375, 1.2236328125, 1.34033203125, 1.45703125, 1.57373046875, 1.6904296875, 1.80712890625, 1.923828125, 2.04052734375, 2.1572265625, 2.27392578125, 2.390625, 2.50732421875, 2.6240234375, 2.74072265625, 2.857421875, 2.97412109375, 3.0908203125, 3.20751953125, 3.32421875, 3.44091796875, 3.5576171875, 3.67431640625, 3.791015625, 3.90771484375, 4.0244140625, 4.14111328125, 4.2578125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 3.0, 10.0, 7.0, 8.0, 12.0, 19.0, 26.0, 50.0, 104.0, 166.0, 368.0, 816.0, 2005.0, 6926.0, 80892.0, 4015915.0, 77049.0, 6406.0, 1920.0, 726.0, 367.0, 197.0, 107.0, 68.0, 35.0, 21.0, 17.0, 15.0, 9.0, 5.0, 6.0, 5.0, 4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.0625, -13.510986328125, -12.95947265625, -12.407958984375, -11.8564453125, -11.304931640625, -10.75341796875, -10.201904296875, -9.650390625, -9.098876953125, -8.54736328125, -7.995849609375, -7.4443359375, -6.892822265625, -6.34130859375, -5.789794921875, -5.23828125, -4.686767578125, -4.13525390625, -3.583740234375, -3.0322265625, -2.480712890625, -1.92919921875, -1.377685546875, -0.826171875, -0.274658203125, 0.27685546875, 0.828369140625, 1.3798828125, 1.931396484375, 2.48291015625, 3.034423828125, 3.5859375, 4.137451171875, 4.68896484375, 5.240478515625, 5.7919921875, 6.343505859375, 6.89501953125, 7.446533203125, 7.998046875, 8.549560546875, 9.10107421875, 9.652587890625, 10.2041015625, 10.755615234375, 11.30712890625, 11.858642578125, 12.41015625, 12.961669921875, 13.51318359375, 14.064697265625, 14.6162109375, 15.167724609375, 15.71923828125, 16.270751953125, 16.822265625, 17.373779296875, 17.92529296875, 18.476806640625, 19.0283203125, 19.579833984375, 20.13134765625, 20.682861328125, 21.234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 1.0, 8.0, 14.0, 11.0, 26.0, 28.0, 48.0, 73.0, 96.0, 156.0, 298.0, 516.0, 813.0, 849.0, 492.0, 233.0, 167.0, 85.0, 59.0, 34.0, 20.0, 16.0, 15.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.5546875, -14.181884765625, -13.80908203125, -13.436279296875, -13.0634765625, -12.690673828125, -12.31787109375, -11.945068359375, -11.572265625, -11.199462890625, -10.82666015625, -10.453857421875, -10.0810546875, -9.708251953125, -9.33544921875, -8.962646484375, -8.58984375, -8.217041015625, -7.84423828125, -7.471435546875, -7.0986328125, -6.725830078125, -6.35302734375, -5.980224609375, -5.607421875, -5.234619140625, -4.86181640625, -4.489013671875, -4.1162109375, -3.743408203125, -3.37060546875, -2.997802734375, -2.625, -2.252197265625, -1.87939453125, -1.506591796875, -1.1337890625, -0.760986328125, -0.38818359375, -0.015380859375, 0.357421875, 0.730224609375, 1.10302734375, 1.475830078125, 1.8486328125, 2.221435546875, 2.59423828125, 2.967041015625, 3.33984375, 3.712646484375, 4.08544921875, 4.458251953125, 4.8310546875, 5.203857421875, 5.57666015625, 5.949462890625, 6.322265625, 6.695068359375, 7.06787109375, 7.440673828125, 7.8134765625, 8.186279296875, 8.55908203125, 8.931884765625, 9.3046875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 2.0, 9.0, 14.0, 21.0, 45.0, 80.0, 167.0, 243.0, 192.0, 108.0, 49.0, 25.0, 15.0, 7.0, 10.0, 3.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.19721984863281, -110.23877716064453, -106.28034210205078, -102.3218994140625, -98.36346435546875, -94.40502166748047, -90.44657897949219, -86.48814392089844, -82.52970886230469, -78.5712661743164, -74.61283111572266, -70.65438842773438, -66.69595336914062, -62.737510681152344, -58.77907180786133, -54.82063293457031, -50.86219024658203, -46.903751373291016, -42.9453125, -38.98686981201172, -35.02843475341797, -31.06999397277832, -27.111553192138672, -23.153114318847656, -19.19467544555664, -15.236236572265625, -11.277796745300293, -7.319356918334961, -3.3609180450439453, 0.5975208282470703, 4.555961608886719, 8.514400482177734, 12.47283935546875, 16.431278228759766, 20.38971710205078, 24.34815788269043, 28.306596755981445, 32.265037536621094, 36.22347640991211, 40.181915283203125, 44.14035415649414, 48.098793029785156, 52.05723190307617, 56.01567077636719, 59.97411346435547, 63.93254852294922, 67.8909912109375, 71.84942626953125, 75.80786895751953, 79.76631164550781, 83.72474670410156, 87.68318939208984, 91.6416244506836, 95.60006713867188, 99.55850219726562, 103.5169448852539, 107.47538757324219, 111.43383026123047, 115.39226531982422, 119.3507080078125, 123.30914306640625, 127.26758575439453, 131.2260284423828, 135.18446350097656, 139.1428985595703]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 7.0, 7.0, 6.0, 15.0, 11.0, 23.0, 19.0, 20.0, 21.0, 31.0, 27.0, 39.0, 42.0, 40.0, 60.0, 60.0, 57.0, 60.0, 41.0, 45.0, 29.0, 46.0, 43.0, 39.0, 36.0, 38.0, 32.0, 24.0, 19.0, 15.0, 14.0, 12.0, 8.0, 5.0, 5.0, 4.0, 1.0, 5.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-44.96317672729492, -43.280418395996094, -41.59765625, -39.91489791870117, -38.232139587402344, -36.54937744140625, -34.86661911010742, -33.183860778808594, -31.5010986328125, -29.81833839416504, -28.135578155517578, -26.45281982421875, -24.77005958557129, -23.087299346923828, -21.404541015625, -19.72178077697754, -18.039020538330078, -16.356260299682617, -14.673501014709473, -12.990741729736328, -11.307981491088867, -9.625221252441406, -7.942461967468262, -6.259702682495117, -4.576942443847656, -2.8941826820373535, -1.2114229202270508, 0.47133684158325195, 2.1540966033935547, 3.8368568420410156, 5.51961612701416, 7.202375411987305, 8.885139465332031, 10.567899703979492, 12.250658988952637, 13.933418273925781, 15.616178512573242, 17.298938751220703, 18.98169708251953, 20.664457321166992, 22.347217559814453, 24.029977798461914, 25.712738037109375, 27.395496368408203, 29.078256607055664, 30.761016845703125, 32.44377517700195, 34.12653350830078, 35.809295654296875, 37.4920539855957, 39.1748161315918, 40.857574462890625, 42.54033660888672, 44.22309494018555, 45.905853271484375, 47.58861541748047, 49.2713737487793, 50.954132080078125, 52.63689422607422, 54.31965255737305, 56.002410888671875, 57.68517303466797, 59.3679313659668, 61.050689697265625, 62.73345184326172]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 4.0, 6.0, 12.0, 11.0, 8.0, 22.0, 35.0, 36.0, 53.0, 69.0, 105.0, 150.0, 229.0, 345.0, 545.0, 895.0, 1334.0, 2320.0, 4357.0, 8130.0, 16160.0, 37479.0, 104100.0, 515827.0, 239263.0, 64865.0, 25819.0, 12023.0, 5974.0, 3381.0, 1860.0, 1065.0, 703.0, 440.0, 280.0, 189.0, 121.0, 99.0, 72.0, 44.0, 33.0, 26.0, 20.0, 9.0, 8.0, 7.0, 4.0, 8.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-5.14453125, -4.9774169921875, -4.810302734375, -4.6431884765625, -4.47607421875, -4.3089599609375, -4.141845703125, -3.9747314453125, -3.8076171875, -3.6405029296875, -3.473388671875, -3.3062744140625, -3.13916015625, -2.9720458984375, -2.804931640625, -2.6378173828125, -2.470703125, -2.3035888671875, -2.136474609375, -1.9693603515625, -1.80224609375, -1.6351318359375, -1.468017578125, -1.3009033203125, -1.1337890625, -0.9666748046875, -0.799560546875, -0.6324462890625, -0.46533203125, -0.2982177734375, -0.131103515625, 0.0360107421875, 0.203125, 0.3702392578125, 0.537353515625, 0.7044677734375, 0.87158203125, 1.0386962890625, 1.205810546875, 1.3729248046875, 1.5400390625, 1.7071533203125, 1.874267578125, 2.0413818359375, 2.20849609375, 2.3756103515625, 2.542724609375, 2.7098388671875, 2.876953125, 3.0440673828125, 3.211181640625, 3.3782958984375, 3.54541015625, 3.7125244140625, 3.879638671875, 4.0467529296875, 4.2138671875, 4.3809814453125, 4.548095703125, 4.7152099609375, 4.88232421875, 5.0494384765625, 5.216552734375, 5.3836669921875, 5.55078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 2.0, 4.0, 5.0, 8.0, 8.0, 11.0, 18.0, 21.0, 22.0, 41.0, 31.0, 45.0, 54.0, 52.0, 68.0, 50.0, 67.0, 60.0, 64.0, 56.0, 47.0, 53.0, 42.0, 33.0, 40.0, 23.0, 14.0, 17.0, 14.0, 7.0, 10.0, 7.0, 7.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.72265625, -4.58331298828125, -4.4439697265625, -4.30462646484375, -4.165283203125, -4.02593994140625, -3.8865966796875, -3.74725341796875, -3.60791015625, -3.46856689453125, -3.3292236328125, -3.18988037109375, -3.050537109375, -2.91119384765625, -2.7718505859375, -2.63250732421875, -2.4931640625, -2.35382080078125, -2.2144775390625, -2.07513427734375, -1.935791015625, -1.79644775390625, -1.6571044921875, -1.51776123046875, -1.37841796875, -1.23907470703125, -1.0997314453125, -0.96038818359375, -0.821044921875, -0.68170166015625, -0.5423583984375, -0.40301513671875, -0.263671875, -0.12432861328125, 0.0150146484375, 0.15435791015625, 0.293701171875, 0.43304443359375, 0.5723876953125, 0.71173095703125, 0.85107421875, 0.99041748046875, 1.1297607421875, 1.26910400390625, 1.408447265625, 1.54779052734375, 1.6871337890625, 1.82647705078125, 1.9658203125, 2.10516357421875, 2.2445068359375, 2.38385009765625, 2.523193359375, 2.66253662109375, 2.8018798828125, 2.94122314453125, 3.08056640625, 3.21990966796875, 3.3592529296875, 3.49859619140625, 3.637939453125, 3.77728271484375, 3.9166259765625, 4.05596923828125, 4.1953125]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 9.0, 6.0, 14.0, 12.0, 21.0, 32.0, 50.0, 98.0, 120.0, 160.0, 304.0, 528.0, 1068.0, 2493.0, 8873.0, 59851.0, 910397.0, 51697.0, 8202.0, 2373.0, 986.0, 474.0, 276.0, 171.0, 103.0, 65.0, 42.0, 34.0, 28.0, 13.0, 13.0, 9.0, 9.0, 5.0, 5.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-13.6328125, -13.2784423828125, -12.924072265625, -12.5697021484375, -12.21533203125, -11.8609619140625, -11.506591796875, -11.1522216796875, -10.7978515625, -10.4434814453125, -10.089111328125, -9.7347412109375, -9.38037109375, -9.0260009765625, -8.671630859375, -8.3172607421875, -7.962890625, -7.6085205078125, -7.254150390625, -6.8997802734375, -6.54541015625, -6.1910400390625, -5.836669921875, -5.4822998046875, -5.1279296875, -4.7735595703125, -4.419189453125, -4.0648193359375, -3.71044921875, -3.3560791015625, -3.001708984375, -2.6473388671875, -2.29296875, -1.9385986328125, -1.584228515625, -1.2298583984375, -0.87548828125, -0.5211181640625, -0.166748046875, 0.1876220703125, 0.5419921875, 0.8963623046875, 1.250732421875, 1.6051025390625, 1.95947265625, 2.3138427734375, 2.668212890625, 3.0225830078125, 3.376953125, 3.7313232421875, 4.085693359375, 4.4400634765625, 4.79443359375, 5.1488037109375, 5.503173828125, 5.8575439453125, 6.2119140625, 6.5662841796875, 6.920654296875, 7.2750244140625, 7.62939453125, 7.9837646484375, 8.338134765625, 8.6925048828125, 9.046875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 1.0, 2.0, 6.0, 2.0, 4.0, 5.0, 7.0, 9.0, 9.0, 13.0, 17.0, 14.0, 14.0, 17.0, 20.0, 25.0, 36.0, 44.0, 49.0, 57.0, 69.0, 75.0, 75.0, 80.0, 53.0, 57.0, 39.0, 33.0, 26.0, 22.0, 15.0, 17.0, 16.0, 13.0, 15.0, 5.0, 6.0, 8.0, 7.0, 4.0, 5.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.21875, -14.72998046875, -14.2412109375, -13.75244140625, -13.263671875, -12.77490234375, -12.2861328125, -11.79736328125, -11.30859375, -10.81982421875, -10.3310546875, -9.84228515625, -9.353515625, -8.86474609375, -8.3759765625, -7.88720703125, -7.3984375, -6.90966796875, -6.4208984375, -5.93212890625, -5.443359375, -4.95458984375, -4.4658203125, -3.97705078125, -3.48828125, -2.99951171875, -2.5107421875, -2.02197265625, -1.533203125, -1.04443359375, -0.5556640625, -0.06689453125, 0.421875, 0.91064453125, 1.3994140625, 1.88818359375, 2.376953125, 2.86572265625, 3.3544921875, 3.84326171875, 4.33203125, 4.82080078125, 5.3095703125, 5.79833984375, 6.287109375, 6.77587890625, 7.2646484375, 7.75341796875, 8.2421875, 8.73095703125, 9.2197265625, 9.70849609375, 10.197265625, 10.68603515625, 11.1748046875, 11.66357421875, 12.15234375, 12.64111328125, 13.1298828125, 13.61865234375, 14.107421875, 14.59619140625, 15.0849609375, 15.57373046875, 16.0625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 3.0, 4.0, 3.0, 6.0, 2.0, 6.0, 8.0, 18.0, 19.0, 25.0, 40.0, 54.0, 69.0, 107.0, 156.0, 257.0, 398.0, 598.0, 1169.0, 2352.0, 5536.0, 14720.0, 52654.0, 767057.0, 154516.0, 30807.0, 9843.0, 3954.0, 1730.0, 886.0, 539.0, 339.0, 207.0, 152.0, 90.0, 54.0, 58.0, 29.0, 19.0, 22.0, 9.0, 14.0, 4.0, 3.0, 3.0, 4.0, 5.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-1.6689453125, -1.618072509765625, -1.56719970703125, -1.516326904296875, -1.4654541015625, -1.414581298828125, -1.36370849609375, -1.312835693359375, -1.261962890625, -1.211090087890625, -1.16021728515625, -1.109344482421875, -1.0584716796875, -1.007598876953125, -0.95672607421875, -0.905853271484375, -0.85498046875, -0.804107666015625, -0.75323486328125, -0.702362060546875, -0.6514892578125, -0.600616455078125, -0.54974365234375, -0.498870849609375, -0.447998046875, -0.397125244140625, -0.34625244140625, -0.295379638671875, -0.2445068359375, -0.193634033203125, -0.14276123046875, -0.091888427734375, -0.041015625, 0.009857177734375, 0.06072998046875, 0.111602783203125, 0.1624755859375, 0.213348388671875, 0.26422119140625, 0.315093994140625, 0.365966796875, 0.416839599609375, 0.46771240234375, 0.518585205078125, 0.5694580078125, 0.620330810546875, 0.67120361328125, 0.722076416015625, 0.77294921875, 0.823822021484375, 0.87469482421875, 0.925567626953125, 0.9764404296875, 1.027313232421875, 1.07818603515625, 1.129058837890625, 1.179931640625, 1.230804443359375, 1.28167724609375, 1.332550048828125, 1.3834228515625, 1.434295654296875, 1.48516845703125, 1.536041259765625, 1.5869140625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 9.0, 7.0, 6.0, 12.0, 11.0, 21.0, 26.0, 18.0, 39.0, 41.0, 79.0, 98.0, 123.0, 130.0, 98.0, 69.0, 65.0, 28.0, 29.0, 24.0, 18.0, 8.0, 5.0, 5.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005211830139160156, -0.0005010738968849182, -0.0004809647798538208, -0.0004608556628227234, -0.000440746545791626, -0.00042063742876052856, -0.00040052831172943115, -0.00038041919469833374, -0.00036031007766723633, -0.0003402009606361389, -0.0003200918436050415, -0.0002999827265739441, -0.0002798736095428467, -0.00025976449251174927, -0.00023965537548065186, -0.00021954625844955444, -0.00019943714141845703, -0.00017932802438735962, -0.0001592189073562622, -0.0001391097903251648, -0.00011900067329406738, -9.889155626296997e-05, -7.878243923187256e-05, -5.8673322200775146e-05, -3.8564205169677734e-05, -1.8455088138580322e-05, 1.6540288925170898e-06, 2.1763145923614502e-05, 4.1872262954711914e-05, 6.198137998580933e-05, 8.209049701690674e-05, 0.00010219961404800415, 0.00012230873107910156, 0.00014241784811019897, 0.0001625269651412964, 0.0001826360821723938, 0.0002027451992034912, 0.00022285431623458862, 0.00024296343326568604, 0.00026307255029678345, 0.00028318166732788086, 0.00030329078435897827, 0.0003233999013900757, 0.0003435090184211731, 0.0003636181354522705, 0.0003837272524833679, 0.00040383636951446533, 0.00042394548654556274, 0.00044405460357666016, 0.00046416372060775757, 0.000484272837638855, 0.0005043819546699524, 0.0005244910717010498, 0.0005446001887321472, 0.0005647093057632446, 0.000584818422794342, 0.0006049275398254395, 0.0006250366568565369, 0.0006451457738876343, 0.0006652548909187317, 0.0006853640079498291, 0.0007054731249809265, 0.0007255822420120239, 0.0007456913590431213, 0.0007658004760742188]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 10.0, 18.0, 8.0, 36.0, 40.0, 51.0, 85.0, 125.0, 234.0, 396.0, 724.0, 1492.0, 3424.0, 9933.0, 38180.0, 728788.0, 219597.0, 30842.0, 8574.0, 3045.0, 1331.0, 680.0, 356.0, 215.0, 128.0, 66.0, 49.0, 35.0, 28.0, 24.0, 15.0, 4.0, 5.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05859375, -1.0143585205078125, -0.970123291015625, -0.9258880615234375, -0.88165283203125, -0.8374176025390625, -0.793182373046875, -0.7489471435546875, -0.7047119140625, -0.6604766845703125, -0.616241455078125, -0.5720062255859375, -0.52777099609375, -0.4835357666015625, -0.439300537109375, -0.3950653076171875, -0.350830078125, -0.3065948486328125, -0.262359619140625, -0.2181243896484375, -0.17388916015625, -0.1296539306640625, -0.085418701171875, -0.0411834716796875, 0.0030517578125, 0.0472869873046875, 0.091522216796875, 0.1357574462890625, 0.17999267578125, 0.2242279052734375, 0.268463134765625, 0.3126983642578125, 0.35693359375, 0.4011688232421875, 0.445404052734375, 0.4896392822265625, 0.53387451171875, 0.5781097412109375, 0.622344970703125, 0.6665802001953125, 0.7108154296875, 0.7550506591796875, 0.799285888671875, 0.8435211181640625, 0.88775634765625, 0.9319915771484375, 0.976226806640625, 1.0204620361328125, 1.064697265625, 1.1089324951171875, 1.153167724609375, 1.1974029541015625, 1.24163818359375, 1.2858734130859375, 1.330108642578125, 1.3743438720703125, 1.4185791015625, 1.4628143310546875, 1.507049560546875, 1.5512847900390625, 1.59552001953125, 1.6397552490234375, 1.683990478515625, 1.7282257080078125, 1.7724609375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 3.0, 1.0, 0.0, 3.0, 7.0, 10.0, 8.0, 5.0, 7.0, 9.0, 12.0, 17.0, 17.0, 16.0, 18.0, 30.0, 34.0, 43.0, 41.0, 55.0, 67.0, 76.0, 66.0, 77.0, 78.0, 55.0, 41.0, 36.0, 28.0, 38.0, 24.0, 19.0, 13.0, 7.0, 10.0, 4.0, 7.0, 6.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3603515625, -1.3066253662109375, -1.252899169921875, -1.1991729736328125, -1.14544677734375, -1.0917205810546875, -1.037994384765625, -0.9842681884765625, -0.9305419921875, -0.8768157958984375, -0.823089599609375, -0.7693634033203125, -0.71563720703125, -0.6619110107421875, -0.608184814453125, -0.5544586181640625, -0.500732421875, -0.4470062255859375, -0.393280029296875, -0.3395538330078125, -0.28582763671875, -0.2321014404296875, -0.178375244140625, -0.1246490478515625, -0.0709228515625, -0.0171966552734375, 0.036529541015625, 0.0902557373046875, 0.14398193359375, 0.1977081298828125, 0.251434326171875, 0.3051605224609375, 0.35888671875, 0.4126129150390625, 0.466339111328125, 0.5200653076171875, 0.57379150390625, 0.6275177001953125, 0.681243896484375, 0.7349700927734375, 0.7886962890625, 0.8424224853515625, 0.896148681640625, 0.9498748779296875, 1.00360107421875, 1.0573272705078125, 1.111053466796875, 1.1647796630859375, 1.218505859375, 1.2722320556640625, 1.325958251953125, 1.3796844482421875, 1.43341064453125, 1.4871368408203125, 1.540863037109375, 1.5945892333984375, 1.6483154296875, 1.7020416259765625, 1.755767822265625, 1.8094940185546875, 1.86322021484375, 1.9169464111328125, 1.970672607421875, 2.0243988037109375, 2.078125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 4.0, 12.0, 36.0, 39.0, 58.0, 105.0, 526.0, 93.0, 58.0, 23.0, 23.0, 7.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.39476013183594, -70.82308959960938, -68.25141143798828, -65.67974090576172, -63.108062744140625, -60.53639221191406, -57.964717864990234, -55.393043518066406, -52.82136917114258, -50.24969482421875, -47.67802047729492, -45.106346130371094, -42.53467559814453, -39.96299743652344, -37.391326904296875, -34.81965255737305, -32.24797821044922, -29.67630386352539, -27.104629516601562, -24.532957077026367, -21.96128273010254, -19.38960838317871, -16.817935943603516, -14.246261596679688, -11.67458724975586, -9.102912902832031, -6.5312395095825195, -3.9595656394958496, -1.3878917694091797, 1.1837825775146484, 3.75545597076416, 6.327129364013672, 8.898796081542969, 11.470470428466797, 14.042143821716309, 16.61381721496582, 19.18549156188965, 21.757165908813477, 24.328838348388672, 26.9005126953125, 29.472187042236328, 32.043861389160156, 34.615535736083984, 37.18721008300781, 39.758880615234375, 42.33055877685547, 44.90222930908203, 47.47390365600586, 50.04557800292969, 52.617252349853516, 55.188926696777344, 57.76060104370117, 60.332275390625, 62.90394592285156, 65.47562408447266, 68.04729461669922, 70.61897277832031, 73.19064331054688, 75.76232147216797, 78.33399200439453, 80.90567016601562, 83.47734069824219, 86.04901885986328, 88.62068939208984, 91.1923599243164]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0, 1.0, 2.0, 5.0, 4.0, 6.0, 3.0, 6.0, 7.0, 12.0, 16.0, 12.0, 21.0, 25.0, 25.0, 25.0, 27.0, 39.0, 93.0, 232.0, 185.0, 39.0, 24.0, 27.0, 27.0, 26.0, 29.0, 18.0, 18.0, 5.0, 4.0, 8.0, 7.0, 8.0, 3.0, 7.0, 4.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.49089431762695, -39.99684143066406, -38.50278854370117, -37.00873565673828, -35.514678955078125, -34.020626068115234, -32.526573181152344, -31.032520294189453, -29.53846549987793, -28.04441261291504, -26.550357818603516, -25.056304931640625, -23.562252044677734, -22.06819725036621, -20.57414436340332, -19.080089569091797, -17.586036682128906, -16.091983795166016, -14.597929000854492, -13.103876113891602, -11.609822273254395, -10.115768432617188, -8.621715545654297, -7.12766170501709, -5.633607864379883, -4.139554023742676, -2.645500659942627, -1.1514472961425781, 0.3426065444946289, 1.836660385131836, 3.3307132720947266, 4.824767112731934, 6.318817138671875, 7.812870979309082, 9.306924819946289, 10.80097770690918, 12.295031547546387, 13.789085388183594, 15.283138275146484, 16.777191162109375, 18.2712459564209, 19.76529884338379, 21.259353637695312, 22.753406524658203, 24.247459411621094, 25.741514205932617, 27.235567092895508, 28.72962188720703, 30.223674774169922, 31.717727661132812, 33.2117805480957, 34.705833435058594, 36.19989013671875, 37.69394302368164, 39.18799591064453, 40.68204879760742, 42.17610168457031, 43.6701545715332, 45.164207458496094, 46.65826416015625, 48.15231704711914, 49.64636993408203, 51.14042282104492, 52.63447570800781, 54.12853240966797]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 6.0, 6.0, 5.0, 10.0, 11.0, 24.0, 16.0, 28.0, 35.0, 44.0, 48.0, 52.0, 150.0, 285.0, 64.0, 46.0, 32.0, 28.0, 24.0, 22.0, 28.0, 10.0, 15.0, 8.0, 2.0, 8.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.9453125, -4.79156494140625, -4.6378173828125, -4.48406982421875, -4.330322265625, -4.17657470703125, -4.0228271484375, -3.86907958984375, -3.71533203125, -3.56158447265625, -3.4078369140625, -3.25408935546875, -3.100341796875, -2.94659423828125, -2.7928466796875, -2.63909912109375, -2.4853515625, -2.33160400390625, -2.1778564453125, -2.02410888671875, -1.870361328125, -1.71661376953125, -1.5628662109375, -1.40911865234375, -1.25537109375, -1.10162353515625, -0.9478759765625, -0.79412841796875, -0.640380859375, -0.48663330078125, -0.3328857421875, -0.17913818359375, -0.025390625, 0.12835693359375, 0.2821044921875, 0.43585205078125, 0.589599609375, 0.74334716796875, 0.8970947265625, 1.05084228515625, 1.20458984375, 1.35833740234375, 1.5120849609375, 1.66583251953125, 1.819580078125, 1.97332763671875, 2.1270751953125, 2.28082275390625, 2.4345703125, 2.58831787109375, 2.7420654296875, 2.89581298828125, 3.049560546875, 3.20330810546875, 3.3570556640625, 3.51080322265625, 3.66455078125, 3.81829833984375, 3.9720458984375, 4.12579345703125, 4.279541015625, 4.43328857421875, 4.5870361328125, 4.74078369140625, 4.89453125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 8.0, 4.0, 8.0, 5.0, 18.0, 7.0, 17.0, 44.0, 55.0, 115.0, 214.0, 556.0, 2101.0, 17332.0, 8356451.0, 9291.0, 1541.0, 441.0, 153.0, 92.0, 45.0, 18.0, 21.0, 8.0, 15.0, 9.0, 12.0, 6.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-37.30021667480469, -35.83097457885742, -34.36172866821289, -32.892486572265625, -31.423240661621094, -29.953998565673828, -28.48475456237793, -27.01551055908203, -25.546266555786133, -24.077022552490234, -22.607778549194336, -21.138534545898438, -19.669292449951172, -18.20004653930664, -16.730804443359375, -15.261560440063477, -13.792316436767578, -12.32307243347168, -10.853828430175781, -9.3845853805542, -7.915341377258301, -6.446097373962402, -4.97685432434082, -3.507610321044922, -2.0383663177490234, -0.5691225528717041, 0.9001212120056152, 2.3693647384643555, 3.838608741760254, 5.307852745056152, 6.777095794677734, 8.246339797973633, 9.715579986572266, 11.184823989868164, 12.654067993164062, 14.123311042785645, 15.592555046081543, 17.061798095703125, 18.531042098999023, 20.000286102294922, 21.46953010559082, 22.93877410888672, 24.408018112182617, 25.877262115478516, 27.34650421142578, 28.815750122070312, 30.284992218017578, 31.754236221313477, 33.223480224609375, 34.69272232055664, 36.16196823120117, 37.63121032714844, 39.10045623779297, 40.569698333740234, 42.0389404296875, 43.50818634033203, 44.97743225097656, 46.44667434692383, 47.91592025756836, 49.385162353515625, 50.854408264160156, 52.32365036010742, 53.79289245605469, 55.26213836669922, 56.731380462646484]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 1.0, 6.0, 0.0, 4.0, 1.0, 4.0, 6.0, 5.0, 11.0, 7.0, 9.0, 12.0, 2.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-85.37743377685547, -82.17849731445312, -78.97956085205078, -75.78062438964844, -72.58169555664062, -69.38275909423828, -66.18382263183594, -62.984886169433594, -59.78594970703125, -56.587013244628906, -53.38807678222656, -50.189144134521484, -46.99020767211914, -43.7912712097168, -40.59233856201172, -37.393402099609375, -34.19446563720703, -30.995529174804688, -27.796594619750977, -24.597660064697266, -21.398723602294922, -18.199787139892578, -15.000852584838867, -11.801918029785156, -8.602981567382812, -5.404046058654785, -2.205110549926758, 0.9938249588012695, 4.192760467529297, 7.391695976257324, 10.590631484985352, 13.789566040039062, 16.988494873046875, 20.18743133544922, 23.38636589050293, 26.58530044555664, 29.784236907958984, 32.98317337036133, 36.182106018066406, 39.38104248046875, 42.579978942871094, 45.77891540527344, 48.97785186767578, 52.17678451538086, 55.3757209777832, 58.57465744018555, 61.773590087890625, 64.97252655029297, 68.17146301269531, 71.37039947509766, 74.5693359375, 77.76827239990234, 80.96720886230469, 84.1661376953125, 87.36507415771484, 90.56401062011719, 93.76294708251953, 96.96188354492188, 100.16082000732422, 103.35975646972656, 106.55868530273438, 109.75762176513672, 112.95655822753906, 116.1554946899414, 119.35443115234375]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 6.0, 4.0, 10.0, 10.0, 18.0, 19.0, 29.0, 36.0, 68.0, 95.0, 160.0, 235.0, 451.0, 863.0, 1545.0, 3145.0, 6289.0, 14220.0, 33376.0, 83394.0, 169613.0, 123058.0, 49839.0, 20120.0, 8843.0, 4147.0, 2054.0, 1119.0, 592.0, 315.0, 221.0, 126.0, 85.0, 53.0, 41.0, 22.0, 10.0, 16.0, 7.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.671875, -19.0517578125, -18.431640625, -17.8115234375, -17.19140625, -16.5712890625, -15.951171875, -15.3310546875, -14.7109375, -14.0908203125, -13.470703125, -12.8505859375, -12.23046875, -11.6103515625, -10.990234375, -10.3701171875, -9.75, -9.1298828125, -8.509765625, -7.8896484375, -7.26953125, -6.6494140625, -6.029296875, -5.4091796875, -4.7890625, -4.1689453125, -3.548828125, -2.9287109375, -2.30859375, -1.6884765625, -1.068359375, -0.4482421875, 0.171875, 0.7919921875, 1.412109375, 2.0322265625, 2.65234375, 3.2724609375, 3.892578125, 4.5126953125, 5.1328125, 5.7529296875, 6.373046875, 6.9931640625, 7.61328125, 8.2333984375, 8.853515625, 9.4736328125, 10.09375, 10.7138671875, 11.333984375, 11.9541015625, 12.57421875, 13.1943359375, 13.814453125, 14.4345703125, 15.0546875, 15.6748046875, 16.294921875, 16.9150390625, 17.53515625, 18.1552734375, 18.775390625, 19.3955078125, 20.015625]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0, 2.0, 6.0, 6.0, 5.0, 11.0, 14.0, 23.0, 24.0, 18.0, 42.0, 36.0, 41.0, 50.0, 80.0, 84.0, 75.0, 71.0, 77.0, 72.0, 50.0, 42.0, 40.0, 36.0, 22.0, 25.0, 14.0, 14.0, 11.0, 4.0, 5.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3515625, -5.206512451171875, -5.06146240234375, -4.916412353515625, -4.7713623046875, -4.626312255859375, -4.48126220703125, -4.336212158203125, -4.191162109375, -4.046112060546875, -3.90106201171875, -3.756011962890625, -3.6109619140625, -3.465911865234375, -3.32086181640625, -3.175811767578125, -3.03076171875, -2.885711669921875, -2.74066162109375, -2.595611572265625, -2.4505615234375, -2.305511474609375, -2.16046142578125, -2.015411376953125, -1.870361328125, -1.725311279296875, -1.58026123046875, -1.435211181640625, -1.2901611328125, -1.145111083984375, -1.00006103515625, -0.855010986328125, -0.7099609375, -0.564910888671875, -0.41986083984375, -0.274810791015625, -0.1297607421875, 0.015289306640625, 0.16033935546875, 0.305389404296875, 0.450439453125, 0.595489501953125, 0.74053955078125, 0.885589599609375, 1.0306396484375, 1.175689697265625, 1.32073974609375, 1.465789794921875, 1.61083984375, 1.755889892578125, 1.90093994140625, 2.045989990234375, 2.1910400390625, 2.336090087890625, 2.48114013671875, 2.626190185546875, 2.771240234375, 2.916290283203125, 3.06134033203125, 3.206390380859375, 3.3514404296875, 3.496490478515625, 3.64154052734375, 3.786590576171875, 3.931640625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 4.0, 3.0, 13.0, 13.0, 25.0, 70.0, 88.0, 87.0, 72.0, 42.0, 13.0, 6.0, 12.0, 10.0, 9.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.99530029296875, -35.039794921875, -34.08428955078125, -33.1287841796875, -32.17327880859375, -31.217775344848633, -30.262269973754883, -29.306764602661133, -28.351259231567383, -27.395753860473633, -26.440248489379883, -25.484745025634766, -24.529239654541016, -23.573734283447266, -22.618228912353516, -21.662723541259766, -20.707218170166016, -19.751712799072266, -18.796207427978516, -17.840702056884766, -16.88519859313965, -15.929693222045898, -14.974187850952148, -14.018682479858398, -13.063179016113281, -12.107673645019531, -11.152169227600098, -10.196663856506348, -9.241158485412598, -8.285654067993164, -7.330148696899414, -6.374643325805664, -5.419137954711914, -4.463633060455322, -3.5081276893615723, -2.5526227951049805, -1.5971176624298096, -0.6416125297546387, 0.3138923645019531, 1.2693977355957031, 2.224902629852295, 3.180407762527466, 4.135912895202637, 5.0914177894592285, 6.04692268371582, 7.00242805480957, 7.957932949066162, 8.91343879699707, 9.868943214416504, 10.824448585510254, 11.779953002929688, 12.735458374023438, 13.690963745117188, 14.646469116210938, 15.601973533630371, 16.557479858398438, 17.512983322143555, 18.468488693237305, 19.423994064331055, 20.379497528076172, 21.335002899169922, 22.290508270263672, 23.246013641357422, 24.201519012451172, 25.157024383544922]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 5.0, 3.0, 4.0, 3.0, 4.0, 11.0, 14.0, 13.0, 45.0, 71.0, 84.0, 70.0, 45.0, 31.0, 20.0, 12.0, 6.0, 8.0, 4.0, 1.0, 4.0, 5.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 5.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.503015518188477, -17.868295669555664, -17.23357391357422, -16.598854064941406, -15.964132308959961, -15.329411506652832, -14.694690704345703, -14.05997085571289, -13.425249099731445, -12.790528297424316, -12.155807495117188, -11.521086692810059, -10.88636589050293, -10.2516450881958, -9.616924285888672, -8.98220443725586, -8.34748363494873, -7.712762832641602, -7.078042030334473, -6.443321228027344, -5.808600425720215, -5.173879623413086, -4.539159297943115, -3.9044384956359863, -3.2697176933288574, -2.6349968910217285, -2.0002760887145996, -1.3655555248260498, -0.7308347225189209, -0.09611392021179199, 0.5386066436767578, 1.1733274459838867, 1.8080482482910156, 2.4427690505981445, 3.0774898529052734, 3.7122104167938232, 4.346931457519531, 4.98165225982666, 5.616372585296631, 6.25109338760376, 6.885814189910889, 7.520534992218018, 8.155255317687988, 8.789976119995117, 9.424696922302246, 10.059417724609375, 10.694138526916504, 11.328859329223633, 11.963580131530762, 12.59830093383789, 13.23302173614502, 13.867742538452148, 14.502463340759277, 15.137184143066406, 15.771903991699219, 16.406625747680664, 17.041345596313477, 17.67606544494629, 18.310787200927734, 18.945507049560547, 19.580228805541992, 20.214948654174805, 20.84967041015625, 21.484390258789062, 22.119112014770508]}, "eval/loss": 4.259012699127197, "eval/wer": 2.4146370487901625, "eval/runtime": 1113.1839, "eval/samples_per_second": 2.373, "eval/steps_per_second": 0.297, "train/train_runtime": 8505.8878, "train/train_samples_per_second": 3.355, "train/train_steps_per_second": 0.21, "train/total_flos": 0.0, "train/train_loss": 4.4116124524129345, "_wandb": {"runtime": 9990}}