{"train/loss": 4.5256, "train/learning_rate": 1.1940000000000001e-05, "train/epoch": 0.78, "train/global_step": 200, "_runtime": 3707, "_timestamp": 1646154545, "_step": 199, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 108.0, 891.0, 16.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-177.56703186035156, -149.70550537109375, -121.84396362304688, -93.98242950439453, -66.12089538574219, -38.25935363769531, -10.3978271484375, 17.463699340820312, 45.32524108886719, 73.18677520751953, 101.04830932617188, 128.90985107421875, 156.77137756347656, 184.63291931152344, 212.49444580078125, 240.35597229003906, 268.217529296875, 296.0790710449219, 323.94061279296875, 351.8021240234375, 379.6636657714844, 407.52520751953125, 435.38671875, 463.2482604980469, 491.10980224609375, 518.9713134765625, 546.8328857421875, 574.6943969726562, 602.555908203125, 630.41748046875, 658.2789916992188, 686.1405029296875, 714.0020751953125, 741.8635864257812, 769.7251586914062, 797.586669921875, 825.4482421875, 853.3097534179688, 881.1712646484375, 909.0328369140625, 936.8943481445312, 964.755859375, 992.617431640625, 1020.4789428710938, 1048.3404541015625, 1076.2020263671875, 1104.0635986328125, 1131.925048828125, 1159.78662109375, 1187.648193359375, 1215.5096435546875, 1243.3712158203125, 1271.2327880859375, 1299.09423828125, 1326.955810546875, 1354.8173828125, 1382.678955078125, 1410.54052734375, 1438.4019775390625, 1466.2635498046875, 1494.1251220703125, 1521.986572265625, 1549.84814453125, 1577.709716796875, 1605.5711669921875]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 7.0, 5.0, 7.0, 6.0, 7.0, 12.0, 13.0, 17.0, 24.0, 21.0, 27.0, 27.0, 39.0, 43.0, 54.0, 52.0, 43.0, 43.0, 50.0, 48.0, 53.0, 54.0, 52.0, 48.0, 46.0, 36.0, 28.0, 28.0, 26.0, 17.0, 14.0, 11.0, 10.0, 8.0, 3.0, 6.0, 11.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-118.32357788085938, -114.09513092041016, -109.8666763305664, -105.63822937011719, -101.40977478027344, -97.18132781982422, -92.952880859375, -88.72442626953125, -84.4959716796875, -80.26752471923828, -76.03907012939453, -71.81062316894531, -67.58216857910156, -63.353721618652344, -59.12527084350586, -54.896820068359375, -50.668373107910156, -46.43992233276367, -42.21147155761719, -37.98302459716797, -33.75457000732422, -29.526121139526367, -25.297672271728516, -21.06922149658203, -16.840770721435547, -12.612319946289062, -8.383870124816895, -4.155420303344727, 0.07303047180175781, 4.301481246948242, 8.529930114746094, 12.758380889892578, 16.986831665039062, 21.215282440185547, 25.44373321533203, 29.672182083129883, 33.900634765625, 38.12908172607422, 42.3575325012207, 46.58598327636719, 50.81443405151367, 55.042884826660156, 59.27133560180664, 63.499786376953125, 67.72823333740234, 71.9566879272461, 76.18513488769531, 80.41358947753906, 84.64203643798828, 88.8704833984375, 93.09893798828125, 97.32738494873047, 101.55583953857422, 105.78428649902344, 110.01274108886719, 114.2411880493164, 118.46963500976562, 122.69808197021484, 126.9265365600586, 131.1549835205078, 135.38343811035156, 139.6118927001953, 143.84033203125, 148.06878662109375, 152.2972412109375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 7.0, 3.0, 3.0, 6.0, 7.0, 6.0, 7.0, 16.0, 12.0, 13.0, 18.0, 21.0, 32.0, 43.0, 46.0, 34.0, 41.0, 46.0, 46.0, 44.0, 51.0, 53.0, 57.0, 37.0, 54.0, 42.0, 36.0, 38.0, 38.0, 33.0, 26.0, 19.0, 15.0, 16.0, 14.0, 2.0, 9.0, 4.0, 5.0, 6.0, 2.0, 1.0, 4.0, 3.0, 1.0, 0.0, 1.0], "bins": [-12.0390625, -11.7215576171875, -11.404052734375, -11.0865478515625, -10.76904296875, -10.4515380859375, -10.134033203125, -9.8165283203125, -9.4990234375, -9.1815185546875, -8.864013671875, -8.5465087890625, -8.22900390625, -7.9114990234375, -7.593994140625, -7.2764892578125, -6.958984375, -6.6414794921875, -6.323974609375, -6.0064697265625, -5.68896484375, -5.3714599609375, -5.053955078125, -4.7364501953125, -4.4189453125, -4.1014404296875, -3.783935546875, -3.4664306640625, -3.14892578125, -2.8314208984375, -2.513916015625, -2.1964111328125, -1.87890625, -1.5614013671875, -1.243896484375, -0.9263916015625, -0.60888671875, -0.2913818359375, 0.026123046875, 0.3436279296875, 0.6611328125, 0.9786376953125, 1.296142578125, 1.6136474609375, 1.93115234375, 2.2486572265625, 2.566162109375, 2.8836669921875, 3.201171875, 3.5186767578125, 3.836181640625, 4.1536865234375, 4.47119140625, 4.7886962890625, 5.106201171875, 5.4237060546875, 5.7412109375, 6.0587158203125, 6.376220703125, 6.6937255859375, 7.01123046875, 7.3287353515625, 7.646240234375, 7.9637451171875, 8.28125]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 5.0, 6.0, 10.0, 14.0, 9.0, 16.0, 18.0, 29.0, 52.0, 64.0, 93.0, 129.0, 190.0, 246.0, 416.0, 617.0, 1099.0, 1963.0, 3895.0, 9985.0, 36436.0, 320618.0, 2775698.0, 941111.0, 74535.0, 15679.0, 5398.0, 2492.0, 1290.0, 771.0, 474.0, 283.0, 200.0, 127.0, 88.0, 87.0, 43.0, 30.0, 23.0, 21.0, 11.0, 15.0, 6.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-25.0625, -24.12353515625, -23.1845703125, -22.24560546875, -21.306640625, -20.36767578125, -19.4287109375, -18.48974609375, -17.55078125, -16.61181640625, -15.6728515625, -14.73388671875, -13.794921875, -12.85595703125, -11.9169921875, -10.97802734375, -10.0390625, -9.10009765625, -8.1611328125, -7.22216796875, -6.283203125, -5.34423828125, -4.4052734375, -3.46630859375, -2.52734375, -1.58837890625, -0.6494140625, 0.28955078125, 1.228515625, 2.16748046875, 3.1064453125, 4.04541015625, 4.984375, 5.92333984375, 6.8623046875, 7.80126953125, 8.740234375, 9.67919921875, 10.6181640625, 11.55712890625, 12.49609375, 13.43505859375, 14.3740234375, 15.31298828125, 16.251953125, 17.19091796875, 18.1298828125, 19.06884765625, 20.0078125, 20.94677734375, 21.8857421875, 22.82470703125, 23.763671875, 24.70263671875, 25.6416015625, 26.58056640625, 27.51953125, 28.45849609375, 29.3974609375, 30.33642578125, 31.275390625, 32.21435546875, 33.1533203125, 34.09228515625, 35.03125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 6.0, 5.0, 2.0, 10.0, 9.0, 13.0, 23.0, 19.0, 25.0, 45.0, 56.0, 83.0, 107.0, 183.0, 286.0, 395.0, 529.0, 628.0, 458.0, 379.0, 260.0, 166.0, 114.0, 65.0, 49.0, 39.0, 38.0, 24.0, 16.0, 7.0, 11.0, 3.0, 4.0, 3.0, 3.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-30.578125, -29.493408203125, -28.40869140625, -27.323974609375, -26.2392578125, -25.154541015625, -24.06982421875, -22.985107421875, -21.900390625, -20.815673828125, -19.73095703125, -18.646240234375, -17.5615234375, -16.476806640625, -15.39208984375, -14.307373046875, -13.22265625, -12.137939453125, -11.05322265625, -9.968505859375, -8.8837890625, -7.799072265625, -6.71435546875, -5.629638671875, -4.544921875, -3.460205078125, -2.37548828125, -1.290771484375, -0.2060546875, 0.878662109375, 1.96337890625, 3.048095703125, 4.1328125, 5.217529296875, 6.30224609375, 7.386962890625, 8.4716796875, 9.556396484375, 10.64111328125, 11.725830078125, 12.810546875, 13.895263671875, 14.97998046875, 16.064697265625, 17.1494140625, 18.234130859375, 19.31884765625, 20.403564453125, 21.48828125, 22.572998046875, 23.65771484375, 24.742431640625, 25.8271484375, 26.911865234375, 27.99658203125, 29.081298828125, 30.166015625, 31.250732421875, 32.33544921875, 33.420166015625, 34.5048828125, 35.589599609375, 36.67431640625, 37.759033203125, 38.84375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 2.0, 4.0, 12.0, 8.0, 19.0, 25.0, 35.0, 68.0, 85.0, 136.0, 221.0, 395.0, 742.0, 1776.0, 13189.0, 3872471.0, 297838.0, 4476.0, 1298.0, 611.0, 317.0, 190.0, 111.0, 63.0, 49.0, 34.0, 29.0, 17.0, 9.0, 12.0, 10.0, 8.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-167.25, -162.703125, -158.15625, -153.609375, -149.0625, -144.515625, -139.96875, -135.421875, -130.875, -126.328125, -121.78125, -117.234375, -112.6875, -108.140625, -103.59375, -99.046875, -94.5, -89.953125, -85.40625, -80.859375, -76.3125, -71.765625, -67.21875, -62.671875, -58.125, -53.578125, -49.03125, -44.484375, -39.9375, -35.390625, -30.84375, -26.296875, -21.75, -17.203125, -12.65625, -8.109375, -3.5625, 0.984375, 5.53125, 10.078125, 14.625, 19.171875, 23.71875, 28.265625, 32.8125, 37.359375, 41.90625, 46.453125, 51.0, 55.546875, 60.09375, 64.640625, 69.1875, 73.734375, 78.28125, 82.828125, 87.375, 91.921875, 96.46875, 101.015625, 105.5625, 110.109375, 114.65625, 119.203125, 123.75]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 6.0, 239.0, 750.0, 19.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-908.4951782226562, -885.8750610351562, -863.2548828125, -840.634765625, -818.0146484375, -795.39453125, -772.7743530273438, -750.1542358398438, -727.5340576171875, -704.9139404296875, -682.2937622070312, -659.6736450195312, -637.0535278320312, -614.433349609375, -591.813232421875, -569.193115234375, -546.572998046875, -523.952880859375, -501.3327331542969, -478.71258544921875, -456.09246826171875, -433.4723205566406, -410.8521728515625, -388.2320556640625, -365.6119079589844, -342.99176025390625, -320.37164306640625, -297.7514953613281, -275.13134765625, -252.51123046875, -229.89108276367188, -207.2709503173828, -184.65081787109375, -162.0306854248047, -139.41055297851562, -116.7904052734375, -94.17027282714844, -71.55014038085938, -48.92999267578125, -26.309860229492188, -3.689727783203125, 18.930408477783203, 41.55054473876953, 64.17068481445312, 86.79081726074219, 109.41094970703125, 132.03109741210938, 154.65122985839844, 177.2713623046875, 199.89149475097656, 222.51162719726562, 245.13177490234375, 267.75189208984375, 290.3720397949219, 312.9921875, 335.6123046875, 358.2324523925781, 380.85260009765625, 403.47271728515625, 426.0928649902344, 448.7130126953125, 471.3331298828125, 493.9532775878906, 516.5734252929688, 539.1935424804688]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 12.0, 7.0, 8.0, 14.0, 15.0, 15.0, 17.0, 30.0, 27.0, 39.0, 22.0, 35.0, 30.0, 37.0, 34.0, 53.0, 46.0, 40.0, 38.0, 47.0, 46.0, 55.0, 45.0, 40.0, 32.0, 37.0, 32.0, 23.0, 22.0, 16.0, 13.0, 17.0, 14.0, 12.0, 5.0, 4.0, 5.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.48583984375, -122.62747192382812, -118.76911163330078, -114.91075134277344, -111.05238342285156, -107.19401550292969, -103.33565521240234, -99.477294921875, -95.61892700195312, -91.76055908203125, -87.9021987915039, -84.04383850097656, -80.18547058105469, -76.32710266113281, -72.46874237060547, -68.61038208007812, -64.75201416015625, -60.89365005493164, -57.03528594970703, -53.17692184448242, -49.31855773925781, -45.4601936340332, -41.601829528808594, -37.743465423583984, -33.885101318359375, -30.026737213134766, -26.168373107910156, -22.310009002685547, -18.451644897460938, -14.593280792236328, -10.734916687011719, -6.876552581787109, -3.0181884765625, 0.8401756286621094, 4.698539733886719, 8.556903839111328, 12.415267944335938, 16.273632049560547, 20.131996154785156, 23.990360260009766, 27.848724365234375, 31.707088470458984, 35.565452575683594, 39.4238166809082, 43.28218078613281, 47.14054489135742, 50.99890899658203, 54.85727310180664, 58.71563720703125, 62.57400131225586, 66.43236541748047, 70.29072570800781, 74.14909362792969, 78.00746154785156, 81.8658218383789, 85.72418212890625, 89.58255004882812, 93.44091796875, 97.29927825927734, 101.15763854980469, 105.01600646972656, 108.87437438964844, 112.73273468017578, 116.59109497070312, 120.449462890625]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 10.0, 11.0, 8.0, 6.0, 17.0, 20.0, 24.0, 23.0, 23.0, 40.0, 34.0, 48.0, 45.0, 46.0, 36.0, 46.0, 47.0, 45.0, 48.0, 45.0, 42.0, 42.0, 31.0, 29.0, 26.0, 20.0, 27.0, 32.0, 24.0, 10.0, 17.0, 8.0, 15.0, 13.0, 7.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.546875, -10.2279052734375, -9.908935546875, -9.5899658203125, -9.27099609375, -8.9520263671875, -8.633056640625, -8.3140869140625, -7.9951171875, -7.6761474609375, -7.357177734375, -7.0382080078125, -6.71923828125, -6.4002685546875, -6.081298828125, -5.7623291015625, -5.443359375, -5.1243896484375, -4.805419921875, -4.4864501953125, -4.16748046875, -3.8485107421875, -3.529541015625, -3.2105712890625, -2.8916015625, -2.5726318359375, -2.253662109375, -1.9346923828125, -1.61572265625, -1.2967529296875, -0.977783203125, -0.6588134765625, -0.33984375, -0.0208740234375, 0.298095703125, 0.6170654296875, 0.93603515625, 1.2550048828125, 1.573974609375, 1.8929443359375, 2.2119140625, 2.5308837890625, 2.849853515625, 3.1688232421875, 3.48779296875, 3.8067626953125, 4.125732421875, 4.4447021484375, 4.763671875, 5.0826416015625, 5.401611328125, 5.7205810546875, 6.03955078125, 6.3585205078125, 6.677490234375, 6.9964599609375, 7.3154296875, 7.6343994140625, 7.953369140625, 8.2723388671875, 8.59130859375, 8.9102783203125, 9.229248046875, 9.5482177734375, 9.8671875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 8.0, 9.0, 12.0, 19.0, 37.0, 37.0, 63.0, 67.0, 111.0, 151.0, 228.0, 291.0, 428.0, 614.0, 923.0, 1343.0, 1923.0, 2709.0, 4241.0, 6276.0, 9364.0, 14635.0, 23008.0, 38041.0, 65877.0, 122590.0, 301764.0, 210116.0, 98138.0, 54975.0, 32608.0, 19975.0, 12771.0, 8258.0, 5406.0, 3604.0, 2430.0, 1681.0, 1161.0, 800.0, 523.0, 364.0, 287.0, 187.0, 145.0, 105.0, 77.0, 58.0, 38.0, 24.0, 23.0, 14.0, 6.0, 7.0, 5.0, 2.0, 2.0, 4.0], "bins": [-2.220703125, -2.153076171875, -2.08544921875, -2.017822265625, -1.9501953125, -1.882568359375, -1.81494140625, -1.747314453125, -1.6796875, -1.612060546875, -1.54443359375, -1.476806640625, -1.4091796875, -1.341552734375, -1.27392578125, -1.206298828125, -1.138671875, -1.071044921875, -1.00341796875, -0.935791015625, -0.8681640625, -0.800537109375, -0.73291015625, -0.665283203125, -0.59765625, -0.530029296875, -0.46240234375, -0.394775390625, -0.3271484375, -0.259521484375, -0.19189453125, -0.124267578125, -0.056640625, 0.010986328125, 0.07861328125, 0.146240234375, 0.2138671875, 0.281494140625, 0.34912109375, 0.416748046875, 0.484375, 0.552001953125, 0.61962890625, 0.687255859375, 0.7548828125, 0.822509765625, 0.89013671875, 0.957763671875, 1.025390625, 1.093017578125, 1.16064453125, 1.228271484375, 1.2958984375, 1.363525390625, 1.43115234375, 1.498779296875, 1.56640625, 1.634033203125, 1.70166015625, 1.769287109375, 1.8369140625, 1.904541015625, 1.97216796875, 2.039794921875, 2.107421875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 7.0, 10.0, 9.0, 6.0, 11.0, 11.0, 14.0, 18.0, 14.0, 20.0, 20.0, 19.0, 19.0, 28.0, 22.0, 34.0, 30.0, 21.0, 31.0, 43.0, 32.0, 29.0, 1070.0, 37.0, 32.0, 36.0, 36.0, 29.0, 32.0, 33.0, 29.0, 25.0, 28.0, 20.0, 21.0, 24.0, 14.0, 16.0, 13.0, 17.0, 10.0, 11.0, 9.0, 11.0, 4.0, 5.0, 5.0, 2.0, 1.0, 4.0, 5.0, 4.0, 0.0, 1.0], "bins": [-5.38671875, -5.22308349609375, -5.0594482421875, -4.89581298828125, -4.732177734375, -4.56854248046875, -4.4049072265625, -4.24127197265625, -4.07763671875, -3.91400146484375, -3.7503662109375, -3.58673095703125, -3.423095703125, -3.25946044921875, -3.0958251953125, -2.93218994140625, -2.7685546875, -2.60491943359375, -2.4412841796875, -2.27764892578125, -2.114013671875, -1.95037841796875, -1.7867431640625, -1.62310791015625, -1.45947265625, -1.29583740234375, -1.1322021484375, -0.96856689453125, -0.804931640625, -0.64129638671875, -0.4776611328125, -0.31402587890625, -0.150390625, 0.01324462890625, 0.1768798828125, 0.34051513671875, 0.504150390625, 0.66778564453125, 0.8314208984375, 0.99505615234375, 1.15869140625, 1.32232666015625, 1.4859619140625, 1.64959716796875, 1.813232421875, 1.97686767578125, 2.1405029296875, 2.30413818359375, 2.4677734375, 2.63140869140625, 2.7950439453125, 2.95867919921875, 3.122314453125, 3.28594970703125, 3.4495849609375, 3.61322021484375, 3.77685546875, 3.94049072265625, 4.1041259765625, 4.26776123046875, 4.431396484375, 4.59503173828125, 4.7586669921875, 4.92230224609375, 5.0859375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 6.0, 7.0, 8.0, 17.0, 21.0, 43.0, 69.0, 81.0, 106.0, 162.0, 248.0, 348.0, 490.0, 671.0, 973.0, 1394.0, 1940.0, 2578.0, 3651.0, 5116.0, 7027.0, 9813.0, 13608.0, 19436.0, 27927.0, 40621.0, 62020.0, 100287.0, 200057.0, 1279957.0, 108299.0, 66134.0, 43463.0, 29213.0, 20524.0, 14215.0, 10366.0, 7369.0, 5413.0, 3799.0, 2786.0, 2026.0, 1418.0, 1000.0, 747.0, 532.0, 384.0, 234.0, 174.0, 139.0, 81.0, 47.0, 37.0, 28.0, 15.0, 12.0, 5.0, 1.0, 3.0, 1.0, 1.0, 2.0], "bins": [-1.5361328125, -1.4866943359375, -1.437255859375, -1.3878173828125, -1.33837890625, -1.2889404296875, -1.239501953125, -1.1900634765625, -1.140625, -1.0911865234375, -1.041748046875, -0.9923095703125, -0.94287109375, -0.8934326171875, -0.843994140625, -0.7945556640625, -0.7451171875, -0.6956787109375, -0.646240234375, -0.5968017578125, -0.54736328125, -0.4979248046875, -0.448486328125, -0.3990478515625, -0.349609375, -0.3001708984375, -0.250732421875, -0.2012939453125, -0.15185546875, -0.1024169921875, -0.052978515625, -0.0035400390625, 0.0458984375, 0.0953369140625, 0.144775390625, 0.1942138671875, 0.24365234375, 0.2930908203125, 0.342529296875, 0.3919677734375, 0.44140625, 0.4908447265625, 0.540283203125, 0.5897216796875, 0.63916015625, 0.6885986328125, 0.738037109375, 0.7874755859375, 0.8369140625, 0.8863525390625, 0.935791015625, 0.9852294921875, 1.03466796875, 1.0841064453125, 1.133544921875, 1.1829833984375, 1.232421875, 1.2818603515625, 1.331298828125, 1.3807373046875, 1.43017578125, 1.4796142578125, 1.529052734375, 1.5784912109375, 1.6279296875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 7.0, 4.0, 4.0, 10.0, 7.0, 6.0, 12.0, 18.0, 15.0, 18.0, 33.0, 22.0, 37.0, 40.0, 69.0, 82.0, 84.0, 84.0, 71.0, 69.0, 63.0, 44.0, 45.0, 28.0, 23.0, 16.0, 14.0, 9.0, 15.0, 9.0, 7.0, 8.0, 4.0, 7.0, 4.0, 3.0, 2.0, 3.0, 2.0, 0.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0011472702026367188, -0.0011114329099655151, -0.0010755956172943115, -0.001039758324623108, -0.0010039210319519043, -0.0009680837392807007, -0.0009322464466094971, -0.0008964091539382935, -0.0008605718612670898, -0.0008247345685958862, -0.0007888972759246826, -0.000753059983253479, -0.0007172226905822754, -0.0006813853979110718, -0.0006455481052398682, -0.0006097108125686646, -0.0005738735198974609, -0.0005380362272262573, -0.0005021989345550537, -0.0004663616418838501, -0.0004305243492126465, -0.00039468705654144287, -0.00035884976387023926, -0.00032301247119903564, -0.00028717517852783203, -0.0002513378858566284, -0.0002155005931854248, -0.0001796633005142212, -0.00014382600784301758, -0.00010798871517181396, -7.215142250061035e-05, -3.631412982940674e-05, -4.76837158203125e-07, 3.536045551300049e-05, 7.11977481842041e-05, 0.00010703504085540771, 0.00014287233352661133, 0.00017870962619781494, 0.00021454691886901855, 0.00025038421154022217, 0.0002862215042114258, 0.0003220587968826294, 0.000357896089553833, 0.0003937333822250366, 0.00042957067489624023, 0.00046540796756744385, 0.0005012452602386475, 0.0005370825529098511, 0.0005729198455810547, 0.0006087571382522583, 0.0006445944309234619, 0.0006804317235946655, 0.0007162690162658691, 0.0007521063089370728, 0.0007879436016082764, 0.00082378089427948, 0.0008596181869506836, 0.0008954554796218872, 0.0009312927722930908, 0.0009671300649642944, 0.001002967357635498, 0.0010388046503067017, 0.0010746419429779053, 0.0011104792356491089, 0.0011463165283203125]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 4.0, 4.0, 3.0, 4.0, 7.0, 5.0, 13.0, 4.0, 14.0, 14.0, 23.0, 24.0, 26.0, 45.0, 53.0, 69.0, 79.0, 121.0, 173.0, 231.0, 280.0, 492.0, 1018.0, 891552.0, 151711.0, 917.0, 510.0, 316.0, 214.0, 161.0, 94.0, 77.0, 61.0, 45.0, 33.0, 31.0, 26.0, 28.0, 18.0, 18.0, 9.0, 5.0, 5.0, 9.0, 3.0, 2.0, 3.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.0213775634765625, -0.020728349685668945, -0.02007913589477539, -0.019429922103881836, -0.01878070831298828, -0.018131494522094727, -0.017482280731201172, -0.016833066940307617, -0.016183853149414062, -0.015534639358520508, -0.014885425567626953, -0.014236211776733398, -0.013586997985839844, -0.012937784194946289, -0.012288570404052734, -0.01163935661315918, -0.010990142822265625, -0.01034092903137207, -0.009691715240478516, -0.009042501449584961, -0.008393287658691406, -0.0077440738677978516, -0.007094860076904297, -0.006445646286010742, -0.0057964324951171875, -0.005147218704223633, -0.004498004913330078, -0.0038487911224365234, -0.0031995773315429688, -0.002550363540649414, -0.0019011497497558594, -0.0012519359588623047, -0.00060272216796875, 4.649162292480469e-05, 0.0006957054138183594, 0.001344919204711914, 0.0019941329956054688, 0.0026433467864990234, 0.003292560577392578, 0.003941774368286133, 0.0045909881591796875, 0.005240201950073242, 0.005889415740966797, 0.0065386295318603516, 0.007187843322753906, 0.007837057113647461, 0.008486270904541016, 0.00913548469543457, 0.009784698486328125, 0.01043391227722168, 0.011083126068115234, 0.011732339859008789, 0.012381553649902344, 0.013030767440795898, 0.013679981231689453, 0.014329195022583008, 0.014978408813476562, 0.015627622604370117, 0.016276836395263672, 0.016926050186157227, 0.01757526397705078, 0.018224477767944336, 0.01887369155883789, 0.019522905349731445, 0.020172119140625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 22.0, 203.0, 563.0, 204.0, 20.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027433899231255054, -0.0026901564560830593, -0.002636923221871257, -0.0025836897548288107, -0.002530456520617008, -0.002477223053574562, -0.002423989586532116, -0.0023707563523203135, -0.0023175228852778673, -0.002264289418235421, -0.0022110561840236187, -0.0021578227169811726, -0.00210458948276937, -0.002051356015726924, -0.0019981227815151215, -0.0019448893144726753, -0.0018916560802608728, -0.0018384227296337485, -0.0017851893790066242, -0.001731955911964178, -0.0016787225613370538, -0.0016254892107099295, -0.0015722558600828052, -0.0015190225094556808, -0.0014657890424132347, -0.0014125556917861104, -0.001359322341158986, -0.00130608887411654, -0.0012528555234894156, -0.0011996221728622913, -0.001146388822235167, -0.0010931554716080427, -0.0010399220045655966, -0.0009866886539384723, -0.000933455245103687, -0.0008802218944765627, -0.0008269885438494384, -0.0007737551350146532, -0.0007205217843875289, -0.0006672884337604046, -0.0006140550831332803, -0.000560821732506156, -0.0005075883236713707, -0.00045435497304424644, -0.0004011216224171221, -0.00034788824268616736, -0.0002946548629552126, -0.00024142151232808828, -0.00018818816170096397, -0.00013495479652192444, -8.172142406692728e-05, -2.8488051611930132e-05, 2.4745313567109406e-05, 7.797867874614894e-05, 0.0001312120584771037, 0.00018444540910422802, 0.00023767878883518279, 0.00029091216856613755, 0.00034414551919326186, 0.00039737889892421663, 0.0004506122786551714, 0.0005038456292822957, 0.00055707897990942, 0.0006103123305365443, 0.0006635457393713295]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0, 6.0, 3.0, 7.0, 4.0, 4.0, 10.0, 6.0, 14.0, 16.0, 12.0, 21.0, 9.0, 18.0, 19.0, 24.0, 24.0, 29.0, 29.0, 40.0, 30.0, 30.0, 40.0, 37.0, 43.0, 33.0, 48.0, 35.0, 46.0, 39.0, 38.0, 29.0, 36.0, 35.0, 32.0, 29.0, 21.0, 22.0, 16.0, 11.0, 17.0, 9.0, 6.0, 2.0, 4.0, 3.0, 8.0, 4.0, 1.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.0005633831024169922, -0.000546477735042572, -0.0005295723676681519, -0.0005126670002937317, -0.0004957616329193115, -0.00047885626554489136, -0.0004619508981704712, -0.000445045530796051, -0.00042814016342163086, -0.0004112347960472107, -0.00039432942867279053, -0.00037742406129837036, -0.0003605186939239502, -0.00034361332654953003, -0.00032670795917510986, -0.0003098025918006897, -0.00029289722442626953, -0.00027599185705184937, -0.0002590864896774292, -0.00024218112230300903, -0.00022527575492858887, -0.0002083703875541687, -0.00019146502017974854, -0.00017455965280532837, -0.0001576542854309082, -0.00014074891805648804, -0.00012384355068206787, -0.0001069381833076477, -9.003281593322754e-05, -7.312744855880737e-05, -5.622208118438721e-05, -3.931671380996704e-05, -2.2411346435546875e-05, -5.505979061126709e-06, 1.1399388313293457e-05, 2.8304755687713623e-05, 4.521012306213379e-05, 6.211549043655396e-05, 7.902085781097412e-05, 9.592622518539429e-05, 0.00011283159255981445, 0.00012973695993423462, 0.00014664232730865479, 0.00016354769468307495, 0.00018045306205749512, 0.00019735842943191528, 0.00021426379680633545, 0.00023116916418075562, 0.0002480745315551758, 0.00026497989892959595, 0.0002818852663040161, 0.0002987906336784363, 0.00031569600105285645, 0.0003326013684272766, 0.0003495067358016968, 0.00036641210317611694, 0.0003833174705505371, 0.0004002228379249573, 0.00041712820529937744, 0.0004340335726737976, 0.0004509389400482178, 0.00046784430742263794, 0.0004847496747970581, 0.0005016550421714783, 0.0005185604095458984]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 7.0, 10.0, 11.0, 8.0, 6.0, 17.0, 20.0, 24.0, 23.0, 23.0, 40.0, 34.0, 48.0, 45.0, 46.0, 36.0, 46.0, 47.0, 45.0, 48.0, 45.0, 42.0, 42.0, 31.0, 29.0, 26.0, 20.0, 27.0, 32.0, 24.0, 10.0, 17.0, 8.0, 15.0, 13.0, 7.0, 8.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.546875, -10.2279052734375, -9.908935546875, -9.5899658203125, -9.27099609375, -8.9520263671875, -8.633056640625, -8.3140869140625, -7.9951171875, -7.6761474609375, -7.357177734375, -7.0382080078125, -6.71923828125, -6.4002685546875, -6.081298828125, -5.7623291015625, -5.443359375, -5.1243896484375, -4.805419921875, -4.4864501953125, -4.16748046875, -3.8485107421875, -3.529541015625, -3.2105712890625, -2.8916015625, -2.5726318359375, -2.253662109375, -1.9346923828125, -1.61572265625, -1.2967529296875, -0.977783203125, -0.6588134765625, -0.33984375, -0.0208740234375, 0.298095703125, 0.6170654296875, 0.93603515625, 1.2550048828125, 1.573974609375, 1.8929443359375, 2.2119140625, 2.5308837890625, 2.849853515625, 3.1688232421875, 3.48779296875, 3.8067626953125, 4.125732421875, 4.4447021484375, 4.763671875, 5.0826416015625, 5.401611328125, 5.7205810546875, 6.03955078125, 6.3585205078125, 6.677490234375, 6.9964599609375, 7.3154296875, 7.6343994140625, 7.953369140625, 8.2723388671875, 8.59130859375, 8.9102783203125, 9.229248046875, 9.5482177734375, 9.8671875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 0.0, 2.0, 3.0, 4.0, 5.0, 12.0, 6.0, 11.0, 14.0, 42.0, 32.0, 44.0, 57.0, 111.0, 120.0, 165.0, 235.0, 330.0, 442.0, 652.0, 921.0, 1278.0, 1870.0, 2841.0, 4740.0, 8798.0, 23661.0, 622257.0, 337706.0, 20745.0, 8212.0, 4469.0, 2677.0, 1774.0, 1267.0, 865.0, 608.0, 434.0, 315.0, 231.0, 170.0, 111.0, 84.0, 60.0, 60.0, 35.0, 24.0, 19.0, 11.0, 12.0, 9.0, 4.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-75.1875, -72.833984375, -70.48046875, -68.126953125, -65.7734375, -63.419921875, -61.06640625, -58.712890625, -56.359375, -54.005859375, -51.65234375, -49.298828125, -46.9453125, -44.591796875, -42.23828125, -39.884765625, -37.53125, -35.177734375, -32.82421875, -30.470703125, -28.1171875, -25.763671875, -23.41015625, -21.056640625, -18.703125, -16.349609375, -13.99609375, -11.642578125, -9.2890625, -6.935546875, -4.58203125, -2.228515625, 0.125, 2.478515625, 4.83203125, 7.185546875, 9.5390625, 11.892578125, 14.24609375, 16.599609375, 18.953125, 21.306640625, 23.66015625, 26.013671875, 28.3671875, 30.720703125, 33.07421875, 35.427734375, 37.78125, 40.134765625, 42.48828125, 44.841796875, 47.1953125, 49.548828125, 51.90234375, 54.255859375, 56.609375, 58.962890625, 61.31640625, 63.669921875, 66.0234375, 68.376953125, 70.73046875, 73.083984375, 75.4375]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 3.0, 4.0, 6.0, 6.0, 4.0, 7.0, 13.0, 8.0, 19.0, 18.0, 16.0, 27.0, 24.0, 31.0, 27.0, 28.0, 42.0, 56.0, 47.0, 63.0, 101.0, 323.0, 1536.0, 165.0, 78.0, 46.0, 37.0, 38.0, 37.0, 38.0, 30.0, 30.0, 23.0, 12.0, 23.0, 12.0, 17.0, 17.0, 11.0, 7.0, 7.0, 8.0, 3.0, 4.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.53125, -27.58740234375, -26.6435546875, -25.69970703125, -24.755859375, -23.81201171875, -22.8681640625, -21.92431640625, -20.98046875, -20.03662109375, -19.0927734375, -18.14892578125, -17.205078125, -16.26123046875, -15.3173828125, -14.37353515625, -13.4296875, -12.48583984375, -11.5419921875, -10.59814453125, -9.654296875, -8.71044921875, -7.7666015625, -6.82275390625, -5.87890625, -4.93505859375, -3.9912109375, -3.04736328125, -2.103515625, -1.15966796875, -0.2158203125, 0.72802734375, 1.671875, 2.61572265625, 3.5595703125, 4.50341796875, 5.447265625, 6.39111328125, 7.3349609375, 8.27880859375, 9.22265625, 10.16650390625, 11.1103515625, 12.05419921875, 12.998046875, 13.94189453125, 14.8857421875, 15.82958984375, 16.7734375, 17.71728515625, 18.6611328125, 19.60498046875, 20.548828125, 21.49267578125, 22.4365234375, 23.38037109375, 24.32421875, 25.26806640625, 26.2119140625, 27.15576171875, 28.099609375, 29.04345703125, 29.9873046875, 30.93115234375, 31.875]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 5.0, 6.0, 9.0, 7.0, 13.0, 15.0, 16.0, 12.0, 22.0, 26.0, 32.0, 32.0, 47.0, 40.0, 64.0, 109.0, 227.0, 774.0, 8959.0, 3127961.0, 5981.0, 663.0, 230.0, 125.0, 72.0, 44.0, 36.0, 37.0, 31.0, 12.0, 19.0, 19.0, 15.0, 9.0, 9.0, 9.0, 7.0, 6.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-162.625, -158.0390625, -153.453125, -148.8671875, -144.28125, -139.6953125, -135.109375, -130.5234375, -125.9375, -121.3515625, -116.765625, -112.1796875, -107.59375, -103.0078125, -98.421875, -93.8359375, -89.25, -84.6640625, -80.078125, -75.4921875, -70.90625, -66.3203125, -61.734375, -57.1484375, -52.5625, -47.9765625, -43.390625, -38.8046875, -34.21875, -29.6328125, -25.046875, -20.4609375, -15.875, -11.2890625, -6.703125, -2.1171875, 2.46875, 7.0546875, 11.640625, 16.2265625, 20.8125, 25.3984375, 29.984375, 34.5703125, 39.15625, 43.7421875, 48.328125, 52.9140625, 57.5, 62.0859375, 66.671875, 71.2578125, 75.84375, 80.4296875, 85.015625, 89.6015625, 94.1875, 98.7734375, 103.359375, 107.9453125, 112.53125, 117.1171875, 121.703125, 126.2890625, 130.875]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 142.0, 869.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-236.32247924804688, -222.5504608154297, -208.77842712402344, -195.00640869140625, -181.234375, -167.4623565673828, -153.69033813476562, -139.91830444335938, -126.14628601074219, -112.37425994873047, -98.60223388671875, -84.83021545410156, -71.05818939208984, -57.286163330078125, -43.51414489746094, -29.74211883544922, -15.9700927734375, -2.198068618774414, 11.573955535888672, 25.345977783203125, 39.118003845214844, 52.89002990722656, 66.66204833984375, 80.43407440185547, 94.20610046386719, 107.9781265258789, 121.75015258789062, 135.5221710205078, 149.294189453125, 163.06622314453125, 176.83824157714844, 190.61026000976562, 204.38232421875, 218.1543426513672, 231.92637634277344, 245.69839477539062, 259.4704284667969, 273.242431640625, 287.01446533203125, 300.7864990234375, 314.55853271484375, 328.33056640625, 342.1025695800781, 355.8746032714844, 369.6466369628906, 383.41864013671875, 397.190673828125, 410.96270751953125, 424.7347106933594, 438.5067443847656, 452.27874755859375, 466.05078125, 479.82281494140625, 493.5948486328125, 507.3668518066406, 521.1388549804688, 534.910888671875, 548.6829223632812, 562.4549560546875, 576.2269287109375, 589.9989624023438, 603.77099609375, 617.5430297851562, 631.3150634765625, 645.0870971679688]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 6.0, 10.0, 10.0, 8.0, 13.0, 17.0, 13.0, 22.0, 17.0, 27.0, 28.0, 31.0, 27.0, 34.0, 34.0, 38.0, 37.0, 35.0, 27.0, 33.0, 34.0, 41.0, 55.0, 40.0, 49.0, 34.0, 32.0, 40.0, 31.0, 26.0, 30.0, 22.0, 17.0, 18.0, 10.0, 12.0, 16.0, 3.0, 13.0, 4.0, 1.0, 3.0, 4.0, 2.0, 0.0, 5.0], "bins": [-101.06277465820312, -98.22279357910156, -95.3828125, -92.54283142089844, -89.70285034179688, -86.86286163330078, -84.02288055419922, -81.18289947509766, -78.3429183959961, -75.50293731689453, -72.66295623779297, -69.8229751586914, -66.98298645019531, -64.14300537109375, -61.30302429199219, -58.463043212890625, -55.62306213378906, -52.7830810546875, -49.94309997558594, -47.10311508178711, -44.26313400268555, -41.423152923583984, -38.583168029785156, -35.743186950683594, -32.90320587158203, -30.06322479248047, -27.223241806030273, -24.383258819580078, -21.543277740478516, -18.703296661376953, -15.863313674926758, -13.023330688476562, -10.183349609375, -7.343367576599121, -4.503385543823242, -1.6634035110473633, 1.1765785217285156, 4.0165605545043945, 6.856542587280273, 9.696525573730469, 12.536506652832031, 15.37648868560791, 18.21647071838379, 21.056453704833984, 23.896434783935547, 26.73641586303711, 29.576398849487305, 32.4163818359375, 35.25636291503906, 38.096343994140625, 40.93632507324219, 43.776309967041016, 46.61629104614258, 49.45627212524414, 52.29625701904297, 55.13623809814453, 57.976219177246094, 60.816200256347656, 63.65618133544922, 66.49616241455078, 69.33615112304688, 72.17613220214844, 75.01611328125, 77.85609436035156, 80.69607543945312]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 1.0, 2.0, 4.0, 7.0, 9.0, 9.0, 6.0, 7.0, 8.0, 21.0, 20.0, 27.0, 24.0, 26.0, 32.0, 29.0, 38.0, 53.0, 40.0, 43.0, 43.0, 41.0, 52.0, 37.0, 55.0, 42.0, 39.0, 32.0, 29.0, 25.0, 21.0, 28.0, 26.0, 21.0, 23.0, 14.0, 11.0, 8.0, 14.0, 13.0, 8.0, 3.0, 3.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.9375, -10.608154296875, -10.27880859375, -9.949462890625, -9.6201171875, -9.290771484375, -8.96142578125, -8.632080078125, -8.302734375, -7.973388671875, -7.64404296875, -7.314697265625, -6.9853515625, -6.656005859375, -6.32666015625, -5.997314453125, -5.66796875, -5.338623046875, -5.00927734375, -4.679931640625, -4.3505859375, -4.021240234375, -3.69189453125, -3.362548828125, -3.033203125, -2.703857421875, -2.37451171875, -2.045166015625, -1.7158203125, -1.386474609375, -1.05712890625, -0.727783203125, -0.3984375, -0.069091796875, 0.26025390625, 0.589599609375, 0.9189453125, 1.248291015625, 1.57763671875, 1.906982421875, 2.236328125, 2.565673828125, 2.89501953125, 3.224365234375, 3.5537109375, 3.883056640625, 4.21240234375, 4.541748046875, 4.87109375, 5.200439453125, 5.52978515625, 5.859130859375, 6.1884765625, 6.517822265625, 6.84716796875, 7.176513671875, 7.505859375, 7.835205078125, 8.16455078125, 8.493896484375, 8.8232421875, 9.152587890625, 9.48193359375, 9.811279296875, 10.140625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 5.0, 4.0, 11.0, 5.0, 10.0, 19.0, 17.0, 28.0, 40.0, 46.0, 74.0, 128.0, 218.0, 360.0, 652.0, 1307.0, 2774.0, 6449.0, 16897.0, 64954.0, 2444714.0, 1576092.0, 52849.0, 15016.0, 6025.0, 2669.0, 1321.0, 631.0, 357.0, 212.0, 126.0, 86.0, 47.0, 32.0, 28.0, 25.0, 16.0, 12.0, 11.0, 4.0, 6.0, 5.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-78.4375, -76.056640625, -73.67578125, -71.294921875, -68.9140625, -66.533203125, -64.15234375, -61.771484375, -59.390625, -57.009765625, -54.62890625, -52.248046875, -49.8671875, -47.486328125, -45.10546875, -42.724609375, -40.34375, -37.962890625, -35.58203125, -33.201171875, -30.8203125, -28.439453125, -26.05859375, -23.677734375, -21.296875, -18.916015625, -16.53515625, -14.154296875, -11.7734375, -9.392578125, -7.01171875, -4.630859375, -2.25, 0.130859375, 2.51171875, 4.892578125, 7.2734375, 9.654296875, 12.03515625, 14.416015625, 16.796875, 19.177734375, 21.55859375, 23.939453125, 26.3203125, 28.701171875, 31.08203125, 33.462890625, 35.84375, 38.224609375, 40.60546875, 42.986328125, 45.3671875, 47.748046875, 50.12890625, 52.509765625, 54.890625, 57.271484375, 59.65234375, 62.033203125, 64.4140625, 66.794921875, 69.17578125, 71.556640625, 73.9375]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 8.0, 10.0, 10.0, 26.0, 21.0, 25.0, 30.0, 62.0, 102.0, 145.0, 221.0, 367.0, 624.0, 823.0, 563.0, 358.0, 220.0, 117.0, 101.0, 63.0, 45.0, 27.0, 25.0, 19.0, 21.0, 8.0, 7.0, 7.0, 5.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-81.25, -79.23974609375, -77.2294921875, -75.21923828125, -73.208984375, -71.19873046875, -69.1884765625, -67.17822265625, -65.16796875, -63.15771484375, -61.1474609375, -59.13720703125, -57.126953125, -55.11669921875, -53.1064453125, -51.09619140625, -49.0859375, -47.07568359375, -45.0654296875, -43.05517578125, -41.044921875, -39.03466796875, -37.0244140625, -35.01416015625, -33.00390625, -30.99365234375, -28.9833984375, -26.97314453125, -24.962890625, -22.95263671875, -20.9423828125, -18.93212890625, -16.921875, -14.91162109375, -12.9013671875, -10.89111328125, -8.880859375, -6.87060546875, -4.8603515625, -2.85009765625, -0.83984375, 1.17041015625, 3.1806640625, 5.19091796875, 7.201171875, 9.21142578125, 11.2216796875, 13.23193359375, 15.2421875, 17.25244140625, 19.2626953125, 21.27294921875, 23.283203125, 25.29345703125, 27.3037109375, 29.31396484375, 31.32421875, 33.33447265625, 35.3447265625, 37.35498046875, 39.365234375, 41.37548828125, 43.3857421875, 45.39599609375, 47.40625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 9.0, 12.0, 25.0, 24.0, 45.0, 51.0, 92.0, 138.0, 215.0, 384.0, 1146.0, 3426545.0, 763737.0, 947.0, 321.0, 196.0, 118.0, 80.0, 51.0, 41.0, 24.0, 21.0, 15.0, 9.0, 7.0, 6.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-247.0, -236.23828125, -225.4765625, -214.71484375, -203.953125, -193.19140625, -182.4296875, -171.66796875, -160.90625, -150.14453125, -139.3828125, -128.62109375, -117.859375, -107.09765625, -96.3359375, -85.57421875, -74.8125, -64.05078125, -53.2890625, -42.52734375, -31.765625, -21.00390625, -10.2421875, 0.51953125, 11.28125, 22.04296875, 32.8046875, 43.56640625, 54.328125, 65.08984375, 75.8515625, 86.61328125, 97.375, 108.13671875, 118.8984375, 129.66015625, 140.421875, 151.18359375, 161.9453125, 172.70703125, 183.46875, 194.23046875, 204.9921875, 215.75390625, 226.515625, 237.27734375, 248.0390625, 258.80078125, 269.5625, 280.32421875, 291.0859375, 301.84765625, 312.609375, 323.37109375, 334.1328125, 344.89453125, 355.65625, 366.41796875, 377.1796875, 387.94140625, 398.703125, 409.46484375, 420.2265625, 430.98828125, 441.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 16.0, 862.0, 135.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-169.61683654785156, -139.83148193359375, -110.0461196899414, -80.26075744628906, -50.47540283203125, -20.690048217773438, 9.095321655273438, 38.88067626953125, 68.66603088378906, 98.45138549804688, 128.23675537109375, 158.02210998535156, 187.80746459960938, 217.5928192138672, 247.37818908691406, 277.1635437011719, 306.94891357421875, 336.7342834472656, 366.5196228027344, 396.30499267578125, 426.09033203125, 455.8757019042969, 485.66107177734375, 515.4464111328125, 545.2317504882812, 575.01708984375, 604.802490234375, 634.5878295898438, 664.3731689453125, 694.1585693359375, 723.9439086914062, 753.729248046875, 783.5146484375, 813.2999877929688, 843.0853881835938, 872.8707275390625, 902.6560668945312, 932.44140625, 962.226806640625, 992.0121459960938, 1021.7974853515625, 1051.5828857421875, 1081.3681640625, 1111.153564453125, 1140.93896484375, 1170.7242431640625, 1200.5096435546875, 1230.2950439453125, 1260.080322265625, 1289.86572265625, 1319.6510009765625, 1349.4364013671875, 1379.2218017578125, 1409.007080078125, 1438.79248046875, 1468.577880859375, 1498.36328125, 1528.148681640625, 1557.9339599609375, 1587.7193603515625, 1617.5047607421875, 1647.2900390625, 1677.075439453125, 1706.86083984375, 1736.6461181640625]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 6.0, 14.0, 16.0, 11.0, 14.0, 17.0, 22.0, 14.0, 33.0, 25.0, 33.0, 36.0, 35.0, 35.0, 37.0, 37.0, 39.0, 37.0, 35.0, 40.0, 41.0, 49.0, 36.0, 36.0, 30.0, 23.0, 36.0, 30.0, 33.0, 20.0, 16.0, 16.0, 10.0, 19.0, 8.0, 10.0, 11.0, 5.0, 2.0, 5.0, 6.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-147.52682495117188, -142.51129150390625, -137.49574279785156, -132.48020935058594, -127.46467590332031, -122.44913482666016, -117.43359375, -112.41806030273438, -107.40251922607422, -102.38697814941406, -97.37144470214844, -92.35590362548828, -87.34036254882812, -82.3248291015625, -77.30928802490234, -72.29374694824219, -67.27821350097656, -62.26267623901367, -57.24713897705078, -52.231597900390625, -47.216060638427734, -42.200523376464844, -37.18498229980469, -32.1694450378418, -27.153907775878906, -22.138370513916016, -17.122831344604492, -12.107293128967285, -7.091754913330078, -2.0762176513671875, 2.939321517944336, 7.954860687255859, 12.970413208007812, 17.985950469970703, 23.001489639282227, 28.01702880859375, 33.03256607055664, 38.04810333251953, 43.06364440917969, 48.07918167114258, 53.09471893310547, 58.11025619506836, 63.12579345703125, 68.1413345336914, 73.15687561035156, 78.17240905761719, 83.18795013427734, 88.2034912109375, 93.21902465820312, 98.23456573486328, 103.2500991821289, 108.26564025878906, 113.28117370605469, 118.29671478271484, 123.312255859375, 128.32778930664062, 133.34332275390625, 138.35885620117188, 143.37440490722656, 148.3899383544922, 153.4054718017578, 158.4210205078125, 163.43655395507812, 168.45208740234375, 173.46763610839844]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 2.0, 4.0, 3.0, 6.0, 9.0, 6.0, 12.0, 8.0, 11.0, 17.0, 19.0, 19.0, 28.0, 27.0, 37.0, 35.0, 44.0, 45.0, 42.0, 38.0, 48.0, 42.0, 37.0, 39.0, 39.0, 43.0, 31.0, 36.0, 39.0, 27.0, 33.0, 29.0, 26.0, 16.0, 21.0, 21.0, 9.0, 14.0, 6.0, 9.0, 7.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.6328125, -10.3023681640625, -9.971923828125, -9.6414794921875, -9.31103515625, -8.9805908203125, -8.650146484375, -8.3197021484375, -7.9892578125, -7.6588134765625, -7.328369140625, -6.9979248046875, -6.66748046875, -6.3370361328125, -6.006591796875, -5.6761474609375, -5.345703125, -5.0152587890625, -4.684814453125, -4.3543701171875, -4.02392578125, -3.6934814453125, -3.363037109375, -3.0325927734375, -2.7021484375, -2.3717041015625, -2.041259765625, -1.7108154296875, -1.38037109375, -1.0499267578125, -0.719482421875, -0.3890380859375, -0.05859375, 0.2718505859375, 0.602294921875, 0.9327392578125, 1.26318359375, 1.5936279296875, 1.924072265625, 2.2545166015625, 2.5849609375, 2.9154052734375, 3.245849609375, 3.5762939453125, 3.90673828125, 4.2371826171875, 4.567626953125, 4.8980712890625, 5.228515625, 5.5589599609375, 5.889404296875, 6.2198486328125, 6.55029296875, 6.8807373046875, 7.211181640625, 7.5416259765625, 7.8720703125, 8.2025146484375, 8.532958984375, 8.8634033203125, 9.19384765625, 9.5242919921875, 9.854736328125, 10.1851806640625, 10.515625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 4.0, 5.0, 8.0, 18.0, 23.0, 29.0, 44.0, 71.0, 87.0, 117.0, 167.0, 232.0, 345.0, 529.0, 739.0, 1045.0, 1514.0, 2176.0, 3235.0, 4728.0, 7046.0, 10865.0, 16527.0, 26020.0, 41968.0, 70173.0, 127460.0, 303098.0, 187943.0, 94312.0, 54364.0, 32817.0, 20597.0, 13344.0, 8545.0, 5796.0, 3955.0, 2635.0, 1797.0, 1263.0, 870.0, 610.0, 421.0, 300.0, 230.0, 141.0, 108.0, 81.0, 53.0, 28.0, 26.0, 22.0, 14.0, 7.0, 4.0, 4.0, 1.0, 4.0, 0.0, 2.0], "bins": [-2.25, -2.17913818359375, -2.1082763671875, -2.03741455078125, -1.966552734375, -1.89569091796875, -1.8248291015625, -1.75396728515625, -1.68310546875, -1.61224365234375, -1.5413818359375, -1.47052001953125, -1.399658203125, -1.32879638671875, -1.2579345703125, -1.18707275390625, -1.1162109375, -1.04534912109375, -0.9744873046875, -0.90362548828125, -0.832763671875, -0.76190185546875, -0.6910400390625, -0.62017822265625, -0.54931640625, -0.47845458984375, -0.4075927734375, -0.33673095703125, -0.265869140625, -0.19500732421875, -0.1241455078125, -0.05328369140625, 0.017578125, 0.08843994140625, 0.1593017578125, 0.23016357421875, 0.301025390625, 0.37188720703125, 0.4427490234375, 0.51361083984375, 0.58447265625, 0.65533447265625, 0.7261962890625, 0.79705810546875, 0.867919921875, 0.93878173828125, 1.0096435546875, 1.08050537109375, 1.1513671875, 1.22222900390625, 1.2930908203125, 1.36395263671875, 1.434814453125, 1.50567626953125, 1.5765380859375, 1.64739990234375, 1.71826171875, 1.78912353515625, 1.8599853515625, 1.93084716796875, 2.001708984375, 2.07257080078125, 2.1434326171875, 2.21429443359375, 2.28515625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 5.0, 3.0, 3.0, 5.0, 6.0, 9.0, 8.0, 15.0, 13.0, 10.0, 15.0, 24.0, 26.0, 24.0, 41.0, 40.0, 35.0, 31.0, 30.0, 46.0, 41.0, 40.0, 47.0, 1051.0, 29.0, 36.0, 32.0, 36.0, 30.0, 38.0, 36.0, 31.0, 31.0, 15.0, 18.0, 17.0, 16.0, 16.0, 14.0, 9.0, 14.0, 14.0, 4.0, 3.0, 7.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-7.08984375, -6.88446044921875, -6.6790771484375, -6.47369384765625, -6.268310546875, -6.06292724609375, -5.8575439453125, -5.65216064453125, -5.44677734375, -5.24139404296875, -5.0360107421875, -4.83062744140625, -4.625244140625, -4.41986083984375, -4.2144775390625, -4.00909423828125, -3.8037109375, -3.59832763671875, -3.3929443359375, -3.18756103515625, -2.982177734375, -2.77679443359375, -2.5714111328125, -2.36602783203125, -2.16064453125, -1.95526123046875, -1.7498779296875, -1.54449462890625, -1.339111328125, -1.13372802734375, -0.9283447265625, -0.72296142578125, -0.517578125, -0.31219482421875, -0.1068115234375, 0.09857177734375, 0.303955078125, 0.50933837890625, 0.7147216796875, 0.92010498046875, 1.12548828125, 1.33087158203125, 1.5362548828125, 1.74163818359375, 1.947021484375, 2.15240478515625, 2.3577880859375, 2.56317138671875, 2.7685546875, 2.97393798828125, 3.1793212890625, 3.38470458984375, 3.590087890625, 3.79547119140625, 4.0008544921875, 4.20623779296875, 4.41162109375, 4.61700439453125, 4.8223876953125, 5.02777099609375, 5.233154296875, 5.43853759765625, 5.6439208984375, 5.84930419921875, 6.0546875]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 6.0, 12.0, 14.0, 26.0, 37.0, 42.0, 79.0, 108.0, 137.0, 204.0, 304.0, 359.0, 555.0, 803.0, 1088.0, 1525.0, 2262.0, 3027.0, 4427.0, 6189.0, 9216.0, 13233.0, 20072.0, 30581.0, 47462.0, 76712.0, 133392.0, 1318704.0, 169463.0, 92552.0, 55797.0, 35555.0, 23194.0, 15498.0, 10320.0, 7216.0, 4966.0, 3550.0, 2419.0, 1791.0, 1255.0, 851.0, 646.0, 436.0, 330.0, 204.0, 174.0, 94.0, 80.0, 57.0, 38.0, 20.0, 17.0, 19.0, 10.0, 9.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-1.861328125, -1.798614501953125, -1.73590087890625, -1.673187255859375, -1.6104736328125, -1.547760009765625, -1.48504638671875, -1.422332763671875, -1.359619140625, -1.296905517578125, -1.23419189453125, -1.171478271484375, -1.1087646484375, -1.046051025390625, -0.98333740234375, -0.920623779296875, -0.85791015625, -0.795196533203125, -0.73248291015625, -0.669769287109375, -0.6070556640625, -0.544342041015625, -0.48162841796875, -0.418914794921875, -0.356201171875, -0.293487548828125, -0.23077392578125, -0.168060302734375, -0.1053466796875, -0.042633056640625, 0.02008056640625, 0.082794189453125, 0.1455078125, 0.208221435546875, 0.27093505859375, 0.333648681640625, 0.3963623046875, 0.459075927734375, 0.52178955078125, 0.584503173828125, 0.647216796875, 0.709930419921875, 0.77264404296875, 0.835357666015625, 0.8980712890625, 0.960784912109375, 1.02349853515625, 1.086212158203125, 1.14892578125, 1.211639404296875, 1.27435302734375, 1.337066650390625, 1.3997802734375, 1.462493896484375, 1.52520751953125, 1.587921142578125, 1.650634765625, 1.713348388671875, 1.77606201171875, 1.838775634765625, 1.9014892578125, 1.964202880859375, 2.02691650390625, 2.089630126953125, 2.15234375]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 6.0, 6.0, 3.0, 9.0, 4.0, 8.0, 13.0, 12.0, 17.0, 16.0, 19.0, 22.0, 29.0, 51.0, 52.0, 46.0, 61.0, 68.0, 89.0, 89.0, 62.0, 49.0, 42.0, 37.0, 37.0, 26.0, 25.0, 18.0, 12.0, 17.0, 8.0, 7.0, 5.0, 9.0, 3.0, 5.0, 9.0, 5.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.00152587890625, -0.0014729350805282593, -0.0014199912548065186, -0.0013670474290847778, -0.0013141036033630371, -0.0012611597776412964, -0.0012082159519195557, -0.001155272126197815, -0.0011023283004760742, -0.0010493844747543335, -0.0009964406490325928, -0.000943496823310852, -0.0008905529975891113, -0.0008376091718673706, -0.0007846653461456299, -0.0007317215204238892, -0.0006787776947021484, -0.0006258338689804077, -0.000572890043258667, -0.0005199462175369263, -0.00046700239181518555, -0.0004140585660934448, -0.0003611147403717041, -0.0003081709146499634, -0.00025522708892822266, -0.00020228326320648193, -0.0001493394374847412, -9.639561176300049e-05, -4.3451786041259766e-05, 9.492039680480957e-06, 6.243586540222168e-05, 0.0001153796911239624, 0.00016832351684570312, 0.00022126734256744385, 0.00027421116828918457, 0.0003271549940109253, 0.000380098819732666, 0.00043304264545440674, 0.00048598647117614746, 0.0005389302968978882, 0.0005918741226196289, 0.0006448179483413696, 0.0006977617740631104, 0.0007507055997848511, 0.0008036494255065918, 0.0008565932512283325, 0.0009095370769500732, 0.000962480902671814, 0.0010154247283935547, 0.0010683685541152954, 0.0011213123798370361, 0.0011742562055587769, 0.0012272000312805176, 0.0012801438570022583, 0.001333087682723999, 0.0013860315084457397, 0.0014389753341674805, 0.0014919191598892212, 0.001544862985610962, 0.0015978068113327026, 0.0016507506370544434, 0.001703694462776184, 0.0017566382884979248, 0.0018095821142196655, 0.0018625259399414062]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 2.0, 4.0, 8.0, 6.0, 13.0, 5.0, 6.0, 10.0, 13.0, 13.0, 22.0, 21.0, 39.0, 52.0, 71.0, 175.0, 257.0, 684.0, 935135.0, 110673.0, 631.0, 279.0, 126.0, 90.0, 55.0, 31.0, 26.0, 16.0, 18.0, 13.0, 12.0, 7.0, 12.0, 4.0, 3.0, 8.0, 7.0, 2.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.05267333984375, -0.05116605758666992, -0.049658775329589844, -0.048151493072509766, -0.04664421081542969, -0.04513692855834961, -0.04362964630126953, -0.04212236404418945, -0.040615081787109375, -0.0391077995300293, -0.03760051727294922, -0.03609323501586914, -0.03458595275878906, -0.033078670501708984, -0.031571388244628906, -0.030064105987548828, -0.02855682373046875, -0.027049541473388672, -0.025542259216308594, -0.024034976959228516, -0.022527694702148438, -0.02102041244506836, -0.01951313018798828, -0.018005847930908203, -0.016498565673828125, -0.014991283416748047, -0.013484001159667969, -0.01197671890258789, -0.010469436645507812, -0.008962154388427734, -0.007454872131347656, -0.005947589874267578, -0.0044403076171875, -0.002933025360107422, -0.0014257431030273438, 8.153915405273438e-05, 0.0015888214111328125, 0.0030961036682128906, 0.004603385925292969, 0.006110668182373047, 0.007617950439453125, 0.009125232696533203, 0.010632514953613281, 0.01213979721069336, 0.013647079467773438, 0.015154361724853516, 0.016661643981933594, 0.018168926239013672, 0.01967620849609375, 0.021183490753173828, 0.022690773010253906, 0.024198055267333984, 0.025705337524414062, 0.02721261978149414, 0.02871990203857422, 0.030227184295654297, 0.031734466552734375, 0.03324174880981445, 0.03474903106689453, 0.03625631332397461, 0.03776359558105469, 0.039270877838134766, 0.040778160095214844, 0.04228544235229492, 0.043792724609375]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 48.0, 963.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0038304217159748077, -0.0035962783731520176, -0.0033621350303292274, -0.003127991920337081, -0.002893848577514291, -0.0026597052346915007, -0.002425562124699354, -0.002191418781876564, -0.001957275439053774, -0.0017231320962309837, -0.0014889888698235154, -0.001254845643416047, -0.001020702300593257, -0.0007865589577704668, -0.0005524157313629985, -0.00031827250495553017, -8.412916213274002e-05, 0.0001500141224823892, 0.00038415740709751844, 0.0006183006917126477, 0.0008524439763277769, 0.001086587319150567, 0.0013207305455580354, 0.0015548737719655037, 0.0017890171147882938, 0.002023160457611084, 0.002257303800433874, 0.0024914469104260206, 0.0027255902532488108, 0.002959733596071601, 0.0031938767060637474, 0.0034280200488865376, 0.0036621633917093277, 0.003896306734532118, 0.004130450077354908, 0.004364593420177698, 0.004598736763000488, 0.004832879640161991, 0.005067022982984781, 0.005301166325807571, 0.0055353096686303616, 0.005769453011453152, 0.006003596354275942, 0.006237739697098732, 0.006471882574260235, 0.006706026382744312, 0.006940169259905815, 0.007174312602728605, 0.007408455945551395, 0.0076425992883741856, 0.007876742631196976, 0.008110885508358479, 0.008345029316842556, 0.008579172194004059, 0.008813316002488136, 0.009047458879649639, 0.009281601756811142, 0.009515744633972645, 0.009749888442456722, 0.009984031319618225, 0.010218175128102303, 0.010452318005263805, 0.010686461813747883, 0.010920604690909386, 0.011154748499393463]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 5.0, 3.0, 5.0, 5.0, 8.0, 11.0, 4.0, 10.0, 14.0, 23.0, 18.0, 27.0, 30.0, 23.0, 31.0, 33.0, 38.0, 44.0, 41.0, 40.0, 50.0, 51.0, 41.0, 47.0, 42.0, 46.0, 35.0, 29.0, 30.0, 29.0, 26.0, 30.0, 16.0, 13.0, 16.0, 18.0, 21.0, 14.0, 10.0, 8.0, 6.0, 5.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.000966191291809082, -0.0009376080706715584, -0.0009090248495340347, -0.0008804416283965111, -0.0008518584072589874, -0.0008232751861214638, -0.0007946919649839401, -0.0007661087438464165, -0.0007375255227088928, -0.0007089423015713692, -0.0006803590804338455, -0.0006517758592963219, -0.0006231926381587982, -0.0005946094170212746, -0.0005660261958837509, -0.0005374429747462273, -0.0005088597536087036, -0.00048027653247117996, -0.0004516933113336563, -0.00042311009019613266, -0.000394526869058609, -0.00036594364792108536, -0.0003373604267835617, -0.00030877720564603806, -0.0002801939845085144, -0.00025161076337099075, -0.0002230275422334671, -0.00019444432109594345, -0.0001658610999584198, -0.00013727787882089615, -0.0001086946576833725, -8.011143654584885e-05, -5.1528215408325195e-05, -2.2944994270801544e-05, 5.638226866722107e-06, 3.422144800424576e-05, 6.280466914176941e-05, 9.138789027929306e-05, 0.00011997111141681671, 0.00014855433255434036, 0.00017713755369186401, 0.00020572077482938766, 0.00023430399596691132, 0.00026288721710443497, 0.0002914704382419586, 0.00032005365937948227, 0.0003486368805170059, 0.00037722010165452957, 0.0004058033227920532, 0.0004343865439295769, 0.0004629697650671005, 0.0004915529862046242, 0.0005201362073421478, 0.0005487194284796715, 0.0005773026496171951, 0.0006058858707547188, 0.0006344690918922424, 0.0006630523130297661, 0.0006916355341672897, 0.0007202187553048134, 0.000748801976442337, 0.0007773851975798607, 0.0008059684187173843, 0.000834551639854908, 0.0008631348609924316]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 0.0, 4.0, 2.0, 4.0, 3.0, 6.0, 9.0, 6.0, 12.0, 8.0, 11.0, 17.0, 19.0, 19.0, 28.0, 27.0, 37.0, 35.0, 44.0, 45.0, 42.0, 38.0, 48.0, 42.0, 37.0, 39.0, 39.0, 43.0, 31.0, 36.0, 39.0, 27.0, 33.0, 29.0, 26.0, 16.0, 21.0, 21.0, 9.0, 14.0, 6.0, 9.0, 7.0, 7.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.6328125, -10.3023681640625, -9.971923828125, -9.6414794921875, -9.31103515625, -8.9805908203125, -8.650146484375, -8.3197021484375, -7.9892578125, -7.6588134765625, -7.328369140625, -6.9979248046875, -6.66748046875, -6.3370361328125, -6.006591796875, -5.6761474609375, -5.345703125, -5.0152587890625, -4.684814453125, -4.3543701171875, -4.02392578125, -3.6934814453125, -3.363037109375, -3.0325927734375, -2.7021484375, -2.3717041015625, -2.041259765625, -1.7108154296875, -1.38037109375, -1.0499267578125, -0.719482421875, -0.3890380859375, -0.05859375, 0.2718505859375, 0.602294921875, 0.9327392578125, 1.26318359375, 1.5936279296875, 1.924072265625, 2.2545166015625, 2.5849609375, 2.9154052734375, 3.245849609375, 3.5762939453125, 3.90673828125, 4.2371826171875, 4.567626953125, 4.8980712890625, 5.228515625, 5.5589599609375, 5.889404296875, 6.2198486328125, 6.55029296875, 6.8807373046875, 7.211181640625, 7.5416259765625, 7.8720703125, 8.2025146484375, 8.532958984375, 8.8634033203125, 9.19384765625, 9.5242919921875, 9.854736328125, 10.1851806640625, 10.515625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 10.0, 5.0, 8.0, 4.0, 14.0, 18.0, 27.0, 29.0, 42.0, 37.0, 68.0, 98.0, 124.0, 154.0, 223.0, 399.0, 620.0, 983.0, 2018.0, 4160.0, 9588.0, 25550.0, 79953.0, 308867.0, 438611.0, 118104.0, 35088.0, 12745.0, 5192.0, 2380.0, 1272.0, 735.0, 455.0, 252.0, 212.0, 139.0, 92.0, 62.0, 68.0, 38.0, 31.0, 16.0, 23.0, 18.0, 5.0, 4.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-9.875, -9.5579833984375, -9.240966796875, -8.9239501953125, -8.60693359375, -8.2899169921875, -7.972900390625, -7.6558837890625, -7.3388671875, -7.0218505859375, -6.704833984375, -6.3878173828125, -6.07080078125, -5.7537841796875, -5.436767578125, -5.1197509765625, -4.802734375, -4.4857177734375, -4.168701171875, -3.8516845703125, -3.53466796875, -3.2176513671875, -2.900634765625, -2.5836181640625, -2.2666015625, -1.9495849609375, -1.632568359375, -1.3155517578125, -0.99853515625, -0.6815185546875, -0.364501953125, -0.0474853515625, 0.26953125, 0.5865478515625, 0.903564453125, 1.2205810546875, 1.53759765625, 1.8546142578125, 2.171630859375, 2.4886474609375, 2.8056640625, 3.1226806640625, 3.439697265625, 3.7567138671875, 4.07373046875, 4.3907470703125, 4.707763671875, 5.0247802734375, 5.341796875, 5.6588134765625, 5.975830078125, 6.2928466796875, 6.60986328125, 6.9268798828125, 7.243896484375, 7.5609130859375, 7.8779296875, 8.1949462890625, 8.511962890625, 8.8289794921875, 9.14599609375, 9.4630126953125, 9.780029296875, 10.0970458984375, 10.4140625]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0, 5.0, 3.0, 1.0, 3.0, 7.0, 7.0, 14.0, 13.0, 15.0, 11.0, 23.0, 23.0, 37.0, 32.0, 31.0, 32.0, 41.0, 39.0, 41.0, 47.0, 75.0, 240.0, 1721.0, 133.0, 76.0, 53.0, 41.0, 43.0, 34.0, 32.0, 18.0, 25.0, 25.0, 12.0, 18.0, 15.0, 23.0, 9.0, 4.0, 8.0, 5.0, 5.0, 6.0, 4.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-36.34375, -35.18310546875, -34.0224609375, -32.86181640625, -31.701171875, -30.54052734375, -29.3798828125, -28.21923828125, -27.05859375, -25.89794921875, -24.7373046875, -23.57666015625, -22.416015625, -21.25537109375, -20.0947265625, -18.93408203125, -17.7734375, -16.61279296875, -15.4521484375, -14.29150390625, -13.130859375, -11.97021484375, -10.8095703125, -9.64892578125, -8.48828125, -7.32763671875, -6.1669921875, -5.00634765625, -3.845703125, -2.68505859375, -1.5244140625, -0.36376953125, 0.796875, 1.95751953125, 3.1181640625, 4.27880859375, 5.439453125, 6.60009765625, 7.7607421875, 8.92138671875, 10.08203125, 11.24267578125, 12.4033203125, 13.56396484375, 14.724609375, 15.88525390625, 17.0458984375, 18.20654296875, 19.3671875, 20.52783203125, 21.6884765625, 22.84912109375, 24.009765625, 25.17041015625, 26.3310546875, 27.49169921875, 28.65234375, 29.81298828125, 30.9736328125, 32.13427734375, 33.294921875, 34.45556640625, 35.6162109375, 36.77685546875, 37.9375]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 1.0, 7.0, 5.0, 5.0, 7.0, 7.0, 13.0, 19.0, 17.0, 18.0, 20.0, 24.0, 30.0, 34.0, 47.0, 64.0, 100.0, 176.0, 311.0, 962.0, 8086.0, 3109770.0, 23657.0, 1223.0, 426.0, 177.0, 122.0, 62.0, 62.0, 46.0, 41.0, 35.0, 29.0, 14.0, 12.0, 20.0, 11.0, 10.0, 9.0, 9.0, 4.0, 2.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.25, -83.6044921875, -80.958984375, -78.3134765625, -75.66796875, -73.0224609375, -70.376953125, -67.7314453125, -65.0859375, -62.4404296875, -59.794921875, -57.1494140625, -54.50390625, -51.8583984375, -49.212890625, -46.5673828125, -43.921875, -41.2763671875, -38.630859375, -35.9853515625, -33.33984375, -30.6943359375, -28.048828125, -25.4033203125, -22.7578125, -20.1123046875, -17.466796875, -14.8212890625, -12.17578125, -9.5302734375, -6.884765625, -4.2392578125, -1.59375, 1.0517578125, 3.697265625, 6.3427734375, 8.98828125, 11.6337890625, 14.279296875, 16.9248046875, 19.5703125, 22.2158203125, 24.861328125, 27.5068359375, 30.15234375, 32.7978515625, 35.443359375, 38.0888671875, 40.734375, 43.3798828125, 46.025390625, 48.6708984375, 51.31640625, 53.9619140625, 56.607421875, 59.2529296875, 61.8984375, 64.5439453125, 67.189453125, 69.8349609375, 72.48046875, 75.1259765625, 77.771484375, 80.4169921875, 83.0625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 19.0, 738.0, 259.0, 4.0], "bins": [-455.5243225097656, -448.15130615234375, -440.7783203125, -433.4053039550781, -426.03228759765625, -418.6593017578125, -411.2862854003906, -403.91326904296875, -396.5402526855469, -389.167236328125, -381.79425048828125, -374.4212341308594, -367.0482177734375, -359.67523193359375, -352.3022155761719, -344.92919921875, -337.55621337890625, -330.1831970214844, -322.8102111816406, -315.43719482421875, -308.0641784667969, -300.691162109375, -293.31817626953125, -285.9451599121094, -278.5721435546875, -271.1991271972656, -263.8261413574219, -256.453125, -249.08010864257812, -241.7071075439453, -234.3341064453125, -226.96109008789062, -219.5880889892578, -212.215087890625, -204.84207153320312, -197.4690704345703, -190.09605407714844, -182.72305297851562, -175.35003662109375, -167.97703552246094, -160.60403442382812, -153.2310333251953, -145.85801696777344, -138.48501586914062, -131.11199951171875, -123.73899841308594, -116.3659896850586, -108.99298095703125, -101.61997985839844, -94.2469711303711, -86.87396240234375, -79.50096130371094, -72.1279525756836, -64.75494384765625, -57.381935119628906, -50.00893020629883, -42.63591766357422, -35.262908935546875, -27.889904022216797, -20.516895294189453, -13.143888473510742, -5.770881652832031, 1.6021270751953125, 8.97513198852539, 16.348140716552734]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 7.0, 4.0, 2.0, 3.0, 5.0, 9.0, 10.0, 18.0, 11.0, 15.0, 23.0, 28.0, 27.0, 35.0, 33.0, 33.0, 38.0, 42.0, 35.0, 37.0, 50.0, 44.0, 44.0, 54.0, 54.0, 47.0, 49.0, 31.0, 28.0, 30.0, 26.0, 28.0, 17.0, 22.0, 14.0, 15.0, 8.0, 5.0, 7.0, 5.0, 6.0, 5.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-110.15283203125, -106.2305679321289, -102.30829620361328, -98.38603210449219, -94.46376037597656, -90.54149627685547, -86.61923217773438, -82.69696044921875, -78.77468872070312, -74.85242462158203, -70.9301528930664, -67.00788879394531, -63.08561706542969, -59.163352966308594, -55.241085052490234, -51.318817138671875, -47.39655303955078, -43.47428512573242, -39.55201721191406, -35.62975311279297, -31.707483291625977, -27.785215377807617, -23.86294937133789, -19.94068145751953, -16.018413543701172, -12.096145629882812, -8.17387866973877, -4.251611709594727, -0.3293437957763672, 3.592924118041992, 7.515190124511719, 11.437458038330078, 15.359725952148438, 19.281993865966797, 23.204261779785156, 27.126527786254883, 31.048795700073242, 34.97106170654297, 38.89332962036133, 42.81559753417969, 46.73786544799805, 50.660133361816406, 54.582401275634766, 58.504669189453125, 62.42693328857422, 66.34920501708984, 70.27146911621094, 74.19374084472656, 78.11600494384766, 82.03826904296875, 85.96054077148438, 89.88280487060547, 93.8050765991211, 97.72734069824219, 101.64961242675781, 105.5718765258789, 109.494140625, 113.4164047241211, 117.33867645263672, 121.26094055175781, 125.18321228027344, 129.10548400878906, 133.02774047851562, 136.95001220703125, 140.87228393554688]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 2.0, 1.0, 3.0, 8.0, 3.0, 8.0, 4.0, 8.0, 11.0, 7.0, 15.0, 23.0, 16.0, 20.0, 21.0, 31.0, 32.0, 40.0, 42.0, 43.0, 44.0, 43.0, 42.0, 42.0, 38.0, 42.0, 39.0, 34.0, 34.0, 39.0, 41.0, 30.0, 27.0, 25.0, 29.0, 18.0, 22.0, 20.0, 11.0, 8.0, 10.0, 7.0, 4.0, 11.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-10.71875, -10.3843994140625, -10.050048828125, -9.7156982421875, -9.38134765625, -9.0469970703125, -8.712646484375, -8.3782958984375, -8.0439453125, -7.7095947265625, -7.375244140625, -7.0408935546875, -6.70654296875, -6.3721923828125, -6.037841796875, -5.7034912109375, -5.369140625, -5.0347900390625, -4.700439453125, -4.3660888671875, -4.03173828125, -3.6973876953125, -3.363037109375, -3.0286865234375, -2.6943359375, -2.3599853515625, -2.025634765625, -1.6912841796875, -1.35693359375, -1.0225830078125, -0.688232421875, -0.3538818359375, -0.01953125, 0.3148193359375, 0.649169921875, 0.9835205078125, 1.31787109375, 1.6522216796875, 1.986572265625, 2.3209228515625, 2.6552734375, 2.9896240234375, 3.323974609375, 3.6583251953125, 3.99267578125, 4.3270263671875, 4.661376953125, 4.9957275390625, 5.330078125, 5.6644287109375, 5.998779296875, 6.3331298828125, 6.66748046875, 7.0018310546875, 7.336181640625, 7.6705322265625, 8.0048828125, 8.3392333984375, 8.673583984375, 9.0079345703125, 9.34228515625, 9.6766357421875, 10.010986328125, 10.3453369140625, 10.6796875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 3.0, 3.0, 8.0, 4.0, 6.0, 8.0, 10.0, 13.0, 17.0, 29.0, 31.0, 37.0, 48.0, 80.0, 104.0, 179.0, 323.0, 809.0, 2962.0, 20566.0, 377862.0, 3172372.0, 584510.0, 28679.0, 3748.0, 913.0, 382.0, 185.0, 109.0, 69.0, 52.0, 30.0, 27.0, 30.0, 23.0, 15.0, 16.0, 6.0, 5.0, 6.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-37.59375, -36.439453125, -35.28515625, -34.130859375, -32.9765625, -31.822265625, -30.66796875, -29.513671875, -28.359375, -27.205078125, -26.05078125, -24.896484375, -23.7421875, -22.587890625, -21.43359375, -20.279296875, -19.125, -17.970703125, -16.81640625, -15.662109375, -14.5078125, -13.353515625, -12.19921875, -11.044921875, -9.890625, -8.736328125, -7.58203125, -6.427734375, -5.2734375, -4.119140625, -2.96484375, -1.810546875, -0.65625, 0.498046875, 1.65234375, 2.806640625, 3.9609375, 5.115234375, 6.26953125, 7.423828125, 8.578125, 9.732421875, 10.88671875, 12.041015625, 13.1953125, 14.349609375, 15.50390625, 16.658203125, 17.8125, 18.966796875, 20.12109375, 21.275390625, 22.4296875, 23.583984375, 24.73828125, 25.892578125, 27.046875, 28.201171875, 29.35546875, 30.509765625, 31.6640625, 32.818359375, 33.97265625, 35.126953125, 36.28125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 6.0, 8.0, 9.0, 16.0, 33.0, 59.0, 97.0, 155.0, 285.0, 464.0, 871.0, 864.0, 547.0, 282.0, 144.0, 105.0, 63.0, 26.0, 20.0, 13.0, 6.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.9375, -86.59619140625, -84.2548828125, -81.91357421875, -79.572265625, -77.23095703125, -74.8896484375, -72.54833984375, -70.20703125, -67.86572265625, -65.5244140625, -63.18310546875, -60.841796875, -58.50048828125, -56.1591796875, -53.81787109375, -51.4765625, -49.13525390625, -46.7939453125, -44.45263671875, -42.111328125, -39.77001953125, -37.4287109375, -35.08740234375, -32.74609375, -30.40478515625, -28.0634765625, -25.72216796875, -23.380859375, -21.03955078125, -18.6982421875, -16.35693359375, -14.015625, -11.67431640625, -9.3330078125, -6.99169921875, -4.650390625, -2.30908203125, 0.0322265625, 2.37353515625, 4.71484375, 7.05615234375, 9.3974609375, 11.73876953125, 14.080078125, 16.42138671875, 18.7626953125, 21.10400390625, 23.4453125, 25.78662109375, 28.1279296875, 30.46923828125, 32.810546875, 35.15185546875, 37.4931640625, 39.83447265625, 42.17578125, 44.51708984375, 46.8583984375, 49.19970703125, 51.541015625, 53.88232421875, 56.2236328125, 58.56494140625, 60.90625]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 6.0, 9.0, 15.0, 25.0, 55.0, 76.0, 126.0, 226.0, 394.0, 1263.0, 1167448.0, 3022398.0, 1297.0, 382.0, 229.0, 130.0, 71.0, 50.0, 28.0, 19.0, 11.0, 7.0, 4.0, 6.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-231.25, -223.28515625, -215.3203125, -207.35546875, -199.390625, -191.42578125, -183.4609375, -175.49609375, -167.53125, -159.56640625, -151.6015625, -143.63671875, -135.671875, -127.70703125, -119.7421875, -111.77734375, -103.8125, -95.84765625, -87.8828125, -79.91796875, -71.953125, -63.98828125, -56.0234375, -48.05859375, -40.09375, -32.12890625, -24.1640625, -16.19921875, -8.234375, -0.26953125, 7.6953125, 15.66015625, 23.625, 31.58984375, 39.5546875, 47.51953125, 55.484375, 63.44921875, 71.4140625, 79.37890625, 87.34375, 95.30859375, 103.2734375, 111.23828125, 119.203125, 127.16796875, 135.1328125, 143.09765625, 151.0625, 159.02734375, 166.9921875, 174.95703125, 182.921875, 190.88671875, 198.8515625, 206.81640625, 214.78125, 222.74609375, 230.7109375, 238.67578125, 246.640625, 254.60546875, 262.5703125, 270.53515625, 278.5]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 8.0, 56.0, 348.0, 459.0, 131.0, 13.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-705.4849243164062, -692.4681396484375, -679.4513549804688, -666.4345703125, -653.4177856445312, -640.4010009765625, -627.38427734375, -614.367431640625, -601.3507080078125, -588.3339233398438, -575.317138671875, -562.3003540039062, -549.2835693359375, -536.2667846679688, -523.25, -510.2332458496094, -497.2164306640625, -484.19964599609375, -471.182861328125, -458.16607666015625, -445.1493225097656, -432.1325378417969, -419.1157531738281, -406.0989685058594, -393.08221435546875, -380.0654296875, -367.04864501953125, -354.0318603515625, -341.0151062011719, -327.9983215332031, -314.9815368652344, -301.9647521972656, -288.947998046875, -275.93121337890625, -262.9144287109375, -249.8976593017578, -236.88087463378906, -223.86410522460938, -210.84732055664062, -197.83053588867188, -184.81375122070312, -171.79696655273438, -158.7801971435547, -145.76341247558594, -132.7466278076172, -119.72985076904297, -106.71307373046875, -93.6962890625, -80.67950439453125, -67.66272735595703, -54.64594268798828, -41.62916564941406, -28.612384796142578, -15.595603942871094, -2.578826904296875, 10.437957763671875, 23.454734802246094, 36.47151565551758, 49.48829650878906, 62.50507354736328, 75.5218505859375, 88.53863525390625, 101.55541229248047, 114.57219696044922, 127.58897399902344]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 8.0, 3.0, 7.0, 9.0, 11.0, 5.0, 9.0, 26.0, 16.0, 15.0, 24.0, 22.0, 19.0, 25.0, 31.0, 48.0, 33.0, 43.0, 44.0, 41.0, 49.0, 36.0, 59.0, 46.0, 48.0, 31.0, 34.0, 30.0, 31.0, 29.0, 29.0, 21.0, 21.0, 16.0, 25.0, 14.0, 10.0, 8.0, 12.0, 5.0, 4.0, 3.0, 5.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-167.39956665039062, -162.64743041992188, -157.8953094482422, -153.14317321777344, -148.3910369873047, -143.638916015625, -138.88677978515625, -134.1346435546875, -129.38250732421875, -124.63037872314453, -119.87824249267578, -115.12611389160156, -110.37397766113281, -105.6218490600586, -100.86972045898438, -96.11758422851562, -91.36546325683594, -86.61333465576172, -81.86119842529297, -77.10906982421875, -72.35693359375, -67.60480499267578, -62.85267639160156, -58.10054397583008, -53.348411560058594, -48.59627914428711, -43.844146728515625, -39.092018127441406, -34.33988571166992, -29.587753295898438, -24.835622787475586, -20.083492279052734, -15.33135986328125, -10.579228401184082, -5.827096939086914, -1.074965476989746, 3.677165985107422, 8.429298400878906, 13.181428909301758, 17.93355941772461, 22.685691833496094, 27.437824249267578, 32.18995666503906, 36.94208526611328, 41.694217681884766, 46.44635009765625, 51.19847869873047, 55.95061111450195, 60.70274353027344, 65.45487213134766, 70.2070083618164, 74.95913696289062, 79.71127319335938, 84.4634017944336, 89.21553039550781, 93.96766662597656, 98.71979522705078, 103.471923828125, 108.22406005859375, 112.97618865966797, 117.72831726074219, 122.48045349121094, 127.23258209228516, 131.98471069335938, 136.73684692382812]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 4.0, 2.0, 5.0, 13.0, 3.0, 17.0, 13.0, 15.0, 13.0, 17.0, 35.0, 31.0, 33.0, 33.0, 39.0, 45.0, 53.0, 56.0, 32.0, 41.0, 40.0, 42.0, 42.0, 48.0, 34.0, 40.0, 33.0, 35.0, 28.0, 25.0, 27.0, 31.0, 8.0, 11.0, 10.0, 8.0, 9.0, 7.0, 6.0, 3.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.8203125, -11.4608154296875, -11.101318359375, -10.7418212890625, -10.38232421875, -10.0228271484375, -9.663330078125, -9.3038330078125, -8.9443359375, -8.5848388671875, -8.225341796875, -7.8658447265625, -7.50634765625, -7.1468505859375, -6.787353515625, -6.4278564453125, -6.068359375, -5.7088623046875, -5.349365234375, -4.9898681640625, -4.63037109375, -4.2708740234375, -3.911376953125, -3.5518798828125, -3.1923828125, -2.8328857421875, -2.473388671875, -2.1138916015625, -1.75439453125, -1.3948974609375, -1.035400390625, -0.6759033203125, -0.31640625, 0.0430908203125, 0.402587890625, 0.7620849609375, 1.12158203125, 1.4810791015625, 1.840576171875, 2.2000732421875, 2.5595703125, 2.9190673828125, 3.278564453125, 3.6380615234375, 3.99755859375, 4.3570556640625, 4.716552734375, 5.0760498046875, 5.435546875, 5.7950439453125, 6.154541015625, 6.5140380859375, 6.87353515625, 7.2330322265625, 7.592529296875, 7.9520263671875, 8.3115234375, 8.6710205078125, 9.030517578125, 9.3900146484375, 9.74951171875, 10.1090087890625, 10.468505859375, 10.8280029296875, 11.1875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 5.0, 1.0, 8.0, 8.0, 11.0, 26.0, 20.0, 39.0, 54.0, 93.0, 119.0, 161.0, 212.0, 347.0, 515.0, 721.0, 1002.0, 1461.0, 2021.0, 2923.0, 4455.0, 6163.0, 9445.0, 13970.0, 21692.0, 33457.0, 54152.0, 93831.0, 187722.0, 298391.0, 124683.0, 69318.0, 41982.0, 26571.0, 17174.0, 11461.0, 7664.0, 5078.0, 3494.0, 2473.0, 1778.0, 1160.0, 811.0, 574.0, 400.0, 284.0, 190.0, 134.0, 105.0, 75.0, 39.0, 31.0, 19.0, 12.0, 11.0, 7.0, 7.0, 3.0, 2.0, 3.0, 1.0], "bins": [-2.263671875, -2.193450927734375, -2.12322998046875, -2.053009033203125, -1.9827880859375, -1.912567138671875, -1.84234619140625, -1.772125244140625, -1.701904296875, -1.631683349609375, -1.56146240234375, -1.491241455078125, -1.4210205078125, -1.350799560546875, -1.28057861328125, -1.210357666015625, -1.14013671875, -1.069915771484375, -0.99969482421875, -0.929473876953125, -0.8592529296875, -0.789031982421875, -0.71881103515625, -0.648590087890625, -0.578369140625, -0.508148193359375, -0.43792724609375, -0.367706298828125, -0.2974853515625, -0.227264404296875, -0.15704345703125, -0.086822509765625, -0.0166015625, 0.053619384765625, 0.12384033203125, 0.194061279296875, 0.2642822265625, 0.334503173828125, 0.40472412109375, 0.474945068359375, 0.545166015625, 0.615386962890625, 0.68560791015625, 0.755828857421875, 0.8260498046875, 0.896270751953125, 0.96649169921875, 1.036712646484375, 1.10693359375, 1.177154541015625, 1.24737548828125, 1.317596435546875, 1.3878173828125, 1.458038330078125, 1.52825927734375, 1.598480224609375, 1.668701171875, 1.738922119140625, 1.80914306640625, 1.879364013671875, 1.9495849609375, 2.019805908203125, 2.09002685546875, 2.160247802734375, 2.23046875]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 4.0, 6.0, 2.0, 7.0, 4.0, 9.0, 11.0, 16.0, 14.0, 14.0, 22.0, 26.0, 29.0, 28.0, 35.0, 38.0, 35.0, 43.0, 34.0, 35.0, 46.0, 31.0, 1063.0, 46.0, 47.0, 41.0, 39.0, 39.0, 29.0, 30.0, 31.0, 38.0, 24.0, 13.0, 18.0, 18.0, 8.0, 12.0, 12.0, 9.0, 16.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.0546875, -6.8350830078125, -6.615478515625, -6.3958740234375, -6.17626953125, -5.9566650390625, -5.737060546875, -5.5174560546875, -5.2978515625, -5.0782470703125, -4.858642578125, -4.6390380859375, -4.41943359375, -4.1998291015625, -3.980224609375, -3.7606201171875, -3.541015625, -3.3214111328125, -3.101806640625, -2.8822021484375, -2.66259765625, -2.4429931640625, -2.223388671875, -2.0037841796875, -1.7841796875, -1.5645751953125, -1.344970703125, -1.1253662109375, -0.90576171875, -0.6861572265625, -0.466552734375, -0.2469482421875, -0.02734375, 0.1922607421875, 0.411865234375, 0.6314697265625, 0.85107421875, 1.0706787109375, 1.290283203125, 1.5098876953125, 1.7294921875, 1.9490966796875, 2.168701171875, 2.3883056640625, 2.60791015625, 2.8275146484375, 3.047119140625, 3.2667236328125, 3.486328125, 3.7059326171875, 3.925537109375, 4.1451416015625, 4.36474609375, 4.5843505859375, 4.803955078125, 5.0235595703125, 5.2431640625, 5.4627685546875, 5.682373046875, 5.9019775390625, 6.12158203125, 6.3411865234375, 6.560791015625, 6.7803955078125, 7.0]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 9.0, 4.0, 11.0, 15.0, 16.0, 28.0, 49.0, 60.0, 94.0, 146.0, 203.0, 338.0, 456.0, 690.0, 1032.0, 1471.0, 2114.0, 3283.0, 4912.0, 7271.0, 10885.0, 16460.0, 25734.0, 40457.0, 66238.0, 115113.0, 1303279.0, 221489.0, 105273.0, 61419.0, 37552.0, 24285.0, 15727.0, 10132.0, 6875.0, 4542.0, 2984.0, 2173.0, 1415.0, 934.0, 666.0, 430.0, 261.0, 205.0, 124.0, 99.0, 63.0, 41.0, 29.0, 23.0, 17.0, 6.0, 3.0, 7.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.134765625, -2.067901611328125, -2.00103759765625, -1.934173583984375, -1.8673095703125, -1.800445556640625, -1.73358154296875, -1.666717529296875, -1.599853515625, -1.532989501953125, -1.46612548828125, -1.399261474609375, -1.3323974609375, -1.265533447265625, -1.19866943359375, -1.131805419921875, -1.06494140625, -0.998077392578125, -0.93121337890625, -0.864349365234375, -0.7974853515625, -0.730621337890625, -0.66375732421875, -0.596893310546875, -0.530029296875, -0.463165283203125, -0.39630126953125, -0.329437255859375, -0.2625732421875, -0.195709228515625, -0.12884521484375, -0.061981201171875, 0.0048828125, 0.071746826171875, 0.13861083984375, 0.205474853515625, 0.2723388671875, 0.339202880859375, 0.40606689453125, 0.472930908203125, 0.539794921875, 0.606658935546875, 0.67352294921875, 0.740386962890625, 0.8072509765625, 0.874114990234375, 0.94097900390625, 1.007843017578125, 1.07470703125, 1.141571044921875, 1.20843505859375, 1.275299072265625, 1.3421630859375, 1.409027099609375, 1.47589111328125, 1.542755126953125, 1.609619140625, 1.676483154296875, 1.74334716796875, 1.810211181640625, 1.8770751953125, 1.943939208984375, 2.01080322265625, 2.077667236328125, 2.14453125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 6.0, 6.0, 4.0, 6.0, 8.0, 12.0, 13.0, 25.0, 27.0, 43.0, 64.0, 85.0, 118.0, 134.0, 121.0, 87.0, 59.0, 52.0, 26.0, 25.0, 18.0, 16.0, 10.0, 9.0, 5.0, 3.0, 11.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00228118896484375, -0.0022012293338775635, -0.002121269702911377, -0.0020413100719451904, -0.001961350440979004, -0.0018813908100128174, -0.0018014311790466309, -0.0017214715480804443, -0.0016415119171142578, -0.0015615522861480713, -0.0014815926551818848, -0.0014016330242156982, -0.0013216733932495117, -0.0012417137622833252, -0.0011617541313171387, -0.0010817945003509521, -0.0010018348693847656, -0.0009218752384185791, -0.0008419156074523926, -0.0007619559764862061, -0.0006819963455200195, -0.000602036714553833, -0.0005220770835876465, -0.00044211745262145996, -0.00036215782165527344, -0.0002821981906890869, -0.0002022385597229004, -0.00012227892875671387, -4.2319297790527344e-05, 3.764033317565918e-05, 0.0001175999641418457, 0.00019755959510803223, 0.00027751922607421875, 0.0003574788570404053, 0.0004374384880065918, 0.0005173981189727783, 0.0005973577499389648, 0.0006773173809051514, 0.0007572770118713379, 0.0008372366428375244, 0.0009171962738037109, 0.0009971559047698975, 0.001077115535736084, 0.0011570751667022705, 0.001237034797668457, 0.0013169944286346436, 0.00139695405960083, 0.0014769136905670166, 0.0015568733215332031, 0.0016368329524993896, 0.0017167925834655762, 0.0017967522144317627, 0.0018767118453979492, 0.0019566714763641357, 0.0020366311073303223, 0.002116590738296509, 0.0021965503692626953, 0.002276510000228882, 0.0023564696311950684, 0.002436429262161255, 0.0025163888931274414, 0.002596348524093628, 0.0026763081550598145, 0.002756267786026001, 0.0028362274169921875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 7.0, 7.0, 10.0, 20.0, 26.0, 29.0, 42.0, 84.0, 129.0, 297.0, 1239.0, 1045113.0, 939.0, 261.0, 126.0, 75.0, 44.0, 33.0, 17.0, 9.0, 16.0, 2.0, 5.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.07550048828125, -0.07336950302124023, -0.07123851776123047, -0.0691075325012207, -0.06697654724121094, -0.06484556198120117, -0.0627145767211914, -0.06058359146118164, -0.058452606201171875, -0.05632162094116211, -0.054190635681152344, -0.05205965042114258, -0.04992866516113281, -0.04779767990112305, -0.04566669464111328, -0.043535709381103516, -0.04140472412109375, -0.039273738861083984, -0.03714275360107422, -0.03501176834106445, -0.03288078308105469, -0.030749797821044922, -0.028618812561035156, -0.02648782730102539, -0.024356842041015625, -0.02222585678100586, -0.020094871520996094, -0.017963886260986328, -0.015832901000976562, -0.013701915740966797, -0.011570930480957031, -0.009439945220947266, -0.0073089599609375, -0.005177974700927734, -0.0030469894409179688, -0.0009160041809082031, 0.0012149810791015625, 0.003345966339111328, 0.005476951599121094, 0.007607936859130859, 0.009738922119140625, 0.01186990737915039, 0.014000892639160156, 0.016131877899169922, 0.018262863159179688, 0.020393848419189453, 0.02252483367919922, 0.024655818939208984, 0.02678680419921875, 0.028917789459228516, 0.03104877471923828, 0.03317975997924805, 0.03531074523925781, 0.03744173049926758, 0.039572715759277344, 0.04170370101928711, 0.043834686279296875, 0.04596567153930664, 0.048096656799316406, 0.05022764205932617, 0.05235862731933594, 0.0544896125793457, 0.05662059783935547, 0.058751583099365234, 0.060882568359375]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 6.0, 28.0, 272.0, 524.0, 168.0, 16.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.004810418002307415, -0.004726535174995661, -0.004642652813345194, -0.00455876998603344, -0.004474887624382973, -0.0043910047970712185, -0.004307121969759464, -0.004223239608108997, -0.004139356780797243, -0.004055473953485489, -0.003971591591835022, -0.0038877087645232677, -0.003803826170042157, -0.0037199435755610466, -0.003636060981079936, -0.0035521783865988255, -0.003468295792117715, -0.0033844131976366043, -0.0033005306031554937, -0.003216648008674383, -0.003132765181362629, -0.0030488825868815184, -0.002964999992400408, -0.0028811173979192972, -0.0027972348034381866, -0.002713352208957076, -0.0026294696144759655, -0.0025455867871642113, -0.0024617041926831007, -0.00237782159820199, -0.0022939390037208796, -0.002210056409239769, -0.0021261735819280148, -0.002042290987446904, -0.0019584083929657936, -0.0018745256820693612, -0.0017906429711729288, -0.0017067603766918182, -0.0016228777822107077, -0.001538995187729597, -0.0014551124768331647, -0.0013712298823520541, -0.0012873471714556217, -0.0012034645769745111, -0.0011195819824934006, -0.0010356992715969682, -0.0009518166771158576, -0.0008679340244270861, -0.0007840513717383146, -0.0007001687190495431, -0.0006162860663607717, -0.0005324034718796611, -0.0004485208191908896, -0.0003646381665021181, -0.00028075557202100754, -0.00019687291933223605, -0.00011299026664346457, -2.9107628506608307e-05, 5.477500963024795e-05, 0.00013865763321518898, 0.00022254028590396047, 0.00030642293859273195, 0.0003903055330738425, 0.000474188185762614, 0.0005580708384513855]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 9.0, 7.0, 9.0, 7.0, 10.0, 15.0, 15.0, 19.0, 23.0, 23.0, 32.0, 18.0, 27.0, 29.0, 33.0, 35.0, 47.0, 49.0, 51.0, 48.0, 56.0, 34.0, 52.0, 33.0, 43.0, 27.0, 40.0, 33.0, 32.0, 21.0, 25.0, 15.0, 20.0, 20.0, 10.0, 10.0, 9.0, 9.0, 0.0, 3.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0010797977447509766, -0.0010486738756299019, -0.0010175500065088272, -0.0009864261373877525, -0.0009553022682666779, -0.0009241783991456032, -0.0008930545300245285, -0.0008619306609034538, -0.0008308067917823792, -0.0007996829226613045, -0.0007685590535402298, -0.0007374351844191551, -0.0007063113152980804, -0.0006751874461770058, -0.0006440635770559311, -0.0006129397079348564, -0.0005818158388137817, -0.0005506919696927071, -0.0005195681005716324, -0.0004884442314505577, -0.00045732036232948303, -0.00042619649320840836, -0.0003950726240873337, -0.000363948754966259, -0.0003328248858451843, -0.00030170101672410965, -0.000270577147603035, -0.0002394532784819603, -0.00020832940936088562, -0.00017720554023981094, -0.00014608167111873627, -0.00011495780199766159, -8.383393287658691e-05, -5.271006375551224e-05, -2.158619463443756e-05, 9.537674486637115e-06, 4.066154360771179e-05, 7.178541272878647e-05, 0.00010290928184986115, 0.00013403315097093582, 0.0001651570200920105, 0.00019628088921308517, 0.00022740475833415985, 0.00025852862745523453, 0.0002896524965763092, 0.0003207763656973839, 0.00035190023481845856, 0.00038302410393953323, 0.0004141479730606079, 0.0004452718421816826, 0.00047639571130275726, 0.0005075195804238319, 0.0005386434495449066, 0.0005697673186659813, 0.000600891187787056, 0.0006320150569081306, 0.0006631389260292053, 0.00069426279515028, 0.0007253866642713547, 0.0007565105333924294, 0.000787634402513504, 0.0008187582716345787, 0.0008498821407556534, 0.0008810060098767281, 0.0009121298789978027]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 4.0, 2.0, 5.0, 13.0, 3.0, 17.0, 13.0, 15.0, 13.0, 17.0, 35.0, 31.0, 33.0, 33.0, 39.0, 45.0, 53.0, 56.0, 32.0, 41.0, 40.0, 42.0, 42.0, 48.0, 34.0, 40.0, 33.0, 35.0, 28.0, 25.0, 27.0, 31.0, 8.0, 11.0, 10.0, 8.0, 9.0, 7.0, 6.0, 3.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.8203125, -11.4608154296875, -11.101318359375, -10.7418212890625, -10.38232421875, -10.0228271484375, -9.663330078125, -9.3038330078125, -8.9443359375, -8.5848388671875, -8.225341796875, -7.8658447265625, -7.50634765625, -7.1468505859375, -6.787353515625, -6.4278564453125, -6.068359375, -5.7088623046875, -5.349365234375, -4.9898681640625, -4.63037109375, -4.2708740234375, -3.911376953125, -3.5518798828125, -3.1923828125, -2.8328857421875, -2.473388671875, -2.1138916015625, -1.75439453125, -1.3948974609375, -1.035400390625, -0.6759033203125, -0.31640625, 0.0430908203125, 0.402587890625, 0.7620849609375, 1.12158203125, 1.4810791015625, 1.840576171875, 2.2000732421875, 2.5595703125, 2.9190673828125, 3.278564453125, 3.6380615234375, 3.99755859375, 4.3570556640625, 4.716552734375, 5.0760498046875, 5.435546875, 5.7950439453125, 6.154541015625, 6.5140380859375, 6.87353515625, 7.2330322265625, 7.592529296875, 7.9520263671875, 8.3115234375, 8.6710205078125, 9.030517578125, 9.3900146484375, 9.74951171875, 10.1090087890625, 10.468505859375, 10.8280029296875, 11.1875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 9.0, 5.0, 13.0, 23.0, 22.0, 32.0, 36.0, 57.0, 94.0, 163.0, 188.0, 254.0, 462.0, 689.0, 1142.0, 1884.0, 3243.0, 6081.0, 12544.0, 29524.0, 82625.0, 313434.0, 421225.0, 107457.0, 35735.0, 15116.0, 7060.0, 3719.0, 2116.0, 1281.0, 779.0, 513.0, 338.0, 220.0, 140.0, 110.0, 64.0, 48.0, 35.0, 31.0, 15.0, 11.0, 7.0, 3.0, 6.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.46875, -8.196533203125, -7.92431640625, -7.652099609375, -7.3798828125, -7.107666015625, -6.83544921875, -6.563232421875, -6.291015625, -6.018798828125, -5.74658203125, -5.474365234375, -5.2021484375, -4.929931640625, -4.65771484375, -4.385498046875, -4.11328125, -3.841064453125, -3.56884765625, -3.296630859375, -3.0244140625, -2.752197265625, -2.47998046875, -2.207763671875, -1.935546875, -1.663330078125, -1.39111328125, -1.118896484375, -0.8466796875, -0.574462890625, -0.30224609375, -0.030029296875, 0.2421875, 0.514404296875, 0.78662109375, 1.058837890625, 1.3310546875, 1.603271484375, 1.87548828125, 2.147705078125, 2.419921875, 2.692138671875, 2.96435546875, 3.236572265625, 3.5087890625, 3.781005859375, 4.05322265625, 4.325439453125, 4.59765625, 4.869873046875, 5.14208984375, 5.414306640625, 5.6865234375, 5.958740234375, 6.23095703125, 6.503173828125, 6.775390625, 7.047607421875, 7.31982421875, 7.592041015625, 7.8642578125, 8.136474609375, 8.40869140625, 8.680908203125, 8.953125]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 9.0, 6.0, 11.0, 8.0, 13.0, 14.0, 11.0, 14.0, 17.0, 26.0, 28.0, 28.0, 29.0, 30.0, 32.0, 42.0, 41.0, 46.0, 51.0, 83.0, 1756.0, 237.0, 67.0, 38.0, 48.0, 43.0, 36.0, 40.0, 26.0, 32.0, 31.0, 22.0, 17.0, 18.0, 13.0, 20.0, 9.0, 7.0, 6.0, 16.0, 6.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-35.0, -33.9326171875, -32.865234375, -31.7978515625, -30.73046875, -29.6630859375, -28.595703125, -27.5283203125, -26.4609375, -25.3935546875, -24.326171875, -23.2587890625, -22.19140625, -21.1240234375, -20.056640625, -18.9892578125, -17.921875, -16.8544921875, -15.787109375, -14.7197265625, -13.65234375, -12.5849609375, -11.517578125, -10.4501953125, -9.3828125, -8.3154296875, -7.248046875, -6.1806640625, -5.11328125, -4.0458984375, -2.978515625, -1.9111328125, -0.84375, 0.2236328125, 1.291015625, 2.3583984375, 3.42578125, 4.4931640625, 5.560546875, 6.6279296875, 7.6953125, 8.7626953125, 9.830078125, 10.8974609375, 11.96484375, 13.0322265625, 14.099609375, 15.1669921875, 16.234375, 17.3017578125, 18.369140625, 19.4365234375, 20.50390625, 21.5712890625, 22.638671875, 23.7060546875, 24.7734375, 25.8408203125, 26.908203125, 27.9755859375, 29.04296875, 30.1103515625, 31.177734375, 32.2451171875, 33.3125]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 1.0, 2.0, 1.0, 6.0, 10.0, 12.0, 6.0, 9.0, 14.0, 15.0, 17.0, 21.0, 22.0, 28.0, 33.0, 48.0, 68.0, 86.0, 140.0, 199.0, 423.0, 1013.0, 6069.0, 2358128.0, 772388.0, 4902.0, 914.0, 371.0, 199.0, 129.0, 89.0, 62.0, 52.0, 41.0, 36.0, 29.0, 17.0, 19.0, 13.0, 10.0, 14.0, 13.0, 8.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 2.0, 2.0], "bins": [-58.3125, -56.48779296875, -54.6630859375, -52.83837890625, -51.013671875, -49.18896484375, -47.3642578125, -45.53955078125, -43.71484375, -41.89013671875, -40.0654296875, -38.24072265625, -36.416015625, -34.59130859375, -32.7666015625, -30.94189453125, -29.1171875, -27.29248046875, -25.4677734375, -23.64306640625, -21.818359375, -19.99365234375, -18.1689453125, -16.34423828125, -14.51953125, -12.69482421875, -10.8701171875, -9.04541015625, -7.220703125, -5.39599609375, -3.5712890625, -1.74658203125, 0.078125, 1.90283203125, 3.7275390625, 5.55224609375, 7.376953125, 9.20166015625, 11.0263671875, 12.85107421875, 14.67578125, 16.50048828125, 18.3251953125, 20.14990234375, 21.974609375, 23.79931640625, 25.6240234375, 27.44873046875, 29.2734375, 31.09814453125, 32.9228515625, 34.74755859375, 36.572265625, 38.39697265625, 40.2216796875, 42.04638671875, 43.87109375, 45.69580078125, 47.5205078125, 49.34521484375, 51.169921875, 52.99462890625, 54.8193359375, 56.64404296875, 58.46875]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 898.0, 115.0, 0.0, 1.0], "bins": [-1066.22705078125, -1048.6787109375, -1031.13037109375, -1013.5820922851562, -996.0337524414062, -978.4854125976562, -960.9371337890625, -943.3887939453125, -925.8404541015625, -908.2921142578125, -890.7438354492188, -873.1954956054688, -855.6471557617188, -838.0988159179688, -820.550537109375, -803.002197265625, -785.453857421875, -767.905517578125, -750.3572387695312, -732.8088989257812, -715.2605590820312, -697.7122192382812, -680.1639404296875, -662.6156005859375, -645.0673217773438, -627.5189819335938, -609.970703125, -592.42236328125, -574.8740234375, -557.32568359375, -539.7774047851562, -522.2290649414062, -504.68072509765625, -487.1324157714844, -469.5840759277344, -452.0357666015625, -434.4874267578125, -416.9391174316406, -399.39080810546875, -381.84246826171875, -364.29412841796875, -346.7458190917969, -329.1974792480469, -311.649169921875, -294.100830078125, -276.5525207519531, -259.00421142578125, -241.45587158203125, -223.90756225585938, -206.35923767089844, -188.8109130859375, -171.26260375976562, -153.71426391601562, -136.16595458984375, -118.61763000488281, -101.06930541992188, -83.52098083496094, -65.97265625, -48.42433547973633, -30.876014709472656, -13.327690124511719, 4.220634460449219, 21.768951416015625, 39.31727600097656, 56.8656005859375]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 6.0, 1.0, 1.0, 4.0, 6.0, 6.0, 4.0, 5.0, 1.0, 13.0, 16.0, 8.0, 11.0, 21.0, 20.0, 18.0, 24.0, 23.0, 36.0, 33.0, 30.0, 36.0, 35.0, 43.0, 29.0, 26.0, 38.0, 39.0, 44.0, 39.0, 35.0, 36.0, 38.0, 28.0, 35.0, 38.0, 36.0, 20.0, 15.0, 22.0, 19.0, 21.0, 10.0, 11.0, 8.0, 8.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-112.30756378173828, -108.8187484741211, -105.3299331665039, -101.84111785888672, -98.35230255126953, -94.86349487304688, -91.37467956542969, -87.8858642578125, -84.39704895019531, -80.90823364257812, -77.41941833496094, -73.93060302734375, -70.44178771972656, -66.95297241210938, -63.46416091918945, -59.97534942626953, -56.48653030395508, -52.99771499633789, -49.5088996887207, -46.02008819580078, -42.531272888183594, -39.042457580566406, -35.55364227294922, -32.06482696533203, -28.576013565063477, -25.08719825744629, -21.598384857177734, -18.109569549560547, -14.620755195617676, -11.131940841674805, -7.643125534057617, -4.1543121337890625, -0.665496826171875, 2.823317766189575, 6.312132358551025, 9.800947189331055, 13.289761543273926, 16.778575897216797, 20.267391204833984, 23.75620460510254, 27.245019912719727, 30.733835220336914, 34.22264862060547, 37.711463928222656, 41.200279235839844, 44.68909454345703, 48.17790985107422, 51.66672134399414, 55.15553665161133, 58.644351959228516, 62.1331672668457, 65.62197875976562, 69.11079406738281, 72.599609375, 76.08842468261719, 79.57723999023438, 83.06605529785156, 86.55487060546875, 90.04368591308594, 93.53250122070312, 97.02131652832031, 100.5101318359375, 103.99894714355469, 107.48775482177734, 110.97657012939453]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 6.0, 3.0, 5.0, 8.0, 5.0, 7.0, 11.0, 10.0, 20.0, 12.0, 14.0, 29.0, 24.0, 31.0, 37.0, 44.0, 35.0, 36.0, 54.0, 47.0, 55.0, 29.0, 31.0, 43.0, 48.0, 43.0, 43.0, 36.0, 32.0, 29.0, 31.0, 28.0, 21.0, 22.0, 17.0, 10.0, 7.0, 7.0, 13.0, 4.0, 8.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-11.921875, -11.5560302734375, -11.190185546875, -10.8243408203125, -10.45849609375, -10.0926513671875, -9.726806640625, -9.3609619140625, -8.9951171875, -8.6292724609375, -8.263427734375, -7.8975830078125, -7.53173828125, -7.1658935546875, -6.800048828125, -6.4342041015625, -6.068359375, -5.7025146484375, -5.336669921875, -4.9708251953125, -4.60498046875, -4.2391357421875, -3.873291015625, -3.5074462890625, -3.1416015625, -2.7757568359375, -2.409912109375, -2.0440673828125, -1.67822265625, -1.3123779296875, -0.946533203125, -0.5806884765625, -0.21484375, 0.1510009765625, 0.516845703125, 0.8826904296875, 1.24853515625, 1.6143798828125, 1.980224609375, 2.3460693359375, 2.7119140625, 3.0777587890625, 3.443603515625, 3.8094482421875, 4.17529296875, 4.5411376953125, 4.906982421875, 5.2728271484375, 5.638671875, 6.0045166015625, 6.370361328125, 6.7362060546875, 7.10205078125, 7.4678955078125, 7.833740234375, 8.1995849609375, 8.5654296875, 8.9312744140625, 9.297119140625, 9.6629638671875, 10.02880859375, 10.3946533203125, 10.760498046875, 11.1263427734375, 11.4921875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 1.0, 7.0, 4.0, 4.0, 3.0, 14.0, 9.0, 14.0, 16.0, 10.0, 23.0, 28.0, 20.0, 32.0, 35.0, 39.0, 43.0, 64.0, 126.0, 771.0, 16785.0, 3424031.0, 747275.0, 4174.0, 326.0, 85.0, 48.0, 44.0, 33.0, 29.0, 29.0, 28.0, 28.0, 21.0, 13.0, 11.0, 10.0, 9.0, 15.0, 7.0, 2.0, 6.0, 5.0, 7.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-76.4375, -74.1083984375, -71.779296875, -69.4501953125, -67.12109375, -64.7919921875, -62.462890625, -60.1337890625, -57.8046875, -55.4755859375, -53.146484375, -50.8173828125, -48.48828125, -46.1591796875, -43.830078125, -41.5009765625, -39.171875, -36.8427734375, -34.513671875, -32.1845703125, -29.85546875, -27.5263671875, -25.197265625, -22.8681640625, -20.5390625, -18.2099609375, -15.880859375, -13.5517578125, -11.22265625, -8.8935546875, -6.564453125, -4.2353515625, -1.90625, 0.4228515625, 2.751953125, 5.0810546875, 7.41015625, 9.7392578125, 12.068359375, 14.3974609375, 16.7265625, 19.0556640625, 21.384765625, 23.7138671875, 26.04296875, 28.3720703125, 30.701171875, 33.0302734375, 35.359375, 37.6884765625, 40.017578125, 42.3466796875, 44.67578125, 47.0048828125, 49.333984375, 51.6630859375, 53.9921875, 56.3212890625, 58.650390625, 60.9794921875, 63.30859375, 65.6376953125, 67.966796875, 70.2958984375, 72.625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 6.0, 1.0, 5.0, 5.0, 13.0, 22.0, 29.0, 55.0, 95.0, 134.0, 237.0, 423.0, 701.0, 846.0, 626.0, 368.0, 221.0, 113.0, 64.0, 41.0, 33.0, 16.0, 16.0, 7.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.25, -51.37109375, -49.4921875, -47.61328125, -45.734375, -43.85546875, -41.9765625, -40.09765625, -38.21875, -36.33984375, -34.4609375, -32.58203125, -30.703125, -28.82421875, -26.9453125, -25.06640625, -23.1875, -21.30859375, -19.4296875, -17.55078125, -15.671875, -13.79296875, -11.9140625, -10.03515625, -8.15625, -6.27734375, -4.3984375, -2.51953125, -0.640625, 1.23828125, 3.1171875, 4.99609375, 6.875, 8.75390625, 10.6328125, 12.51171875, 14.390625, 16.26953125, 18.1484375, 20.02734375, 21.90625, 23.78515625, 25.6640625, 27.54296875, 29.421875, 31.30078125, 33.1796875, 35.05859375, 36.9375, 38.81640625, 40.6953125, 42.57421875, 44.453125, 46.33203125, 48.2109375, 50.08984375, 51.96875, 53.84765625, 55.7265625, 57.60546875, 59.484375, 61.36328125, 63.2421875, 65.12109375, 67.0]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 6.0, 7.0, 6.0, 17.0, 22.0, 30.0, 63.0, 73.0, 121.0, 216.0, 370.0, 1038.0, 1158946.0, 3031375.0, 1050.0, 408.0, 205.0, 116.0, 82.0, 60.0, 46.0, 16.0, 6.0, 4.0, 5.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-299.0, -290.46484375, -281.9296875, -273.39453125, -264.859375, -256.32421875, -247.7890625, -239.25390625, -230.71875, -222.18359375, -213.6484375, -205.11328125, -196.578125, -188.04296875, -179.5078125, -170.97265625, -162.4375, -153.90234375, -145.3671875, -136.83203125, -128.296875, -119.76171875, -111.2265625, -102.69140625, -94.15625, -85.62109375, -77.0859375, -68.55078125, -60.015625, -51.48046875, -42.9453125, -34.41015625, -25.875, -17.33984375, -8.8046875, -0.26953125, 8.265625, 16.80078125, 25.3359375, 33.87109375, 42.40625, 50.94140625, 59.4765625, 68.01171875, 76.546875, 85.08203125, 93.6171875, 102.15234375, 110.6875, 119.22265625, 127.7578125, 136.29296875, 144.828125, 153.36328125, 161.8984375, 170.43359375, 178.96875, 187.50390625, 196.0390625, 204.57421875, 213.109375, 221.64453125, 230.1796875, 238.71484375, 247.25]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 30.0, 317.0, 519.0, 130.0, 16.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-827.2380981445312, -811.9957275390625, -796.7533569335938, -781.510986328125, -766.2686767578125, -751.0263061523438, -735.783935546875, -720.5415649414062, -705.2991943359375, -690.0568237304688, -674.814453125, -659.5721435546875, -644.3297729492188, -629.08740234375, -613.8450317382812, -598.6026611328125, -583.3603515625, -568.1179809570312, -552.8756103515625, -537.63330078125, -522.3909301757812, -507.1485595703125, -491.90618896484375, -476.663818359375, -461.42144775390625, -446.1790771484375, -430.9367370605469, -415.6943664550781, -400.4519958496094, -385.20965576171875, -369.96728515625, -354.72491455078125, -339.4825134277344, -324.2401428222656, -308.997802734375, -293.75543212890625, -278.5130615234375, -263.27069091796875, -248.02835083007812, -232.78598022460938, -217.5436248779297, -202.30126953125, -187.05889892578125, -171.81654357910156, -156.57418823242188, -141.33181762695312, -126.08946228027344, -110.84709930419922, -95.604736328125, -80.36237335205078, -65.12001037597656, -49.877655029296875, -34.635292053222656, -19.392929077148438, -4.15057373046875, 11.091789245605469, 26.334152221679688, 41.576515197753906, 56.81887435913086, 72.06123352050781, 87.30359649658203, 102.54595947265625, 117.78831481933594, 133.03067016601562, 148.27304077148438]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 3.0, 4.0, 7.0, 10.0, 15.0, 9.0, 12.0, 25.0, 25.0, 31.0, 27.0, 36.0, 31.0, 50.0, 37.0, 43.0, 48.0, 38.0, 36.0, 33.0, 43.0, 40.0, 37.0, 45.0, 34.0, 39.0, 34.0, 24.0, 26.0, 23.0, 22.0, 25.0, 15.0, 15.0, 12.0, 15.0, 7.0, 8.0, 10.0, 3.0, 3.0, 5.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.25936889648438, -111.35108184814453, -107.44278717041016, -103.53450012207031, -99.62620544433594, -95.7179183959961, -91.80962371826172, -87.90133666992188, -83.9930419921875, -80.08475494384766, -76.17646026611328, -72.26817321777344, -68.35987854003906, -64.45159149169922, -60.543296813964844, -56.635009765625, -52.72671890258789, -48.81842803955078, -44.91013717651367, -41.00184631347656, -37.09355545043945, -33.185264587402344, -29.276975631713867, -25.368684768676758, -21.46039390563965, -17.55210304260254, -13.64381217956543, -9.735522270202637, -5.827231407165527, -1.9189414978027344, 1.989349365234375, 5.897640228271484, 9.805931091308594, 13.714221954345703, 17.622512817382812, 21.530803680419922, 25.43909454345703, 29.347383499145508, 33.25567626953125, 37.163963317871094, 41.07225799560547, 44.98054885864258, 48.88883972167969, 52.7971305847168, 56.705421447753906, 60.61370849609375, 64.52200317382812, 68.43029022216797, 72.33857727050781, 76.24686431884766, 80.15515899658203, 84.06344604492188, 87.97174072265625, 91.8800277709961, 95.78832244873047, 99.69660949707031, 103.60490417480469, 107.51319122314453, 111.4214859008789, 115.32977294921875, 119.23806762695312, 123.14635467529297, 127.05464935302734, 130.9629364013672, 134.87123107910156]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 7.0, 8.0, 7.0, 6.0, 4.0, 7.0, 10.0, 17.0, 26.0, 17.0, 24.0, 32.0, 31.0, 29.0, 35.0, 39.0, 44.0, 54.0, 42.0, 48.0, 37.0, 43.0, 36.0, 47.0, 45.0, 33.0, 23.0, 34.0, 34.0, 29.0, 27.0, 22.0, 17.0, 17.0, 16.0, 7.0, 10.0, 5.0, 9.0, 6.0, 10.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.1953125, -11.830810546875, -11.46630859375, -11.101806640625, -10.7373046875, -10.372802734375, -10.00830078125, -9.643798828125, -9.279296875, -8.914794921875, -8.55029296875, -8.185791015625, -7.8212890625, -7.456787109375, -7.09228515625, -6.727783203125, -6.36328125, -5.998779296875, -5.63427734375, -5.269775390625, -4.9052734375, -4.540771484375, -4.17626953125, -3.811767578125, -3.447265625, -3.082763671875, -2.71826171875, -2.353759765625, -1.9892578125, -1.624755859375, -1.26025390625, -0.895751953125, -0.53125, -0.166748046875, 0.19775390625, 0.562255859375, 0.9267578125, 1.291259765625, 1.65576171875, 2.020263671875, 2.384765625, 2.749267578125, 3.11376953125, 3.478271484375, 3.8427734375, 4.207275390625, 4.57177734375, 4.936279296875, 5.30078125, 5.665283203125, 6.02978515625, 6.394287109375, 6.7587890625, 7.123291015625, 7.48779296875, 7.852294921875, 8.216796875, 8.581298828125, 8.94580078125, 9.310302734375, 9.6748046875, 10.039306640625, 10.40380859375, 10.768310546875, 11.1328125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 10.0, 10.0, 21.0, 21.0, 36.0, 35.0, 55.0, 66.0, 150.0, 167.0, 252.0, 389.0, 530.0, 725.0, 1021.0, 1339.0, 1958.0, 2762.0, 4020.0, 5635.0, 7864.0, 12216.0, 18017.0, 27023.0, 42050.0, 67888.0, 119560.0, 274485.0, 195573.0, 97579.0, 57249.0, 35792.0, 23374.0, 15838.0, 10610.0, 7230.0, 5069.0, 3468.0, 2466.0, 1718.0, 1218.0, 901.0, 670.0, 450.0, 334.0, 228.0, 147.0, 100.0, 77.0, 56.0, 36.0, 30.0, 13.0, 15.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0], "bins": [-2.197265625, -2.12823486328125, -2.0592041015625, -1.99017333984375, -1.921142578125, -1.85211181640625, -1.7830810546875, -1.71405029296875, -1.64501953125, -1.57598876953125, -1.5069580078125, -1.43792724609375, -1.368896484375, -1.29986572265625, -1.2308349609375, -1.16180419921875, -1.0927734375, -1.02374267578125, -0.9547119140625, -0.88568115234375, -0.816650390625, -0.74761962890625, -0.6785888671875, -0.60955810546875, -0.54052734375, -0.47149658203125, -0.4024658203125, -0.33343505859375, -0.264404296875, -0.19537353515625, -0.1263427734375, -0.05731201171875, 0.01171875, 0.08074951171875, 0.1497802734375, 0.21881103515625, 0.287841796875, 0.35687255859375, 0.4259033203125, 0.49493408203125, 0.56396484375, 0.63299560546875, 0.7020263671875, 0.77105712890625, 0.840087890625, 0.90911865234375, 0.9781494140625, 1.04718017578125, 1.1162109375, 1.18524169921875, 1.2542724609375, 1.32330322265625, 1.392333984375, 1.46136474609375, 1.5303955078125, 1.59942626953125, 1.66845703125, 1.73748779296875, 1.8065185546875, 1.87554931640625, 1.944580078125, 2.01361083984375, 2.0826416015625, 2.15167236328125, 2.220703125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 2.0, 8.0, 2.0, 13.0, 7.0, 11.0, 7.0, 11.0, 15.0, 13.0, 19.0, 27.0, 25.0, 15.0, 27.0, 37.0, 36.0, 46.0, 39.0, 37.0, 41.0, 45.0, 1064.0, 39.0, 37.0, 48.0, 48.0, 41.0, 25.0, 34.0, 26.0, 28.0, 25.0, 22.0, 17.0, 11.0, 14.0, 8.0, 13.0, 11.0, 7.0, 8.0, 5.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0546875, -6.8380126953125, -6.621337890625, -6.4046630859375, -6.18798828125, -5.9713134765625, -5.754638671875, -5.5379638671875, -5.3212890625, -5.1046142578125, -4.887939453125, -4.6712646484375, -4.45458984375, -4.2379150390625, -4.021240234375, -3.8045654296875, -3.587890625, -3.3712158203125, -3.154541015625, -2.9378662109375, -2.72119140625, -2.5045166015625, -2.287841796875, -2.0711669921875, -1.8544921875, -1.6378173828125, -1.421142578125, -1.2044677734375, -0.98779296875, -0.7711181640625, -0.554443359375, -0.3377685546875, -0.12109375, 0.0955810546875, 0.312255859375, 0.5289306640625, 0.74560546875, 0.9622802734375, 1.178955078125, 1.3956298828125, 1.6123046875, 1.8289794921875, 2.045654296875, 2.2623291015625, 2.47900390625, 2.6956787109375, 2.912353515625, 3.1290283203125, 3.345703125, 3.5623779296875, 3.779052734375, 3.9957275390625, 4.21240234375, 4.4290771484375, 4.645751953125, 4.8624267578125, 5.0791015625, 5.2957763671875, 5.512451171875, 5.7291259765625, 5.94580078125, 6.1624755859375, 6.379150390625, 6.5958251953125, 6.8125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 10.0, 15.0, 17.0, 29.0, 45.0, 73.0, 106.0, 155.0, 237.0, 337.0, 482.0, 737.0, 1052.0, 1429.0, 2170.0, 3005.0, 4294.0, 6416.0, 8939.0, 13407.0, 20103.0, 30537.0, 49404.0, 83325.0, 157289.0, 1350381.0, 147137.0, 79104.0, 46991.0, 29394.0, 19212.0, 12876.0, 8715.0, 5895.0, 4266.0, 2912.0, 2036.0, 1449.0, 988.0, 684.0, 498.0, 306.0, 230.0, 142.0, 109.0, 67.0, 45.0, 29.0, 24.0, 14.0, 8.0, 8.0, 6.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.078125, -2.012054443359375, -1.94598388671875, -1.879913330078125, -1.8138427734375, -1.747772216796875, -1.68170166015625, -1.615631103515625, -1.549560546875, -1.483489990234375, -1.41741943359375, -1.351348876953125, -1.2852783203125, -1.219207763671875, -1.15313720703125, -1.087066650390625, -1.02099609375, -0.954925537109375, -0.88885498046875, -0.822784423828125, -0.7567138671875, -0.690643310546875, -0.62457275390625, -0.558502197265625, -0.492431640625, -0.426361083984375, -0.36029052734375, -0.294219970703125, -0.2281494140625, -0.162078857421875, -0.09600830078125, -0.029937744140625, 0.0361328125, 0.102203369140625, 0.16827392578125, 0.234344482421875, 0.3004150390625, 0.366485595703125, 0.43255615234375, 0.498626708984375, 0.564697265625, 0.630767822265625, 0.69683837890625, 0.762908935546875, 0.8289794921875, 0.895050048828125, 0.96112060546875, 1.027191162109375, 1.09326171875, 1.159332275390625, 1.22540283203125, 1.291473388671875, 1.3575439453125, 1.423614501953125, 1.48968505859375, 1.555755615234375, 1.621826171875, 1.687896728515625, 1.75396728515625, 1.820037841796875, 1.8861083984375, 1.952178955078125, 2.01824951171875, 2.084320068359375, 2.150390625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 5.0, 1.0, 3.0, 3.0, 4.0, 5.0, 4.0, 6.0, 5.0, 9.0, 11.0, 11.0, 16.0, 14.0, 22.0, 22.0, 41.0, 42.0, 38.0, 92.0, 107.0, 97.0, 98.0, 68.0, 58.0, 44.0, 25.0, 17.0, 21.0, 15.0, 16.0, 19.0, 11.0, 13.0, 6.0, 11.0, 10.0, 6.0, 5.0, 1.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0020236968994140625, -0.0019647032022476196, -0.0019057095050811768, -0.0018467158079147339, -0.001787722110748291, -0.0017287284135818481, -0.0016697347164154053, -0.0016107410192489624, -0.0015517473220825195, -0.0014927536249160767, -0.0014337599277496338, -0.001374766230583191, -0.001315772533416748, -0.0012567788362503052, -0.0011977851390838623, -0.0011387914419174194, -0.0010797977447509766, -0.0010208040475845337, -0.0009618103504180908, -0.000902816653251648, -0.0008438229560852051, -0.0007848292589187622, -0.0007258355617523193, -0.0006668418645858765, -0.0006078481674194336, -0.0005488544702529907, -0.0004898607730865479, -0.000430867075920105, -0.0003718733787536621, -0.00031287968158721924, -0.00025388598442077637, -0.0001948922872543335, -0.00013589859008789062, -7.690489292144775e-05, -1.7911195755004883e-05, 4.108250141143799e-05, 0.00010007619857788086, 0.00015906989574432373, 0.0002180635929107666, 0.00027705729007720947, 0.00033605098724365234, 0.0003950446844100952, 0.0004540383815765381, 0.000513032078742981, 0.0005720257759094238, 0.0006310194730758667, 0.0006900131702423096, 0.0007490068674087524, 0.0008080005645751953, 0.0008669942617416382, 0.0009259879589080811, 0.000984981656074524, 0.0010439753532409668, 0.0011029690504074097, 0.0011619627475738525, 0.0012209564447402954, 0.0012799501419067383, 0.0013389438390731812, 0.001397937536239624, 0.001456931233406067, 0.0015159249305725098, 0.0015749186277389526, 0.0016339123249053955, 0.0016929060220718384, 0.0017518997192382812]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 7.0, 7.0, 7.0, 10.0, 12.0, 15.0, 16.0, 15.0, 25.0, 35.0, 52.0, 66.0, 107.0, 151.0, 266.0, 727.0, 276675.0, 768805.0, 751.0, 284.0, 129.0, 101.0, 75.0, 48.0, 30.0, 26.0, 23.0, 13.0, 14.0, 14.0, 11.0, 2.0, 6.0, 2.0, 3.0, 5.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03594970703125, -0.03451347351074219, -0.033077239990234375, -0.03164100646972656, -0.03020477294921875, -0.028768539428710938, -0.027332305908203125, -0.025896072387695312, -0.0244598388671875, -0.023023605346679688, -0.021587371826171875, -0.020151138305664062, -0.01871490478515625, -0.017278671264648438, -0.015842437744140625, -0.014406204223632812, -0.012969970703125, -0.011533737182617188, -0.010097503662109375, -0.008661270141601562, -0.00722503662109375, -0.0057888031005859375, -0.004352569580078125, -0.0029163360595703125, -0.0014801025390625, -4.38690185546875e-05, 0.001392364501953125, 0.0028285980224609375, 0.00426483154296875, 0.0057010650634765625, 0.007137298583984375, 0.008573532104492188, 0.010009765625, 0.011445999145507812, 0.012882232666015625, 0.014318466186523438, 0.01575469970703125, 0.017190933227539062, 0.018627166748046875, 0.020063400268554688, 0.0214996337890625, 0.022935867309570312, 0.024372100830078125, 0.025808334350585938, 0.02724456787109375, 0.028680801391601562, 0.030117034912109375, 0.03155326843261719, 0.032989501953125, 0.03442573547363281, 0.035861968994140625, 0.03729820251464844, 0.03873443603515625, 0.04017066955566406, 0.041606903076171875, 0.04304313659667969, 0.0444793701171875, 0.04591560363769531, 0.047351837158203125, 0.04878807067871094, 0.05022430419921875, 0.05166053771972656, 0.053096771240234375, 0.05453300476074219, 0.05596923828125]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 5.0, 12.0, 16.0, 41.0, 54.0, 80.0, 111.0, 156.0, 162.0, 118.0, 104.0, 64.0, 31.0, 22.0, 17.0, 6.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007034657173790038, -0.0006776724476367235, -0.0006518791196867824, -0.0006260858499445021, -0.000600292521994561, -0.0005744992522522807, -0.0005487059243023396, -0.0005229126545600593, -0.0004971193848177791, -0.00047132608597166836, -0.00044553278712555766, -0.0004197395173832774, -0.00039394618943333626, -0.000368152919691056, -0.0003423596208449453, -0.0003165663219988346, -0.00029077299404889345, -0.00026497969520278275, -0.00023918639635667205, -0.00021339311206247658, -0.00018759981321636587, -0.00016180651437025517, -0.0001360132300760597, -0.000110219931229949, -8.44266323838383e-05, -5.86333371757064e-05, -3.284004196757451e-05, -7.04675039742142e-06, 1.8746548448689282e-05, 4.4539847294799984e-05, 7.033313158899546e-05, 9.612643043510616e-05, 0.00012191972928121686, 0.00014771302812732756, 0.00017350632697343826, 0.00019929961126763374, 0.00022509291011374444, 0.0002508861944079399, 0.0002766794932540506, 0.0003024727921001613, 0.000328266090946272, 0.0003540593897923827, 0.0003798526886384934, 0.0004056459874846041, 0.00043143925722688437, 0.0004572325851768255, 0.00048302585491910577, 0.000508819124661386, 0.0005346124526113272, 0.0005604057223536074, 0.0005861990503035486, 0.0006119923200458288, 0.00063778564799577, 0.0006635789177380502, 0.0006893721874803305, 0.0007151655154302716, 0.0007409588433802128, 0.000766752113122493, 0.0007925454410724342, 0.0008183387108147144, 0.0008441320387646556, 0.0008699253085069358, 0.0008957185782492161, 0.0009215119061991572, 0.0009473051759414375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 0.0, 2.0, 4.0, 6.0, 7.0, 10.0, 13.0, 14.0, 8.0, 18.0, 15.0, 19.0, 26.0, 26.0, 28.0, 26.0, 42.0, 34.0, 32.0, 45.0, 38.0, 44.0, 43.0, 48.0, 42.0, 32.0, 33.0, 47.0, 33.0, 35.0, 23.0, 18.0, 21.0, 24.0, 30.0, 24.0, 19.0, 18.0, 10.0, 11.0, 8.0, 8.0, 10.0, 4.0, 5.0, 5.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008897185325622559, -0.0008610868826508522, -0.0008324552327394485, -0.0008038235828280449, -0.0007751919329166412, -0.0007465602830052376, -0.0007179286330938339, -0.0006892969831824303, -0.0006606653332710266, -0.000632033683359623, -0.0006034020334482193, -0.0005747703835368156, -0.000546138733625412, -0.0005175070837140083, -0.0004888754338026047, -0.000460243783891201, -0.00043161213397979736, -0.0004029804840683937, -0.00037434883415699005, -0.0003457171842455864, -0.00031708553433418274, -0.0002884538844227791, -0.00025982223451137543, -0.00023119058459997177, -0.00020255893468856812, -0.00017392728477716446, -0.0001452956348657608, -0.00011666398495435715, -8.803233504295349e-05, -5.9400685131549835e-05, -3.076903522014618e-05, -2.137385308742523e-06, 2.6494264602661133e-05, 5.512591451406479e-05, 8.375756442546844e-05, 0.0001123892143368721, 0.00014102086424827576, 0.0001696525141596794, 0.00019828416407108307, 0.00022691581398248672, 0.0002555474638938904, 0.00028417911380529404, 0.0003128107637166977, 0.00034144241362810135, 0.000370074063539505, 0.00039870571345090866, 0.0004273373633623123, 0.000455969013273716, 0.00048460066318511963, 0.0005132323130965233, 0.0005418639630079269, 0.0005704956129193306, 0.0005991272628307343, 0.0006277589127421379, 0.0006563905626535416, 0.0006850222125649452, 0.0007136538624763489, 0.0007422855123877525, 0.0007709171622991562, 0.0007995488122105598, 0.0008281804621219635, 0.0008568121120333672, 0.0008854437619447708, 0.0009140754118561745, 0.0009427070617675781]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 4.0, 4.0, 7.0, 8.0, 7.0, 6.0, 4.0, 7.0, 10.0, 17.0, 26.0, 17.0, 24.0, 32.0, 31.0, 29.0, 35.0, 39.0, 44.0, 54.0, 42.0, 48.0, 37.0, 43.0, 36.0, 47.0, 45.0, 33.0, 23.0, 34.0, 34.0, 29.0, 27.0, 22.0, 17.0, 17.0, 16.0, 7.0, 10.0, 5.0, 9.0, 6.0, 10.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.1953125, -11.830810546875, -11.46630859375, -11.101806640625, -10.7373046875, -10.372802734375, -10.00830078125, -9.643798828125, -9.279296875, -8.914794921875, -8.55029296875, -8.185791015625, -7.8212890625, -7.456787109375, -7.09228515625, -6.727783203125, -6.36328125, -5.998779296875, -5.63427734375, -5.269775390625, -4.9052734375, -4.540771484375, -4.17626953125, -3.811767578125, -3.447265625, -3.082763671875, -2.71826171875, -2.353759765625, -1.9892578125, -1.624755859375, -1.26025390625, -0.895751953125, -0.53125, -0.166748046875, 0.19775390625, 0.562255859375, 0.9267578125, 1.291259765625, 1.65576171875, 2.020263671875, 2.384765625, 2.749267578125, 3.11376953125, 3.478271484375, 3.8427734375, 4.207275390625, 4.57177734375, 4.936279296875, 5.30078125, 5.665283203125, 6.02978515625, 6.394287109375, 6.7587890625, 7.123291015625, 7.48779296875, 7.852294921875, 8.216796875, 8.581298828125, 8.94580078125, 9.310302734375, 9.6748046875, 10.039306640625, 10.40380859375, 10.768310546875, 11.1328125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 3.0, 7.0, 13.0, 9.0, 10.0, 23.0, 21.0, 48.0, 60.0, 91.0, 121.0, 182.0, 247.0, 376.0, 630.0, 979.0, 1600.0, 3091.0, 6167.0, 14941.0, 47877.0, 231303.0, 566906.0, 122489.0, 30095.0, 10376.0, 4676.0, 2521.0, 1365.0, 810.0, 494.0, 311.0, 226.0, 137.0, 118.0, 59.0, 50.0, 40.0, 29.0, 22.0, 12.0, 7.0, 7.0, 7.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.90625, -7.6168212890625, -7.327392578125, -7.0379638671875, -6.74853515625, -6.4591064453125, -6.169677734375, -5.8802490234375, -5.5908203125, -5.3013916015625, -5.011962890625, -4.7225341796875, -4.43310546875, -4.1436767578125, -3.854248046875, -3.5648193359375, -3.275390625, -2.9859619140625, -2.696533203125, -2.4071044921875, -2.11767578125, -1.8282470703125, -1.538818359375, -1.2493896484375, -0.9599609375, -0.6705322265625, -0.381103515625, -0.0916748046875, 0.19775390625, 0.4871826171875, 0.776611328125, 1.0660400390625, 1.35546875, 1.6448974609375, 1.934326171875, 2.2237548828125, 2.51318359375, 2.8026123046875, 3.092041015625, 3.3814697265625, 3.6708984375, 3.9603271484375, 4.249755859375, 4.5391845703125, 4.82861328125, 5.1180419921875, 5.407470703125, 5.6968994140625, 5.986328125, 6.2757568359375, 6.565185546875, 6.8546142578125, 7.14404296875, 7.4334716796875, 7.722900390625, 8.0123291015625, 8.3017578125, 8.5911865234375, 8.880615234375, 9.1700439453125, 9.45947265625, 9.7489013671875, 10.038330078125, 10.3277587890625, 10.6171875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 5.0, 2.0, 5.0, 4.0, 4.0, 7.0, 17.0, 14.0, 18.0, 14.0, 24.0, 28.0, 30.0, 37.0, 34.0, 39.0, 43.0, 43.0, 76.0, 118.0, 1895.0, 130.0, 93.0, 53.0, 50.0, 38.0, 49.0, 35.0, 22.0, 18.0, 21.0, 11.0, 15.0, 10.0, 9.0, 9.0, 7.0, 6.0, 3.0, 1.0, 8.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-46.15625, -44.7373046875, -43.318359375, -41.8994140625, -40.48046875, -39.0615234375, -37.642578125, -36.2236328125, -34.8046875, -33.3857421875, -31.966796875, -30.5478515625, -29.12890625, -27.7099609375, -26.291015625, -24.8720703125, -23.453125, -22.0341796875, -20.615234375, -19.1962890625, -17.77734375, -16.3583984375, -14.939453125, -13.5205078125, -12.1015625, -10.6826171875, -9.263671875, -7.8447265625, -6.42578125, -5.0068359375, -3.587890625, -2.1689453125, -0.75, 0.6689453125, 2.087890625, 3.5068359375, 4.92578125, 6.3447265625, 7.763671875, 9.1826171875, 10.6015625, 12.0205078125, 13.439453125, 14.8583984375, 16.27734375, 17.6962890625, 19.115234375, 20.5341796875, 21.953125, 23.3720703125, 24.791015625, 26.2099609375, 27.62890625, 29.0478515625, 30.466796875, 31.8857421875, 33.3046875, 34.7236328125, 36.142578125, 37.5615234375, 38.98046875, 40.3994140625, 41.818359375, 43.2373046875, 44.65625]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 5.0, 5.0, 2.0, 6.0, 7.0, 7.0, 7.0, 7.0, 12.0, 17.0, 16.0, 28.0, 28.0, 37.0, 73.0, 85.0, 115.0, 201.0, 476.0, 1501.0, 32135.0, 3098175.0, 10666.0, 1038.0, 385.0, 208.0, 120.0, 81.0, 53.0, 48.0, 33.0, 25.0, 20.0, 18.0, 19.0, 15.0, 4.0, 7.0, 4.0, 4.0, 4.0, 5.0, 3.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-72.4375, -70.1298828125, -67.822265625, -65.5146484375, -63.20703125, -60.8994140625, -58.591796875, -56.2841796875, -53.9765625, -51.6689453125, -49.361328125, -47.0537109375, -44.74609375, -42.4384765625, -40.130859375, -37.8232421875, -35.515625, -33.2080078125, -30.900390625, -28.5927734375, -26.28515625, -23.9775390625, -21.669921875, -19.3623046875, -17.0546875, -14.7470703125, -12.439453125, -10.1318359375, -7.82421875, -5.5166015625, -3.208984375, -0.9013671875, 1.40625, 3.7138671875, 6.021484375, 8.3291015625, 10.63671875, 12.9443359375, 15.251953125, 17.5595703125, 19.8671875, 22.1748046875, 24.482421875, 26.7900390625, 29.09765625, 31.4052734375, 33.712890625, 36.0205078125, 38.328125, 40.6357421875, 42.943359375, 45.2509765625, 47.55859375, 49.8662109375, 52.173828125, 54.4814453125, 56.7890625, 59.0966796875, 61.404296875, 63.7119140625, 66.01953125, 68.3271484375, 70.634765625, 72.9423828125, 75.25]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 9.0, 604.0, 395.0, 9.0], "bins": [-481.2646484375, -473.4877624511719, -465.71087646484375, -457.9339904785156, -450.1571044921875, -442.3802185058594, -434.60333251953125, -426.826416015625, -419.049560546875, -411.2726745605469, -403.49578857421875, -395.7189025878906, -387.9420166015625, -380.1651306152344, -372.38824462890625, -364.611328125, -356.8344421386719, -349.05755615234375, -341.2806701660156, -333.5037841796875, -325.7268981933594, -317.95001220703125, -310.1731262207031, -302.396240234375, -294.61932373046875, -286.8424377441406, -279.0655517578125, -271.2886657714844, -263.51177978515625, -255.73489379882812, -247.95799255371094, -240.1811065673828, -232.4042510986328, -224.6273651123047, -216.85047912597656, -209.07359313964844, -201.29669189453125, -193.51980590820312, -185.742919921875, -177.96603393554688, -170.18914794921875, -162.41226196289062, -154.6353759765625, -146.85848999023438, -139.08160400390625, -131.30471801757812, -123.52781677246094, -115.75093078613281, -107.97404479980469, -100.19715881347656, -92.42027282714844, -84.64337921142578, -76.86649322509766, -69.08960723876953, -61.31271743774414, -53.53582763671875, -45.75893783569336, -37.98204803466797, -30.205162048339844, -22.428274154663086, -14.651386260986328, -6.874500274658203, 0.9023895263671875, 8.679279327392578, 16.456165313720703]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 7.0, 6.0, 3.0, 8.0, 6.0, 15.0, 11.0, 12.0, 26.0, 24.0, 21.0, 21.0, 20.0, 24.0, 31.0, 37.0, 34.0, 36.0, 37.0, 36.0, 41.0, 37.0, 44.0, 39.0, 30.0, 44.0, 37.0, 29.0, 32.0, 34.0, 25.0, 16.0, 28.0, 20.0, 16.0, 15.0, 20.0, 16.0, 5.0, 12.0, 6.0, 8.0, 6.0, 3.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-119.96376037597656, -116.13307189941406, -112.3023910522461, -108.4717025756836, -104.64102172851562, -100.81033325195312, -96.97965240478516, -93.14896392822266, -89.31828308105469, -85.48759460449219, -81.65691375732422, -77.82622528076172, -73.99554443359375, -70.16485595703125, -66.33417510986328, -62.50348663330078, -58.67280197143555, -54.84211730957031, -51.01143264770508, -47.180747985839844, -43.35006332397461, -39.519378662109375, -35.688690185546875, -31.858007431030273, -28.02732276916504, -24.196638107299805, -20.36595344543457, -16.535266876220703, -12.704583168029785, -8.873897552490234, -5.043212890625, -1.2125282287597656, 2.6181564331054688, 6.448841094970703, 10.279525756835938, 14.110211372375488, 17.940895080566406, 21.771581649780273, 25.602266311645508, 29.432950973510742, 33.263633728027344, 37.09431838989258, 40.92500305175781, 44.75568771362305, 48.58637237548828, 52.41706085205078, 56.24774169921875, 60.07843017578125, 63.909114837646484, 67.73979949951172, 71.57048797607422, 75.40116882324219, 79.23185729980469, 83.06253814697266, 86.89322662353516, 90.72390747070312, 94.55459594726562, 98.38528442382812, 102.2159652709961, 106.0466537475586, 109.87733459472656, 113.70802307128906, 117.53870391845703, 121.36939239501953, 125.2000732421875]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 6.0, 7.0, 9.0, 8.0, 2.0, 4.0, 10.0, 8.0, 19.0, 17.0, 26.0, 19.0, 30.0, 32.0, 29.0, 30.0, 37.0, 47.0, 47.0, 45.0, 41.0, 40.0, 42.0, 44.0, 41.0, 47.0, 30.0, 28.0, 31.0, 36.0, 27.0, 27.0, 31.0, 16.0, 18.0, 18.0, 10.0, 4.0, 9.0, 10.0, 11.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-12.3515625, -11.985595703125, -11.61962890625, -11.253662109375, -10.8876953125, -10.521728515625, -10.15576171875, -9.789794921875, -9.423828125, -9.057861328125, -8.69189453125, -8.325927734375, -7.9599609375, -7.593994140625, -7.22802734375, -6.862060546875, -6.49609375, -6.130126953125, -5.76416015625, -5.398193359375, -5.0322265625, -4.666259765625, -4.30029296875, -3.934326171875, -3.568359375, -3.202392578125, -2.83642578125, -2.470458984375, -2.1044921875, -1.738525390625, -1.37255859375, -1.006591796875, -0.640625, -0.274658203125, 0.09130859375, 0.457275390625, 0.8232421875, 1.189208984375, 1.55517578125, 1.921142578125, 2.287109375, 2.653076171875, 3.01904296875, 3.385009765625, 3.7509765625, 4.116943359375, 4.48291015625, 4.848876953125, 5.21484375, 5.580810546875, 5.94677734375, 6.312744140625, 6.6787109375, 7.044677734375, 7.41064453125, 7.776611328125, 8.142578125, 8.508544921875, 8.87451171875, 9.240478515625, 9.6064453125, 9.972412109375, 10.33837890625, 10.704345703125, 11.0703125]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 3.0, 8.0, 7.0, 13.0, 13.0, 25.0, 27.0, 35.0, 51.0, 85.0, 135.0, 172.0, 427.0, 1019.0, 2713.0, 10280.0, 56597.0, 487455.0, 2286492.0, 1174818.0, 144445.0, 21882.0, 4752.0, 1499.0, 569.0, 260.0, 152.0, 102.0, 55.0, 43.0, 33.0, 31.0, 22.0, 20.0, 10.0, 12.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-23.25, -22.51708984375, -21.7841796875, -21.05126953125, -20.318359375, -19.58544921875, -18.8525390625, -18.11962890625, -17.38671875, -16.65380859375, -15.9208984375, -15.18798828125, -14.455078125, -13.72216796875, -12.9892578125, -12.25634765625, -11.5234375, -10.79052734375, -10.0576171875, -9.32470703125, -8.591796875, -7.85888671875, -7.1259765625, -6.39306640625, -5.66015625, -4.92724609375, -4.1943359375, -3.46142578125, -2.728515625, -1.99560546875, -1.2626953125, -0.52978515625, 0.203125, 0.93603515625, 1.6689453125, 2.40185546875, 3.134765625, 3.86767578125, 4.6005859375, 5.33349609375, 6.06640625, 6.79931640625, 7.5322265625, 8.26513671875, 8.998046875, 9.73095703125, 10.4638671875, 11.19677734375, 11.9296875, 12.66259765625, 13.3955078125, 14.12841796875, 14.861328125, 15.59423828125, 16.3271484375, 17.06005859375, 17.79296875, 18.52587890625, 19.2587890625, 19.99169921875, 20.724609375, 21.45751953125, 22.1904296875, 22.92333984375, 23.65625]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 5.0, 5.0, 6.0, 13.0, 18.0, 20.0, 28.0, 33.0, 38.0, 54.0, 85.0, 116.0, 151.0, 221.0, 290.0, 411.0, 574.0, 501.0, 415.0, 296.0, 234.0, 164.0, 88.0, 86.0, 58.0, 36.0, 27.0, 25.0, 22.0, 14.0, 13.0, 11.0, 5.0, 1.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-36.34375, -35.1728515625, -34.001953125, -32.8310546875, -31.66015625, -30.4892578125, -29.318359375, -28.1474609375, -26.9765625, -25.8056640625, -24.634765625, -23.4638671875, -22.29296875, -21.1220703125, -19.951171875, -18.7802734375, -17.609375, -16.4384765625, -15.267578125, -14.0966796875, -12.92578125, -11.7548828125, -10.583984375, -9.4130859375, -8.2421875, -7.0712890625, -5.900390625, -4.7294921875, -3.55859375, -2.3876953125, -1.216796875, -0.0458984375, 1.125, 2.2958984375, 3.466796875, 4.6376953125, 5.80859375, 6.9794921875, 8.150390625, 9.3212890625, 10.4921875, 11.6630859375, 12.833984375, 14.0048828125, 15.17578125, 16.3466796875, 17.517578125, 18.6884765625, 19.859375, 21.0302734375, 22.201171875, 23.3720703125, 24.54296875, 25.7138671875, 26.884765625, 28.0556640625, 29.2265625, 30.3974609375, 31.568359375, 32.7392578125, 33.91015625, 35.0810546875, 36.251953125, 37.4228515625, 38.59375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 4.0, 3.0, 3.0, 15.0, 14.0, 19.0, 21.0, 41.0, 33.0, 57.0, 84.0, 116.0, 192.0, 351.0, 823.0, 12770.0, 4159892.0, 17946.0, 910.0, 355.0, 182.0, 151.0, 92.0, 50.0, 41.0, 34.0, 28.0, 18.0, 11.0, 16.0, 7.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-195.875, -189.662109375, -183.44921875, -177.236328125, -171.0234375, -164.810546875, -158.59765625, -152.384765625, -146.171875, -139.958984375, -133.74609375, -127.533203125, -121.3203125, -115.107421875, -108.89453125, -102.681640625, -96.46875, -90.255859375, -84.04296875, -77.830078125, -71.6171875, -65.404296875, -59.19140625, -52.978515625, -46.765625, -40.552734375, -34.33984375, -28.126953125, -21.9140625, -15.701171875, -9.48828125, -3.275390625, 2.9375, 9.150390625, 15.36328125, 21.576171875, 27.7890625, 34.001953125, 40.21484375, 46.427734375, 52.640625, 58.853515625, 65.06640625, 71.279296875, 77.4921875, 83.705078125, 89.91796875, 96.130859375, 102.34375, 108.556640625, 114.76953125, 120.982421875, 127.1953125, 133.408203125, 139.62109375, 145.833984375, 152.046875, 158.259765625, 164.47265625, 170.685546875, 176.8984375, 183.111328125, 189.32421875, 195.537109375, 201.75]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 16.0, 82.0, 247.0, 392.0, 223.0, 42.0, 12.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.6908721923828, -147.70152282714844, -136.712158203125, -125.72280883789062, -114.73344421386719, -103.74409484863281, -92.7547378540039, -81.765380859375, -70.7760238647461, -59.78666687011719, -48.79730987548828, -37.80795669555664, -26.818599700927734, -15.829242706298828, -4.8398895263671875, 6.149467468261719, 17.138824462890625, 28.12818145751953, 39.11753845214844, 50.10689163208008, 61.096248626708984, 72.08560180664062, 83.07495880126953, 94.06431579589844, 105.05367279052734, 116.04302978515625, 127.03238677978516, 138.02174377441406, 149.01109313964844, 160.00045776367188, 170.98980712890625, 181.97915649414062, 192.96853637695312, 203.9578857421875, 214.94725036621094, 225.9365997314453, 236.92596435546875, 247.91531372070312, 258.9046630859375, 269.89404296875, 280.8833923339844, 291.87274169921875, 302.8620910644531, 313.8514709472656, 324.8408203125, 335.8301696777344, 346.81951904296875, 357.80889892578125, 368.7982177734375, 379.7875671386719, 390.77691650390625, 401.76629638671875, 412.7556457519531, 423.7449951171875, 434.7343444824219, 445.72369384765625, 456.71307373046875, 467.7024230957031, 478.6917724609375, 489.68115234375, 500.6705017089844, 511.65985107421875, 522.6492309570312, 533.6385498046875, 544.6279296875]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 10.0, 11.0, 11.0, 10.0, 9.0, 17.0, 13.0, 25.0, 12.0, 29.0, 33.0, 25.0, 37.0, 24.0, 35.0, 33.0, 37.0, 41.0, 30.0, 17.0, 38.0, 52.0, 46.0, 35.0, 34.0, 32.0, 35.0, 24.0, 25.0, 31.0, 22.0, 17.0, 30.0, 15.0, 19.0, 14.0, 16.0, 5.0, 9.0, 6.0, 8.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-114.02655029296875, -110.62129974365234, -107.21604919433594, -103.81079864501953, -100.40554809570312, -97.00029754638672, -93.59504699707031, -90.1897964477539, -86.7845458984375, -83.3792953491211, -79.97404479980469, -76.56879425048828, -73.16354370117188, -69.75829315185547, -66.35304260253906, -62.947792053222656, -59.542537689208984, -56.13728713989258, -52.73203659057617, -49.326786041259766, -45.92153549194336, -42.51628112792969, -39.11103057861328, -35.705780029296875, -32.30052947998047, -28.895278930664062, -25.490028381347656, -22.08477783203125, -18.679527282714844, -15.274274826049805, -11.869024276733398, -8.463773727416992, -5.058525085449219, -1.6532742977142334, 1.751976490020752, 5.157227516174316, 8.562478065490723, 11.967729568481445, 15.372980117797852, 18.778230667114258, 22.183481216430664, 25.58873176574707, 28.993982315063477, 32.399234771728516, 35.80448532104492, 39.20973587036133, 42.614986419677734, 46.02023696899414, 49.42548751831055, 52.83073806762695, 56.23598861694336, 59.641239166259766, 63.04648971557617, 66.45174407958984, 69.85699462890625, 73.26224517822266, 76.66749572753906, 80.07274627685547, 83.47799682617188, 86.88324737548828, 90.28849792480469, 93.6937484741211, 97.0989990234375, 100.5042495727539, 103.90950012207031]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 8.0, 7.0, 9.0, 11.0, 8.0, 8.0, 10.0, 13.0, 13.0, 18.0, 20.0, 29.0, 25.0, 28.0, 31.0, 39.0, 39.0, 31.0, 47.0, 40.0, 51.0, 28.0, 45.0, 44.0, 43.0, 43.0, 39.0, 42.0, 26.0, 25.0, 23.0, 32.0, 23.0, 19.0, 22.0, 7.0, 11.0, 13.0, 8.0, 4.0, 2.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.578125, -12.21240234375, -11.8466796875, -11.48095703125, -11.115234375, -10.74951171875, -10.3837890625, -10.01806640625, -9.65234375, -9.28662109375, -8.9208984375, -8.55517578125, -8.189453125, -7.82373046875, -7.4580078125, -7.09228515625, -6.7265625, -6.36083984375, -5.9951171875, -5.62939453125, -5.263671875, -4.89794921875, -4.5322265625, -4.16650390625, -3.80078125, -3.43505859375, -3.0693359375, -2.70361328125, -2.337890625, -1.97216796875, -1.6064453125, -1.24072265625, -0.875, -0.50927734375, -0.1435546875, 0.22216796875, 0.587890625, 0.95361328125, 1.3193359375, 1.68505859375, 2.05078125, 2.41650390625, 2.7822265625, 3.14794921875, 3.513671875, 3.87939453125, 4.2451171875, 4.61083984375, 4.9765625, 5.34228515625, 5.7080078125, 6.07373046875, 6.439453125, 6.80517578125, 7.1708984375, 7.53662109375, 7.90234375, 8.26806640625, 8.6337890625, 8.99951171875, 9.365234375, 9.73095703125, 10.0966796875, 10.46240234375, 10.828125]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 5.0, 9.0, 10.0, 17.0, 29.0, 47.0, 59.0, 82.0, 113.0, 202.0, 224.0, 364.0, 600.0, 871.0, 1433.0, 2236.0, 3568.0, 5732.0, 9615.0, 16138.0, 28619.0, 52728.0, 106322.0, 284059.0, 300302.0, 109349.0, 54123.0, 29342.0, 16631.0, 9790.0, 5818.0, 3658.0, 2271.0, 1422.0, 891.0, 620.0, 413.0, 288.0, 176.0, 107.0, 70.0, 63.0, 40.0, 30.0, 22.0, 18.0, 11.0, 9.0, 4.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-3.318359375, -3.217864990234375, -3.11737060546875, -3.016876220703125, -2.9163818359375, -2.815887451171875, -2.71539306640625, -2.614898681640625, -2.514404296875, -2.413909912109375, -2.31341552734375, -2.212921142578125, -2.1124267578125, -2.011932373046875, -1.91143798828125, -1.810943603515625, -1.71044921875, -1.609954833984375, -1.50946044921875, -1.408966064453125, -1.3084716796875, -1.207977294921875, -1.10748291015625, -1.006988525390625, -0.906494140625, -0.805999755859375, -0.70550537109375, -0.605010986328125, -0.5045166015625, -0.404022216796875, -0.30352783203125, -0.203033447265625, -0.1025390625, -0.002044677734375, 0.09844970703125, 0.198944091796875, 0.2994384765625, 0.399932861328125, 0.50042724609375, 0.600921630859375, 0.701416015625, 0.801910400390625, 0.90240478515625, 1.002899169921875, 1.1033935546875, 1.203887939453125, 1.30438232421875, 1.404876708984375, 1.50537109375, 1.605865478515625, 1.70635986328125, 1.806854248046875, 1.9073486328125, 2.007843017578125, 2.10833740234375, 2.208831787109375, 2.309326171875, 2.409820556640625, 2.51031494140625, 2.610809326171875, 2.7113037109375, 2.811798095703125, 2.91229248046875, 3.012786865234375, 3.11328125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 5.0, 5.0, 7.0, 9.0, 12.0, 11.0, 15.0, 20.0, 21.0, 19.0, 31.0, 28.0, 28.0, 22.0, 38.0, 29.0, 37.0, 31.0, 41.0, 43.0, 45.0, 1058.0, 58.0, 36.0, 43.0, 49.0, 35.0, 38.0, 33.0, 22.0, 20.0, 21.0, 21.0, 11.0, 17.0, 15.0, 12.0, 6.0, 9.0, 9.0, 4.0, 7.0, 4.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.55859375, -7.31561279296875, -7.0726318359375, -6.82965087890625, -6.586669921875, -6.34368896484375, -6.1007080078125, -5.85772705078125, -5.61474609375, -5.37176513671875, -5.1287841796875, -4.88580322265625, -4.642822265625, -4.39984130859375, -4.1568603515625, -3.91387939453125, -3.6708984375, -3.42791748046875, -3.1849365234375, -2.94195556640625, -2.698974609375, -2.45599365234375, -2.2130126953125, -1.97003173828125, -1.72705078125, -1.48406982421875, -1.2410888671875, -0.99810791015625, -0.755126953125, -0.51214599609375, -0.2691650390625, -0.02618408203125, 0.216796875, 0.45977783203125, 0.7027587890625, 0.94573974609375, 1.188720703125, 1.43170166015625, 1.6746826171875, 1.91766357421875, 2.16064453125, 2.40362548828125, 2.6466064453125, 2.88958740234375, 3.132568359375, 3.37554931640625, 3.6185302734375, 3.86151123046875, 4.1044921875, 4.34747314453125, 4.5904541015625, 4.83343505859375, 5.076416015625, 5.31939697265625, 5.5623779296875, 5.80535888671875, 6.04833984375, 6.29132080078125, 6.5343017578125, 6.77728271484375, 7.020263671875, 7.26324462890625, 7.5062255859375, 7.74920654296875, 7.9921875]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 5.0, 11.0, 15.0, 20.0, 39.0, 55.0, 69.0, 111.0, 160.0, 262.0, 321.0, 533.0, 742.0, 1088.0, 1592.0, 2388.0, 3454.0, 4973.0, 7664.0, 10928.0, 16437.0, 24942.0, 39085.0, 63000.0, 109216.0, 1300108.0, 233357.0, 105089.0, 60602.0, 37488.0, 24098.0, 15790.0, 10690.0, 7187.0, 5023.0, 3367.0, 2271.0, 1593.0, 1071.0, 722.0, 523.0, 353.0, 217.0, 141.0, 109.0, 75.0, 49.0, 29.0, 30.0, 18.0, 11.0, 8.0, 2.0, 5.0, 3.0, 0.0, 1.0], "bins": [-2.4375, -2.363555908203125, -2.28961181640625, -2.215667724609375, -2.1417236328125, -2.067779541015625, -1.99383544921875, -1.919891357421875, -1.845947265625, -1.772003173828125, -1.69805908203125, -1.624114990234375, -1.5501708984375, -1.476226806640625, -1.40228271484375, -1.328338623046875, -1.25439453125, -1.180450439453125, -1.10650634765625, -1.032562255859375, -0.9586181640625, -0.884674072265625, -0.81072998046875, -0.736785888671875, -0.662841796875, -0.588897705078125, -0.51495361328125, -0.441009521484375, -0.3670654296875, -0.293121337890625, -0.21917724609375, -0.145233154296875, -0.0712890625, 0.002655029296875, 0.07659912109375, 0.150543212890625, 0.2244873046875, 0.298431396484375, 0.37237548828125, 0.446319580078125, 0.520263671875, 0.594207763671875, 0.66815185546875, 0.742095947265625, 0.8160400390625, 0.889984130859375, 0.96392822265625, 1.037872314453125, 1.11181640625, 1.185760498046875, 1.25970458984375, 1.333648681640625, 1.4075927734375, 1.481536865234375, 1.55548095703125, 1.629425048828125, 1.703369140625, 1.777313232421875, 1.85125732421875, 1.925201416015625, 1.9991455078125, 2.073089599609375, 2.14703369140625, 2.220977783203125, 2.294921875]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 0.0, 6.0, 8.0, 3.0, 5.0, 9.0, 13.0, 19.0, 15.0, 18.0, 37.0, 50.0, 51.0, 58.0, 86.0, 89.0, 74.0, 116.0, 64.0, 57.0, 56.0, 37.0, 30.0, 19.0, 19.0, 23.0, 13.0, 4.0, 7.0, 9.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012998580932617188, -0.001256793737411499, -0.0012137293815612793, -0.0011706650257110596, -0.0011276006698608398, -0.0010845363140106201, -0.0010414719581604004, -0.0009984076023101807, -0.0009553432464599609, -0.0009122788906097412, -0.0008692145347595215, -0.0008261501789093018, -0.000783085823059082, -0.0007400214672088623, -0.0006969571113586426, -0.0006538927555084229, -0.0006108283996582031, -0.0005677640438079834, -0.0005246996879577637, -0.00048163533210754395, -0.0004385709762573242, -0.0003955066204071045, -0.00035244226455688477, -0.00030937790870666504, -0.0002663135528564453, -0.00022324919700622559, -0.00018018484115600586, -0.00013712048530578613, -9.40561294555664e-05, -5.099177360534668e-05, -7.927417755126953e-06, 3.5136938095092773e-05, 7.82012939453125e-05, 0.00012126564979553223, 0.00016433000564575195, 0.00020739436149597168, 0.0002504587173461914, 0.00029352307319641113, 0.00033658742904663086, 0.0003796517848968506, 0.0004227161407470703, 0.00046578049659729004, 0.0005088448524475098, 0.0005519092082977295, 0.0005949735641479492, 0.0006380379199981689, 0.0006811022758483887, 0.0007241666316986084, 0.0007672309875488281, 0.0008102953433990479, 0.0008533596992492676, 0.0008964240550994873, 0.000939488410949707, 0.0009825527667999268, 0.0010256171226501465, 0.0010686814785003662, 0.001111745834350586, 0.0011548101902008057, 0.0011978745460510254, 0.0012409389019012451, 0.0012840032577514648, 0.0013270676136016846, 0.0013701319694519043, 0.001413196325302124, 0.0014562606811523438]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 5.0, 0.0, 0.0, 4.0, 6.0, 3.0, 4.0, 12.0, 8.0, 10.0, 30.0, 28.0, 21.0, 61.0, 106.0, 121.0, 209.0, 336.0, 837.0, 83893.0, 960139.0, 1526.0, 460.0, 266.0, 153.0, 107.0, 60.0, 36.0, 30.0, 31.0, 15.0, 10.0, 13.0, 9.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.034210205078125, -0.03317832946777344, -0.032146453857421875, -0.031114578247070312, -0.03008270263671875, -0.029050827026367188, -0.028018951416015625, -0.026987075805664062, -0.0259552001953125, -0.024923324584960938, -0.023891448974609375, -0.022859573364257812, -0.02182769775390625, -0.020795822143554688, -0.019763946533203125, -0.018732070922851562, -0.0177001953125, -0.016668319702148438, -0.015636444091796875, -0.014604568481445312, -0.01357269287109375, -0.012540817260742188, -0.011508941650390625, -0.010477066040039062, -0.0094451904296875, -0.008413314819335938, -0.007381439208984375, -0.0063495635986328125, -0.00531768798828125, -0.0042858123779296875, -0.003253936767578125, -0.0022220611572265625, -0.001190185546875, -0.0001583099365234375, 0.000873565673828125, 0.0019054412841796875, 0.00293731689453125, 0.0039691925048828125, 0.005001068115234375, 0.0060329437255859375, 0.0070648193359375, 0.008096694946289062, 0.009128570556640625, 0.010160446166992188, 0.01119232177734375, 0.012224197387695312, 0.013256072998046875, 0.014287948608398438, 0.01531982421875, 0.016351699829101562, 0.017383575439453125, 0.018415451049804688, 0.01944732666015625, 0.020479202270507812, 0.021511077880859375, 0.022542953491210938, 0.0235748291015625, 0.024606704711914062, 0.025638580322265625, 0.026670455932617188, 0.02770233154296875, 0.028734207153320312, 0.029766082763671875, 0.030797958374023438, 0.031829833984375]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 28.0, 89.0, 241.0, 313.0, 221.0, 74.0, 30.0, 7.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002491489052772522, -0.0024327789433300495, -0.002374068833887577, -0.0023153589572757483, -0.002256648847833276, -0.0021979387383908033, -0.0021392288617789745, -0.002080518752336502, -0.0020218086428940296, -0.001963098533451557, -0.0019043885404244065, -0.001845678547397256, -0.0017869684379547834, -0.001728258328512311, -0.0016695483354851604, -0.0016108383424580097, -0.0015521282330155373, -0.0014934181235730648, -0.0014347081305459142, -0.0013759981375187635, -0.001317288028076291, -0.0012585779186338186, -0.001199867925606668, -0.0011411579325795174, -0.001082447823137045, -0.0010237377136945724, -0.0009650277206674218, -0.0009063176694326103, -0.0008476076181977987, -0.0007888975669629872, -0.0007301875157281756, -0.0006714774644933641, -0.0006127674132585526, -0.000554057362023741, -0.0004953473107889295, -0.0004366372595541179, -0.0003779272083193064, -0.00031921715708449483, -0.0002605071058496833, -0.00020179705461487174, -0.0001430870033800602, -8.437695214524865e-05, -2.5666900910437107e-05, 3.304315032437444e-05, 9.175320155918598e-05, 0.00015046325279399753, 0.00020917330402880907, 0.0002678833552636206, 0.00032659340649843216, 0.0003853034577332437, 0.00044401350896805525, 0.0005027235602028668, 0.0005614336114376783, 0.0006201436626724899, 0.0006788537139073014, 0.000737563765142113, 0.0007962738163769245, 0.0008549838676117361, 0.0009136939188465476, 0.0009724039700813591, 0.0010311140213161707, 0.0010898241307586432, 0.0011485341237857938, 0.0012072441168129444, 0.0012659542262554169]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 4.0, 5.0, 1.0, 3.0, 7.0, 7.0, 10.0, 6.0, 15.0, 7.0, 6.0, 16.0, 20.0, 23.0, 19.0, 24.0, 21.0, 34.0, 19.0, 37.0, 43.0, 38.0, 39.0, 32.0, 54.0, 37.0, 43.0, 29.0, 33.0, 31.0, 32.0, 26.0, 25.0, 32.0, 24.0, 26.0, 21.0, 25.0, 15.0, 21.0, 10.0, 11.0, 12.0, 15.0, 14.0, 9.0, 2.0, 6.0, 5.0, 4.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00041806697845458984, -0.00040322355926036835, -0.00038838014006614685, -0.00037353672087192535, -0.00035869330167770386, -0.00034384988248348236, -0.00032900646328926086, -0.00031416304409503937, -0.00029931962490081787, -0.0002844762057065964, -0.0002696327865123749, -0.0002547893673181534, -0.00023994594812393188, -0.0002251025289297104, -0.0002102591097354889, -0.0001954156905412674, -0.0001805722713470459, -0.0001657288521528244, -0.0001508854329586029, -0.0001360420137643814, -0.00012119859457015991, -0.00010635517537593842, -9.151175618171692e-05, -7.666833698749542e-05, -6.182491779327393e-05, -4.698149859905243e-05, -3.213807940483093e-05, -1.7294660210609436e-05, -2.4512410163879395e-06, 1.2392178177833557e-05, 2.7235597372055054e-05, 4.207901656627655e-05, 5.692243576049805e-05, 7.176585495471954e-05, 8.660927414894104e-05, 0.00010145269334316254, 0.00011629611253738403, 0.00013113953173160553, 0.00014598295092582703, 0.00016082637012004852, 0.00017566978931427002, 0.00019051320850849152, 0.000205356627702713, 0.0002202000468969345, 0.000235043466091156, 0.0002498868852853775, 0.000264730304479599, 0.0002795737236738205, 0.000294417142868042, 0.0003092605620622635, 0.000324103981256485, 0.0003389474004507065, 0.000353790819644928, 0.0003686342388391495, 0.00038347765803337097, 0.00039832107722759247, 0.00041316449642181396, 0.00042800791561603546, 0.00044285133481025696, 0.00045769475400447845, 0.00047253817319869995, 0.00048738159239292145, 0.0005022250115871429, 0.0005170684307813644, 0.0005319118499755859]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 1.0, 8.0, 7.0, 9.0, 11.0, 8.0, 8.0, 10.0, 13.0, 13.0, 18.0, 20.0, 29.0, 25.0, 28.0, 31.0, 39.0, 39.0, 31.0, 47.0, 40.0, 51.0, 28.0, 45.0, 44.0, 43.0, 43.0, 39.0, 42.0, 26.0, 25.0, 23.0, 32.0, 23.0, 19.0, 22.0, 7.0, 11.0, 13.0, 8.0, 4.0, 2.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-12.578125, -12.21240234375, -11.8466796875, -11.48095703125, -11.115234375, -10.74951171875, -10.3837890625, -10.01806640625, -9.65234375, -9.28662109375, -8.9208984375, -8.55517578125, -8.189453125, -7.82373046875, -7.4580078125, -7.09228515625, -6.7265625, -6.36083984375, -5.9951171875, -5.62939453125, -5.263671875, -4.89794921875, -4.5322265625, -4.16650390625, -3.80078125, -3.43505859375, -3.0693359375, -2.70361328125, -2.337890625, -1.97216796875, -1.6064453125, -1.24072265625, -0.875, -0.50927734375, -0.1435546875, 0.22216796875, 0.587890625, 0.95361328125, 1.3193359375, 1.68505859375, 2.05078125, 2.41650390625, 2.7822265625, 3.14794921875, 3.513671875, 3.87939453125, 4.2451171875, 4.61083984375, 4.9765625, 5.34228515625, 5.7080078125, 6.07373046875, 6.439453125, 6.80517578125, 7.1708984375, 7.53662109375, 7.90234375, 8.26806640625, 8.6337890625, 8.99951171875, 9.365234375, 9.73095703125, 10.0966796875, 10.46240234375, 10.828125]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 7.0, 6.0, 10.0, 12.0, 15.0, 20.0, 37.0, 35.0, 63.0, 121.0, 170.0, 293.0, 464.0, 720.0, 1243.0, 2184.0, 4110.0, 8390.0, 19490.0, 55024.0, 186239.0, 444570.0, 220201.0, 63489.0, 22007.0, 9329.0, 4446.0, 2377.0, 1365.0, 773.0, 492.0, 306.0, 205.0, 110.0, 86.0, 45.0, 34.0, 23.0, 13.0, 9.0, 5.0, 5.0, 2.0, 5.0, 5.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-7.81640625, -7.59027099609375, -7.3641357421875, -7.13800048828125, -6.911865234375, -6.68572998046875, -6.4595947265625, -6.23345947265625, -6.00732421875, -5.78118896484375, -5.5550537109375, -5.32891845703125, -5.102783203125, -4.87664794921875, -4.6505126953125, -4.42437744140625, -4.1982421875, -3.97210693359375, -3.7459716796875, -3.51983642578125, -3.293701171875, -3.06756591796875, -2.8414306640625, -2.61529541015625, -2.38916015625, -2.16302490234375, -1.9368896484375, -1.71075439453125, -1.484619140625, -1.25848388671875, -1.0323486328125, -0.80621337890625, -0.580078125, -0.35394287109375, -0.1278076171875, 0.09832763671875, 0.324462890625, 0.55059814453125, 0.7767333984375, 1.00286865234375, 1.22900390625, 1.45513916015625, 1.6812744140625, 1.90740966796875, 2.133544921875, 2.35968017578125, 2.5858154296875, 2.81195068359375, 3.0380859375, 3.26422119140625, 3.4903564453125, 3.71649169921875, 3.942626953125, 4.16876220703125, 4.3948974609375, 4.62103271484375, 4.84716796875, 5.07330322265625, 5.2994384765625, 5.52557373046875, 5.751708984375, 5.97784423828125, 6.2039794921875, 6.43011474609375, 6.65625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 3.0, 6.0, 3.0, 7.0, 8.0, 18.0, 13.0, 19.0, 22.0, 24.0, 22.0, 26.0, 39.0, 26.0, 34.0, 41.0, 41.0, 44.0, 66.0, 270.0, 1764.0, 122.0, 50.0, 48.0, 50.0, 41.0, 38.0, 29.0, 29.0, 28.0, 16.0, 18.0, 17.0, 16.0, 8.0, 14.0, 5.0, 6.0, 3.0, 4.0, 6.0, 3.0, 2.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.4375, -41.03564453125, -39.6337890625, -38.23193359375, -36.830078125, -35.42822265625, -34.0263671875, -32.62451171875, -31.22265625, -29.82080078125, -28.4189453125, -27.01708984375, -25.615234375, -24.21337890625, -22.8115234375, -21.40966796875, -20.0078125, -18.60595703125, -17.2041015625, -15.80224609375, -14.400390625, -12.99853515625, -11.5966796875, -10.19482421875, -8.79296875, -7.39111328125, -5.9892578125, -4.58740234375, -3.185546875, -1.78369140625, -0.3818359375, 1.02001953125, 2.421875, 3.82373046875, 5.2255859375, 6.62744140625, 8.029296875, 9.43115234375, 10.8330078125, 12.23486328125, 13.63671875, 15.03857421875, 16.4404296875, 17.84228515625, 19.244140625, 20.64599609375, 22.0478515625, 23.44970703125, 24.8515625, 26.25341796875, 27.6552734375, 29.05712890625, 30.458984375, 31.86083984375, 33.2626953125, 34.66455078125, 36.06640625, 37.46826171875, 38.8701171875, 40.27197265625, 41.673828125, 43.07568359375, 44.4775390625, 45.87939453125, 47.28125]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 5.0, 4.0, 6.0, 6.0, 10.0, 13.0, 16.0, 17.0, 17.0, 29.0, 28.0, 47.0, 57.0, 86.0, 115.0, 187.0, 329.0, 815.0, 6278.0, 3091448.0, 43652.0, 1317.0, 403.0, 244.0, 167.0, 100.0, 56.0, 55.0, 30.0, 25.0, 30.0, 22.0, 21.0, 17.0, 15.0, 5.0, 6.0, 9.0, 3.0, 3.0, 5.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-76.1875, -73.8564453125, -71.525390625, -69.1943359375, -66.86328125, -64.5322265625, -62.201171875, -59.8701171875, -57.5390625, -55.2080078125, -52.876953125, -50.5458984375, -48.21484375, -45.8837890625, -43.552734375, -41.2216796875, -38.890625, -36.5595703125, -34.228515625, -31.8974609375, -29.56640625, -27.2353515625, -24.904296875, -22.5732421875, -20.2421875, -17.9111328125, -15.580078125, -13.2490234375, -10.91796875, -8.5869140625, -6.255859375, -3.9248046875, -1.59375, 0.7373046875, 3.068359375, 5.3994140625, 7.73046875, 10.0615234375, 12.392578125, 14.7236328125, 17.0546875, 19.3857421875, 21.716796875, 24.0478515625, 26.37890625, 28.7099609375, 31.041015625, 33.3720703125, 35.703125, 38.0341796875, 40.365234375, 42.6962890625, 45.02734375, 47.3583984375, 49.689453125, 52.0205078125, 54.3515625, 56.6826171875, 59.013671875, 61.3447265625, 63.67578125, 66.0068359375, 68.337890625, 70.6689453125, 73.0]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 10.0, 52.0, 222.0, 443.0, 219.0, 56.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-101.6822280883789, -98.4548568725586, -95.22748565673828, -92.00011444091797, -88.77274322509766, -85.54537200927734, -82.31800079345703, -79.09062957763672, -75.8632583618164, -72.6358871459961, -69.40851593017578, -66.18114471435547, -62.953773498535156, -59.726402282714844, -56.49903106689453, -53.27165985107422, -50.044288635253906, -46.816917419433594, -43.58954620361328, -40.36217498779297, -37.134803771972656, -33.907432556152344, -30.68006134033203, -27.45269012451172, -24.225318908691406, -20.997947692871094, -17.77057647705078, -14.543205261230469, -11.315834045410156, -8.088462829589844, -4.861091613769531, -1.6337203979492188, 1.5936508178710938, 4.821022033691406, 8.048393249511719, 11.275764465332031, 14.503135681152344, 17.730506896972656, 20.95787811279297, 24.18524932861328, 27.412620544433594, 30.639991760253906, 33.86736297607422, 37.09473419189453, 40.322105407714844, 43.549476623535156, 46.77684783935547, 50.00421905517578, 53.231590270996094, 56.458961486816406, 59.68633270263672, 62.91370391845703, 66.14107513427734, 69.36844635009766, 72.59581756591797, 75.82318878173828, 79.0505599975586, 82.2779312133789, 85.50530242919922, 88.73267364501953, 91.96004486083984, 95.18741607666016, 98.41478729248047, 101.64215850830078, 104.8695297241211]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 4.0, 2.0, 3.0, 11.0, 6.0, 4.0, 5.0, 15.0, 12.0, 18.0, 16.0, 26.0, 24.0, 36.0, 30.0, 40.0, 36.0, 44.0, 43.0, 36.0, 39.0, 49.0, 53.0, 43.0, 54.0, 49.0, 42.0, 32.0, 30.0, 27.0, 20.0, 34.0, 29.0, 20.0, 11.0, 9.0, 14.0, 12.0, 8.0, 5.0, 3.0, 3.0, 5.0, 0.0, 0.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-153.2041473388672, -148.4302520751953, -143.65635681152344, -138.88246154785156, -134.1085662841797, -129.3346710205078, -124.56077575683594, -119.78688049316406, -115.01298522949219, -110.23908996582031, -105.46519470214844, -100.69129943847656, -95.91740417480469, -91.14350891113281, -86.36961364746094, -81.59571838378906, -76.82182312011719, -72.04792785644531, -67.27403259277344, -62.50013732910156, -57.72624206542969, -52.95234680175781, -48.17845153808594, -43.40455627441406, -38.63066101074219, -33.85676574707031, -29.082870483398438, -24.308975219726562, -19.535079956054688, -14.761184692382812, -9.987289428710938, -5.2133941650390625, -0.43951416015625, 4.334381103515625, 9.1082763671875, 13.882171630859375, 18.65606689453125, 23.429962158203125, 28.203857421875, 32.977752685546875, 37.75164794921875, 42.525543212890625, 47.2994384765625, 52.073333740234375, 56.84722900390625, 61.621124267578125, 66.39501953125, 71.16891479492188, 75.94281005859375, 80.71670532226562, 85.4906005859375, 90.26449584960938, 95.03839111328125, 99.81228637695312, 104.586181640625, 109.36007690429688, 114.13397216796875, 118.90786743164062, 123.6817626953125, 128.45565795898438, 133.22955322265625, 138.00344848632812, 142.77734375, 147.55123901367188, 152.32513427734375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 0.0, 1.0, 10.0, 3.0, 8.0, 7.0, 15.0, 8.0, 6.0, 12.0, 12.0, 14.0, 15.0, 22.0, 35.0, 31.0, 24.0, 32.0, 31.0, 37.0, 34.0, 39.0, 42.0, 40.0, 42.0, 48.0, 43.0, 38.0, 34.0, 41.0, 41.0, 22.0, 25.0, 29.0, 19.0, 27.0, 23.0, 20.0, 14.0, 11.0, 9.0, 6.0, 9.0, 3.0, 3.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-12.234375, -11.8782958984375, -11.522216796875, -11.1661376953125, -10.81005859375, -10.4539794921875, -10.097900390625, -9.7418212890625, -9.3857421875, -9.0296630859375, -8.673583984375, -8.3175048828125, -7.96142578125, -7.6053466796875, -7.249267578125, -6.8931884765625, -6.537109375, -6.1810302734375, -5.824951171875, -5.4688720703125, -5.11279296875, -4.7567138671875, -4.400634765625, -4.0445556640625, -3.6884765625, -3.3323974609375, -2.976318359375, -2.6202392578125, -2.26416015625, -1.9080810546875, -1.552001953125, -1.1959228515625, -0.83984375, -0.4837646484375, -0.127685546875, 0.2283935546875, 0.58447265625, 0.9405517578125, 1.296630859375, 1.6527099609375, 2.0087890625, 2.3648681640625, 2.720947265625, 3.0770263671875, 3.43310546875, 3.7891845703125, 4.145263671875, 4.5013427734375, 4.857421875, 5.2135009765625, 5.569580078125, 5.9256591796875, 6.28173828125, 6.6378173828125, 6.993896484375, 7.3499755859375, 7.7060546875, 8.0621337890625, 8.418212890625, 8.7742919921875, 9.13037109375, 9.4864501953125, 9.842529296875, 10.1986083984375, 10.5546875]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 8.0, 4.0, 5.0, 8.0, 6.0, 12.0, 10.0, 12.0, 12.0, 15.0, 25.0, 22.0, 32.0, 58.0, 56.0, 73.0, 125.0, 210.0, 505.0, 2011.0, 12709.0, 167446.0, 2435214.0, 1486505.0, 78959.0, 7825.0, 1324.0, 431.0, 202.0, 110.0, 72.0, 52.0, 48.0, 30.0, 24.0, 17.0, 20.0, 14.0, 13.0, 11.0, 15.0, 10.0, 4.0, 5.0, 6.0, 0.0, 0.0, 1.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0], "bins": [-34.78125, -33.72314453125, -32.6650390625, -31.60693359375, -30.548828125, -29.49072265625, -28.4326171875, -27.37451171875, -26.31640625, -25.25830078125, -24.2001953125, -23.14208984375, -22.083984375, -21.02587890625, -19.9677734375, -18.90966796875, -17.8515625, -16.79345703125, -15.7353515625, -14.67724609375, -13.619140625, -12.56103515625, -11.5029296875, -10.44482421875, -9.38671875, -8.32861328125, -7.2705078125, -6.21240234375, -5.154296875, -4.09619140625, -3.0380859375, -1.97998046875, -0.921875, 0.13623046875, 1.1943359375, 2.25244140625, 3.310546875, 4.36865234375, 5.4267578125, 6.48486328125, 7.54296875, 8.60107421875, 9.6591796875, 10.71728515625, 11.775390625, 12.83349609375, 13.8916015625, 14.94970703125, 16.0078125, 17.06591796875, 18.1240234375, 19.18212890625, 20.240234375, 21.29833984375, 22.3564453125, 23.41455078125, 24.47265625, 25.53076171875, 26.5888671875, 27.64697265625, 28.705078125, 29.76318359375, 30.8212890625, 31.87939453125, 32.9375]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 8.0, 10.0, 9.0, 17.0, 20.0, 29.0, 41.0, 64.0, 77.0, 116.0, 137.0, 205.0, 313.0, 415.0, 503.0, 537.0, 424.0, 289.0, 241.0, 167.0, 127.0, 93.0, 73.0, 36.0, 31.0, 36.0, 19.0, 12.0, 7.0, 7.0, 3.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.75, -40.59326171875, -39.4365234375, -38.27978515625, -37.123046875, -35.96630859375, -34.8095703125, -33.65283203125, -32.49609375, -31.33935546875, -30.1826171875, -29.02587890625, -27.869140625, -26.71240234375, -25.5556640625, -24.39892578125, -23.2421875, -22.08544921875, -20.9287109375, -19.77197265625, -18.615234375, -17.45849609375, -16.3017578125, -15.14501953125, -13.98828125, -12.83154296875, -11.6748046875, -10.51806640625, -9.361328125, -8.20458984375, -7.0478515625, -5.89111328125, -4.734375, -3.57763671875, -2.4208984375, -1.26416015625, -0.107421875, 1.04931640625, 2.2060546875, 3.36279296875, 4.51953125, 5.67626953125, 6.8330078125, 7.98974609375, 9.146484375, 10.30322265625, 11.4599609375, 12.61669921875, 13.7734375, 14.93017578125, 16.0869140625, 17.24365234375, 18.400390625, 19.55712890625, 20.7138671875, 21.87060546875, 23.02734375, 24.18408203125, 25.3408203125, 26.49755859375, 27.654296875, 28.81103515625, 29.9677734375, 31.12451171875, 32.28125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 5.0, 4.0, 4.0, 13.0, 13.0, 28.0, 36.0, 39.0, 74.0, 102.0, 148.0, 249.0, 425.0, 1247.0, 63493.0, 4120405.0, 6241.0, 781.0, 346.0, 211.0, 136.0, 89.0, 60.0, 49.0, 30.0, 16.0, 11.0, 8.0, 8.0, 7.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-151.875, -145.876953125, -139.87890625, -133.880859375, -127.8828125, -121.884765625, -115.88671875, -109.888671875, -103.890625, -97.892578125, -91.89453125, -85.896484375, -79.8984375, -73.900390625, -67.90234375, -61.904296875, -55.90625, -49.908203125, -43.91015625, -37.912109375, -31.9140625, -25.916015625, -19.91796875, -13.919921875, -7.921875, -1.923828125, 4.07421875, 10.072265625, 16.0703125, 22.068359375, 28.06640625, 34.064453125, 40.0625, 46.060546875, 52.05859375, 58.056640625, 64.0546875, 70.052734375, 76.05078125, 82.048828125, 88.046875, 94.044921875, 100.04296875, 106.041015625, 112.0390625, 118.037109375, 124.03515625, 130.033203125, 136.03125, 142.029296875, 148.02734375, 154.025390625, 160.0234375, 166.021484375, 172.01953125, 178.017578125, 184.015625, 190.013671875, 196.01171875, 202.009765625, 208.0078125, 214.005859375, 220.00390625, 226.001953125, 232.0]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 28.0, 72.0, 175.0, 275.0, 239.0, 127.0, 55.0, 19.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.33699035644531, -107.52052307128906, -99.70406341552734, -91.8875961303711, -84.07113647460938, -76.25466918945312, -68.43820190429688, -60.62173843383789, -52.805274963378906, -44.98881149291992, -37.17234802246094, -29.355880737304688, -21.539417266845703, -13.722953796386719, -5.906486511230469, 1.9099769592285156, 9.7264404296875, 17.542903900146484, 25.3593692779541, 33.17583465576172, 40.9922981262207, 48.80876159667969, 56.62522888183594, 64.44169616699219, 72.2581558227539, 80.07462310791016, 87.89108276367188, 95.70755004882812, 103.52401733398438, 111.3404769897461, 119.15694427490234, 126.97340393066406, 134.78985595703125, 142.6063232421875, 150.42279052734375, 158.2392578125, 166.0557098388672, 173.87217712402344, 181.6886444091797, 189.50511169433594, 197.32156372070312, 205.13803100585938, 212.95449829101562, 220.77096557617188, 228.58741760253906, 236.4038848876953, 244.22035217285156, 252.0368194580078, 259.853271484375, 267.66973876953125, 275.4862060546875, 283.30267333984375, 291.119140625, 298.93560791015625, 306.7520751953125, 314.5685119628906, 322.385009765625, 330.20147705078125, 338.0179443359375, 345.83441162109375, 353.65087890625, 361.46734619140625, 369.2838134765625, 377.1002502441406, 384.9167175292969]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 3.0, 2.0, 5.0, 2.0, 3.0, 17.0, 9.0, 10.0, 14.0, 16.0, 16.0, 24.0, 23.0, 23.0, 36.0, 41.0, 28.0, 40.0, 46.0, 41.0, 52.0, 46.0, 47.0, 53.0, 45.0, 44.0, 39.0, 34.0, 39.0, 32.0, 33.0, 27.0, 26.0, 11.0, 17.0, 17.0, 11.0, 6.0, 8.0, 4.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0], "bins": [-132.92840576171875, -129.0357208251953, -125.14303588867188, -121.25035095214844, -117.357666015625, -113.46498107910156, -109.5722885131836, -105.67960357666016, -101.78691864013672, -97.89423370361328, -94.00154876708984, -90.1088638305664, -86.21617126464844, -82.323486328125, -78.43080139160156, -74.53811645507812, -70.64543151855469, -66.75274658203125, -62.86006164550781, -58.96737289428711, -55.07468795776367, -51.182003021240234, -47.28931427001953, -43.396629333496094, -39.503944396972656, -35.61125946044922, -31.71857261657715, -27.825885772705078, -23.93320083618164, -20.040515899658203, -16.147829055786133, -12.255142211914062, -8.362457275390625, -4.469771385192871, -0.5770854949951172, 3.3156003952026367, 7.208286285400391, 11.100971221923828, 14.993658065795898, 18.88634490966797, 22.779029846191406, 26.671714782714844, 30.564401626586914, 34.457088470458984, 38.34977340698242, 42.24245834350586, 46.13514709472656, 50.02783203125, 53.92051696777344, 57.813201904296875, 61.70588684082031, 65.59857177734375, 69.49125671386719, 73.38394165039062, 77.2766342163086, 81.16931915283203, 85.06200408935547, 88.9546890258789, 92.84737396240234, 96.74005889892578, 100.63275146484375, 104.52543640136719, 108.41812133789062, 112.31080627441406, 116.2034912109375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 13.0, 8.0, 8.0, 14.0, 9.0, 12.0, 15.0, 20.0, 17.0, 21.0, 28.0, 33.0, 27.0, 33.0, 44.0, 27.0, 39.0, 37.0, 39.0, 44.0, 47.0, 46.0, 42.0, 31.0, 38.0, 35.0, 30.0, 26.0, 23.0, 31.0, 29.0, 17.0, 14.0, 15.0, 11.0, 15.0, 12.0, 9.0, 5.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0], "bins": [-12.5625, -12.2005615234375, -11.838623046875, -11.4766845703125, -11.11474609375, -10.7528076171875, -10.390869140625, -10.0289306640625, -9.6669921875, -9.3050537109375, -8.943115234375, -8.5811767578125, -8.21923828125, -7.8572998046875, -7.495361328125, -7.1334228515625, -6.771484375, -6.4095458984375, -6.047607421875, -5.6856689453125, -5.32373046875, -4.9617919921875, -4.599853515625, -4.2379150390625, -3.8759765625, -3.5140380859375, -3.152099609375, -2.7901611328125, -2.42822265625, -2.0662841796875, -1.704345703125, -1.3424072265625, -0.98046875, -0.6185302734375, -0.256591796875, 0.1053466796875, 0.46728515625, 0.8292236328125, 1.191162109375, 1.5531005859375, 1.9150390625, 2.2769775390625, 2.638916015625, 3.0008544921875, 3.36279296875, 3.7247314453125, 4.086669921875, 4.4486083984375, 4.810546875, 5.1724853515625, 5.534423828125, 5.8963623046875, 6.25830078125, 6.6202392578125, 6.982177734375, 7.3441162109375, 7.7060546875, 8.0679931640625, 8.429931640625, 8.7918701171875, 9.15380859375, 9.5157470703125, 9.877685546875, 10.2396240234375, 10.6015625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 9.0, 6.0, 13.0, 18.0, 29.0, 31.0, 43.0, 54.0, 74.0, 110.0, 155.0, 232.0, 348.0, 529.0, 725.0, 1063.0, 1617.0, 2336.0, 3597.0, 5335.0, 7912.0, 12430.0, 19048.0, 30807.0, 49748.0, 86192.0, 166215.0, 320679.0, 140123.0, 76325.0, 44614.0, 27450.0, 17330.0, 11047.0, 7448.0, 4768.0, 3266.0, 2191.0, 1515.0, 987.0, 618.0, 414.0, 300.0, 241.0, 179.0, 129.0, 93.0, 64.0, 31.0, 15.0, 8.0, 10.0, 7.0, 8.0, 5.0, 7.0, 5.0, 6.0, 5.0, 2.0, 3.0, 1.0], "bins": [-2.451171875, -2.367767333984375, -2.28436279296875, -2.200958251953125, -2.1175537109375, -2.034149169921875, -1.95074462890625, -1.867340087890625, -1.783935546875, -1.700531005859375, -1.61712646484375, -1.533721923828125, -1.4503173828125, -1.366912841796875, -1.28350830078125, -1.200103759765625, -1.11669921875, -1.033294677734375, -0.94989013671875, -0.866485595703125, -0.7830810546875, -0.699676513671875, -0.61627197265625, -0.532867431640625, -0.449462890625, -0.366058349609375, -0.28265380859375, -0.199249267578125, -0.1158447265625, -0.032440185546875, 0.05096435546875, 0.134368896484375, 0.2177734375, 0.301177978515625, 0.38458251953125, 0.467987060546875, 0.5513916015625, 0.634796142578125, 0.71820068359375, 0.801605224609375, 0.885009765625, 0.968414306640625, 1.05181884765625, 1.135223388671875, 1.2186279296875, 1.302032470703125, 1.38543701171875, 1.468841552734375, 1.55224609375, 1.635650634765625, 1.71905517578125, 1.802459716796875, 1.8858642578125, 1.969268798828125, 2.05267333984375, 2.136077880859375, 2.219482421875, 2.302886962890625, 2.38629150390625, 2.469696044921875, 2.5531005859375, 2.636505126953125, 2.71990966796875, 2.803314208984375, 2.88671875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 5.0, 8.0, 10.0, 3.0, 8.0, 11.0, 11.0, 10.0, 16.0, 17.0, 27.0, 18.0, 32.0, 18.0, 25.0, 28.0, 30.0, 32.0, 29.0, 37.0, 21.0, 30.0, 42.0, 35.0, 1053.0, 29.0, 44.0, 36.0, 34.0, 39.0, 29.0, 40.0, 26.0, 16.0, 22.0, 19.0, 24.0, 18.0, 11.0, 17.0, 16.0, 14.0, 7.0, 7.0, 7.0, 5.0, 1.0, 6.0, 8.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.96484375, -5.75469970703125, -5.5445556640625, -5.33441162109375, -5.124267578125, -4.91412353515625, -4.7039794921875, -4.49383544921875, -4.28369140625, -4.07354736328125, -3.8634033203125, -3.65325927734375, -3.443115234375, -3.23297119140625, -3.0228271484375, -2.81268310546875, -2.6025390625, -2.39239501953125, -2.1822509765625, -1.97210693359375, -1.761962890625, -1.55181884765625, -1.3416748046875, -1.13153076171875, -0.92138671875, -0.71124267578125, -0.5010986328125, -0.29095458984375, -0.080810546875, 0.12933349609375, 0.3394775390625, 0.54962158203125, 0.759765625, 0.96990966796875, 1.1800537109375, 1.39019775390625, 1.600341796875, 1.81048583984375, 2.0206298828125, 2.23077392578125, 2.44091796875, 2.65106201171875, 2.8612060546875, 3.07135009765625, 3.281494140625, 3.49163818359375, 3.7017822265625, 3.91192626953125, 4.1220703125, 4.33221435546875, 4.5423583984375, 4.75250244140625, 4.962646484375, 5.17279052734375, 5.3829345703125, 5.59307861328125, 5.80322265625, 6.01336669921875, 6.2235107421875, 6.43365478515625, 6.643798828125, 6.85394287109375, 7.0640869140625, 7.27423095703125, 7.484375]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 0.0, 9.0, 17.0, 25.0, 23.0, 44.0, 75.0, 129.0, 188.0, 252.0, 437.0, 598.0, 871.0, 1319.0, 1830.0, 2587.0, 3935.0, 5395.0, 7905.0, 11172.0, 16462.0, 23556.0, 35462.0, 54234.0, 86014.0, 153898.0, 1318215.0, 138071.0, 79372.0, 50262.0, 32853.0, 21949.0, 15222.0, 10588.0, 7372.0, 5143.0, 3617.0, 2561.0, 1731.0, 1178.0, 852.0, 539.0, 376.0, 283.0, 187.0, 121.0, 77.0, 58.0, 27.0, 17.0, 12.0, 10.0, 4.0, 1.0, 1.0, 2.0], "bins": [-2.287109375, -2.2206573486328125, -2.154205322265625, -2.0877532958984375, -2.02130126953125, -1.9548492431640625, -1.888397216796875, -1.8219451904296875, -1.7554931640625, -1.6890411376953125, -1.622589111328125, -1.5561370849609375, -1.48968505859375, -1.4232330322265625, -1.356781005859375, -1.2903289794921875, -1.223876953125, -1.1574249267578125, -1.090972900390625, -1.0245208740234375, -0.95806884765625, -0.8916168212890625, -0.825164794921875, -0.7587127685546875, -0.6922607421875, -0.6258087158203125, -0.559356689453125, -0.4929046630859375, -0.42645263671875, -0.3600006103515625, -0.293548583984375, -0.2270965576171875, -0.16064453125, -0.0941925048828125, -0.027740478515625, 0.0387115478515625, 0.10516357421875, 0.1716156005859375, 0.238067626953125, 0.3045196533203125, 0.3709716796875, 0.4374237060546875, 0.503875732421875, 0.5703277587890625, 0.63677978515625, 0.7032318115234375, 0.769683837890625, 0.8361358642578125, 0.902587890625, 0.9690399169921875, 1.035491943359375, 1.1019439697265625, 1.16839599609375, 1.2348480224609375, 1.301300048828125, 1.3677520751953125, 1.4342041015625, 1.5006561279296875, 1.567108154296875, 1.6335601806640625, 1.70001220703125, 1.7664642333984375, 1.832916259765625, 1.8993682861328125, 1.9658203125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 1.0, 1.0, 5.0, 6.0, 10.0, 5.0, 14.0, 16.0, 20.0, 26.0, 29.0, 31.0, 40.0, 55.0, 73.0, 79.0, 90.0, 78.0, 82.0, 70.0, 61.0, 38.0, 27.0, 32.0, 14.0, 11.0, 10.0, 15.0, 18.0, 12.0, 4.0, 2.0, 3.0, 5.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0018072128295898438, -0.001753881573677063, -0.0017005503177642822, -0.0016472190618515015, -0.0015938878059387207, -0.00154055655002594, -0.0014872252941131592, -0.0014338940382003784, -0.0013805627822875977, -0.001327231526374817, -0.0012739002704620361, -0.0012205690145492554, -0.0011672377586364746, -0.0011139065027236938, -0.001060575246810913, -0.0010072439908981323, -0.0009539127349853516, -0.0009005814790725708, -0.00084725022315979, -0.0007939189672470093, -0.0007405877113342285, -0.0006872564554214478, -0.000633925199508667, -0.0005805939435958862, -0.0005272626876831055, -0.0004739314317703247, -0.00042060017585754395, -0.0003672689199447632, -0.0003139376640319824, -0.00026060640811920166, -0.0002072751522064209, -0.00015394389629364014, -0.00010061264038085938, -4.728138446807861e-05, 6.0498714447021484e-06, 5.938112735748291e-05, 0.00011271238327026367, 0.00016604363918304443, 0.0002193748950958252, 0.00027270615100860596, 0.0003260374069213867, 0.0003793686628341675, 0.00043269991874694824, 0.000486031174659729, 0.0005393624305725098, 0.0005926936864852905, 0.0006460249423980713, 0.000699356198310852, 0.0007526874542236328, 0.0008060187101364136, 0.0008593499660491943, 0.0009126812219619751, 0.0009660124778747559, 0.0010193437337875366, 0.0010726749897003174, 0.0011260062456130981, 0.001179337501525879, 0.0012326687574386597, 0.0012860000133514404, 0.0013393312692642212, 0.001392662525177002, 0.0014459937810897827, 0.0014993250370025635, 0.0015526562929153442, 0.001605987548828125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 5.0, 10.0, 6.0, 16.0, 14.0, 17.0, 28.0, 42.0, 56.0, 51.0, 118.0, 224.0, 552.0, 11856.0, 1033320.0, 1351.0, 396.0, 148.0, 105.0, 60.0, 34.0, 39.0, 26.0, 16.0, 11.0, 7.0, 8.0, 8.0, 4.0, 6.0, 2.0, 1.0, 2.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.04461669921875, -0.04323530197143555, -0.041853904724121094, -0.04047250747680664, -0.03909111022949219, -0.037709712982177734, -0.03632831573486328, -0.03494691848754883, -0.033565521240234375, -0.03218412399291992, -0.03080272674560547, -0.029421329498291016, -0.028039932250976562, -0.02665853500366211, -0.025277137756347656, -0.023895740509033203, -0.02251434326171875, -0.021132946014404297, -0.019751548767089844, -0.01837015151977539, -0.016988754272460938, -0.015607357025146484, -0.014225959777832031, -0.012844562530517578, -0.011463165283203125, -0.010081768035888672, -0.008700370788574219, -0.007318973541259766, -0.0059375762939453125, -0.004556179046630859, -0.0031747817993164062, -0.0017933845520019531, -0.0004119873046875, 0.0009694099426269531, 0.0023508071899414062, 0.0037322044372558594, 0.0051136016845703125, 0.006494998931884766, 0.007876396179199219, 0.009257793426513672, 0.010639190673828125, 0.012020587921142578, 0.013401985168457031, 0.014783382415771484, 0.016164779663085938, 0.01754617691040039, 0.018927574157714844, 0.020308971405029297, 0.02169036865234375, 0.023071765899658203, 0.024453163146972656, 0.02583456039428711, 0.027215957641601562, 0.028597354888916016, 0.02997875213623047, 0.03136014938354492, 0.032741546630859375, 0.03412294387817383, 0.03550434112548828, 0.036885738372802734, 0.03826713562011719, 0.03964853286743164, 0.041029930114746094, 0.04241132736206055, 0.043792724609375]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 10.0, 23.0, 63.0, 106.0, 187.0, 262.0, 192.0, 85.0, 54.0, 18.0, 10.0, 1.0, 2.0], "bins": [-0.002659847494214773, -0.0026126750744879246, -0.0025655024219304323, -0.0025183300022035837, -0.002471157582476735, -0.002423984929919243, -0.0023768125101923943, -0.0023296400904655457, -0.002282467670738697, -0.0022352952510118484, -0.002188122598454356, -0.0021409501787275076, -0.002093777759000659, -0.0020466051064431667, -0.001999432686716318, -0.0019522602669894695, -0.0019050876144319773, -0.0018579150782898068, -0.0018107426585629582, -0.0017635701224207878, -0.0017163977026939392, -0.0016692251665517688, -0.0016220526304095984, -0.0015748802106827497, -0.0015277076745405793, -0.0014805351383984089, -0.0014333627186715603, -0.0013861901825293899, -0.0013390176463872194, -0.0012918452266603708, -0.0012446726905182004, -0.00119750015437603, -0.0011503278510645032, -0.0011031553149223328, -0.0010559828951954842, -0.0010088103590533137, -0.0009616378811188042, -0.0009144654031842947, -0.0008672928670421243, -0.0008201203891076148, -0.0007729479111731052, -0.0007257754332385957, -0.0006786029553040862, -0.0006314304191619158, -0.0005842579412274063, -0.0005370854632928967, -0.0004899129271507263, -0.0004427404492162168, -0.00039556794217787683, -0.00034839543513953686, -0.00030122295720502734, -0.0002540504792705178, -0.00020687797223217785, -0.0001597054797457531, -0.00011253298725932837, -6.536048022098839e-05, -1.8188002286478877e-05, 2.8984490199945867e-05, 7.615698268637061e-05, 0.00012332947517279536, 0.0001705019676592201, 0.00021767446014564484, 0.0002648469526320696, 0.00031201945967040956, 0.0003591919376049191]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 5.0, 9.0, 9.0, 15.0, 20.0, 21.0, 16.0, 24.0, 21.0, 17.0, 26.0, 30.0, 35.0, 32.0, 56.0, 44.0, 29.0, 37.0, 39.0, 53.0, 44.0, 37.0, 40.0, 42.0, 45.0, 34.0, 29.0, 25.0, 18.0, 16.0, 21.0, 23.0, 24.0, 14.0, 12.0, 8.0, 8.0, 3.0, 3.0, 1.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007435083389282227, -0.0007173418998718262, -0.0006911754608154297, -0.0006650090217590332, -0.0006388425827026367, -0.0006126761436462402, -0.0005865097045898438, -0.0005603432655334473, -0.0005341768264770508, -0.0005080103874206543, -0.0004818439483642578, -0.00045567750930786133, -0.00042951107025146484, -0.00040334463119506836, -0.0003771781921386719, -0.0003510117530822754, -0.0003248453140258789, -0.0002986788749694824, -0.00027251243591308594, -0.00024634599685668945, -0.00022017955780029297, -0.00019401311874389648, -0.0001678466796875, -0.00014168024063110352, -0.00011551380157470703, -8.934736251831055e-05, -6.318092346191406e-05, -3.701448440551758e-05, -1.0848045349121094e-05, 1.531839370727539e-05, 4.1484832763671875e-05, 6.765127182006836e-05, 9.381771087646484e-05, 0.00011998414993286133, 0.0001461505889892578, 0.0001723170280456543, 0.00019848346710205078, 0.00022464990615844727, 0.00025081634521484375, 0.00027698278427124023, 0.0003031492233276367, 0.0003293156623840332, 0.0003554821014404297, 0.00038164854049682617, 0.00040781497955322266, 0.00043398141860961914, 0.0004601478576660156, 0.0004863142967224121, 0.0005124807357788086, 0.0005386471748352051, 0.0005648136138916016, 0.000590980052947998, 0.0006171464920043945, 0.000643312931060791, 0.0006694793701171875, 0.000695645809173584, 0.0007218122482299805, 0.000747978687286377, 0.0007741451263427734, 0.0008003115653991699, 0.0008264780044555664, 0.0008526444435119629, 0.0008788108825683594, 0.0009049773216247559, 0.0009311437606811523]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 7.0, 6.0, 13.0, 8.0, 8.0, 14.0, 9.0, 12.0, 15.0, 20.0, 17.0, 21.0, 28.0, 33.0, 27.0, 33.0, 44.0, 27.0, 39.0, 37.0, 39.0, 44.0, 47.0, 46.0, 42.0, 31.0, 38.0, 35.0, 30.0, 26.0, 23.0, 31.0, 29.0, 17.0, 14.0, 15.0, 11.0, 15.0, 12.0, 9.0, 5.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 3.0, 0.0, 3.0], "bins": [-12.5625, -12.2005615234375, -11.838623046875, -11.4766845703125, -11.11474609375, -10.7528076171875, -10.390869140625, -10.0289306640625, -9.6669921875, -9.3050537109375, -8.943115234375, -8.5811767578125, -8.21923828125, -7.8572998046875, -7.495361328125, -7.1334228515625, -6.771484375, -6.4095458984375, -6.047607421875, -5.6856689453125, -5.32373046875, -4.9617919921875, -4.599853515625, -4.2379150390625, -3.8759765625, -3.5140380859375, -3.152099609375, -2.7901611328125, -2.42822265625, -2.0662841796875, -1.704345703125, -1.3424072265625, -0.98046875, -0.6185302734375, -0.256591796875, 0.1053466796875, 0.46728515625, 0.8292236328125, 1.191162109375, 1.5531005859375, 1.9150390625, 2.2769775390625, 2.638916015625, 3.0008544921875, 3.36279296875, 3.7247314453125, 4.086669921875, 4.4486083984375, 4.810546875, 5.1724853515625, 5.534423828125, 5.8963623046875, 6.25830078125, 6.6202392578125, 6.982177734375, 7.3441162109375, 7.7060546875, 8.0679931640625, 8.429931640625, 8.7918701171875, 9.15380859375, 9.5157470703125, 9.877685546875, 10.2396240234375, 10.6015625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 5.0, 5.0, 9.0, 4.0, 5.0, 10.0, 20.0, 19.0, 35.0, 47.0, 74.0, 80.0, 130.0, 207.0, 248.0, 412.0, 667.0, 977.0, 1448.0, 2401.0, 3860.0, 6582.0, 11832.0, 23096.0, 57370.0, 209408.0, 518561.0, 127381.0, 41486.0, 18220.0, 9348.0, 5352.0, 3312.0, 2038.0, 1283.0, 872.0, 570.0, 385.0, 255.0, 151.0, 111.0, 85.0, 56.0, 43.0, 39.0, 12.0, 12.0, 12.0, 11.0, 4.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-10.0625, -9.7694091796875, -9.476318359375, -9.1832275390625, -8.89013671875, -8.5970458984375, -8.303955078125, -8.0108642578125, -7.7177734375, -7.4246826171875, -7.131591796875, -6.8385009765625, -6.54541015625, -6.2523193359375, -5.959228515625, -5.6661376953125, -5.373046875, -5.0799560546875, -4.786865234375, -4.4937744140625, -4.20068359375, -3.9075927734375, -3.614501953125, -3.3214111328125, -3.0283203125, -2.7352294921875, -2.442138671875, -2.1490478515625, -1.85595703125, -1.5628662109375, -1.269775390625, -0.9766845703125, -0.68359375, -0.3905029296875, -0.097412109375, 0.1956787109375, 0.48876953125, 0.7818603515625, 1.074951171875, 1.3680419921875, 1.6611328125, 1.9542236328125, 2.247314453125, 2.5404052734375, 2.83349609375, 3.1265869140625, 3.419677734375, 3.7127685546875, 4.005859375, 4.2989501953125, 4.592041015625, 4.8851318359375, 5.17822265625, 5.4713134765625, 5.764404296875, 6.0574951171875, 6.3505859375, 6.6436767578125, 6.936767578125, 7.2298583984375, 7.52294921875, 7.8160400390625, 8.109130859375, 8.4022216796875, 8.6953125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 3.0, 9.0, 9.0, 8.0, 14.0, 15.0, 17.0, 22.0, 30.0, 32.0, 23.0, 40.0, 37.0, 52.0, 48.0, 53.0, 102.0, 1745.0, 293.0, 73.0, 59.0, 51.0, 60.0, 39.0, 36.0, 29.0, 30.0, 17.0, 18.0, 19.0, 14.0, 15.0, 7.0, 5.0, 6.0, 6.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-58.6875, -57.0947265625, -55.501953125, -53.9091796875, -52.31640625, -50.7236328125, -49.130859375, -47.5380859375, -45.9453125, -44.3525390625, -42.759765625, -41.1669921875, -39.57421875, -37.9814453125, -36.388671875, -34.7958984375, -33.203125, -31.6103515625, -30.017578125, -28.4248046875, -26.83203125, -25.2392578125, -23.646484375, -22.0537109375, -20.4609375, -18.8681640625, -17.275390625, -15.6826171875, -14.08984375, -12.4970703125, -10.904296875, -9.3115234375, -7.71875, -6.1259765625, -4.533203125, -2.9404296875, -1.34765625, 0.2451171875, 1.837890625, 3.4306640625, 5.0234375, 6.6162109375, 8.208984375, 9.8017578125, 11.39453125, 12.9873046875, 14.580078125, 16.1728515625, 17.765625, 19.3583984375, 20.951171875, 22.5439453125, 24.13671875, 25.7294921875, 27.322265625, 28.9150390625, 30.5078125, 32.1005859375, 33.693359375, 35.2861328125, 36.87890625, 38.4716796875, 40.064453125, 41.6572265625, 43.25]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 6.0, 4.0, 8.0, 4.0, 9.0, 17.0, 26.0, 23.0, 33.0, 34.0, 71.0, 91.0, 144.0, 246.0, 467.0, 1877.0, 105725.0, 3030454.0, 4854.0, 714.0, 330.0, 168.0, 123.0, 64.0, 58.0, 44.0, 33.0, 19.0, 19.0, 11.0, 7.0, 7.0, 5.0, 6.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-119.0625, -115.580078125, -112.09765625, -108.615234375, -105.1328125, -101.650390625, -98.16796875, -94.685546875, -91.203125, -87.720703125, -84.23828125, -80.755859375, -77.2734375, -73.791015625, -70.30859375, -66.826171875, -63.34375, -59.861328125, -56.37890625, -52.896484375, -49.4140625, -45.931640625, -42.44921875, -38.966796875, -35.484375, -32.001953125, -28.51953125, -25.037109375, -21.5546875, -18.072265625, -14.58984375, -11.107421875, -7.625, -4.142578125, -0.66015625, 2.822265625, 6.3046875, 9.787109375, 13.26953125, 16.751953125, 20.234375, 23.716796875, 27.19921875, 30.681640625, 34.1640625, 37.646484375, 41.12890625, 44.611328125, 48.09375, 51.576171875, 55.05859375, 58.541015625, 62.0234375, 65.505859375, 68.98828125, 72.470703125, 75.953125, 79.435546875, 82.91796875, 86.400390625, 89.8828125, 93.365234375, 96.84765625, 100.330078125, 103.8125]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 63.0, 906.0, 46.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-740.4804077148438, -726.63134765625, -712.7822875976562, -698.9332275390625, -685.084228515625, -671.2351684570312, -657.3861083984375, -643.5370483398438, -629.68798828125, -615.8389282226562, -601.9898681640625, -588.140869140625, -574.2918090820312, -560.4427490234375, -546.5936889648438, -532.74462890625, -518.8956298828125, -505.04656982421875, -491.1975402832031, -477.3484802246094, -463.4994201660156, -449.650390625, -435.80133056640625, -421.9522705078125, -408.10321044921875, -394.254150390625, -380.4051208496094, -366.5560607910156, -352.7070007324219, -338.85797119140625, -325.0089111328125, -311.15985107421875, -297.31085205078125, -283.4617919921875, -269.6127624511719, -255.76370239257812, -241.91465759277344, -228.06561279296875, -214.216552734375, -200.3675079345703, -186.5184326171875, -172.6693878173828, -158.82032775878906, -144.97128295898438, -131.1222381591797, -117.27318572998047, -103.42413330078125, -89.57508850097656, -75.72604370117188, -61.87699508666992, -48.02794647216797, -34.17889404296875, -20.329845428466797, -6.480796813964844, 7.368255615234375, 21.217300415039062, 35.06635284423828, 48.915401458740234, 62.76445007324219, 76.6135025024414, 90.46255493164062, 104.31159973144531, 118.16065216064453, 132.00970458984375, 145.85874938964844]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 1.0, 4.0, 2.0, 4.0, 14.0, 9.0, 5.0, 13.0, 15.0, 10.0, 22.0, 9.0, 26.0, 15.0, 22.0, 29.0, 26.0, 27.0, 25.0, 29.0, 42.0, 31.0, 36.0, 42.0, 40.0, 41.0, 27.0, 35.0, 34.0, 28.0, 40.0, 29.0, 23.0, 22.0, 32.0, 23.0, 19.0, 22.0, 17.0, 23.0, 10.0, 14.0, 14.0, 11.0, 5.0, 12.0, 5.0, 7.0, 1.0, 6.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0], "bins": [-109.12353515625, -105.5908432006836, -102.05815124511719, -98.52545928955078, -94.99276733398438, -91.46007537841797, -87.92738342285156, -84.39469146728516, -80.86199951171875, -77.32930755615234, -73.79661560058594, -70.26392364501953, -66.73123168945312, -63.19853973388672, -59.66584777832031, -56.133155822753906, -52.600460052490234, -49.06776809692383, -45.53507614135742, -42.002384185791016, -38.46969223022461, -34.93699645996094, -31.404306411743164, -27.871614456176758, -24.33892250061035, -20.806230545043945, -17.27353858947754, -13.740845680236816, -10.20815372467041, -6.6754608154296875, -3.1427688598632812, 0.389923095703125, 3.9226150512695312, 7.4553070068359375, 10.987998962402344, 14.520691871643066, 18.053382873535156, 21.586076736450195, 25.1187686920166, 28.651460647583008, 32.18415069580078, 35.71684265136719, 39.249534606933594, 42.7822265625, 46.314918518066406, 49.84761047363281, 53.38030242919922, 56.912994384765625, 60.4456901550293, 63.9783821105957, 67.51107788085938, 71.04376983642578, 74.57646179199219, 78.1091537475586, 81.641845703125, 85.1745376586914, 88.70722961425781, 92.23992156982422, 95.77261352539062, 99.30530548095703, 102.83799743652344, 106.37068939208984, 109.90338134765625, 113.43607330322266, 116.96876525878906]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 6.0, 9.0, 9.0, 13.0, 10.0, 7.0, 7.0, 13.0, 19.0, 17.0, 30.0, 21.0, 28.0, 22.0, 37.0, 35.0, 30.0, 36.0, 43.0, 32.0, 42.0, 43.0, 41.0, 48.0, 41.0, 36.0, 25.0, 30.0, 33.0, 29.0, 29.0, 28.0, 28.0, 18.0, 8.0, 17.0, 14.0, 19.0, 9.0, 6.0, 6.0, 6.0, 6.0, 4.0, 5.0, 1.0, 3.0, 0.0, 3.0, 3.0, 1.0, 1.0], "bins": [-12.2890625, -11.923095703125, -11.55712890625, -11.191162109375, -10.8251953125, -10.459228515625, -10.09326171875, -9.727294921875, -9.361328125, -8.995361328125, -8.62939453125, -8.263427734375, -7.8974609375, -7.531494140625, -7.16552734375, -6.799560546875, -6.43359375, -6.067626953125, -5.70166015625, -5.335693359375, -4.9697265625, -4.603759765625, -4.23779296875, -3.871826171875, -3.505859375, -3.139892578125, -2.77392578125, -2.407958984375, -2.0419921875, -1.676025390625, -1.31005859375, -0.944091796875, -0.578125, -0.212158203125, 0.15380859375, 0.519775390625, 0.8857421875, 1.251708984375, 1.61767578125, 1.983642578125, 2.349609375, 2.715576171875, 3.08154296875, 3.447509765625, 3.8134765625, 4.179443359375, 4.54541015625, 4.911376953125, 5.27734375, 5.643310546875, 6.00927734375, 6.375244140625, 6.7412109375, 7.107177734375, 7.47314453125, 7.839111328125, 8.205078125, 8.571044921875, 8.93701171875, 9.302978515625, 9.6689453125, 10.034912109375, 10.40087890625, 10.766845703125, 11.1328125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 9.0, 13.0, 24.0, 29.0, 32.0, 52.0, 72.0, 97.0, 143.0, 245.0, 411.0, 783.0, 1670.0, 3824.0, 9742.0, 29396.0, 113462.0, 458315.0, 1373108.0, 1483464.0, 532674.0, 131896.0, 35224.0, 11395.0, 4253.0, 1766.0, 939.0, 448.0, 255.0, 169.0, 121.0, 70.0, 58.0, 30.0, 23.0, 23.0, 9.0, 13.0, 8.0, 1.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6796875, -14.20703125, -13.734375, -13.26171875, -12.7890625, -12.31640625, -11.84375, -11.37109375, -10.8984375, -10.42578125, -9.953125, -9.48046875, -9.0078125, -8.53515625, -8.0625, -7.58984375, -7.1171875, -6.64453125, -6.171875, -5.69921875, -5.2265625, -4.75390625, -4.28125, -3.80859375, -3.3359375, -2.86328125, -2.390625, -1.91796875, -1.4453125, -0.97265625, -0.5, -0.02734375, 0.4453125, 0.91796875, 1.390625, 1.86328125, 2.3359375, 2.80859375, 3.28125, 3.75390625, 4.2265625, 4.69921875, 5.171875, 5.64453125, 6.1171875, 6.58984375, 7.0625, 7.53515625, 8.0078125, 8.48046875, 8.953125, 9.42578125, 9.8984375, 10.37109375, 10.84375, 11.31640625, 11.7890625, 12.26171875, 12.734375, 13.20703125, 13.6796875, 14.15234375, 14.625, 15.09765625, 15.5703125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 7.0, 6.0, 10.0, 21.0, 22.0, 22.0, 24.0, 49.0, 54.0, 73.0, 97.0, 126.0, 141.0, 193.0, 273.0, 350.0, 425.0, 447.0, 418.0, 328.0, 234.0, 188.0, 133.0, 111.0, 70.0, 72.0, 34.0, 39.0, 31.0, 29.0, 17.0, 9.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-38.6875, -37.70361328125, -36.7197265625, -35.73583984375, -34.751953125, -33.76806640625, -32.7841796875, -31.80029296875, -30.81640625, -29.83251953125, -28.8486328125, -27.86474609375, -26.880859375, -25.89697265625, -24.9130859375, -23.92919921875, -22.9453125, -21.96142578125, -20.9775390625, -19.99365234375, -19.009765625, -18.02587890625, -17.0419921875, -16.05810546875, -15.07421875, -14.09033203125, -13.1064453125, -12.12255859375, -11.138671875, -10.15478515625, -9.1708984375, -8.18701171875, -7.203125, -6.21923828125, -5.2353515625, -4.25146484375, -3.267578125, -2.28369140625, -1.2998046875, -0.31591796875, 0.66796875, 1.65185546875, 2.6357421875, 3.61962890625, 4.603515625, 5.58740234375, 6.5712890625, 7.55517578125, 8.5390625, 9.52294921875, 10.5068359375, 11.49072265625, 12.474609375, 13.45849609375, 14.4423828125, 15.42626953125, 16.41015625, 17.39404296875, 18.3779296875, 19.36181640625, 20.345703125, 21.32958984375, 22.3134765625, 23.29736328125, 24.28125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 5.0, 3.0, 7.0, 13.0, 13.0, 11.0, 15.0, 38.0, 41.0, 59.0, 58.0, 86.0, 112.0, 225.0, 305.0, 736.0, 16392.0, 4146280.0, 27878.0, 907.0, 343.0, 238.0, 138.0, 101.0, 78.0, 49.0, 37.0, 24.0, 23.0, 30.0, 11.0, 9.0, 11.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-144.375, -138.935546875, -133.49609375, -128.056640625, -122.6171875, -117.177734375, -111.73828125, -106.298828125, -100.859375, -95.419921875, -89.98046875, -84.541015625, -79.1015625, -73.662109375, -68.22265625, -62.783203125, -57.34375, -51.904296875, -46.46484375, -41.025390625, -35.5859375, -30.146484375, -24.70703125, -19.267578125, -13.828125, -8.388671875, -2.94921875, 2.490234375, 7.9296875, 13.369140625, 18.80859375, 24.248046875, 29.6875, 35.126953125, 40.56640625, 46.005859375, 51.4453125, 56.884765625, 62.32421875, 67.763671875, 73.203125, 78.642578125, 84.08203125, 89.521484375, 94.9609375, 100.400390625, 105.83984375, 111.279296875, 116.71875, 122.158203125, 127.59765625, 133.037109375, 138.4765625, 143.916015625, 149.35546875, 154.794921875, 160.234375, 165.673828125, 171.11328125, 176.552734375, 181.9921875, 187.431640625, 192.87109375, 198.310546875, 203.75]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 6.0, 36.0, 182.0, 406.0, 301.0, 75.0, 11.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-513.5125732421875, -500.25885009765625, -487.0051574707031, -473.7514343261719, -460.49774169921875, -447.2440185546875, -433.99029541015625, -420.7366027832031, -407.4828796386719, -394.2291564941406, -380.9754638671875, -367.72174072265625, -354.4680480957031, -341.2143249511719, -327.96063232421875, -314.7069091796875, -301.45318603515625, -288.199462890625, -274.9457702636719, -261.6920471191406, -248.43833923339844, -235.18463134765625, -221.93092346191406, -208.67721557617188, -195.42352294921875, -182.16981506347656, -168.91610717773438, -155.66238403320312, -142.40867614746094, -129.15496826171875, -115.90126037597656, -102.64754486083984, -89.39382934570312, -76.14012145996094, -62.88640594482422, -49.63269805908203, -36.37898635864258, -23.125274658203125, -9.871566772460938, 3.3821487426757812, 16.63585662841797, 29.889568328857422, 43.143280029296875, 56.39698791503906, 69.65069580078125, 82.90441131591797, 96.15811920166016, 109.41183471679688, 122.66554260253906, 135.91925048828125, 149.17295837402344, 162.42666625976562, 175.68038940429688, 188.93409729003906, 202.18780517578125, 215.4415283203125, 228.69522094726562, 241.9489288330078, 255.20263671875, 268.45635986328125, 281.7100524902344, 294.9637756347656, 308.21746826171875, 321.47119140625, 334.72491455078125]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 4.0, 7.0, 5.0, 11.0, 4.0, 8.0, 8.0, 12.0, 13.0, 21.0, 22.0, 21.0, 22.0, 25.0, 37.0, 42.0, 35.0, 36.0, 40.0, 44.0, 33.0, 48.0, 32.0, 45.0, 47.0, 39.0, 37.0, 40.0, 27.0, 24.0, 25.0, 23.0, 26.0, 21.0, 18.0, 20.0, 15.0, 14.0, 15.0, 10.0, 4.0, 8.0, 6.0, 7.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-107.12677001953125, -103.61946868896484, -100.1121597290039, -96.6048583984375, -93.09754943847656, -89.59024810791016, -86.08294677734375, -82.57563781738281, -79.0683364868164, -75.56103515625, -72.05372619628906, -68.54642486572266, -65.03911590576172, -61.53181457519531, -58.02450942993164, -54.51720428466797, -51.0098991394043, -47.502593994140625, -43.99528884887695, -40.48798370361328, -36.980682373046875, -33.4733772277832, -29.96607208251953, -26.458768844604492, -22.95146369934082, -19.44415855407715, -15.93685531616211, -12.429550170898438, -8.922245979309082, -5.414941787719727, -1.9076366424560547, 1.5996665954589844, 5.106971740722656, 8.614275932312012, 12.121580123901367, 15.628885269165039, 19.136188507080078, 22.64349365234375, 26.150798797607422, 29.65810203552246, 33.1654052734375, 36.67271041870117, 40.180015563964844, 43.68731689453125, 47.19462203979492, 50.701927185058594, 54.209232330322266, 57.71653747558594, 61.22384262084961, 64.73114776611328, 68.23844909667969, 71.74575805664062, 75.25305938720703, 78.76036071777344, 82.26766967773438, 85.77497100830078, 89.28227996826172, 92.78958129882812, 96.29689025878906, 99.80419158935547, 103.3115005493164, 106.81880187988281, 110.32611083984375, 113.83341217041016, 117.34071350097656]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 6.0, 7.0, 10.0, 14.0, 6.0, 11.0, 12.0, 22.0, 18.0, 21.0, 25.0, 20.0, 34.0, 34.0, 39.0, 32.0, 39.0, 40.0, 47.0, 33.0, 42.0, 48.0, 41.0, 40.0, 31.0, 39.0, 34.0, 30.0, 30.0, 23.0, 28.0, 19.0, 19.0, 22.0, 16.0, 14.0, 7.0, 8.0, 10.0, 7.0, 1.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-13.1640625, -12.771728515625, -12.37939453125, -11.987060546875, -11.5947265625, -11.202392578125, -10.81005859375, -10.417724609375, -10.025390625, -9.633056640625, -9.24072265625, -8.848388671875, -8.4560546875, -8.063720703125, -7.67138671875, -7.279052734375, -6.88671875, -6.494384765625, -6.10205078125, -5.709716796875, -5.3173828125, -4.925048828125, -4.53271484375, -4.140380859375, -3.748046875, -3.355712890625, -2.96337890625, -2.571044921875, -2.1787109375, -1.786376953125, -1.39404296875, -1.001708984375, -0.609375, -0.217041015625, 0.17529296875, 0.567626953125, 0.9599609375, 1.352294921875, 1.74462890625, 2.136962890625, 2.529296875, 2.921630859375, 3.31396484375, 3.706298828125, 4.0986328125, 4.490966796875, 4.88330078125, 5.275634765625, 5.66796875, 6.060302734375, 6.45263671875, 6.844970703125, 7.2373046875, 7.629638671875, 8.02197265625, 8.414306640625, 8.806640625, 9.198974609375, 9.59130859375, 9.983642578125, 10.3759765625, 10.768310546875, 11.16064453125, 11.552978515625, 11.9453125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 7.0, 7.0, 22.0, 25.0, 24.0, 45.0, 47.0, 71.0, 119.0, 129.0, 170.0, 278.0, 365.0, 505.0, 698.0, 943.0, 1338.0, 1878.0, 2654.0, 3727.0, 5300.0, 7673.0, 11720.0, 17168.0, 26193.0, 41052.0, 65266.0, 113926.0, 292388.0, 199806.0, 92707.0, 55854.0, 35161.0, 22820.0, 15175.0, 10025.0, 6857.0, 4820.0, 3339.0, 2271.0, 1674.0, 1211.0, 871.0, 598.0, 452.0, 301.0, 264.0, 171.0, 132.0, 95.0, 66.0, 53.0, 39.0, 22.0, 17.0, 12.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0], "bins": [-2.427734375, -2.3489990234375, -2.270263671875, -2.1915283203125, -2.11279296875, -2.0340576171875, -1.955322265625, -1.8765869140625, -1.7978515625, -1.7191162109375, -1.640380859375, -1.5616455078125, -1.48291015625, -1.4041748046875, -1.325439453125, -1.2467041015625, -1.16796875, -1.0892333984375, -1.010498046875, -0.9317626953125, -0.85302734375, -0.7742919921875, -0.695556640625, -0.6168212890625, -0.5380859375, -0.4593505859375, -0.380615234375, -0.3018798828125, -0.22314453125, -0.1444091796875, -0.065673828125, 0.0130615234375, 0.091796875, 0.1705322265625, 0.249267578125, 0.3280029296875, 0.40673828125, 0.4854736328125, 0.564208984375, 0.6429443359375, 0.7216796875, 0.8004150390625, 0.879150390625, 0.9578857421875, 1.03662109375, 1.1153564453125, 1.194091796875, 1.2728271484375, 1.3515625, 1.4302978515625, 1.509033203125, 1.5877685546875, 1.66650390625, 1.7452392578125, 1.823974609375, 1.9027099609375, 1.9814453125, 2.0601806640625, 2.138916015625, 2.2176513671875, 2.29638671875, 2.3751220703125, 2.453857421875, 2.5325927734375, 2.611328125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 6.0, 5.0, 3.0, 6.0, 11.0, 8.0, 10.0, 9.0, 12.0, 14.0, 10.0, 16.0, 21.0, 24.0, 19.0, 25.0, 32.0, 34.0, 42.0, 36.0, 34.0, 34.0, 43.0, 1065.0, 29.0, 39.0, 51.0, 44.0, 40.0, 38.0, 25.0, 24.0, 39.0, 18.0, 24.0, 29.0, 18.0, 21.0, 14.0, 12.0, 14.0, 9.0, 9.0, 3.0, 3.0, 2.0, 4.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.69140625, -7.45068359375, -7.2099609375, -6.96923828125, -6.728515625, -6.48779296875, -6.2470703125, -6.00634765625, -5.765625, -5.52490234375, -5.2841796875, -5.04345703125, -4.802734375, -4.56201171875, -4.3212890625, -4.08056640625, -3.83984375, -3.59912109375, -3.3583984375, -3.11767578125, -2.876953125, -2.63623046875, -2.3955078125, -2.15478515625, -1.9140625, -1.67333984375, -1.4326171875, -1.19189453125, -0.951171875, -0.71044921875, -0.4697265625, -0.22900390625, 0.01171875, 0.25244140625, 0.4931640625, 0.73388671875, 0.974609375, 1.21533203125, 1.4560546875, 1.69677734375, 1.9375, 2.17822265625, 2.4189453125, 2.65966796875, 2.900390625, 3.14111328125, 3.3818359375, 3.62255859375, 3.86328125, 4.10400390625, 4.3447265625, 4.58544921875, 4.826171875, 5.06689453125, 5.3076171875, 5.54833984375, 5.7890625, 6.02978515625, 6.2705078125, 6.51123046875, 6.751953125, 6.99267578125, 7.2333984375, 7.47412109375, 7.71484375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 4.0, 8.0, 13.0, 12.0, 25.0, 47.0, 42.0, 85.0, 105.0, 144.0, 219.0, 326.0, 408.0, 658.0, 917.0, 1335.0, 1795.0, 2660.0, 3676.0, 5460.0, 7782.0, 11416.0, 16621.0, 24834.0, 38364.0, 61866.0, 106118.0, 225154.0, 1290266.0, 111309.0, 64389.0, 40066.0, 25879.0, 17139.0, 11616.0, 8035.0, 5574.0, 3868.0, 2637.0, 1904.0, 1273.0, 909.0, 653.0, 465.0, 313.0, 206.0, 183.0, 106.0, 81.0, 56.0, 44.0, 35.0, 17.0, 10.0, 10.0, 5.0, 3.0, 0.0, 1.0, 2.0], "bins": [-2.365234375, -2.291412353515625, -2.21759033203125, -2.143768310546875, -2.0699462890625, -1.996124267578125, -1.92230224609375, -1.848480224609375, -1.774658203125, -1.700836181640625, -1.62701416015625, -1.553192138671875, -1.4793701171875, -1.405548095703125, -1.33172607421875, -1.257904052734375, -1.18408203125, -1.110260009765625, -1.03643798828125, -0.962615966796875, -0.8887939453125, -0.814971923828125, -0.74114990234375, -0.667327880859375, -0.593505859375, -0.519683837890625, -0.44586181640625, -0.372039794921875, -0.2982177734375, -0.224395751953125, -0.15057373046875, -0.076751708984375, -0.0029296875, 0.070892333984375, 0.14471435546875, 0.218536376953125, 0.2923583984375, 0.366180419921875, 0.44000244140625, 0.513824462890625, 0.587646484375, 0.661468505859375, 0.73529052734375, 0.809112548828125, 0.8829345703125, 0.956756591796875, 1.03057861328125, 1.104400634765625, 1.17822265625, 1.252044677734375, 1.32586669921875, 1.399688720703125, 1.4735107421875, 1.547332763671875, 1.62115478515625, 1.694976806640625, 1.768798828125, 1.842620849609375, 1.91644287109375, 1.990264892578125, 2.0640869140625, 2.137908935546875, 2.21173095703125, 2.285552978515625, 2.359375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 4.0, 11.0, 10.0, 8.0, 15.0, 13.0, 17.0, 28.0, 27.0, 36.0, 53.0, 50.0, 65.0, 81.0, 94.0, 84.0, 70.0, 61.0, 49.0, 33.0, 36.0, 24.0, 19.0, 16.0, 10.0, 11.0, 9.0, 7.0, 13.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0013990402221679688, -0.0013519078493118286, -0.0013047754764556885, -0.0012576431035995483, -0.0012105107307434082, -0.001163378357887268, -0.001116245985031128, -0.0010691136121749878, -0.0010219812393188477, -0.0009748488664627075, -0.0009277164936065674, -0.0008805841207504272, -0.0008334517478942871, -0.000786319375038147, -0.0007391870021820068, -0.0006920546293258667, -0.0006449222564697266, -0.0005977898836135864, -0.0005506575107574463, -0.0005035251379013062, -0.000456392765045166, -0.0004092603921890259, -0.00036212801933288574, -0.0003149956464767456, -0.00026786327362060547, -0.00022073090076446533, -0.0001735985279083252, -0.00012646615505218506, -7.933378219604492e-05, -3.2201409339904785e-05, 1.4930963516235352e-05, 6.206333637237549e-05, 0.00010919570922851562, 0.00015632808208465576, 0.0002034604549407959, 0.00025059282779693604, 0.00029772520065307617, 0.0003448575735092163, 0.00039198994636535645, 0.0004391223192214966, 0.0004862546920776367, 0.0005333870649337769, 0.000580519437789917, 0.0006276518106460571, 0.0006747841835021973, 0.0007219165563583374, 0.0007690489292144775, 0.0008161813020706177, 0.0008633136749267578, 0.000910446047782898, 0.0009575784206390381, 0.0010047107934951782, 0.0010518431663513184, 0.0010989755392074585, 0.0011461079120635986, 0.0011932402849197388, 0.001240372657775879, 0.001287505030632019, 0.0013346374034881592, 0.0013817697763442993, 0.0014289021492004395, 0.0014760345220565796, 0.0015231668949127197, 0.0015702992677688599, 0.001617431640625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 9.0, 12.0, 4.0, 7.0, 15.0, 8.0, 14.0, 20.0, 29.0, 40.0, 46.0, 95.0, 194.0, 396.0, 1353.0, 1014781.0, 30200.0, 648.0, 239.0, 146.0, 83.0, 47.0, 31.0, 19.0, 17.0, 21.0, 14.0, 8.0, 7.0, 5.0, 2.0, 3.0, 7.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0], "bins": [-0.044708251953125, -0.04342222213745117, -0.042136192321777344, -0.040850162506103516, -0.03956413269042969, -0.03827810287475586, -0.03699207305908203, -0.0357060432434082, -0.034420013427734375, -0.03313398361206055, -0.03184795379638672, -0.03056192398071289, -0.029275894165039062, -0.027989864349365234, -0.026703834533691406, -0.025417804718017578, -0.02413177490234375, -0.022845745086669922, -0.021559715270996094, -0.020273685455322266, -0.018987655639648438, -0.01770162582397461, -0.01641559600830078, -0.015129566192626953, -0.013843536376953125, -0.012557506561279297, -0.011271476745605469, -0.00998544692993164, -0.008699417114257812, -0.007413387298583984, -0.006127357482910156, -0.004841327667236328, -0.0035552978515625, -0.002269268035888672, -0.0009832382202148438, 0.0003027915954589844, 0.0015888214111328125, 0.0028748512268066406, 0.004160881042480469, 0.005446910858154297, 0.006732940673828125, 0.008018970489501953, 0.009305000305175781, 0.01059103012084961, 0.011877059936523438, 0.013163089752197266, 0.014449119567871094, 0.015735149383544922, 0.01702117919921875, 0.018307209014892578, 0.019593238830566406, 0.020879268646240234, 0.022165298461914062, 0.02345132827758789, 0.02473735809326172, 0.026023387908935547, 0.027309417724609375, 0.028595447540283203, 0.02988147735595703, 0.03116750717163086, 0.03245353698730469, 0.033739566802978516, 0.035025596618652344, 0.03631162643432617, 0.03759765625]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 44.0, 561.0, 379.0, 28.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005722501780837774, -0.005558581557124853, -0.005394661333411932, -0.0052307406440377235, -0.005066820420324802, -0.004902900196611881, -0.00473897997289896, -0.004575059749186039, -0.004411139525473118, -0.004247219301760197, -0.0040832990780472755, -0.003919378854334354, -0.003755458164960146, -0.003591537941247225, -0.0034276177175343037, -0.0032636974938213825, -0.003099776804447174, -0.002935856580734253, -0.002771936124190688, -0.002608015900477767, -0.002444095443934202, -0.002280175220221281, -0.00211625499650836, -0.001952334656380117, -0.001788414316251874, -0.001624493976123631, -0.001460573635995388, -0.0012966534122824669, -0.001132733072154224, -0.000968812732025981, -0.0008048925083130598, -0.0006409721681848168, -0.00047705182805657387, -0.00031313151703216136, -0.00014921120600774884, 1.4709075912833214e-05, 0.00017862941604107618, 0.00034254975616931915, 0.0005064699798822403, 0.0006703903200104833, 0.0008343106601387262, 0.0009982310002669692, 0.0011621513403952122, 0.0013260715641081333, 0.0014899919042363763, 0.0016539122443646193, 0.0018178324680775404, 0.001981752924621105, 0.0021456731483340263, 0.0023095933720469475, 0.0024735138285905123, 0.0026374340523034334, 0.002801354508846998, 0.0029652747325599194, 0.0031291949562728405, 0.0032931151799857616, 0.0034570356365293264, 0.0036209558602422476, 0.0037848763167858124, 0.0039487965404987335, 0.004112716764211655, 0.004276636987924576, 0.004440557211637497, 0.004604477901011705, 0.0047683981247246265]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 5.0, 4.0, 8.0, 11.0, 11.0, 10.0, 15.0, 21.0, 14.0, 24.0, 16.0, 29.0, 34.0, 33.0, 39.0, 34.0, 48.0, 32.0, 45.0, 45.0, 34.0, 40.0, 46.0, 37.0, 50.0, 43.0, 42.0, 32.0, 21.0, 29.0, 20.0, 15.0, 22.0, 15.0, 9.0, 12.0, 14.0, 11.0, 7.0, 8.0, 1.0, 3.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0007356405258178711, -0.000712202861905098, -0.0006887651979923248, -0.0006653275340795517, -0.0006418898701667786, -0.0006184522062540054, -0.0005950145423412323, -0.0005715768784284592, -0.000548139214515686, -0.0005247015506029129, -0.0005012638866901398, -0.00047782622277736664, -0.0004543885588645935, -0.0004309508949518204, -0.00040751323103904724, -0.0003840755671262741, -0.000360637903213501, -0.00033720023930072784, -0.0003137625753879547, -0.0002903249114751816, -0.00026688724756240845, -0.00024344958364963531, -0.00022001191973686218, -0.00019657425582408905, -0.00017313659191131592, -0.00014969892799854279, -0.00012626126408576965, -0.00010282360017299652, -7.938593626022339e-05, -5.5948272347450256e-05, -3.2510608434677124e-05, -9.072944521903992e-06, 1.436471939086914e-05, 3.780238330364227e-05, 6.12400472164154e-05, 8.467771112918854e-05, 0.00010811537504196167, 0.0001315530389547348, 0.00015499070286750793, 0.00017842836678028107, 0.0002018660306930542, 0.00022530369460582733, 0.00024874135851860046, 0.0002721790224313736, 0.00029561668634414673, 0.00031905435025691986, 0.000342492014169693, 0.0003659296780824661, 0.00038936734199523926, 0.0004128050059080124, 0.0004362426698207855, 0.00045968033373355865, 0.0004831179976463318, 0.0005065556615591049, 0.000529993325471878, 0.0005534309893846512, 0.0005768686532974243, 0.0006003063172101974, 0.0006237439811229706, 0.0006471816450357437, 0.0006706193089485168, 0.00069405697286129, 0.0007174946367740631, 0.0007409323006868362, 0.0007643699645996094]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 2.0, 6.0, 7.0, 10.0, 14.0, 6.0, 11.0, 12.0, 22.0, 18.0, 21.0, 25.0, 20.0, 34.0, 34.0, 39.0, 32.0, 39.0, 40.0, 47.0, 33.0, 42.0, 48.0, 41.0, 40.0, 31.0, 39.0, 34.0, 30.0, 30.0, 23.0, 28.0, 19.0, 19.0, 22.0, 16.0, 14.0, 7.0, 8.0, 10.0, 7.0, 1.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-13.1640625, -12.771728515625, -12.37939453125, -11.987060546875, -11.5947265625, -11.202392578125, -10.81005859375, -10.417724609375, -10.025390625, -9.633056640625, -9.24072265625, -8.848388671875, -8.4560546875, -8.063720703125, -7.67138671875, -7.279052734375, -6.88671875, -6.494384765625, -6.10205078125, -5.709716796875, -5.3173828125, -4.925048828125, -4.53271484375, -4.140380859375, -3.748046875, -3.355712890625, -2.96337890625, -2.571044921875, -2.1787109375, -1.786376953125, -1.39404296875, -1.001708984375, -0.609375, -0.217041015625, 0.17529296875, 0.567626953125, 0.9599609375, 1.352294921875, 1.74462890625, 2.136962890625, 2.529296875, 2.921630859375, 3.31396484375, 3.706298828125, 4.0986328125, 4.490966796875, 4.88330078125, 5.275634765625, 5.66796875, 6.060302734375, 6.45263671875, 6.844970703125, 7.2373046875, 7.629638671875, 8.02197265625, 8.414306640625, 8.806640625, 9.198974609375, 9.59130859375, 9.983642578125, 10.3759765625, 10.768310546875, 11.16064453125, 11.552978515625, 11.9453125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 12.0, 16.0, 23.0, 30.0, 32.0, 56.0, 82.0, 129.0, 219.0, 336.0, 690.0, 1246.0, 2527.0, 5654.0, 12709.0, 32739.0, 101399.0, 395171.0, 352936.0, 90619.0, 29906.0, 11796.0, 5076.0, 2395.0, 1183.0, 650.0, 349.0, 180.0, 128.0, 68.0, 56.0, 42.0, 30.0, 16.0, 9.0, 7.0, 9.0, 5.0, 4.0, 3.0, 4.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.78125, -10.44384765625, -10.1064453125, -9.76904296875, -9.431640625, -9.09423828125, -8.7568359375, -8.41943359375, -8.08203125, -7.74462890625, -7.4072265625, -7.06982421875, -6.732421875, -6.39501953125, -6.0576171875, -5.72021484375, -5.3828125, -5.04541015625, -4.7080078125, -4.37060546875, -4.033203125, -3.69580078125, -3.3583984375, -3.02099609375, -2.68359375, -2.34619140625, -2.0087890625, -1.67138671875, -1.333984375, -0.99658203125, -0.6591796875, -0.32177734375, 0.015625, 0.35302734375, 0.6904296875, 1.02783203125, 1.365234375, 1.70263671875, 2.0400390625, 2.37744140625, 2.71484375, 3.05224609375, 3.3896484375, 3.72705078125, 4.064453125, 4.40185546875, 4.7392578125, 5.07666015625, 5.4140625, 5.75146484375, 6.0888671875, 6.42626953125, 6.763671875, 7.10107421875, 7.4384765625, 7.77587890625, 8.11328125, 8.45068359375, 8.7880859375, 9.12548828125, 9.462890625, 9.80029296875, 10.1376953125, 10.47509765625, 10.8125]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 9.0, 4.0, 2.0, 4.0, 4.0, 10.0, 13.0, 6.0, 14.0, 12.0, 23.0, 26.0, 26.0, 33.0, 32.0, 32.0, 33.0, 37.0, 49.0, 65.0, 61.0, 149.0, 1588.0, 280.0, 88.0, 57.0, 58.0, 38.0, 41.0, 27.0, 22.0, 32.0, 28.0, 21.0, 19.0, 16.0, 15.0, 12.0, 22.0, 15.0, 7.0, 8.0, 4.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-45.1875, -43.84619140625, -42.5048828125, -41.16357421875, -39.822265625, -38.48095703125, -37.1396484375, -35.79833984375, -34.45703125, -33.11572265625, -31.7744140625, -30.43310546875, -29.091796875, -27.75048828125, -26.4091796875, -25.06787109375, -23.7265625, -22.38525390625, -21.0439453125, -19.70263671875, -18.361328125, -17.02001953125, -15.6787109375, -14.33740234375, -12.99609375, -11.65478515625, -10.3134765625, -8.97216796875, -7.630859375, -6.28955078125, -4.9482421875, -3.60693359375, -2.265625, -0.92431640625, 0.4169921875, 1.75830078125, 3.099609375, 4.44091796875, 5.7822265625, 7.12353515625, 8.46484375, 9.80615234375, 11.1474609375, 12.48876953125, 13.830078125, 15.17138671875, 16.5126953125, 17.85400390625, 19.1953125, 20.53662109375, 21.8779296875, 23.21923828125, 24.560546875, 25.90185546875, 27.2431640625, 28.58447265625, 29.92578125, 31.26708984375, 32.6083984375, 33.94970703125, 35.291015625, 36.63232421875, 37.9736328125, 39.31494140625, 40.65625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 5.0, 5.0, 7.0, 5.0, 7.0, 7.0, 11.0, 19.0, 15.0, 24.0, 22.0, 29.0, 41.0, 61.0, 78.0, 84.0, 136.0, 169.0, 284.0, 448.0, 1615.0, 26734.0, 3089528.0, 23387.0, 1546.0, 472.0, 277.0, 164.0, 124.0, 92.0, 56.0, 65.0, 45.0, 34.0, 32.0, 15.0, 10.0, 24.0, 7.0, 6.0, 4.0, 6.0, 2.0, 9.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0], "bins": [-98.5, -95.55859375, -92.6171875, -89.67578125, -86.734375, -83.79296875, -80.8515625, -77.91015625, -74.96875, -72.02734375, -69.0859375, -66.14453125, -63.203125, -60.26171875, -57.3203125, -54.37890625, -51.4375, -48.49609375, -45.5546875, -42.61328125, -39.671875, -36.73046875, -33.7890625, -30.84765625, -27.90625, -24.96484375, -22.0234375, -19.08203125, -16.140625, -13.19921875, -10.2578125, -7.31640625, -4.375, -1.43359375, 1.5078125, 4.44921875, 7.390625, 10.33203125, 13.2734375, 16.21484375, 19.15625, 22.09765625, 25.0390625, 27.98046875, 30.921875, 33.86328125, 36.8046875, 39.74609375, 42.6875, 45.62890625, 48.5703125, 51.51171875, 54.453125, 57.39453125, 60.3359375, 63.27734375, 66.21875, 69.16015625, 72.1015625, 75.04296875, 77.984375, 80.92578125, 83.8671875, 86.80859375, 89.75]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 26.0, 415.0, 541.0, 32.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-435.5154113769531, -426.97894287109375, -418.44244384765625, -409.9059753417969, -401.3694763183594, -392.8330078125, -384.2965087890625, -375.7600402832031, -367.2235412597656, -358.68707275390625, -350.15057373046875, -341.6141052246094, -333.0776062011719, -324.5411376953125, -316.004638671875, -307.4681701660156, -298.93170166015625, -290.3952331542969, -281.8587341308594, -273.322265625, -264.7857666015625, -256.2492980957031, -247.71279907226562, -239.17633056640625, -230.63983154296875, -222.1033477783203, -213.56686401367188, -205.03038024902344, -196.493896484375, -187.95741271972656, -179.42092895507812, -170.88446044921875, -162.34793090820312, -153.8114471435547, -145.27496337890625, -136.7384796142578, -128.20199584960938, -119.66551208496094, -111.12903594970703, -102.5925521850586, -94.05607604980469, -85.51959228515625, -76.98310852050781, -68.44662475585938, -59.9101448059082, -51.373661041259766, -42.837181091308594, -34.300697326660156, -25.76421356201172, -17.22772979736328, -8.691247940063477, -0.15476608276367188, 8.381717681884766, 16.918201446533203, 25.454681396484375, 33.99116516113281, 42.52764892578125, 51.06413269042969, 59.600616455078125, 68.13710021972656, 76.673583984375, 85.21006774902344, 93.74654388427734, 102.28302764892578, 110.81951141357422]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [4.0, 0.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 5.0, 10.0, 6.0, 5.0, 11.0, 18.0, 14.0, 11.0, 13.0, 17.0, 20.0, 27.0, 26.0, 27.0, 34.0, 36.0, 24.0, 38.0, 35.0, 30.0, 35.0, 32.0, 49.0, 40.0, 36.0, 27.0, 41.0, 31.0, 30.0, 28.0, 24.0, 24.0, 24.0, 10.0, 22.0, 18.0, 20.0, 23.0, 19.0, 4.0, 11.0, 9.0, 9.0, 3.0, 5.0, 1.0, 3.0, 3.0, 5.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0], "bins": [-89.90013122558594, -86.91744232177734, -83.93475341796875, -80.95206451416016, -77.96937561035156, -74.98668670654297, -72.00399780273438, -69.02130126953125, -66.03861999511719, -63.055931091308594, -60.0732421875, -57.090553283691406, -54.10786437988281, -51.12517547607422, -48.14248275756836, -45.159793853759766, -42.177101135253906, -39.19441223144531, -36.21172332763672, -33.229034423828125, -30.2463436126709, -27.263654708862305, -24.280963897705078, -21.298274993896484, -18.31558609008789, -15.332897186279297, -12.350207328796387, -9.367517471313477, -6.384828567504883, -3.402139663696289, -0.4194488525390625, 2.5632400512695312, 5.545936584472656, 8.52862548828125, 11.51131534576416, 14.49400520324707, 17.476694107055664, 20.459383010864258, 23.442073822021484, 26.424762725830078, 29.407451629638672, 32.390140533447266, 35.37282943725586, 38.35552215576172, 41.33821105957031, 44.320899963378906, 47.3035888671875, 50.286277770996094, 53.26896667480469, 56.25165557861328, 59.234344482421875, 62.21703338623047, 65.19972229003906, 68.18241119384766, 71.16510009765625, 74.14779663085938, 77.13047790527344, 80.11316680908203, 83.09585571289062, 86.07854461669922, 89.06123352050781, 92.0439224243164, 95.026611328125, 98.00930786132812, 100.99199676513672]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 6.0, 12.0, 4.0, 10.0, 18.0, 12.0, 13.0, 28.0, 24.0, 27.0, 27.0, 29.0, 31.0, 49.0, 31.0, 40.0, 42.0, 43.0, 48.0, 44.0, 39.0, 41.0, 36.0, 39.0, 39.0, 34.0, 24.0, 35.0, 20.0, 23.0, 26.0, 22.0, 12.0, 7.0, 12.0, 9.0, 9.0, 4.0, 3.0, 8.0, 3.0, 6.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0], "bins": [-14.1171875, -13.7012939453125, -13.285400390625, -12.8695068359375, -12.45361328125, -12.0377197265625, -11.621826171875, -11.2059326171875, -10.7900390625, -10.3741455078125, -9.958251953125, -9.5423583984375, -9.12646484375, -8.7105712890625, -8.294677734375, -7.8787841796875, -7.462890625, -7.0469970703125, -6.631103515625, -6.2152099609375, -5.79931640625, -5.3834228515625, -4.967529296875, -4.5516357421875, -4.1357421875, -3.7198486328125, -3.303955078125, -2.8880615234375, -2.47216796875, -2.0562744140625, -1.640380859375, -1.2244873046875, -0.80859375, -0.3927001953125, 0.023193359375, 0.4390869140625, 0.85498046875, 1.2708740234375, 1.686767578125, 2.1026611328125, 2.5185546875, 2.9344482421875, 3.350341796875, 3.7662353515625, 4.18212890625, 4.5980224609375, 5.013916015625, 5.4298095703125, 5.845703125, 6.2615966796875, 6.677490234375, 7.0933837890625, 7.50927734375, 7.9251708984375, 8.341064453125, 8.7569580078125, 9.1728515625, 9.5887451171875, 10.004638671875, 10.4205322265625, 10.83642578125, 11.2523193359375, 11.668212890625, 12.0841064453125, 12.5]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 7.0, 9.0, 7.0, 6.0, 13.0, 15.0, 13.0, 15.0, 21.0, 24.0, 22.0, 41.0, 32.0, 63.0, 78.0, 114.0, 174.0, 403.0, 3283.0, 381040.0, 3773541.0, 33320.0, 1210.0, 273.0, 116.0, 98.0, 59.0, 44.0, 34.0, 40.0, 24.0, 22.0, 24.0, 11.0, 12.0, 16.0, 9.0, 8.0, 8.0, 5.0, 4.0, 6.0, 2.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0], "bins": [-81.5625, -79.251953125, -76.94140625, -74.630859375, -72.3203125, -70.009765625, -67.69921875, -65.388671875, -63.078125, -60.767578125, -58.45703125, -56.146484375, -53.8359375, -51.525390625, -49.21484375, -46.904296875, -44.59375, -42.283203125, -39.97265625, -37.662109375, -35.3515625, -33.041015625, -30.73046875, -28.419921875, -26.109375, -23.798828125, -21.48828125, -19.177734375, -16.8671875, -14.556640625, -12.24609375, -9.935546875, -7.625, -5.314453125, -3.00390625, -0.693359375, 1.6171875, 3.927734375, 6.23828125, 8.548828125, 10.859375, 13.169921875, 15.48046875, 17.791015625, 20.1015625, 22.412109375, 24.72265625, 27.033203125, 29.34375, 31.654296875, 33.96484375, 36.275390625, 38.5859375, 40.896484375, 43.20703125, 45.517578125, 47.828125, 50.138671875, 52.44921875, 54.759765625, 57.0703125, 59.380859375, 61.69140625, 64.001953125, 66.3125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 22.0, 7.0, 26.0, 22.0, 28.0, 55.0, 68.0, 87.0, 109.0, 150.0, 216.0, 320.0, 397.0, 489.0, 468.0, 423.0, 312.0, 235.0, 165.0, 125.0, 86.0, 56.0, 50.0, 41.0, 23.0, 27.0, 8.0, 11.0, 12.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.5625, -28.580078125, -27.59765625, -26.615234375, -25.6328125, -24.650390625, -23.66796875, -22.685546875, -21.703125, -20.720703125, -19.73828125, -18.755859375, -17.7734375, -16.791015625, -15.80859375, -14.826171875, -13.84375, -12.861328125, -11.87890625, -10.896484375, -9.9140625, -8.931640625, -7.94921875, -6.966796875, -5.984375, -5.001953125, -4.01953125, -3.037109375, -2.0546875, -1.072265625, -0.08984375, 0.892578125, 1.875, 2.857421875, 3.83984375, 4.822265625, 5.8046875, 6.787109375, 7.76953125, 8.751953125, 9.734375, 10.716796875, 11.69921875, 12.681640625, 13.6640625, 14.646484375, 15.62890625, 16.611328125, 17.59375, 18.576171875, 19.55859375, 20.541015625, 21.5234375, 22.505859375, 23.48828125, 24.470703125, 25.453125, 26.435546875, 27.41796875, 28.400390625, 29.3828125, 30.365234375, 31.34765625, 32.330078125, 33.3125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 3.0, 5.0, 5.0, 7.0, 6.0, 21.0, 20.0, 17.0, 30.0, 46.0, 51.0, 64.0, 88.0, 99.0, 130.0, 183.0, 312.0, 637.0, 1755.0, 108683.0, 4065689.0, 13778.0, 1118.0, 475.0, 277.0, 184.0, 146.0, 107.0, 74.0, 59.0, 64.0, 34.0, 27.0, 16.0, 24.0, 13.0, 12.0, 5.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-128.0, -123.482421875, -118.96484375, -114.447265625, -109.9296875, -105.412109375, -100.89453125, -96.376953125, -91.859375, -87.341796875, -82.82421875, -78.306640625, -73.7890625, -69.271484375, -64.75390625, -60.236328125, -55.71875, -51.201171875, -46.68359375, -42.166015625, -37.6484375, -33.130859375, -28.61328125, -24.095703125, -19.578125, -15.060546875, -10.54296875, -6.025390625, -1.5078125, 3.009765625, 7.52734375, 12.044921875, 16.5625, 21.080078125, 25.59765625, 30.115234375, 34.6328125, 39.150390625, 43.66796875, 48.185546875, 52.703125, 57.220703125, 61.73828125, 66.255859375, 70.7734375, 75.291015625, 79.80859375, 84.326171875, 88.84375, 93.361328125, 97.87890625, 102.396484375, 106.9140625, 111.431640625, 115.94921875, 120.466796875, 124.984375, 129.501953125, 134.01953125, 138.537109375, 143.0546875, 147.572265625, 152.08984375, 156.607421875, 161.125]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 6.0, 4.0, 7.0, 17.0, 27.0, 40.0, 71.0, 82.0, 118.0, 127.0, 123.0, 115.0, 91.0, 62.0, 36.0, 33.0, 24.0, 15.0, 5.0, 5.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-71.47301483154297, -67.73322296142578, -63.99342346191406, -60.253631591796875, -56.51383590698242, -52.77404022216797, -49.03424835205078, -45.29445266723633, -41.554656982421875, -37.81486129760742, -34.07506561279297, -30.33527374267578, -26.595478057861328, -22.855682373046875, -19.115888595581055, -15.376094818115234, -11.636299133300781, -7.8965044021606445, -4.156709671020508, -0.4169149398803711, 3.3228797912597656, 7.062675476074219, 10.802469253540039, 14.54226303100586, 18.282058715820312, 22.021854400634766, 25.761648178100586, 29.501441955566406, 33.24123764038086, 36.98103332519531, 40.7208251953125, 44.46062088012695, 48.20042419433594, 51.94021987915039, 55.680015563964844, 59.41980743408203, 63.159603118896484, 66.89939880371094, 70.63919067382812, 74.37898254394531, 78.11878204345703, 81.85857391357422, 85.59837341308594, 89.33816528320312, 93.07795715332031, 96.81775665283203, 100.55754852294922, 104.29734802246094, 108.03713989257812, 111.77693176269531, 115.51673126220703, 119.25652313232422, 122.99632263183594, 126.73611450195312, 130.4759063720703, 134.2156982421875, 137.95550537109375, 141.69529724121094, 145.43508911132812, 149.17489624023438, 152.91468811035156, 156.65447998046875, 160.39427185058594, 164.13406372070312, 167.8738555908203]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 2.0, 8.0, 8.0, 10.0, 8.0, 11.0, 13.0, 12.0, 21.0, 21.0, 27.0, 32.0, 30.0, 22.0, 29.0, 25.0, 50.0, 44.0, 45.0, 31.0, 43.0, 28.0, 44.0, 55.0, 27.0, 34.0, 37.0, 26.0, 28.0, 32.0, 31.0, 26.0, 22.0, 20.0, 17.0, 12.0, 14.0, 10.0, 10.0, 10.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 2.0, 0.0, 1.0], "bins": [-107.52072143554688, -104.39474487304688, -101.26876831054688, -98.14279174804688, -95.0168228149414, -91.8908462524414, -88.7648696899414, -85.6388931274414, -82.51292419433594, -79.38694763183594, -76.26097106933594, -73.13499450683594, -70.00902557373047, -66.88304901123047, -63.75707244873047, -60.63109588623047, -57.50511932373047, -54.37914276123047, -51.253170013427734, -48.127193450927734, -45.001220703125, -41.875244140625, -38.749267578125, -35.623291015625, -32.497318267822266, -29.3713436126709, -26.24536895751953, -23.11939239501953, -19.993417739868164, -16.867443084716797, -13.741466522216797, -10.61549186706543, -7.4895172119140625, -4.363542079925537, -1.2375669479370117, 1.8884086608886719, 5.014383316040039, 8.140357971191406, 11.266334533691406, 14.392309188842773, 17.51828384399414, 20.644258499145508, 23.770233154296875, 26.896209716796875, 30.022184371948242, 33.14815902709961, 36.27413558959961, 39.400108337402344, 42.526084899902344, 45.652061462402344, 48.77803421020508, 51.90401077270508, 55.02998352050781, 58.15596008300781, 61.28193664550781, 64.40791320800781, 67.53388977050781, 70.65986633300781, 73.78584289550781, 76.91181945800781, 80.03778839111328, 83.16376495361328, 86.28974151611328, 89.41571807861328, 92.54168701171875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 3.0, 10.0, 12.0, 8.0, 12.0, 16.0, 15.0, 22.0, 27.0, 24.0, 37.0, 31.0, 30.0, 35.0, 43.0, 42.0, 59.0, 49.0, 44.0, 55.0, 39.0, 42.0, 47.0, 29.0, 55.0, 28.0, 17.0, 28.0, 30.0, 19.0, 14.0, 13.0, 10.0, 13.0, 11.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.171875, -14.7176513671875, -14.263427734375, -13.8092041015625, -13.35498046875, -12.9007568359375, -12.446533203125, -11.9923095703125, -11.5380859375, -11.0838623046875, -10.629638671875, -10.1754150390625, -9.72119140625, -9.2669677734375, -8.812744140625, -8.3585205078125, -7.904296875, -7.4500732421875, -6.995849609375, -6.5416259765625, -6.08740234375, -5.6331787109375, -5.178955078125, -4.7247314453125, -4.2705078125, -3.8162841796875, -3.362060546875, -2.9078369140625, -2.45361328125, -1.9993896484375, -1.545166015625, -1.0909423828125, -0.63671875, -0.1824951171875, 0.271728515625, 0.7259521484375, 1.18017578125, 1.6343994140625, 2.088623046875, 2.5428466796875, 2.9970703125, 3.4512939453125, 3.905517578125, 4.3597412109375, 4.81396484375, 5.2681884765625, 5.722412109375, 6.1766357421875, 6.630859375, 7.0850830078125, 7.539306640625, 7.9935302734375, 8.44775390625, 8.9019775390625, 9.356201171875, 9.8104248046875, 10.2646484375, 10.7188720703125, 11.173095703125, 11.6273193359375, 12.08154296875, 12.5357666015625, 12.989990234375, 13.4442138671875, 13.8984375]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 3.0, 5.0, 6.0, 10.0, 11.0, 25.0, 39.0, 45.0, 77.0, 120.0, 197.0, 290.0, 426.0, 716.0, 993.0, 1577.0, 2509.0, 4000.0, 6049.0, 9917.0, 15988.0, 26149.0, 44733.0, 81000.0, 170930.0, 366877.0, 142197.0, 70892.0, 40168.0, 23509.0, 14640.0, 8914.0, 5534.0, 3566.0, 2274.0, 1438.0, 916.0, 639.0, 397.0, 269.0, 179.0, 128.0, 68.0, 49.0, 32.0, 26.0, 14.0, 8.0, 8.0, 2.0, 3.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.43359375, -3.330780029296875, -3.22796630859375, -3.125152587890625, -3.0223388671875, -2.919525146484375, -2.81671142578125, -2.713897705078125, -2.611083984375, -2.508270263671875, -2.40545654296875, -2.302642822265625, -2.1998291015625, -2.097015380859375, -1.99420166015625, -1.891387939453125, -1.78857421875, -1.685760498046875, -1.58294677734375, -1.480133056640625, -1.3773193359375, -1.274505615234375, -1.17169189453125, -1.068878173828125, -0.966064453125, -0.863250732421875, -0.76043701171875, -0.657623291015625, -0.5548095703125, -0.451995849609375, -0.34918212890625, -0.246368408203125, -0.1435546875, -0.040740966796875, 0.06207275390625, 0.164886474609375, 0.2677001953125, 0.370513916015625, 0.47332763671875, 0.576141357421875, 0.678955078125, 0.781768798828125, 0.88458251953125, 0.987396240234375, 1.0902099609375, 1.193023681640625, 1.29583740234375, 1.398651123046875, 1.50146484375, 1.604278564453125, 1.70709228515625, 1.809906005859375, 1.9127197265625, 2.015533447265625, 2.11834716796875, 2.221160888671875, 2.323974609375, 2.426788330078125, 2.52960205078125, 2.632415771484375, 2.7352294921875, 2.838043212890625, 2.94085693359375, 3.043670654296875, 3.146484375]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 5.0, 2.0, 2.0, 6.0, 5.0, 5.0, 7.0, 7.0, 12.0, 10.0, 24.0, 17.0, 29.0, 19.0, 26.0, 23.0, 38.0, 33.0, 41.0, 50.0, 42.0, 34.0, 38.0, 1060.0, 42.0, 41.0, 44.0, 33.0, 47.0, 39.0, 29.0, 30.0, 30.0, 25.0, 22.0, 17.0, 19.0, 12.0, 18.0, 9.0, 9.0, 5.0, 10.0, 4.0, 5.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-8.796875, -8.526611328125, -8.25634765625, -7.986083984375, -7.7158203125, -7.445556640625, -7.17529296875, -6.905029296875, -6.634765625, -6.364501953125, -6.09423828125, -5.823974609375, -5.5537109375, -5.283447265625, -5.01318359375, -4.742919921875, -4.47265625, -4.202392578125, -3.93212890625, -3.661865234375, -3.3916015625, -3.121337890625, -2.85107421875, -2.580810546875, -2.310546875, -2.040283203125, -1.77001953125, -1.499755859375, -1.2294921875, -0.959228515625, -0.68896484375, -0.418701171875, -0.1484375, 0.121826171875, 0.39208984375, 0.662353515625, 0.9326171875, 1.202880859375, 1.47314453125, 1.743408203125, 2.013671875, 2.283935546875, 2.55419921875, 2.824462890625, 3.0947265625, 3.364990234375, 3.63525390625, 3.905517578125, 4.17578125, 4.446044921875, 4.71630859375, 4.986572265625, 5.2568359375, 5.527099609375, 5.79736328125, 6.067626953125, 6.337890625, 6.608154296875, 6.87841796875, 7.148681640625, 7.4189453125, 7.689208984375, 7.95947265625, 8.229736328125, 8.5]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 8.0, 11.0, 29.0, 24.0, 37.0, 69.0, 98.0, 121.0, 231.0, 262.0, 426.0, 610.0, 899.0, 1227.0, 1872.0, 2660.0, 3954.0, 5803.0, 8575.0, 12729.0, 19178.0, 29958.0, 48327.0, 81318.0, 149750.0, 1344090.0, 157821.0, 84834.0, 50155.0, 31038.0, 20021.0, 13237.0, 8846.0, 5952.0, 4087.0, 2785.0, 1892.0, 1325.0, 906.0, 617.0, 426.0, 309.0, 190.0, 152.0, 90.0, 61.0, 46.0, 21.0, 24.0, 14.0, 7.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.599609375, -2.517181396484375, -2.43475341796875, -2.352325439453125, -2.2698974609375, -2.187469482421875, -2.10504150390625, -2.022613525390625, -1.940185546875, -1.857757568359375, -1.77532958984375, -1.692901611328125, -1.6104736328125, -1.528045654296875, -1.44561767578125, -1.363189697265625, -1.28076171875, -1.198333740234375, -1.11590576171875, -1.033477783203125, -0.9510498046875, -0.868621826171875, -0.78619384765625, -0.703765869140625, -0.621337890625, -0.538909912109375, -0.45648193359375, -0.374053955078125, -0.2916259765625, -0.209197998046875, -0.12677001953125, -0.044342041015625, 0.0380859375, 0.120513916015625, 0.20294189453125, 0.285369873046875, 0.3677978515625, 0.450225830078125, 0.53265380859375, 0.615081787109375, 0.697509765625, 0.779937744140625, 0.86236572265625, 0.944793701171875, 1.0272216796875, 1.109649658203125, 1.19207763671875, 1.274505615234375, 1.35693359375, 1.439361572265625, 1.52178955078125, 1.604217529296875, 1.6866455078125, 1.769073486328125, 1.85150146484375, 1.933929443359375, 2.016357421875, 2.098785400390625, 2.18121337890625, 2.263641357421875, 2.3460693359375, 2.428497314453125, 2.51092529296875, 2.593353271484375, 2.67578125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 2.0, 4.0, 3.0, 4.0, 7.0, 4.0, 8.0, 7.0, 14.0, 9.0, 21.0, 26.0, 31.0, 42.0, 39.0, 55.0, 75.0, 75.0, 109.0, 95.0, 76.0, 73.0, 28.0, 43.0, 26.0, 27.0, 16.0, 24.0, 16.0, 16.0, 6.0, 8.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0019216537475585938, -0.0018628090620040894, -0.001803964376449585, -0.0017451196908950806, -0.0016862750053405762, -0.0016274303197860718, -0.0015685856342315674, -0.001509740948677063, -0.0014508962631225586, -0.0013920515775680542, -0.0013332068920135498, -0.0012743622064590454, -0.001215517520904541, -0.0011566728353500366, -0.0010978281497955322, -0.0010389834642410278, -0.0009801387786865234, -0.000921294093132019, -0.0008624494075775146, -0.0008036047220230103, -0.0007447600364685059, -0.0006859153509140015, -0.0006270706653594971, -0.0005682259798049927, -0.0005093812942504883, -0.0004505366086959839, -0.0003916919231414795, -0.0003328472375869751, -0.0002740025520324707, -0.0002151578664779663, -0.00015631318092346191, -9.746849536895752e-05, -3.8623809814453125e-05, 2.022087574005127e-05, 7.906556129455566e-05, 0.00013791024684906006, 0.00019675493240356445, 0.00025559961795806885, 0.00031444430351257324, 0.00037328898906707764, 0.00043213367462158203, 0.0004909783601760864, 0.0005498230457305908, 0.0006086677312850952, 0.0006675124168395996, 0.000726357102394104, 0.0007852017879486084, 0.0008440464735031128, 0.0009028911590576172, 0.0009617358446121216, 0.001020580530166626, 0.0010794252157211304, 0.0011382699012756348, 0.0011971145868301392, 0.0012559592723846436, 0.001314803957939148, 0.0013736486434936523, 0.0014324933290481567, 0.0014913380146026611, 0.0015501827001571655, 0.00160902738571167, 0.0016678720712661743, 0.0017267167568206787, 0.001785561442375183, 0.0018444061279296875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 8.0, 10.0, 12.0, 23.0, 20.0, 24.0, 35.0, 40.0, 82.0, 139.0, 277.0, 636.0, 13382.0, 1029948.0, 2816.0, 510.0, 208.0, 123.0, 62.0, 55.0, 28.0, 19.0, 17.0, 13.0, 14.0, 14.0, 6.0, 2.0, 5.0, 6.0, 3.0, 2.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.04534912109375, -0.043947696685791016, -0.04254627227783203, -0.04114484786987305, -0.03974342346191406, -0.03834199905395508, -0.036940574645996094, -0.03553915023803711, -0.034137725830078125, -0.03273630142211914, -0.031334877014160156, -0.029933452606201172, -0.028532028198242188, -0.027130603790283203, -0.02572917938232422, -0.024327754974365234, -0.02292633056640625, -0.021524906158447266, -0.02012348175048828, -0.018722057342529297, -0.017320632934570312, -0.015919208526611328, -0.014517784118652344, -0.01311635971069336, -0.011714935302734375, -0.01031351089477539, -0.008912086486816406, -0.007510662078857422, -0.0061092376708984375, -0.004707813262939453, -0.0033063888549804688, -0.0019049644470214844, -0.0005035400390625, 0.0008978843688964844, 0.0022993087768554688, 0.003700733184814453, 0.0051021575927734375, 0.006503582000732422, 0.007905006408691406, 0.00930643081665039, 0.010707855224609375, 0.01210927963256836, 0.013510704040527344, 0.014912128448486328, 0.016313552856445312, 0.017714977264404297, 0.01911640167236328, 0.020517826080322266, 0.02191925048828125, 0.023320674896240234, 0.02472209930419922, 0.026123523712158203, 0.027524948120117188, 0.028926372528076172, 0.030327796936035156, 0.03172922134399414, 0.033130645751953125, 0.03453207015991211, 0.035933494567871094, 0.03733491897583008, 0.03873634338378906, 0.04013776779174805, 0.04153919219970703, 0.042940616607666016, 0.044342041015625]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 6.0, 29.0, 91.0, 202.0, 312.0, 233.0, 92.0, 33.0, 11.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0012997663579881191, -0.0012261336669325829, -0.0011525009758770466, -0.0010788682848215103, -0.001005235593765974, -0.0009316029027104378, -0.0008579701534472406, -0.0007843374623917043, -0.000710704771336168, -0.0006370720802806318, -0.0005634393892250955, -0.0004898066399618983, -0.0004161739780101925, -0.00034254128695465624, -0.0002689085667952895, -0.00019527587573975325, -0.00012164318468421698, -4.801048635272309e-05, 2.5622211978770792e-05, 9.925491758622229e-05, 0.00017288760864175856, 0.00024652029969729483, 0.00032015301985666156, 0.00039378571091219783, 0.0004674184019677341, 0.0005410510930232704, 0.0006146837840788066, 0.0006883165333420038, 0.0007619492243975401, 0.0008355819154530764, 0.0009092146065086126, 0.000982847297564149, 0.0010564799886196852, 0.0011301126796752214, 0.0012037453707307577, 0.001277378061786294, 0.0013510107528418303, 0.0014246434438973665, 0.0014982761349529028, 0.001571908826008439, 0.0016455415170639753, 0.0017191742081195116, 0.0017928068991750479, 0.0018664395902305841, 0.0019400722812861204, 0.0020137049723416567, 0.002087337663397193, 0.0021609703544527292, 0.002234603278338909, 0.0023082359693944454, 0.0023818686604499817, 0.002455501351505518, 0.0025291340425610542, 0.0026027667336165905, 0.0026763994246721268, 0.002750032115727663, 0.0028236648067831993, 0.0028972974978387356, 0.002970930188894272, 0.003044562879949808, 0.0031181955710053444, 0.0031918282620608807, 0.003265460953116417, 0.003339093644171953, 0.0034127263352274895]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 7.0, 13.0, 6.0, 10.0, 13.0, 15.0, 12.0, 11.0, 28.0, 16.0, 34.0, 24.0, 42.0, 39.0, 44.0, 46.0, 48.0, 45.0, 51.0, 44.0, 50.0, 48.0, 29.0, 36.0, 38.0, 31.0, 33.0, 33.0, 25.0, 31.0, 21.0, 13.0, 9.0, 19.0, 10.0, 5.0, 6.0, 5.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.0009680390357971191, -0.0009396960958838463, -0.0009113531559705734, -0.0008830102160573006, -0.0008546672761440277, -0.0008263243362307549, -0.000797981396317482, -0.0007696384564042091, -0.0007412955164909363, -0.0007129525765776634, -0.0006846096366643906, -0.0006562666967511177, -0.0006279237568378448, -0.000599580816924572, -0.0005712378770112991, -0.0005428949370980263, -0.0005145519971847534, -0.00048620905727148056, -0.0004578661173582077, -0.00042952317744493484, -0.000401180237531662, -0.00037283729761838913, -0.00034449435770511627, -0.0003161514177918434, -0.00028780847787857056, -0.0002594655379652977, -0.00023112259805202484, -0.00020277965813875198, -0.00017443671822547913, -0.00014609377831220627, -0.00011775083839893341, -8.940789848566055e-05, -6.10649585723877e-05, -3.272201865911484e-05, -4.37907874584198e-06, 2.3963861167430878e-05, 5.2306801080703735e-05, 8.064974099397659e-05, 0.00010899268090724945, 0.0001373356208205223, 0.00016567856073379517, 0.00019402150064706802, 0.00022236444056034088, 0.00025070738047361374, 0.0002790503203868866, 0.00030739326030015945, 0.0003357362002134323, 0.00036407914012670517, 0.00039242208003997803, 0.0004207650199532509, 0.00044910795986652374, 0.0004774508997797966, 0.0005057938396930695, 0.0005341367796063423, 0.0005624797195196152, 0.000590822659432888, 0.0006191655993461609, 0.0006475085392594337, 0.0006758514791727066, 0.0007041944190859795, 0.0007325373589992523, 0.0007608802989125252, 0.000789223238825798, 0.0008175661787390709, 0.0008459091186523438]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 4.0, 6.0, 3.0, 10.0, 12.0, 8.0, 12.0, 16.0, 15.0, 22.0, 27.0, 24.0, 37.0, 31.0, 30.0, 35.0, 43.0, 42.0, 59.0, 49.0, 44.0, 55.0, 39.0, 42.0, 47.0, 29.0, 55.0, 28.0, 17.0, 28.0, 30.0, 20.0, 13.0, 13.0, 10.0, 13.0, 11.0, 6.0, 3.0, 4.0, 4.0, 4.0, 2.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.171875, -14.7176513671875, -14.263427734375, -13.8092041015625, -13.35498046875, -12.9007568359375, -12.446533203125, -11.9923095703125, -11.5380859375, -11.0838623046875, -10.629638671875, -10.1754150390625, -9.72119140625, -9.2669677734375, -8.812744140625, -8.3585205078125, -7.904296875, -7.4500732421875, -6.995849609375, -6.5416259765625, -6.08740234375, -5.6331787109375, -5.178955078125, -4.7247314453125, -4.2705078125, -3.8162841796875, -3.362060546875, -2.9078369140625, -2.45361328125, -1.9993896484375, -1.545166015625, -1.0909423828125, -0.63671875, -0.1824951171875, 0.271728515625, 0.7259521484375, 1.18017578125, 1.6343994140625, 2.088623046875, 2.5428466796875, 2.9970703125, 3.4512939453125, 3.905517578125, 4.3597412109375, 4.81396484375, 5.2681884765625, 5.722412109375, 6.1766357421875, 6.630859375, 7.0850830078125, 7.539306640625, 7.9935302734375, 8.44775390625, 8.9019775390625, 9.356201171875, 9.8104248046875, 10.2646484375, 10.7188720703125, 11.173095703125, 11.6273193359375, 12.08154296875, 12.5357666015625, 12.989990234375, 13.4442138671875, 13.8984375]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 5.0, 7.0, 10.0, 14.0, 13.0, 34.0, 42.0, 72.0, 108.0, 156.0, 316.0, 450.0, 702.0, 1025.0, 1604.0, 2548.0, 4231.0, 6936.0, 12630.0, 23325.0, 46988.0, 106779.0, 282243.0, 325890.0, 121078.0, 52605.0, 25686.0, 13426.0, 7636.0, 4417.0, 2711.0, 1730.0, 1099.0, 700.0, 487.0, 290.0, 224.0, 121.0, 84.0, 52.0, 28.0, 15.0, 18.0, 10.0, 6.0, 7.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.55078125, -6.325439453125, -6.10009765625, -5.874755859375, -5.6494140625, -5.424072265625, -5.19873046875, -4.973388671875, -4.748046875, -4.522705078125, -4.29736328125, -4.072021484375, -3.8466796875, -3.621337890625, -3.39599609375, -3.170654296875, -2.9453125, -2.719970703125, -2.49462890625, -2.269287109375, -2.0439453125, -1.818603515625, -1.59326171875, -1.367919921875, -1.142578125, -0.917236328125, -0.69189453125, -0.466552734375, -0.2412109375, -0.015869140625, 0.20947265625, 0.434814453125, 0.66015625, 0.885498046875, 1.11083984375, 1.336181640625, 1.5615234375, 1.786865234375, 2.01220703125, 2.237548828125, 2.462890625, 2.688232421875, 2.91357421875, 3.138916015625, 3.3642578125, 3.589599609375, 3.81494140625, 4.040283203125, 4.265625, 4.490966796875, 4.71630859375, 4.941650390625, 5.1669921875, 5.392333984375, 5.61767578125, 5.843017578125, 6.068359375, 6.293701171875, 6.51904296875, 6.744384765625, 6.9697265625, 7.195068359375, 7.42041015625, 7.645751953125, 7.87109375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 6.0, 2.0, 1.0, 5.0, 6.0, 8.0, 6.0, 14.0, 12.0, 6.0, 14.0, 21.0, 30.0, 22.0, 35.0, 30.0, 33.0, 35.0, 47.0, 43.0, 64.0, 98.0, 337.0, 1580.0, 137.0, 60.0, 54.0, 54.0, 36.0, 41.0, 35.0, 31.0, 26.0, 24.0, 16.0, 24.0, 17.0, 10.0, 9.0, 3.0, 4.0, 6.0, 9.0, 4.0, 1.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.875, -38.220703125, -36.56640625, -34.912109375, -33.2578125, -31.603515625, -29.94921875, -28.294921875, -26.640625, -24.986328125, -23.33203125, -21.677734375, -20.0234375, -18.369140625, -16.71484375, -15.060546875, -13.40625, -11.751953125, -10.09765625, -8.443359375, -6.7890625, -5.134765625, -3.48046875, -1.826171875, -0.171875, 1.482421875, 3.13671875, 4.791015625, 6.4453125, 8.099609375, 9.75390625, 11.408203125, 13.0625, 14.716796875, 16.37109375, 18.025390625, 19.6796875, 21.333984375, 22.98828125, 24.642578125, 26.296875, 27.951171875, 29.60546875, 31.259765625, 32.9140625, 34.568359375, 36.22265625, 37.876953125, 39.53125, 41.185546875, 42.83984375, 44.494140625, 46.1484375, 47.802734375, 49.45703125, 51.111328125, 52.765625, 54.419921875, 56.07421875, 57.728515625, 59.3828125, 61.037109375, 62.69140625, 64.345703125, 66.0]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 9.0, 7.0, 16.0, 16.0, 13.0, 21.0, 46.0, 52.0, 92.0, 122.0, 169.0, 287.0, 548.0, 2076.0, 2802350.0, 337153.0, 1482.0, 462.0, 277.0, 167.0, 115.0, 63.0, 50.0, 35.0, 20.0, 17.0, 14.0, 10.0, 9.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.375, -138.73828125, -134.1015625, -129.46484375, -124.828125, -120.19140625, -115.5546875, -110.91796875, -106.28125, -101.64453125, -97.0078125, -92.37109375, -87.734375, -83.09765625, -78.4609375, -73.82421875, -69.1875, -64.55078125, -59.9140625, -55.27734375, -50.640625, -46.00390625, -41.3671875, -36.73046875, -32.09375, -27.45703125, -22.8203125, -18.18359375, -13.546875, -8.91015625, -4.2734375, 0.36328125, 5.0, 9.63671875, 14.2734375, 18.91015625, 23.546875, 28.18359375, 32.8203125, 37.45703125, 42.09375, 46.73046875, 51.3671875, 56.00390625, 60.640625, 65.27734375, 69.9140625, 74.55078125, 79.1875, 83.82421875, 88.4609375, 93.09765625, 97.734375, 102.37109375, 107.0078125, 111.64453125, 116.28125, 120.91796875, 125.5546875, 130.19140625, 134.828125, 139.46484375, 144.1015625, 148.73828125, 153.375]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 48.0, 824.0, 150.0], "bins": [-948.1953735351562, -933.05126953125, -917.9071655273438, -902.7630615234375, -887.6189575195312, -872.474853515625, -857.3307495117188, -842.1866455078125, -827.0425415039062, -811.8984375, -796.7543334960938, -781.6102294921875, -766.4661254882812, -751.322021484375, -736.1779174804688, -721.0338134765625, -705.8897705078125, -690.7456665039062, -675.6015625, -660.4574584960938, -645.3133544921875, -630.1692504882812, -615.025146484375, -599.8810424804688, -584.7369384765625, -569.5928344726562, -554.44873046875, -539.3046264648438, -524.1605224609375, -509.01641845703125, -493.872314453125, -478.7282409667969, -463.58416748046875, -448.4400634765625, -433.29595947265625, -418.15185546875, -403.00775146484375, -387.8636474609375, -372.71954345703125, -357.5754699707031, -342.43133544921875, -327.2872314453125, -312.14312744140625, -296.9990234375, -281.85491943359375, -266.7108154296875, -251.5667266845703, -236.42263793945312, -221.27853393554688, -206.13442993164062, -190.99032592773438, -175.84622192382812, -160.70213317871094, -145.5580291748047, -130.41392517089844, -115.26982879638672, -100.125732421875, -84.98162841796875, -69.83753204345703, -54.69342803955078, -39.5493278503418, -24.405227661132812, -9.261123657226562, 5.882972717285156, 21.02707862854004]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 4.0, 6.0, 7.0, 9.0, 6.0, 10.0, 18.0, 14.0, 15.0, 15.0, 18.0, 24.0, 23.0, 27.0, 35.0, 43.0, 31.0, 39.0, 37.0, 38.0, 38.0, 43.0, 49.0, 42.0, 41.0, 31.0, 28.0, 32.0, 27.0, 47.0, 36.0, 26.0, 18.0, 19.0, 21.0, 13.0, 17.0, 10.0, 9.0, 9.0, 6.0, 6.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-140.984619140625, -136.71524047851562, -132.44586181640625, -128.17648315429688, -123.90709686279297, -119.6377182006836, -115.36833953857422, -111.09896087646484, -106.82957458496094, -102.56019592285156, -98.29081726074219, -94.02143859863281, -89.7520523071289, -85.48267364501953, -81.21329498291016, -76.94391632080078, -72.6745376586914, -68.40515899658203, -64.13578033447266, -59.866397857666016, -55.597015380859375, -51.32763671875, -47.058258056640625, -42.78887939453125, -38.51949691772461, -34.250118255615234, -29.980735778808594, -25.71135711669922, -21.44197654724121, -17.172595977783203, -12.903217315673828, -8.63383674621582, -4.3644561767578125, -0.09507608413696289, 4.174304008483887, 8.443683624267578, 12.713064193725586, 16.982444763183594, 21.25182342529297, 25.521203994750977, 29.790584564208984, 34.05996322631836, 38.329345703125, 42.598724365234375, 46.86810302734375, 51.13748550415039, 55.406864166259766, 59.676246643066406, 63.94562530517578, 68.21500396728516, 72.48438262939453, 76.75376892089844, 81.02314758300781, 85.29252624511719, 89.56190490722656, 93.83128356933594, 98.10066223144531, 102.37004089355469, 106.63941955566406, 110.90879821777344, 115.17818450927734, 119.44756317138672, 123.7169418334961, 127.98632049560547, 132.25570678710938]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 7.0, 9.0, 14.0, 13.0, 11.0, 10.0, 26.0, 22.0, 25.0, 29.0, 25.0, 27.0, 33.0, 33.0, 45.0, 43.0, 51.0, 53.0, 40.0, 37.0, 48.0, 43.0, 41.0, 46.0, 30.0, 32.0, 29.0, 30.0, 21.0, 18.0, 14.0, 11.0, 18.0, 9.0, 17.0, 5.0, 6.0, 5.0, 1.0, 8.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.09375, -13.6448974609375, -13.196044921875, -12.7471923828125, -12.29833984375, -11.8494873046875, -11.400634765625, -10.9517822265625, -10.5029296875, -10.0540771484375, -9.605224609375, -9.1563720703125, -8.70751953125, -8.2586669921875, -7.809814453125, -7.3609619140625, -6.912109375, -6.4632568359375, -6.014404296875, -5.5655517578125, -5.11669921875, -4.6678466796875, -4.218994140625, -3.7701416015625, -3.3212890625, -2.8724365234375, -2.423583984375, -1.9747314453125, -1.52587890625, -1.0770263671875, -0.628173828125, -0.1793212890625, 0.26953125, 0.7183837890625, 1.167236328125, 1.6160888671875, 2.06494140625, 2.5137939453125, 2.962646484375, 3.4114990234375, 3.8603515625, 4.3092041015625, 4.758056640625, 5.2069091796875, 5.65576171875, 6.1046142578125, 6.553466796875, 7.0023193359375, 7.451171875, 7.9000244140625, 8.348876953125, 8.7977294921875, 9.24658203125, 9.6954345703125, 10.144287109375, 10.5931396484375, 11.0419921875, 11.4908447265625, 11.939697265625, 12.3885498046875, 12.83740234375, 13.2862548828125, 13.735107421875, 14.1839599609375, 14.6328125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 12.0, 8.0, 13.0, 10.0, 14.0, 17.0, 23.0, 19.0, 35.0, 45.0, 60.0, 77.0, 105.0, 162.0, 241.0, 384.0, 713.0, 1473.0, 3312.0, 9585.0, 38513.0, 197826.0, 925986.0, 1839262.0, 924958.0, 197537.0, 37440.0, 9749.0, 3352.0, 1460.0, 736.0, 354.0, 228.0, 146.0, 104.0, 75.0, 65.0, 42.0, 38.0, 25.0, 18.0, 19.0, 17.0, 6.0, 6.0, 8.0, 2.0, 1.0, 1.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.046875, -16.468994140625, -15.89111328125, -15.313232421875, -14.7353515625, -14.157470703125, -13.57958984375, -13.001708984375, -12.423828125, -11.845947265625, -11.26806640625, -10.690185546875, -10.1123046875, -9.534423828125, -8.95654296875, -8.378662109375, -7.80078125, -7.222900390625, -6.64501953125, -6.067138671875, -5.4892578125, -4.911376953125, -4.33349609375, -3.755615234375, -3.177734375, -2.599853515625, -2.02197265625, -1.444091796875, -0.8662109375, -0.288330078125, 0.28955078125, 0.867431640625, 1.4453125, 2.023193359375, 2.60107421875, 3.178955078125, 3.7568359375, 4.334716796875, 4.91259765625, 5.490478515625, 6.068359375, 6.646240234375, 7.22412109375, 7.802001953125, 8.3798828125, 8.957763671875, 9.53564453125, 10.113525390625, 10.69140625, 11.269287109375, 11.84716796875, 12.425048828125, 13.0029296875, 13.580810546875, 14.15869140625, 14.736572265625, 15.314453125, 15.892333984375, 16.47021484375, 17.048095703125, 17.6259765625, 18.203857421875, 18.78173828125, 19.359619140625, 19.9375]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 19.0, 24.0, 53.0, 94.0, 185.0, 294.0, 591.0, 852.0, 880.0, 496.0, 291.0, 138.0, 65.0, 54.0, 31.0, 11.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.0, -61.02783203125, -59.0556640625, -57.08349609375, -55.111328125, -53.13916015625, -51.1669921875, -49.19482421875, -47.22265625, -45.25048828125, -43.2783203125, -41.30615234375, -39.333984375, -37.36181640625, -35.3896484375, -33.41748046875, -31.4453125, -29.47314453125, -27.5009765625, -25.52880859375, -23.556640625, -21.58447265625, -19.6123046875, -17.64013671875, -15.66796875, -13.69580078125, -11.7236328125, -9.75146484375, -7.779296875, -5.80712890625, -3.8349609375, -1.86279296875, 0.109375, 2.08154296875, 4.0537109375, 6.02587890625, 7.998046875, 9.97021484375, 11.9423828125, 13.91455078125, 15.88671875, 17.85888671875, 19.8310546875, 21.80322265625, 23.775390625, 25.74755859375, 27.7197265625, 29.69189453125, 31.6640625, 33.63623046875, 35.6083984375, 37.58056640625, 39.552734375, 41.52490234375, 43.4970703125, 45.46923828125, 47.44140625, 49.41357421875, 51.3857421875, 53.35791015625, 55.330078125, 57.30224609375, 59.2744140625, 61.24658203125, 63.21875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 3.0, 2.0, 7.0, 7.0, 7.0, 14.0, 15.0, 11.0, 28.0, 44.0, 34.0, 52.0, 69.0, 104.0, 146.0, 285.0, 462.0, 1174.0, 38373.0, 4135168.0, 15927.0, 1061.0, 441.0, 241.0, 168.0, 110.0, 87.0, 61.0, 37.0, 37.0, 26.0, 16.0, 14.0, 17.0, 12.0, 11.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-144.875, -139.953125, -135.03125, -130.109375, -125.1875, -120.265625, -115.34375, -110.421875, -105.5, -100.578125, -95.65625, -90.734375, -85.8125, -80.890625, -75.96875, -71.046875, -66.125, -61.203125, -56.28125, -51.359375, -46.4375, -41.515625, -36.59375, -31.671875, -26.75, -21.828125, -16.90625, -11.984375, -7.0625, -2.140625, 2.78125, 7.703125, 12.625, 17.546875, 22.46875, 27.390625, 32.3125, 37.234375, 42.15625, 47.078125, 52.0, 56.921875, 61.84375, 66.765625, 71.6875, 76.609375, 81.53125, 86.453125, 91.375, 96.296875, 101.21875, 106.140625, 111.0625, 115.984375, 120.90625, 125.828125, 130.75, 135.671875, 140.59375, 145.515625, 150.4375, 155.359375, 160.28125, 165.203125, 170.125]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 12.0, 15.0, 28.0, 28.0, 38.0, 76.0, 72.0, 82.0, 111.0, 101.0, 95.0, 94.0, 75.0, 56.0, 47.0, 30.0, 18.0, 12.0, 5.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.92813110351562, -102.66979217529297, -99.41145324707031, -96.15310668945312, -92.89476776123047, -89.63642883300781, -86.37808990478516, -83.1197509765625, -79.86140441894531, -76.60306549072266, -73.3447265625, -70.08638000488281, -66.82804107666016, -63.5697021484375, -60.311363220214844, -57.05302429199219, -53.79468536376953, -50.536346435546875, -47.27800369262695, -44.0196647644043, -40.761322021484375, -37.50298309326172, -34.24464416503906, -30.986303329467773, -27.727962493896484, -24.469621658325195, -21.211280822753906, -17.95294189453125, -14.694601058959961, -11.436260223388672, -8.177921295166016, -4.919580459594727, -1.6612396240234375, 1.5971007347106934, 4.855441093444824, 8.113780975341797, 11.372121810913086, 14.630462646484375, 17.88880157470703, 21.14714241027832, 24.40548324584961, 27.6638240814209, 30.922164916992188, 34.180503845214844, 37.4388427734375, 40.69718551635742, 43.95552444458008, 47.2138671875, 50.472206115722656, 53.73054504394531, 56.988887786865234, 60.24722671508789, 63.50556945800781, 66.76390838623047, 70.02224731445312, 73.28058624267578, 76.53892517089844, 79.7972640991211, 83.05560302734375, 86.31394958496094, 89.5722885131836, 92.83062744140625, 96.0889663696289, 99.34730529785156, 102.60565185546875]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 7.0, 4.0, 8.0, 13.0, 13.0, 20.0, 16.0, 12.0, 25.0, 27.0, 31.0, 25.0, 33.0, 32.0, 39.0, 40.0, 37.0, 50.0, 40.0, 44.0, 41.0, 40.0, 40.0, 37.0, 35.0, 33.0, 33.0, 33.0, 30.0, 29.0, 19.0, 18.0, 17.0, 14.0, 17.0, 12.0, 10.0, 9.0, 5.0, 2.0, 4.0, 7.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-119.36882019042969, -115.9427719116211, -112.51671600341797, -109.09066772460938, -105.66461944580078, -102.23857116699219, -98.81251525878906, -95.38646697998047, -91.96041870117188, -88.53437042236328, -85.10831451416016, -81.68226623535156, -78.25621795654297, -74.83016967773438, -71.40411376953125, -67.97806549072266, -64.55201721191406, -61.1259651184082, -57.69991683959961, -54.27386474609375, -50.847816467285156, -47.4217643737793, -43.99571228027344, -40.569664001464844, -37.14360809326172, -33.71755599975586, -30.291507720947266, -26.865455627441406, -23.439407348632812, -20.013355255126953, -16.587305068969727, -13.1612548828125, -9.735206604003906, -6.30915641784668, -2.883105754852295, 0.5429449081420898, 3.9689950942993164, 7.395046234130859, 10.821096420288086, 14.247146606445312, 17.67319679260254, 21.099246978759766, 24.525297164916992, 27.95134735107422, 31.377399444580078, 34.80345153808594, 38.22949981689453, 41.655548095703125, 45.081600189208984, 48.507652282714844, 51.93370056152344, 55.3597526550293, 58.78580093383789, 62.21185302734375, 65.63790130615234, 69.06394958496094, 72.49000549316406, 75.91605377197266, 79.34210968017578, 82.76815795898438, 86.19420623779297, 89.62025451660156, 93.04631042480469, 96.47235870361328, 99.89840698242188]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 9.0, 14.0, 7.0, 6.0, 15.0, 15.0, 24.0, 22.0, 27.0, 25.0, 30.0, 30.0, 40.0, 35.0, 26.0, 37.0, 40.0, 56.0, 56.0, 44.0, 43.0, 37.0, 24.0, 41.0, 42.0, 32.0, 25.0, 27.0, 24.0, 18.0, 15.0, 16.0, 17.0, 12.0, 10.0, 6.0, 9.0, 7.0, 7.0, 3.0, 2.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.5, -13.07080078125, -12.6416015625, -12.21240234375, -11.783203125, -11.35400390625, -10.9248046875, -10.49560546875, -10.06640625, -9.63720703125, -9.2080078125, -8.77880859375, -8.349609375, -7.92041015625, -7.4912109375, -7.06201171875, -6.6328125, -6.20361328125, -5.7744140625, -5.34521484375, -4.916015625, -4.48681640625, -4.0576171875, -3.62841796875, -3.19921875, -2.77001953125, -2.3408203125, -1.91162109375, -1.482421875, -1.05322265625, -0.6240234375, -0.19482421875, 0.234375, 0.66357421875, 1.0927734375, 1.52197265625, 1.951171875, 2.38037109375, 2.8095703125, 3.23876953125, 3.66796875, 4.09716796875, 4.5263671875, 4.95556640625, 5.384765625, 5.81396484375, 6.2431640625, 6.67236328125, 7.1015625, 7.53076171875, 7.9599609375, 8.38916015625, 8.818359375, 9.24755859375, 9.6767578125, 10.10595703125, 10.53515625, 10.96435546875, 11.3935546875, 11.82275390625, 12.251953125, 12.68115234375, 13.1103515625, 13.53955078125, 13.96875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 3.0, 9.0, 17.0, 14.0, 28.0, 46.0, 52.0, 66.0, 102.0, 138.0, 206.0, 318.0, 434.0, 633.0, 855.0, 1169.0, 1786.0, 2606.0, 3738.0, 5489.0, 8123.0, 12011.0, 18526.0, 28477.0, 45665.0, 74153.0, 138274.0, 349647.0, 145530.0, 76556.0, 46721.0, 29302.0, 19123.0, 12419.0, 8349.0, 5618.0, 3731.0, 2631.0, 1819.0, 1246.0, 870.0, 637.0, 414.0, 325.0, 196.0, 141.0, 98.0, 72.0, 59.0, 40.0, 26.0, 18.0, 23.0, 6.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-2.943359375, -2.850006103515625, -2.75665283203125, -2.663299560546875, -2.5699462890625, -2.476593017578125, -2.38323974609375, -2.289886474609375, -2.196533203125, -2.103179931640625, -2.00982666015625, -1.916473388671875, -1.8231201171875, -1.729766845703125, -1.63641357421875, -1.543060302734375, -1.44970703125, -1.356353759765625, -1.26300048828125, -1.169647216796875, -1.0762939453125, -0.982940673828125, -0.88958740234375, -0.796234130859375, -0.702880859375, -0.609527587890625, -0.51617431640625, -0.422821044921875, -0.3294677734375, -0.236114501953125, -0.14276123046875, -0.049407958984375, 0.0439453125, 0.137298583984375, 0.23065185546875, 0.324005126953125, 0.4173583984375, 0.510711669921875, 0.60406494140625, 0.697418212890625, 0.790771484375, 0.884124755859375, 0.97747802734375, 1.070831298828125, 1.1641845703125, 1.257537841796875, 1.35089111328125, 1.444244384765625, 1.53759765625, 1.630950927734375, 1.72430419921875, 1.817657470703125, 1.9110107421875, 2.004364013671875, 2.09771728515625, 2.191070556640625, 2.284423828125, 2.377777099609375, 2.47113037109375, 2.564483642578125, 2.6578369140625, 2.751190185546875, 2.84454345703125, 2.937896728515625, 3.03125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 2.0, 6.0, 2.0, 4.0, 11.0, 4.0, 7.0, 7.0, 15.0, 21.0, 16.0, 22.0, 24.0, 19.0, 31.0, 39.0, 35.0, 48.0, 35.0, 37.0, 44.0, 49.0, 40.0, 1074.0, 41.0, 36.0, 32.0, 38.0, 41.0, 32.0, 28.0, 31.0, 27.0, 24.0, 16.0, 11.0, 14.0, 22.0, 15.0, 9.0, 8.0, 4.0, 5.0, 3.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.266357421875, -8.97802734375, -8.689697265625, -8.4013671875, -8.113037109375, -7.82470703125, -7.536376953125, -7.248046875, -6.959716796875, -6.67138671875, -6.383056640625, -6.0947265625, -5.806396484375, -5.51806640625, -5.229736328125, -4.94140625, -4.653076171875, -4.36474609375, -4.076416015625, -3.7880859375, -3.499755859375, -3.21142578125, -2.923095703125, -2.634765625, -2.346435546875, -2.05810546875, -1.769775390625, -1.4814453125, -1.193115234375, -0.90478515625, -0.616455078125, -0.328125, -0.039794921875, 0.24853515625, 0.536865234375, 0.8251953125, 1.113525390625, 1.40185546875, 1.690185546875, 1.978515625, 2.266845703125, 2.55517578125, 2.843505859375, 3.1318359375, 3.420166015625, 3.70849609375, 3.996826171875, 4.28515625, 4.573486328125, 4.86181640625, 5.150146484375, 5.4384765625, 5.726806640625, 6.01513671875, 6.303466796875, 6.591796875, 6.880126953125, 7.16845703125, 7.456787109375, 7.7451171875, 8.033447265625, 8.32177734375, 8.610107421875, 8.8984375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 3.0, 6.0, 10.0, 9.0, 13.0, 30.0, 39.0, 57.0, 86.0, 148.0, 191.0, 295.0, 480.0, 685.0, 990.0, 1504.0, 2267.0, 3175.0, 4925.0, 7145.0, 11034.0, 16519.0, 25744.0, 41245.0, 68066.0, 119360.0, 1332881.0, 202597.0, 98606.0, 57678.0, 35399.0, 22409.0, 14455.0, 9600.0, 6297.0, 4315.0, 2943.0, 1909.0, 1376.0, 874.0, 559.0, 405.0, 263.0, 174.0, 127.0, 91.0, 63.0, 30.0, 26.0, 17.0, 10.0, 4.0, 3.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.705078125, -2.61737060546875, -2.5296630859375, -2.44195556640625, -2.354248046875, -2.26654052734375, -2.1788330078125, -2.09112548828125, -2.00341796875, -1.91571044921875, -1.8280029296875, -1.74029541015625, -1.652587890625, -1.56488037109375, -1.4771728515625, -1.38946533203125, -1.3017578125, -1.21405029296875, -1.1263427734375, -1.03863525390625, -0.950927734375, -0.86322021484375, -0.7755126953125, -0.68780517578125, -0.60009765625, -0.51239013671875, -0.4246826171875, -0.33697509765625, -0.249267578125, -0.16156005859375, -0.0738525390625, 0.01385498046875, 0.1015625, 0.18927001953125, 0.2769775390625, 0.36468505859375, 0.452392578125, 0.54010009765625, 0.6278076171875, 0.71551513671875, 0.80322265625, 0.89093017578125, 0.9786376953125, 1.06634521484375, 1.154052734375, 1.24176025390625, 1.3294677734375, 1.41717529296875, 1.5048828125, 1.59259033203125, 1.6802978515625, 1.76800537109375, 1.855712890625, 1.94342041015625, 2.0311279296875, 2.11883544921875, 2.20654296875, 2.29425048828125, 2.3819580078125, 2.46966552734375, 2.557373046875, 2.64508056640625, 2.7327880859375, 2.82049560546875, 2.908203125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 4.0, 8.0, 8.0, 9.0, 10.0, 13.0, 15.0, 15.0, 22.0, 28.0, 28.0, 40.0, 49.0, 82.0, 73.0, 66.0, 94.0, 79.0, 66.0, 56.0, 43.0, 39.0, 27.0, 29.0, 17.0, 8.0, 13.0, 11.0, 10.0, 7.0, 10.0, 4.0, 6.0, 5.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.002017974853515625, -0.001955181360244751, -0.001892387866973877, -0.001829594373703003, -0.001766800880432129, -0.0017040073871612549, -0.0016412138938903809, -0.0015784204006195068, -0.0015156269073486328, -0.0014528334140777588, -0.0013900399208068848, -0.0013272464275360107, -0.0012644529342651367, -0.0012016594409942627, -0.0011388659477233887, -0.0010760724544525146, -0.0010132789611816406, -0.0009504854679107666, -0.0008876919746398926, -0.0008248984813690186, -0.0007621049880981445, -0.0006993114948272705, -0.0006365180015563965, -0.0005737245082855225, -0.0005109310150146484, -0.0004481375217437744, -0.0003853440284729004, -0.00032255053520202637, -0.00025975704193115234, -0.00019696354866027832, -0.0001341700553894043, -7.137656211853027e-05, -8.58306884765625e-06, 5.4210424423217773e-05, 0.0001170039176940918, 0.00017979741096496582, 0.00024259090423583984, 0.00030538439750671387, 0.0003681778907775879, 0.0004309713840484619, 0.0004937648773193359, 0.00055655837059021, 0.000619351863861084, 0.000682145357131958, 0.000744938850402832, 0.0008077323436737061, 0.0008705258369445801, 0.0009333193302154541, 0.0009961128234863281, 0.0010589063167572021, 0.0011216998100280762, 0.0011844933032989502, 0.0012472867965698242, 0.0013100802898406982, 0.0013728737831115723, 0.0014356672763824463, 0.0014984607696533203, 0.0015612542629241943, 0.0016240477561950684, 0.0016868412494659424, 0.0017496347427368164, 0.0018124282360076904, 0.0018752217292785645, 0.0019380152225494385, 0.0020008087158203125]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 2.0, 3.0, 4.0, 3.0, 8.0, 9.0, 9.0, 11.0, 13.0, 17.0, 19.0, 34.0, 42.0, 56.0, 118.0, 224.0, 647.0, 50917.0, 994637.0, 1105.0, 296.0, 136.0, 62.0, 54.0, 36.0, 18.0, 17.0, 18.0, 13.0, 9.0, 7.0, 5.0, 5.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05755615234375, -0.05576658248901367, -0.053977012634277344, -0.052187442779541016, -0.05039787292480469, -0.04860830307006836, -0.04681873321533203, -0.0450291633605957, -0.043239593505859375, -0.04145002365112305, -0.03966045379638672, -0.03787088394165039, -0.03608131408691406, -0.034291744232177734, -0.032502174377441406, -0.030712604522705078, -0.02892303466796875, -0.027133464813232422, -0.025343894958496094, -0.023554325103759766, -0.021764755249023438, -0.01997518539428711, -0.01818561553955078, -0.016396045684814453, -0.014606475830078125, -0.012816905975341797, -0.011027336120605469, -0.00923776626586914, -0.0074481964111328125, -0.005658626556396484, -0.0038690567016601562, -0.002079486846923828, -0.0002899169921875, 0.0014996528625488281, 0.0032892227172851562, 0.005078792572021484, 0.0068683624267578125, 0.00865793228149414, 0.010447502136230469, 0.012237071990966797, 0.014026641845703125, 0.015816211700439453, 0.01760578155517578, 0.01939535140991211, 0.021184921264648438, 0.022974491119384766, 0.024764060974121094, 0.026553630828857422, 0.02834320068359375, 0.030132770538330078, 0.031922340393066406, 0.033711910247802734, 0.03550148010253906, 0.03729104995727539, 0.03908061981201172, 0.04087018966674805, 0.042659759521484375, 0.0444493293762207, 0.04623889923095703, 0.04802846908569336, 0.04981803894042969, 0.051607608795166016, 0.053397178649902344, 0.05518674850463867, 0.056976318359375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 10.0, 28.0, 36.0, 80.0, 102.0, 165.0, 152.0, 165.0, 115.0, 69.0, 49.0, 20.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00137315783649683, -0.0013283267617225647, -0.0012834956869482994, -0.0012386646121740341, -0.0011938335373997688, -0.0011490023462101817, -0.0011041712714359164, -0.0010593401966616511, -0.0010145091218873858, -0.0009696780471131206, -0.0009248469723388553, -0.0008800158393569291, -0.0008351847645826638, -0.0007903536898083985, -0.0007455225568264723, -0.000700691482052207, -0.0006558604072779417, -0.0006110293325036764, -0.0005661982577294111, -0.0005213671247474849, -0.00047653604997321963, -0.00043170497519895434, -0.0003868738713208586, -0.00034204276744276285, -0.00029721169266849756, -0.0002523806178942323, -0.00020754951401613653, -0.000162718424689956, -0.00011788733536377549, -7.305624603759497e-05, -2.8225156711414456e-05, 1.660594716668129e-05, 6.14371383562684e-05, 0.00010626822768244892, 0.00015109931700862944, 0.00019593040633480996, 0.00024076149566099048, 0.00028559257043525577, 0.0003304236743133515, 0.00037525477819144726, 0.00042008585296571255, 0.00046491692773997784, 0.0005097480025142431, 0.0005545791354961693, 0.0005994102102704346, 0.0006442412850446999, 0.0006890724180266261, 0.0007339034928008914, 0.0007787345675751567, 0.000823565642349422, 0.0008683967171236873, 0.0009132278501056135, 0.0009580589248798788, 0.001002890057861805, 0.0010477211326360703, 0.0010925522074103355, 0.0011373832821846008, 0.0011822143569588661, 0.0012270454317331314, 0.0012718765065073967, 0.001316707581281662, 0.001361538772471249, 0.0014063698472455144, 0.0014512009220197797, 0.001496031996794045]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 2.0, 1.0, 2.0, 6.0, 6.0, 3.0, 10.0, 8.0, 12.0, 9.0, 13.0, 12.0, 17.0, 22.0, 31.0, 26.0, 23.0, 30.0, 35.0, 26.0, 37.0, 43.0, 48.0, 40.0, 38.0, 32.0, 38.0, 45.0, 33.0, 40.0, 29.0, 24.0, 37.0, 37.0, 26.0, 28.0, 15.0, 24.0, 14.0, 19.0, 12.0, 17.0, 11.0, 4.0, 10.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0007970333099365234, -0.000768955796957016, -0.0007408782839775085, -0.0007128007709980011, -0.0006847232580184937, -0.0006566457450389862, -0.0006285682320594788, -0.0006004907190799713, -0.0005724132061004639, -0.0005443356931209564, -0.000516258180141449, -0.00048818066716194153, -0.0004601031541824341, -0.00043202564120292664, -0.0004039481282234192, -0.00037587061524391174, -0.0003477931022644043, -0.00031971558928489685, -0.0002916380763053894, -0.00026356056332588196, -0.0002354830503463745, -0.00020740553736686707, -0.00017932802438735962, -0.00015125051140785217, -0.00012317299842834473, -9.509548544883728e-05, -6.701797246932983e-05, -3.894045948982239e-05, -1.0862946510314941e-05, 1.7214566469192505e-05, 4.529207944869995e-05, 7.33695924282074e-05, 0.00010144710540771484, 0.0001295246183872223, 0.00015760213136672974, 0.00018567964434623718, 0.00021375715732574463, 0.00024183467030525208, 0.0002699121832847595, 0.00029798969626426697, 0.0003260672092437744, 0.00035414472222328186, 0.0003822222352027893, 0.00041029974818229675, 0.0004383772611618042, 0.00046645477414131165, 0.0004945322871208191, 0.0005226098001003265, 0.000550687313079834, 0.0005787648260593414, 0.0006068423390388489, 0.0006349198520183563, 0.0006629973649978638, 0.0006910748779773712, 0.0007191523909568787, 0.0007472299039363861, 0.0007753074169158936, 0.000803384929895401, 0.0008314624428749084, 0.0008595399558544159, 0.0008876174688339233, 0.0009156949818134308, 0.0009437724947929382, 0.0009718500077724457, 0.0009999275207519531]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 4.0, 6.0, 8.0, 9.0, 14.0, 7.0, 6.0, 15.0, 15.0, 24.0, 22.0, 27.0, 25.0, 30.0, 30.0, 40.0, 35.0, 26.0, 37.0, 40.0, 56.0, 56.0, 44.0, 43.0, 37.0, 24.0, 41.0, 41.0, 33.0, 25.0, 27.0, 24.0, 18.0, 15.0, 16.0, 17.0, 12.0, 10.0, 6.0, 9.0, 7.0, 7.0, 3.0, 2.0, 3.0, 0.0, 5.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-13.5, -13.07080078125, -12.6416015625, -12.21240234375, -11.783203125, -11.35400390625, -10.9248046875, -10.49560546875, -10.06640625, -9.63720703125, -9.2080078125, -8.77880859375, -8.349609375, -7.92041015625, -7.4912109375, -7.06201171875, -6.6328125, -6.20361328125, -5.7744140625, -5.34521484375, -4.916015625, -4.48681640625, -4.0576171875, -3.62841796875, -3.19921875, -2.77001953125, -2.3408203125, -1.91162109375, -1.482421875, -1.05322265625, -0.6240234375, -0.19482421875, 0.234375, 0.66357421875, 1.0927734375, 1.52197265625, 1.951171875, 2.38037109375, 2.8095703125, 3.23876953125, 3.66796875, 4.09716796875, 4.5263671875, 4.95556640625, 5.384765625, 5.81396484375, 6.2431640625, 6.67236328125, 7.1015625, 7.53076171875, 7.9599609375, 8.38916015625, 8.818359375, 9.24755859375, 9.6767578125, 10.10595703125, 10.53515625, 10.96435546875, 11.3935546875, 11.82275390625, 12.251953125, 12.68115234375, 13.1103515625, 13.53955078125, 13.96875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 7.0, 15.0, 15.0, 16.0, 32.0, 21.0, 49.0, 41.0, 70.0, 90.0, 134.0, 174.0, 269.0, 408.0, 661.0, 1048.0, 1993.0, 3733.0, 7391.0, 15184.0, 32719.0, 71950.0, 171142.0, 347766.0, 221623.0, 92504.0, 40874.0, 19069.0, 9120.0, 4548.0, 2374.0, 1292.0, 726.0, 451.0, 283.0, 184.0, 152.0, 105.0, 68.0, 62.0, 48.0, 39.0, 23.0, 21.0, 13.0, 13.0, 9.0, 9.0, 3.0, 2.0, 6.0, 2.0, 1.0, 2.0, 2.0], "bins": [-8.484375, -8.2244873046875, -7.964599609375, -7.7047119140625, -7.44482421875, -7.1849365234375, -6.925048828125, -6.6651611328125, -6.4052734375, -6.1453857421875, -5.885498046875, -5.6256103515625, -5.36572265625, -5.1058349609375, -4.845947265625, -4.5860595703125, -4.326171875, -4.0662841796875, -3.806396484375, -3.5465087890625, -3.28662109375, -3.0267333984375, -2.766845703125, -2.5069580078125, -2.2470703125, -1.9871826171875, -1.727294921875, -1.4674072265625, -1.20751953125, -0.9476318359375, -0.687744140625, -0.4278564453125, -0.16796875, 0.0919189453125, 0.351806640625, 0.6116943359375, 0.87158203125, 1.1314697265625, 1.391357421875, 1.6512451171875, 1.9111328125, 2.1710205078125, 2.430908203125, 2.6907958984375, 2.95068359375, 3.2105712890625, 3.470458984375, 3.7303466796875, 3.990234375, 4.2501220703125, 4.510009765625, 4.7698974609375, 5.02978515625, 5.2896728515625, 5.549560546875, 5.8094482421875, 6.0693359375, 6.3292236328125, 6.589111328125, 6.8489990234375, 7.10888671875, 7.3687744140625, 7.628662109375, 7.8885498046875, 8.1484375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 5.0, 3.0, 8.0, 5.0, 6.0, 8.0, 9.0, 12.0, 10.0, 9.0, 17.0, 19.0, 32.0, 27.0, 39.0, 38.0, 43.0, 51.0, 78.0, 127.0, 1797.0, 234.0, 85.0, 54.0, 53.0, 40.0, 60.0, 23.0, 29.0, 31.0, 17.0, 24.0, 12.0, 11.0, 16.0, 9.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-71.375, -69.37158203125, -67.3681640625, -65.36474609375, -63.361328125, -61.35791015625, -59.3544921875, -57.35107421875, -55.34765625, -53.34423828125, -51.3408203125, -49.33740234375, -47.333984375, -45.33056640625, -43.3271484375, -41.32373046875, -39.3203125, -37.31689453125, -35.3134765625, -33.31005859375, -31.306640625, -29.30322265625, -27.2998046875, -25.29638671875, -23.29296875, -21.28955078125, -19.2861328125, -17.28271484375, -15.279296875, -13.27587890625, -11.2724609375, -9.26904296875, -7.265625, -5.26220703125, -3.2587890625, -1.25537109375, 0.748046875, 2.75146484375, 4.7548828125, 6.75830078125, 8.76171875, 10.76513671875, 12.7685546875, 14.77197265625, 16.775390625, 18.77880859375, 20.7822265625, 22.78564453125, 24.7890625, 26.79248046875, 28.7958984375, 30.79931640625, 32.802734375, 34.80615234375, 36.8095703125, 38.81298828125, 40.81640625, 42.81982421875, 44.8232421875, 46.82666015625, 48.830078125, 50.83349609375, 52.8369140625, 54.84033203125, 56.84375]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 6.0, 7.0, 11.0, 16.0, 15.0, 14.0, 27.0, 20.0, 48.0, 70.0, 79.0, 136.0, 160.0, 234.0, 412.0, 849.0, 18009.0, 3119009.0, 4869.0, 679.0, 308.0, 203.0, 141.0, 88.0, 66.0, 62.0, 44.0, 30.0, 21.0, 11.0, 17.0, 8.0, 12.0, 4.0, 7.0, 9.0, 3.0, 3.0, 2.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-128.375, -123.8515625, -119.328125, -114.8046875, -110.28125, -105.7578125, -101.234375, -96.7109375, -92.1875, -87.6640625, -83.140625, -78.6171875, -74.09375, -69.5703125, -65.046875, -60.5234375, -56.0, -51.4765625, -46.953125, -42.4296875, -37.90625, -33.3828125, -28.859375, -24.3359375, -19.8125, -15.2890625, -10.765625, -6.2421875, -1.71875, 2.8046875, 7.328125, 11.8515625, 16.375, 20.8984375, 25.421875, 29.9453125, 34.46875, 38.9921875, 43.515625, 48.0390625, 52.5625, 57.0859375, 61.609375, 66.1328125, 70.65625, 75.1796875, 79.703125, 84.2265625, 88.75, 93.2734375, 97.796875, 102.3203125, 106.84375, 111.3671875, 115.890625, 120.4140625, 124.9375, 129.4609375, 133.984375, 138.5078125, 143.03125, 147.5546875, 152.078125, 156.6015625, 161.125]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 56.0, 664.0, 286.0, 11.0], "bins": [-589.8202514648438, -580.2631225585938, -570.7059326171875, -561.1488037109375, -551.5916748046875, -542.0344848632812, -532.4773559570312, -522.9202270507812, -513.363037109375, -503.8058776855469, -494.2487487792969, -484.69158935546875, -475.1344299316406, -465.5773010253906, -456.0201416015625, -446.4630126953125, -436.9058837890625, -427.3487243652344, -417.7915954589844, -408.23443603515625, -398.6772766113281, -389.1201477050781, -379.56298828125, -370.005859375, -360.44866943359375, -350.8915100097656, -341.3343811035156, -331.7772216796875, -322.2200622558594, -312.6629333496094, -303.10577392578125, -293.54864501953125, -283.9914855957031, -274.434326171875, -264.877197265625, -255.32003784179688, -245.7628936767578, -236.20574951171875, -226.64859008789062, -217.09144592285156, -207.5343017578125, -197.97715759277344, -188.4199981689453, -178.86285400390625, -169.3057098388672, -159.74856567382812, -150.19140625, -140.63426208496094, -131.07711791992188, -121.51996612548828, -111.96282196044922, -102.40567016601562, -92.84852600097656, -83.29137420654297, -73.73422241210938, -64.17707824707031, -54.61992645263672, -45.06277847290039, -35.50563049316406, -25.94847869873047, -16.39133071899414, -6.8341827392578125, 2.7229690551757812, 12.280113220214844, 21.83726692199707]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 5.0, 6.0, 5.0, 3.0, 13.0, 10.0, 11.0, 18.0, 18.0, 23.0, 31.0, 25.0, 41.0, 33.0, 36.0, 32.0, 50.0, 41.0, 45.0, 47.0, 34.0, 41.0, 47.0, 44.0, 36.0, 42.0, 39.0, 28.0, 29.0, 23.0, 24.0, 25.0, 24.0, 15.0, 9.0, 14.0, 7.0, 7.0, 5.0, 3.0, 3.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.65896606445312, -125.3544692993164, -121.04997253417969, -116.74547576904297, -112.44097900390625, -108.13648223876953, -103.83198547363281, -99.52749633789062, -95.22299194335938, -90.91849517822266, -86.61399841308594, -82.30950164794922, -78.0050048828125, -73.70050811767578, -69.39601135253906, -65.09152221679688, -60.787025451660156, -56.48252868652344, -52.17803192138672, -47.87353515625, -43.56903839111328, -39.26454162597656, -34.96004867553711, -30.65555191040039, -26.351055145263672, -22.046558380126953, -17.742061614990234, -13.437566757202148, -9.13306999206543, -4.828573226928711, -0.524078369140625, 3.7804183959960938, 8.084915161132812, 12.389411926269531, 16.69390869140625, 20.998403549194336, 25.302900314331055, 29.607397079467773, 33.91189193725586, 38.21638870239258, 42.5208854675293, 46.825382232666016, 51.129878997802734, 55.43437194824219, 59.738868713378906, 64.04336547851562, 68.34786224365234, 72.65235900878906, 76.95685577392578, 81.2613525390625, 85.56584930419922, 89.87034606933594, 94.17484283447266, 98.47933959960938, 102.78382873535156, 107.08833312988281, 111.392822265625, 115.69731903076172, 120.00181579589844, 124.30631256103516, 128.61080932617188, 132.91529846191406, 137.2198028564453, 141.5242919921875, 145.82879638671875]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 11.0, 7.0, 8.0, 12.0, 7.0, 12.0, 13.0, 20.0, 20.0, 26.0, 20.0, 21.0, 35.0, 27.0, 32.0, 33.0, 34.0, 41.0, 50.0, 50.0, 41.0, 42.0, 46.0, 41.0, 32.0, 35.0, 32.0, 34.0, 33.0, 26.0, 25.0, 18.0, 18.0, 14.0, 8.0, 14.0, 11.0, 11.0, 7.0, 4.0, 10.0, 5.0, 3.0, 2.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-13.6015625, -13.169189453125, -12.73681640625, -12.304443359375, -11.8720703125, -11.439697265625, -11.00732421875, -10.574951171875, -10.142578125, -9.710205078125, -9.27783203125, -8.845458984375, -8.4130859375, -7.980712890625, -7.54833984375, -7.115966796875, -6.68359375, -6.251220703125, -5.81884765625, -5.386474609375, -4.9541015625, -4.521728515625, -4.08935546875, -3.656982421875, -3.224609375, -2.792236328125, -2.35986328125, -1.927490234375, -1.4951171875, -1.062744140625, -0.63037109375, -0.197998046875, 0.234375, 0.666748046875, 1.09912109375, 1.531494140625, 1.9638671875, 2.396240234375, 2.82861328125, 3.260986328125, 3.693359375, 4.125732421875, 4.55810546875, 4.990478515625, 5.4228515625, 5.855224609375, 6.28759765625, 6.719970703125, 7.15234375, 7.584716796875, 8.01708984375, 8.449462890625, 8.8818359375, 9.314208984375, 9.74658203125, 10.178955078125, 10.611328125, 11.043701171875, 11.47607421875, 11.908447265625, 12.3408203125, 12.773193359375, 13.20556640625, 13.637939453125, 14.0703125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 5.0, 8.0, 7.0, 10.0, 11.0, 9.0, 24.0, 19.0, 28.0, 25.0, 31.0, 50.0, 46.0, 93.0, 140.0, 253.0, 745.0, 5651.0, 245221.0, 3676762.0, 257957.0, 5617.0, 789.0, 234.0, 146.0, 90.0, 71.0, 45.0, 21.0, 35.0, 20.0, 16.0, 23.0, 14.0, 8.0, 10.0, 5.0, 10.0, 9.0, 3.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-57.25, -55.48876953125, -53.7275390625, -51.96630859375, -50.205078125, -48.44384765625, -46.6826171875, -44.92138671875, -43.16015625, -41.39892578125, -39.6376953125, -37.87646484375, -36.115234375, -34.35400390625, -32.5927734375, -30.83154296875, -29.0703125, -27.30908203125, -25.5478515625, -23.78662109375, -22.025390625, -20.26416015625, -18.5029296875, -16.74169921875, -14.98046875, -13.21923828125, -11.4580078125, -9.69677734375, -7.935546875, -6.17431640625, -4.4130859375, -2.65185546875, -0.890625, 0.87060546875, 2.6318359375, 4.39306640625, 6.154296875, 7.91552734375, 9.6767578125, 11.43798828125, 13.19921875, 14.96044921875, 16.7216796875, 18.48291015625, 20.244140625, 22.00537109375, 23.7666015625, 25.52783203125, 27.2890625, 29.05029296875, 30.8115234375, 32.57275390625, 34.333984375, 36.09521484375, 37.8564453125, 39.61767578125, 41.37890625, 43.14013671875, 44.9013671875, 46.66259765625, 48.423828125, 50.18505859375, 51.9462890625, 53.70751953125, 55.46875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 7.0, 16.0, 12.0, 21.0, 37.0, 53.0, 69.0, 128.0, 179.0, 280.0, 433.0, 586.0, 687.0, 554.0, 361.0, 231.0, 149.0, 101.0, 60.0, 40.0, 32.0, 13.0, 13.0, 9.0, 5.0, 4.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-53.84375, -52.505615234375, -51.16748046875, -49.829345703125, -48.4912109375, -47.153076171875, -45.81494140625, -44.476806640625, -43.138671875, -41.800537109375, -40.46240234375, -39.124267578125, -37.7861328125, -36.447998046875, -35.10986328125, -33.771728515625, -32.43359375, -31.095458984375, -29.75732421875, -28.419189453125, -27.0810546875, -25.742919921875, -24.40478515625, -23.066650390625, -21.728515625, -20.390380859375, -19.05224609375, -17.714111328125, -16.3759765625, -15.037841796875, -13.69970703125, -12.361572265625, -11.0234375, -9.685302734375, -8.34716796875, -7.009033203125, -5.6708984375, -4.332763671875, -2.99462890625, -1.656494140625, -0.318359375, 1.019775390625, 2.35791015625, 3.696044921875, 5.0341796875, 6.372314453125, 7.71044921875, 9.048583984375, 10.38671875, 11.724853515625, 13.06298828125, 14.401123046875, 15.7392578125, 17.077392578125, 18.41552734375, 19.753662109375, 21.091796875, 22.429931640625, 23.76806640625, 25.106201171875, 26.4443359375, 27.782470703125, 29.12060546875, 30.458740234375, 31.796875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 8.0, 15.0, 13.0, 9.0, 27.0, 23.0, 34.0, 63.0, 73.0, 108.0, 127.0, 208.0, 376.0, 830.0, 6729.0, 4122861.0, 60293.0, 1182.0, 455.0, 231.0, 151.0, 109.0, 91.0, 49.0, 48.0, 40.0, 31.0, 20.0, 12.0, 9.0, 14.0, 17.0, 6.0, 4.0, 3.0, 1.0, 3.0, 0.0, 2.0, 3.0], "bins": [-214.125, -208.7265625, -203.328125, -197.9296875, -192.53125, -187.1328125, -181.734375, -176.3359375, -170.9375, -165.5390625, -160.140625, -154.7421875, -149.34375, -143.9453125, -138.546875, -133.1484375, -127.75, -122.3515625, -116.953125, -111.5546875, -106.15625, -100.7578125, -95.359375, -89.9609375, -84.5625, -79.1640625, -73.765625, -68.3671875, -62.96875, -57.5703125, -52.171875, -46.7734375, -41.375, -35.9765625, -30.578125, -25.1796875, -19.78125, -14.3828125, -8.984375, -3.5859375, 1.8125, 7.2109375, 12.609375, 18.0078125, 23.40625, 28.8046875, 34.203125, 39.6015625, 45.0, 50.3984375, 55.796875, 61.1953125, 66.59375, 71.9921875, 77.390625, 82.7890625, 88.1875, 93.5859375, 98.984375, 104.3828125, 109.78125, 115.1796875, 120.578125, 125.9765625, 131.375]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 11.0, 94.0, 368.0, 406.0, 117.0, 14.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-508.1662902832031, -494.4316711425781, -480.6970520019531, -466.96246337890625, -453.22784423828125, -439.49322509765625, -425.75860595703125, -412.02398681640625, -398.28936767578125, -384.55474853515625, -370.82012939453125, -357.08551025390625, -343.3509216308594, -329.6163024902344, -315.8816833496094, -302.1470642089844, -288.4124755859375, -274.6778564453125, -260.9432373046875, -247.20863342285156, -233.47402954101562, -219.73941040039062, -206.00479125976562, -192.27017211914062, -178.5355682373047, -164.8009490966797, -151.06634521484375, -137.33172607421875, -123.59711456298828, -109.86250305175781, -96.12788391113281, -82.39327239990234, -68.65869140625, -54.92407989501953, -41.1894645690918, -27.454849243164062, -13.720237731933594, 0.014373779296875, 13.748992919921875, 27.483604431152344, 41.21821594238281, 54.95282745361328, 68.68743896484375, 82.42205810546875, 96.15666961669922, 109.89128112792969, 123.62590026855469, 137.36050415039062, 151.09512329101562, 164.82974243164062, 178.56434631347656, 192.29896545410156, 206.0335693359375, 219.7681884765625, 233.5028076171875, 247.2374267578125, 260.9720458984375, 274.7066650390625, 288.4412841796875, 302.1759033203125, 315.9104919433594, 329.6451110839844, 343.3797302246094, 357.1143493652344, 370.84893798828125]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 1.0, 6.0, 4.0, 6.0, 6.0, 5.0, 11.0, 10.0, 14.0, 17.0, 14.0, 30.0, 30.0, 31.0, 23.0, 25.0, 30.0, 29.0, 27.0, 36.0, 31.0, 38.0, 40.0, 42.0, 41.0, 46.0, 38.0, 46.0, 42.0, 28.0, 42.0, 28.0, 18.0, 34.0, 19.0, 26.0, 17.0, 14.0, 11.0, 13.0, 4.0, 10.0, 5.0, 11.0, 1.0, 6.0, 5.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-83.8360595703125, -80.85216522216797, -77.86827087402344, -74.8843765258789, -71.90048217773438, -68.91658782958984, -65.93269348144531, -62.94879913330078, -59.96490478515625, -56.98101043701172, -53.99711608886719, -51.013221740722656, -48.029327392578125, -45.045433044433594, -42.06153869628906, -39.07764434814453, -36.09375, -33.10985565185547, -30.125961303710938, -27.142066955566406, -24.158172607421875, -21.174278259277344, -18.190383911132812, -15.206489562988281, -12.22259521484375, -9.238700866699219, -6.2548065185546875, -3.2709121704101562, -0.287017822265625, 2.6968765258789062, 5.6807708740234375, 8.664665222167969, 11.6485595703125, 14.632453918457031, 17.616348266601562, 20.600242614746094, 23.584136962890625, 26.568031311035156, 29.551925659179688, 32.53582000732422, 35.51971435546875, 38.50360870361328, 41.48750305175781, 44.471397399902344, 47.455291748046875, 50.439186096191406, 53.42308044433594, 56.40697479248047, 59.390869140625, 62.37476348876953, 65.35865783691406, 68.3425521850586, 71.32644653320312, 74.31034088134766, 77.29423522949219, 80.27812957763672, 83.26202392578125, 86.24591827392578, 89.22981262207031, 92.21370697021484, 95.19760131835938, 98.1814956665039, 101.16539001464844, 104.14928436279297, 107.1331787109375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 2.0, 6.0, 9.0, 9.0, 5.0, 7.0, 16.0, 13.0, 22.0, 21.0, 21.0, 26.0, 23.0, 24.0, 25.0, 40.0, 31.0, 39.0, 37.0, 40.0, 41.0, 41.0, 41.0, 42.0, 54.0, 39.0, 36.0, 37.0, 25.0, 28.0, 28.0, 30.0, 21.0, 19.0, 16.0, 14.0, 15.0, 10.0, 12.0, 8.0, 3.0, 7.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.78125, -13.3477783203125, -12.914306640625, -12.4808349609375, -12.04736328125, -11.6138916015625, -11.180419921875, -10.7469482421875, -10.3134765625, -9.8800048828125, -9.446533203125, -9.0130615234375, -8.57958984375, -8.1461181640625, -7.712646484375, -7.2791748046875, -6.845703125, -6.4122314453125, -5.978759765625, -5.5452880859375, -5.11181640625, -4.6783447265625, -4.244873046875, -3.8114013671875, -3.3779296875, -2.9444580078125, -2.510986328125, -2.0775146484375, -1.64404296875, -1.2105712890625, -0.777099609375, -0.3436279296875, 0.08984375, 0.5233154296875, 0.956787109375, 1.3902587890625, 1.82373046875, 2.2572021484375, 2.690673828125, 3.1241455078125, 3.5576171875, 3.9910888671875, 4.424560546875, 4.8580322265625, 5.29150390625, 5.7249755859375, 6.158447265625, 6.5919189453125, 7.025390625, 7.4588623046875, 7.892333984375, 8.3258056640625, 8.75927734375, 9.1927490234375, 9.626220703125, 10.0596923828125, 10.4931640625, 10.9266357421875, 11.360107421875, 11.7935791015625, 12.22705078125, 12.6605224609375, 13.093994140625, 13.5274658203125, 13.9609375]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 5.0, 4.0, 5.0, 10.0, 23.0, 28.0, 34.0, 57.0, 75.0, 110.0, 169.0, 234.0, 322.0, 468.0, 663.0, 907.0, 1364.0, 1858.0, 2783.0, 3887.0, 5664.0, 8256.0, 12199.0, 17799.0, 26380.0, 40281.0, 63885.0, 113339.0, 275949.0, 208064.0, 96182.0, 56329.0, 35943.0, 23781.0, 16072.0, 10874.0, 7550.0, 5238.0, 3498.0, 2506.0, 1732.0, 1194.0, 853.0, 581.0, 420.0, 293.0, 231.0, 154.0, 94.0, 71.0, 54.0, 34.0, 22.0, 15.0, 12.0, 5.0, 6.0, 2.0, 2.0, 1.0, 1.0], "bins": [-2.8359375, -2.7469482421875, -2.657958984375, -2.5689697265625, -2.47998046875, -2.3909912109375, -2.302001953125, -2.2130126953125, -2.1240234375, -2.0350341796875, -1.946044921875, -1.8570556640625, -1.76806640625, -1.6790771484375, -1.590087890625, -1.5010986328125, -1.412109375, -1.3231201171875, -1.234130859375, -1.1451416015625, -1.05615234375, -0.9671630859375, -0.878173828125, -0.7891845703125, -0.7001953125, -0.6112060546875, -0.522216796875, -0.4332275390625, -0.34423828125, -0.2552490234375, -0.166259765625, -0.0772705078125, 0.01171875, 0.1007080078125, 0.189697265625, 0.2786865234375, 0.36767578125, 0.4566650390625, 0.545654296875, 0.6346435546875, 0.7236328125, 0.8126220703125, 0.901611328125, 0.9906005859375, 1.07958984375, 1.1685791015625, 1.257568359375, 1.3465576171875, 1.435546875, 1.5245361328125, 1.613525390625, 1.7025146484375, 1.79150390625, 1.8804931640625, 1.969482421875, 2.0584716796875, 2.1474609375, 2.2364501953125, 2.325439453125, 2.4144287109375, 2.50341796875, 2.5924072265625, 2.681396484375, 2.7703857421875, 2.859375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 5.0, 7.0, 9.0, 8.0, 10.0, 15.0, 19.0, 17.0, 26.0, 34.0, 25.0, 26.0, 35.0, 31.0, 34.0, 48.0, 35.0, 43.0, 39.0, 1070.0, 35.0, 45.0, 49.0, 32.0, 40.0, 34.0, 25.0, 32.0, 31.0, 29.0, 26.0, 18.0, 12.0, 16.0, 7.0, 15.0, 11.0, 8.0, 4.0, 6.0, 6.0, 5.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-9.7578125, -9.4759521484375, -9.194091796875, -8.9122314453125, -8.63037109375, -8.3485107421875, -8.066650390625, -7.7847900390625, -7.5029296875, -7.2210693359375, -6.939208984375, -6.6573486328125, -6.37548828125, -6.0936279296875, -5.811767578125, -5.5299072265625, -5.248046875, -4.9661865234375, -4.684326171875, -4.4024658203125, -4.12060546875, -3.8387451171875, -3.556884765625, -3.2750244140625, -2.9931640625, -2.7113037109375, -2.429443359375, -2.1475830078125, -1.86572265625, -1.5838623046875, -1.302001953125, -1.0201416015625, -0.73828125, -0.4564208984375, -0.174560546875, 0.1072998046875, 0.38916015625, 0.6710205078125, 0.952880859375, 1.2347412109375, 1.5166015625, 1.7984619140625, 2.080322265625, 2.3621826171875, 2.64404296875, 2.9259033203125, 3.207763671875, 3.4896240234375, 3.771484375, 4.0533447265625, 4.335205078125, 4.6170654296875, 4.89892578125, 5.1807861328125, 5.462646484375, 5.7445068359375, 6.0263671875, 6.3082275390625, 6.590087890625, 6.8719482421875, 7.15380859375, 7.4356689453125, 7.717529296875, 7.9993896484375, 8.28125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 7.0, 10.0, 7.0, 16.0, 25.0, 37.0, 50.0, 68.0, 129.0, 161.0, 248.0, 344.0, 584.0, 799.0, 1099.0, 1779.0, 2482.0, 3744.0, 5671.0, 8246.0, 12627.0, 19178.0, 29410.0, 46786.0, 77494.0, 141994.0, 1352307.0, 161935.0, 85554.0, 50733.0, 31804.0, 20813.0, 13507.0, 9050.0, 5958.0, 4048.0, 2717.0, 1782.0, 1341.0, 820.0, 573.0, 399.0, 283.0, 157.0, 130.0, 84.0, 49.0, 36.0, 24.0, 13.0, 11.0, 9.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-2.552734375, -2.466461181640625, -2.38018798828125, -2.293914794921875, -2.2076416015625, -2.121368408203125, -2.03509521484375, -1.948822021484375, -1.862548828125, -1.776275634765625, -1.69000244140625, -1.603729248046875, -1.5174560546875, -1.431182861328125, -1.34490966796875, -1.258636474609375, -1.17236328125, -1.086090087890625, -0.99981689453125, -0.913543701171875, -0.8272705078125, -0.740997314453125, -0.65472412109375, -0.568450927734375, -0.482177734375, -0.395904541015625, -0.30963134765625, -0.223358154296875, -0.1370849609375, -0.050811767578125, 0.03546142578125, 0.121734619140625, 0.2080078125, 0.294281005859375, 0.38055419921875, 0.466827392578125, 0.5531005859375, 0.639373779296875, 0.72564697265625, 0.811920166015625, 0.898193359375, 0.984466552734375, 1.07073974609375, 1.157012939453125, 1.2432861328125, 1.329559326171875, 1.41583251953125, 1.502105712890625, 1.58837890625, 1.674652099609375, 1.76092529296875, 1.847198486328125, 1.9334716796875, 2.019744873046875, 2.10601806640625, 2.192291259765625, 2.278564453125, 2.364837646484375, 2.45111083984375, 2.537384033203125, 2.6236572265625, 2.709930419921875, 2.79620361328125, 2.882476806640625, 2.96875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 0.0, 6.0, 4.0, 8.0, 3.0, 12.0, 7.0, 7.0, 8.0, 10.0, 20.0, 22.0, 24.0, 29.0, 37.0, 55.0, 59.0, 74.0, 68.0, 78.0, 79.0, 76.0, 52.0, 57.0, 32.0, 32.0, 25.0, 27.0, 20.0, 17.0, 14.0, 10.0, 4.0, 7.0, 8.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.00183868408203125, -0.0017825216054916382, -0.0017263591289520264, -0.0016701966524124146, -0.0016140341758728027, -0.001557871699333191, -0.001501709222793579, -0.0014455467462539673, -0.0013893842697143555, -0.0013332217931747437, -0.0012770593166351318, -0.00122089684009552, -0.0011647343635559082, -0.0011085718870162964, -0.0010524094104766846, -0.0009962469339370728, -0.0009400844573974609, -0.0008839219808578491, -0.0008277595043182373, -0.0007715970277786255, -0.0007154345512390137, -0.0006592720746994019, -0.00060310959815979, -0.0005469471216201782, -0.0004907846450805664, -0.0004346221685409546, -0.0003784596920013428, -0.00032229721546173096, -0.00026613473892211914, -0.00020997226238250732, -0.0001538097858428955, -9.764730930328369e-05, -4.1484832763671875e-05, 1.4677643775939941e-05, 7.084012031555176e-05, 0.00012700259685516357, 0.0001831650733947754, 0.0002393275499343872, 0.000295490026473999, 0.00035165250301361084, 0.00040781497955322266, 0.00046397745609283447, 0.0005201399326324463, 0.0005763024091720581, 0.0006324648857116699, 0.0006886273622512817, 0.0007447898387908936, 0.0008009523153305054, 0.0008571147918701172, 0.000913277268409729, 0.0009694397449493408, 0.0010256022214889526, 0.0010817646980285645, 0.0011379271745681763, 0.001194089651107788, 0.0012502521276474, 0.0013064146041870117, 0.0013625770807266235, 0.0014187395572662354, 0.0014749020338058472, 0.001531064510345459, 0.0015872269868850708, 0.0016433894634246826, 0.0016995519399642944, 0.0017557144165039062]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 4.0, 6.0, 14.0, 14.0, 14.0, 12.0, 18.0, 38.0, 36.0, 56.0, 70.0, 157.0, 390.0, 1332.0, 981770.0, 63058.0, 866.0, 274.0, 132.0, 77.0, 38.0, 31.0, 24.0, 19.0, 23.0, 12.0, 10.0, 7.0, 13.0, 4.0, 6.0, 8.0, 2.0, 2.0, 4.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.046783447265625, -0.04531383514404297, -0.04384422302246094, -0.042374610900878906, -0.040904998779296875, -0.039435386657714844, -0.03796577453613281, -0.03649616241455078, -0.03502655029296875, -0.03355693817138672, -0.03208732604980469, -0.030617713928222656, -0.029148101806640625, -0.027678489685058594, -0.026208877563476562, -0.02473926544189453, -0.0232696533203125, -0.02180004119873047, -0.020330429077148438, -0.018860816955566406, -0.017391204833984375, -0.015921592712402344, -0.014451980590820312, -0.012982368469238281, -0.01151275634765625, -0.010043144226074219, -0.008573532104492188, -0.007103919982910156, -0.005634307861328125, -0.004164695739746094, -0.0026950836181640625, -0.0012254714965820312, 0.000244140625, 0.0017137527465820312, 0.0031833648681640625, 0.004652976989746094, 0.006122589111328125, 0.007592201232910156, 0.009061813354492188, 0.010531425476074219, 0.01200103759765625, 0.013470649719238281, 0.014940261840820312, 0.016409873962402344, 0.017879486083984375, 0.019349098205566406, 0.020818710327148438, 0.02228832244873047, 0.0237579345703125, 0.02522754669189453, 0.026697158813476562, 0.028166770935058594, 0.029636383056640625, 0.031105995178222656, 0.03257560729980469, 0.03404521942138672, 0.03551483154296875, 0.03698444366455078, 0.03845405578613281, 0.039923667907714844, 0.041393280029296875, 0.042862892150878906, 0.04433250427246094, 0.04580211639404297, 0.047271728515625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 8.0, 80.0, 476.0, 389.0, 57.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007887964136898518, -0.0077416361309587955, -0.007595308590680361, -0.007448980584740639, -0.007302653044462204, -0.007156325038522482, -0.007009997498244047, -0.006863669492304325, -0.00671734195202589, -0.006571013946086168, -0.0064246864058077335, -0.0062783583998680115, -0.006132030859589577, -0.005985702853649855, -0.00583937531337142, -0.005693047307431698, -0.005546719301491976, -0.005400391295552254, -0.005254063755273819, -0.005107735749334097, -0.004961408209055662, -0.00481508020311594, -0.004668752662837505, -0.004522424656897783, -0.004376096650958061, -0.004229768645018339, -0.004083441104739904, -0.003937113098800182, -0.0037907855585217476, -0.0036444575525820255, -0.003498129779472947, -0.0033518020063638687, -0.003205474466085434, -0.0030591466929763556, -0.002912818919867277, -0.0027664911467581987, -0.0026201633736491203, -0.0024738353677093983, -0.00232750759460032, -0.0021811798214912415, -0.0020348518155515194, -0.001888524042442441, -0.0017421962693333626, -0.0015958683798089623, -0.001449540606699884, -0.0013032128335908055, -0.0011568849440664053, -0.0010105571709573269, -0.0008642295142635703, -0.0007179017411544919, -0.0005715739098377526, -0.0004252461076248437, -0.00027891830541193485, -0.00013259053230285645, 1.3737299013882875e-05, 0.0001600651303306222, 0.0003063929034397006, 0.00045272070565260947, 0.0005990485078655183, 0.0007453763391822577, 0.0008917041122913361, 0.0010380318854004145, 0.0011843596585094929, 0.001330687548033893, 0.0014770153211429715]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 6.0, 7.0, 7.0, 9.0, 6.0, 17.0, 13.0, 10.0, 15.0, 25.0, 24.0, 20.0, 24.0, 23.0, 23.0, 42.0, 34.0, 34.0, 36.0, 30.0, 34.0, 34.0, 45.0, 29.0, 33.0, 45.0, 28.0, 33.0, 37.0, 31.0, 23.0, 34.0, 35.0, 20.0, 20.0, 20.0, 14.0, 16.0, 12.0, 9.0, 10.0, 16.0, 5.0, 3.0, 6.0, 2.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.000870048999786377, -0.0008451696485280991, -0.0008202902972698212, -0.0007954109460115433, -0.0007705315947532654, -0.0007456522434949875, -0.0007207728922367096, -0.0006958935409784317, -0.0006710141897201538, -0.0006461348384618759, -0.000621255487203598, -0.0005963761359453201, -0.0005714967846870422, -0.0005466174334287643, -0.0005217380821704865, -0.0004968587309122086, -0.00047197937965393066, -0.00044710002839565277, -0.0004222206771373749, -0.000397341325879097, -0.0003724619746208191, -0.0003475826233625412, -0.0003227032721042633, -0.0002978239208459854, -0.0002729445695877075, -0.0002480652183294296, -0.00022318586707115173, -0.00019830651581287384, -0.00017342716455459595, -0.00014854781329631805, -0.00012366846203804016, -9.878911077976227e-05, -7.390975952148438e-05, -4.903040826320648e-05, -2.415105700492859e-05, 7.282942533493042e-07, 2.5607645511627197e-05, 5.048699676990509e-05, 7.536634802818298e-05, 0.00010024569928646088, 0.00012512505054473877, 0.00015000440180301666, 0.00017488375306129456, 0.00019976310431957245, 0.00022464245557785034, 0.00024952180683612823, 0.00027440115809440613, 0.000299280509352684, 0.0003241598606109619, 0.0003490392118692398, 0.0003739185631275177, 0.0003987979143857956, 0.0004236772656440735, 0.0004485566169023514, 0.00047343596816062927, 0.0004983153194189072, 0.0005231946706771851, 0.000548074021935463, 0.0005729533731937408, 0.0005978327244520187, 0.0006227120757102966, 0.0006475914269685745, 0.0006724707782268524, 0.0006973501294851303, 0.0007222294807434082]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 2.0, 6.0, 9.0, 9.0, 5.0, 7.0, 16.0, 13.0, 22.0, 21.0, 21.0, 26.0, 23.0, 24.0, 25.0, 40.0, 31.0, 39.0, 37.0, 40.0, 41.0, 41.0, 41.0, 42.0, 54.0, 39.0, 36.0, 37.0, 25.0, 28.0, 28.0, 30.0, 21.0, 19.0, 16.0, 14.0, 15.0, 10.0, 12.0, 8.0, 3.0, 7.0, 6.0, 4.0, 3.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-13.78125, -13.3477783203125, -12.914306640625, -12.4808349609375, -12.04736328125, -11.6138916015625, -11.180419921875, -10.7469482421875, -10.3134765625, -9.8800048828125, -9.446533203125, -9.0130615234375, -8.57958984375, -8.1461181640625, -7.712646484375, -7.2791748046875, -6.845703125, -6.4122314453125, -5.978759765625, -5.5452880859375, -5.11181640625, -4.6783447265625, -4.244873046875, -3.8114013671875, -3.3779296875, -2.9444580078125, -2.510986328125, -2.0775146484375, -1.64404296875, -1.2105712890625, -0.777099609375, -0.3436279296875, 0.08984375, 0.5233154296875, 0.956787109375, 1.3902587890625, 1.82373046875, 2.2572021484375, 2.690673828125, 3.1241455078125, 3.5576171875, 3.9910888671875, 4.424560546875, 4.8580322265625, 5.29150390625, 5.7249755859375, 6.158447265625, 6.5919189453125, 7.025390625, 7.4588623046875, 7.892333984375, 8.3258056640625, 8.75927734375, 9.1927490234375, 9.626220703125, 10.0596923828125, 10.4931640625, 10.9266357421875, 11.360107421875, 11.7935791015625, 12.22705078125, 12.6605224609375, 13.093994140625, 13.5274658203125, 13.9609375]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 13.0, 6.0, 12.0, 18.0, 14.0, 19.0, 33.0, 42.0, 47.0, 78.0, 106.0, 102.0, 162.0, 225.0, 246.0, 430.0, 617.0, 954.0, 1534.0, 2861.0, 6809.0, 19314.0, 66878.0, 262002.0, 515450.0, 117887.0, 32628.0, 10359.0, 4062.0, 1965.0, 1176.0, 689.0, 475.0, 329.0, 232.0, 216.0, 117.0, 102.0, 85.0, 63.0, 52.0, 35.0, 36.0, 23.0, 19.0, 4.0, 15.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 3.0], "bins": [-15.6796875, -15.2076416015625, -14.735595703125, -14.2635498046875, -13.79150390625, -13.3194580078125, -12.847412109375, -12.3753662109375, -11.9033203125, -11.4312744140625, -10.959228515625, -10.4871826171875, -10.01513671875, -9.5430908203125, -9.071044921875, -8.5989990234375, -8.126953125, -7.6549072265625, -7.182861328125, -6.7108154296875, -6.23876953125, -5.7667236328125, -5.294677734375, -4.8226318359375, -4.3505859375, -3.8785400390625, -3.406494140625, -2.9344482421875, -2.46240234375, -1.9903564453125, -1.518310546875, -1.0462646484375, -0.57421875, -0.1021728515625, 0.369873046875, 0.8419189453125, 1.31396484375, 1.7860107421875, 2.258056640625, 2.7301025390625, 3.2021484375, 3.6741943359375, 4.146240234375, 4.6182861328125, 5.09033203125, 5.5623779296875, 6.034423828125, 6.5064697265625, 6.978515625, 7.4505615234375, 7.922607421875, 8.3946533203125, 8.86669921875, 9.3387451171875, 9.810791015625, 10.2828369140625, 10.7548828125, 11.2269287109375, 11.698974609375, 12.1710205078125, 12.64306640625, 13.1151123046875, 13.587158203125, 14.0592041015625, 14.53125]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 5.0, 4.0, 6.0, 4.0, 12.0, 11.0, 14.0, 14.0, 9.0, 15.0, 18.0, 23.0, 43.0, 30.0, 35.0, 46.0, 42.0, 51.0, 61.0, 98.0, 407.0, 1548.0, 86.0, 80.0, 48.0, 54.0, 42.0, 39.0, 38.0, 31.0, 30.0, 17.0, 16.0, 11.0, 10.0, 11.0, 11.0, 9.0, 6.0, 4.0, 4.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-50.75, -49.16650390625, -47.5830078125, -45.99951171875, -44.416015625, -42.83251953125, -41.2490234375, -39.66552734375, -38.08203125, -36.49853515625, -34.9150390625, -33.33154296875, -31.748046875, -30.16455078125, -28.5810546875, -26.99755859375, -25.4140625, -23.83056640625, -22.2470703125, -20.66357421875, -19.080078125, -17.49658203125, -15.9130859375, -14.32958984375, -12.74609375, -11.16259765625, -9.5791015625, -7.99560546875, -6.412109375, -4.82861328125, -3.2451171875, -1.66162109375, -0.078125, 1.50537109375, 3.0888671875, 4.67236328125, 6.255859375, 7.83935546875, 9.4228515625, 11.00634765625, 12.58984375, 14.17333984375, 15.7568359375, 17.34033203125, 18.923828125, 20.50732421875, 22.0908203125, 23.67431640625, 25.2578125, 26.84130859375, 28.4248046875, 30.00830078125, 31.591796875, 33.17529296875, 34.7587890625, 36.34228515625, 37.92578125, 39.50927734375, 41.0927734375, 42.67626953125, 44.259765625, 45.84326171875, 47.4267578125, 49.01025390625, 50.59375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 3.0, 11.0, 9.0, 19.0, 26.0, 25.0, 46.0, 49.0, 101.0, 159.0, 238.0, 382.0, 1028.0, 98014.0, 3042304.0, 2000.0, 519.0, 242.0, 171.0, 125.0, 74.0, 38.0, 43.0, 33.0, 16.0, 16.0, 4.0, 6.0, 3.0, 2.0, 4.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-152.625, -147.005859375, -141.38671875, -135.767578125, -130.1484375, -124.529296875, -118.91015625, -113.291015625, -107.671875, -102.052734375, -96.43359375, -90.814453125, -85.1953125, -79.576171875, -73.95703125, -68.337890625, -62.71875, -57.099609375, -51.48046875, -45.861328125, -40.2421875, -34.623046875, -29.00390625, -23.384765625, -17.765625, -12.146484375, -6.52734375, -0.908203125, 4.7109375, 10.330078125, 15.94921875, 21.568359375, 27.1875, 32.806640625, 38.42578125, 44.044921875, 49.6640625, 55.283203125, 60.90234375, 66.521484375, 72.140625, 77.759765625, 83.37890625, 88.998046875, 94.6171875, 100.236328125, 105.85546875, 111.474609375, 117.09375, 122.712890625, 128.33203125, 133.951171875, 139.5703125, 145.189453125, 150.80859375, 156.427734375, 162.046875, 167.666015625, 173.28515625, 178.904296875, 184.5234375, 190.142578125, 195.76171875, 201.380859375, 207.0]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 8.0, 965.0, 43.0, 2.0, 1.0], "bins": [-1474.2449951171875, -1449.8985595703125, -1425.552001953125, -1401.20556640625, -1376.859130859375, -1352.5125732421875, -1328.1661376953125, -1303.819580078125, -1279.47314453125, -1255.126708984375, -1230.7801513671875, -1206.4337158203125, -1182.0872802734375, -1157.74072265625, -1133.394287109375, -1109.0478515625, -1084.7012939453125, -1060.3548583984375, -1036.00830078125, -1011.661865234375, -987.3153686523438, -962.9688720703125, -938.6224365234375, -914.2759399414062, -889.9295043945312, -865.5830078125, -841.236572265625, -816.8900756835938, -792.5435791015625, -768.1970825195312, -743.8506469726562, -719.504150390625, -695.15771484375, -670.8112182617188, -646.4647827148438, -622.1182861328125, -597.7717895507812, -573.42529296875, -549.078857421875, -524.7323608398438, -500.3858642578125, -476.0393981933594, -451.6929016113281, -427.346435546875, -402.99993896484375, -378.6534729003906, -354.3070068359375, -329.96051025390625, -305.614013671875, -281.2675476074219, -256.9210510253906, -232.5745849609375, -208.22808837890625, -183.88162231445312, -159.53514099121094, -135.18865966796875, -110.84219360351562, -86.49571228027344, -62.149234771728516, -37.802757263183594, -13.456275939941406, 10.890205383300781, 35.23667907714844, 59.583160400390625, 83.92964172363281]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 4.0, 3.0, 3.0, 6.0, 6.0, 4.0, 6.0, 8.0, 10.0, 18.0, 13.0, 10.0, 17.0, 17.0, 21.0, 16.0, 25.0, 31.0, 34.0, 30.0, 26.0, 36.0, 46.0, 31.0, 35.0, 41.0, 41.0, 43.0, 42.0, 42.0, 36.0, 40.0, 34.0, 33.0, 31.0, 26.0, 26.0, 13.0, 14.0, 13.0, 17.0, 17.0, 8.0, 8.0, 7.0, 5.0, 4.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.93619537353516, -113.8165283203125, -109.69686126708984, -105.57719421386719, -101.45752716064453, -97.33786010742188, -93.21820068359375, -89.09852600097656, -84.97886657714844, -80.85919952392578, -76.73953247070312, -72.61986541748047, -68.50019836425781, -64.38053131103516, -60.260868072509766, -56.14120101928711, -52.02153015136719, -47.90186309814453, -43.782196044921875, -39.66252899169922, -35.54286193847656, -31.42319679260254, -27.303531646728516, -23.18386459350586, -19.064197540283203, -14.944530487060547, -10.824864387512207, -6.705198287963867, -2.585531234741211, 1.5341358184814453, 5.653800964355469, 9.773468017578125, 13.893142700195312, 18.01280975341797, 22.132476806640625, 26.25214195251465, 30.371809005737305, 34.491477966308594, 38.611141204833984, 42.73080825805664, 46.8504753112793, 50.97014236450195, 55.08980941772461, 59.20947265625, 63.329139709472656, 67.44880676269531, 71.56847381591797, 75.68814086914062, 79.80780792236328, 83.92747497558594, 88.0471420288086, 92.16680908203125, 96.2864761352539, 100.40614318847656, 104.52580261230469, 108.64547729492188, 112.76513671875, 116.88480377197266, 121.00447082519531, 125.12413787841797, 129.24380493164062, 133.36346435546875, 137.48313903808594, 141.60279846191406, 145.72247314453125]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 2.0, 2.0, 10.0, 6.0, 5.0, 10.0, 9.0, 11.0, 10.0, 20.0, 25.0, 23.0, 23.0, 22.0, 25.0, 26.0, 35.0, 38.0, 38.0, 31.0, 51.0, 47.0, 41.0, 40.0, 49.0, 44.0, 40.0, 38.0, 31.0, 32.0, 28.0, 25.0, 21.0, 27.0, 15.0, 15.0, 21.0, 14.0, 6.0, 10.0, 10.0, 2.0, 10.0, 4.0, 5.0, 1.0, 7.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.40625, -14.9346923828125, -14.463134765625, -13.9915771484375, -13.52001953125, -13.0484619140625, -12.576904296875, -12.1053466796875, -11.6337890625, -11.1622314453125, -10.690673828125, -10.2191162109375, -9.74755859375, -9.2760009765625, -8.804443359375, -8.3328857421875, -7.861328125, -7.3897705078125, -6.918212890625, -6.4466552734375, -5.97509765625, -5.5035400390625, -5.031982421875, -4.5604248046875, -4.0888671875, -3.6173095703125, -3.145751953125, -2.6741943359375, -2.20263671875, -1.7310791015625, -1.259521484375, -0.7879638671875, -0.31640625, 0.1551513671875, 0.626708984375, 1.0982666015625, 1.56982421875, 2.0413818359375, 2.512939453125, 2.9844970703125, 3.4560546875, 3.9276123046875, 4.399169921875, 4.8707275390625, 5.34228515625, 5.8138427734375, 6.285400390625, 6.7569580078125, 7.228515625, 7.7000732421875, 8.171630859375, 8.6431884765625, 9.11474609375, 9.5863037109375, 10.057861328125, 10.5294189453125, 11.0009765625, 11.4725341796875, 11.944091796875, 12.4156494140625, 12.88720703125, 13.3587646484375, 13.830322265625, 14.3018798828125, 14.7734375]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 5.0, 5.0, 4.0, 6.0, 5.0, 8.0, 7.0, 8.0, 16.0, 14.0, 20.0, 23.0, 20.0, 18.0, 20.0, 23.0, 29.0, 39.0, 92.0, 156.0, 408.0, 1394.0, 12810.0, 1013965.0, 3090242.0, 70876.0, 2828.0, 607.0, 226.0, 98.0, 51.0, 33.0, 34.0, 27.0, 20.0, 26.0, 18.0, 17.0, 19.0, 11.0, 11.0, 9.0, 6.0, 7.0, 12.0, 7.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-56.09375, -54.3525390625, -52.611328125, -50.8701171875, -49.12890625, -47.3876953125, -45.646484375, -43.9052734375, -42.1640625, -40.4228515625, -38.681640625, -36.9404296875, -35.19921875, -33.4580078125, -31.716796875, -29.9755859375, -28.234375, -26.4931640625, -24.751953125, -23.0107421875, -21.26953125, -19.5283203125, -17.787109375, -16.0458984375, -14.3046875, -12.5634765625, -10.822265625, -9.0810546875, -7.33984375, -5.5986328125, -3.857421875, -2.1162109375, -0.375, 1.3662109375, 3.107421875, 4.8486328125, 6.58984375, 8.3310546875, 10.072265625, 11.8134765625, 13.5546875, 15.2958984375, 17.037109375, 18.7783203125, 20.51953125, 22.2607421875, 24.001953125, 25.7431640625, 27.484375, 29.2255859375, 30.966796875, 32.7080078125, 34.44921875, 36.1904296875, 37.931640625, 39.6728515625, 41.4140625, 43.1552734375, 44.896484375, 46.6376953125, 48.37890625, 50.1201171875, 51.861328125, 53.6025390625, 55.34375]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 2.0, 12.0, 15.0, 17.0, 26.0, 25.0, 40.0, 57.0, 91.0, 112.0, 135.0, 186.0, 264.0, 361.0, 513.0, 484.0, 483.0, 354.0, 259.0, 170.0, 133.0, 98.0, 63.0, 45.0, 35.0, 31.0, 7.0, 14.0, 8.0, 5.0, 8.0, 5.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.125, -38.10693359375, -37.0888671875, -36.07080078125, -35.052734375, -34.03466796875, -33.0166015625, -31.99853515625, -30.98046875, -29.96240234375, -28.9443359375, -27.92626953125, -26.908203125, -25.89013671875, -24.8720703125, -23.85400390625, -22.8359375, -21.81787109375, -20.7998046875, -19.78173828125, -18.763671875, -17.74560546875, -16.7275390625, -15.70947265625, -14.69140625, -13.67333984375, -12.6552734375, -11.63720703125, -10.619140625, -9.60107421875, -8.5830078125, -7.56494140625, -6.546875, -5.52880859375, -4.5107421875, -3.49267578125, -2.474609375, -1.45654296875, -0.4384765625, 0.57958984375, 1.59765625, 2.61572265625, 3.6337890625, 4.65185546875, 5.669921875, 6.68798828125, 7.7060546875, 8.72412109375, 9.7421875, 10.76025390625, 11.7783203125, 12.79638671875, 13.814453125, 14.83251953125, 15.8505859375, 16.86865234375, 17.88671875, 18.90478515625, 19.9228515625, 20.94091796875, 21.958984375, 22.97705078125, 23.9951171875, 25.01318359375, 26.03125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 3.0, 6.0, 8.0, 8.0, 6.0, 10.0, 20.0, 20.0, 22.0, 33.0, 40.0, 62.0, 70.0, 94.0, 104.0, 157.0, 237.0, 341.0, 556.0, 2258.0, 686687.0, 3497439.0, 3893.0, 708.0, 414.0, 225.0, 188.0, 147.0, 119.0, 77.0, 67.0, 55.0, 59.0, 27.0, 34.0, 18.0, 17.0, 15.0, 9.0, 10.0, 7.0, 7.0, 4.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-135.75, -131.0859375, -126.421875, -121.7578125, -117.09375, -112.4296875, -107.765625, -103.1015625, -98.4375, -93.7734375, -89.109375, -84.4453125, -79.78125, -75.1171875, -70.453125, -65.7890625, -61.125, -56.4609375, -51.796875, -47.1328125, -42.46875, -37.8046875, -33.140625, -28.4765625, -23.8125, -19.1484375, -14.484375, -9.8203125, -5.15625, -0.4921875, 4.171875, 8.8359375, 13.5, 18.1640625, 22.828125, 27.4921875, 32.15625, 36.8203125, 41.484375, 46.1484375, 50.8125, 55.4765625, 60.140625, 64.8046875, 69.46875, 74.1328125, 78.796875, 83.4609375, 88.125, 92.7890625, 97.453125, 102.1171875, 106.78125, 111.4453125, 116.109375, 120.7734375, 125.4375, 130.1015625, 134.765625, 139.4296875, 144.09375, 148.7578125, 153.421875, 158.0859375, 162.75]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 14.0, 152.0, 487.0, 316.0, 38.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-681.22265625, -665.6494750976562, -650.0762939453125, -634.5031127929688, -618.929931640625, -603.3567504882812, -587.7835693359375, -572.2103271484375, -556.63720703125, -541.0640258789062, -525.4908447265625, -509.91766357421875, -494.344482421875, -478.77130126953125, -463.1980895996094, -447.6249084472656, -432.05169677734375, -416.478515625, -400.90533447265625, -385.3321533203125, -369.75897216796875, -354.185791015625, -338.6125793457031, -323.0393981933594, -307.4662170410156, -291.8930358886719, -276.3198547363281, -260.7466735839844, -245.17347717285156, -229.6002960205078, -214.027099609375, -198.45391845703125, -182.88076782226562, -167.30758666992188, -151.73440551757812, -136.1612091064453, -120.58802795410156, -105.01484680175781, -89.44165802001953, -73.86846923828125, -58.2952880859375, -42.722103118896484, -27.14891815185547, -11.575733184814453, 3.9974517822265625, 19.570632934570312, 35.143821716308594, 50.717010498046875, 66.29019165039062, 81.86337280273438, 97.43656158447266, 113.00975036621094, 128.5829315185547, 144.15611267089844, 159.72930908203125, 175.302490234375, 190.87567138671875, 206.4488525390625, 222.02203369140625, 237.59523010253906, 253.1684112548828, 268.7415771484375, 284.3147888183594, 299.8879699707031, 315.4611511230469]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [3.0, 3.0, 3.0, 1.0, 3.0, 5.0, 4.0, 6.0, 8.0, 5.0, 7.0, 10.0, 10.0, 15.0, 10.0, 25.0, 26.0, 24.0, 18.0, 25.0, 21.0, 29.0, 29.0, 35.0, 39.0, 43.0, 35.0, 31.0, 41.0, 45.0, 42.0, 30.0, 53.0, 41.0, 26.0, 25.0, 23.0, 28.0, 26.0, 12.0, 27.0, 17.0, 19.0, 18.0, 10.0, 15.0, 10.0, 9.0, 4.0, 7.0, 11.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-89.46188354492188, -86.41546630859375, -83.36904907226562, -80.3226318359375, -77.2762222290039, -74.22980499267578, -71.18338775634766, -68.13697052001953, -65.09056091308594, -62.04414367675781, -58.99773025512695, -55.95131301879883, -52.90489959716797, -49.858482360839844, -46.81206512451172, -43.765647888183594, -40.71923065185547, -37.672813415527344, -34.626399993896484, -31.57998275756836, -28.533567428588867, -25.487152099609375, -22.44073486328125, -19.394319534301758, -16.347904205322266, -13.301488876342773, -10.255072593688965, -7.208656311035156, -4.162240982055664, -1.1158256530761719, 1.9305915832519531, 4.977006912231445, 8.023422241210938, 11.06983757019043, 14.116253852844238, 17.162670135498047, 20.20908546447754, 23.25550079345703, 26.301918029785156, 29.34833335876465, 32.39474868774414, 35.441165924072266, 38.487579345703125, 41.53399658203125, 44.580413818359375, 47.626827239990234, 50.67324447631836, 53.71965789794922, 56.766075134277344, 59.81249237060547, 62.85890579223633, 65.90531921386719, 68.95173645019531, 71.99815368652344, 75.04457092285156, 78.09098815917969, 81.13740539550781, 84.18382263183594, 87.23023986816406, 90.27665710449219, 93.32306671142578, 96.3694839477539, 99.41590118408203, 102.46231842041016, 105.50872802734375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 11.0, 7.0, 8.0, 10.0, 15.0, 19.0, 22.0, 12.0, 33.0, 27.0, 37.0, 27.0, 42.0, 30.0, 35.0, 44.0, 34.0, 52.0, 34.0, 45.0, 49.0, 43.0, 55.0, 32.0, 28.0, 38.0, 30.0, 20.0, 22.0, 19.0, 21.0, 23.0, 14.0, 9.0, 10.0, 8.0, 7.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3359375, -14.8524169921875, -14.368896484375, -13.8853759765625, -13.40185546875, -12.9183349609375, -12.434814453125, -11.9512939453125, -11.4677734375, -10.9842529296875, -10.500732421875, -10.0172119140625, -9.53369140625, -9.0501708984375, -8.566650390625, -8.0831298828125, -7.599609375, -7.1160888671875, -6.632568359375, -6.1490478515625, -5.66552734375, -5.1820068359375, -4.698486328125, -4.2149658203125, -3.7314453125, -3.2479248046875, -2.764404296875, -2.2808837890625, -1.79736328125, -1.3138427734375, -0.830322265625, -0.3468017578125, 0.13671875, 0.6202392578125, 1.103759765625, 1.5872802734375, 2.07080078125, 2.5543212890625, 3.037841796875, 3.5213623046875, 4.0048828125, 4.4884033203125, 4.971923828125, 5.4554443359375, 5.93896484375, 6.4224853515625, 6.906005859375, 7.3895263671875, 7.873046875, 8.3565673828125, 8.840087890625, 9.3236083984375, 9.80712890625, 10.2906494140625, 10.774169921875, 11.2576904296875, 11.7412109375, 12.2247314453125, 12.708251953125, 13.1917724609375, 13.67529296875, 14.1588134765625, 14.642333984375, 15.1258544921875, 15.609375]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 7.0, 6.0, 8.0, 10.0, 16.0, 27.0, 36.0, 53.0, 75.0, 101.0, 151.0, 232.0, 310.0, 427.0, 608.0, 860.0, 1290.0, 1753.0, 2624.0, 3775.0, 5581.0, 8166.0, 12090.0, 18102.0, 27419.0, 42811.0, 70389.0, 129322.0, 282811.0, 189143.0, 93144.0, 54529.0, 34270.0, 22212.0, 14693.0, 9945.0, 6554.0, 4688.0, 3094.0, 2238.0, 1497.0, 1064.0, 716.0, 519.0, 377.0, 238.0, 175.0, 125.0, 91.0, 60.0, 43.0, 29.0, 19.0, 17.0, 10.0, 6.0, 9.0, 2.0, 2.0, 0.0, 2.0], "bins": [-2.962890625, -2.86956787109375, -2.7762451171875, -2.68292236328125, -2.589599609375, -2.49627685546875, -2.4029541015625, -2.30963134765625, -2.21630859375, -2.12298583984375, -2.0296630859375, -1.93634033203125, -1.843017578125, -1.74969482421875, -1.6563720703125, -1.56304931640625, -1.4697265625, -1.37640380859375, -1.2830810546875, -1.18975830078125, -1.096435546875, -1.00311279296875, -0.9097900390625, -0.81646728515625, -0.72314453125, -0.62982177734375, -0.5364990234375, -0.44317626953125, -0.349853515625, -0.25653076171875, -0.1632080078125, -0.06988525390625, 0.0234375, 0.11676025390625, 0.2100830078125, 0.30340576171875, 0.396728515625, 0.49005126953125, 0.5833740234375, 0.67669677734375, 0.77001953125, 0.86334228515625, 0.9566650390625, 1.04998779296875, 1.143310546875, 1.23663330078125, 1.3299560546875, 1.42327880859375, 1.5166015625, 1.60992431640625, 1.7032470703125, 1.79656982421875, 1.889892578125, 1.98321533203125, 2.0765380859375, 2.16986083984375, 2.26318359375, 2.35650634765625, 2.4498291015625, 2.54315185546875, 2.636474609375, 2.72979736328125, 2.8231201171875, 2.91644287109375, 3.009765625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 2.0, 6.0, 5.0, 10.0, 11.0, 10.0, 14.0, 19.0, 24.0, 13.0, 23.0, 16.0, 33.0, 24.0, 32.0, 41.0, 33.0, 44.0, 38.0, 36.0, 1059.0, 42.0, 42.0, 46.0, 50.0, 39.0, 50.0, 43.0, 32.0, 32.0, 31.0, 19.0, 21.0, 21.0, 11.0, 11.0, 8.0, 13.0, 8.0, 10.0, 1.0, 4.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-9.078125, -8.7744140625, -8.470703125, -8.1669921875, -7.86328125, -7.5595703125, -7.255859375, -6.9521484375, -6.6484375, -6.3447265625, -6.041015625, -5.7373046875, -5.43359375, -5.1298828125, -4.826171875, -4.5224609375, -4.21875, -3.9150390625, -3.611328125, -3.3076171875, -3.00390625, -2.7001953125, -2.396484375, -2.0927734375, -1.7890625, -1.4853515625, -1.181640625, -0.8779296875, -0.57421875, -0.2705078125, 0.033203125, 0.3369140625, 0.640625, 0.9443359375, 1.248046875, 1.5517578125, 1.85546875, 2.1591796875, 2.462890625, 2.7666015625, 3.0703125, 3.3740234375, 3.677734375, 3.9814453125, 4.28515625, 4.5888671875, 4.892578125, 5.1962890625, 5.5, 5.8037109375, 6.107421875, 6.4111328125, 6.71484375, 7.0185546875, 7.322265625, 7.6259765625, 7.9296875, 8.2333984375, 8.537109375, 8.8408203125, 9.14453125, 9.4482421875, 9.751953125, 10.0556640625, 10.359375]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 4.0, 8.0, 8.0, 9.0, 16.0, 35.0, 36.0, 48.0, 80.0, 116.0, 174.0, 245.0, 380.0, 556.0, 824.0, 1243.0, 1884.0, 2794.0, 4228.0, 6339.0, 9179.0, 14264.0, 22007.0, 34877.0, 57061.0, 99645.0, 200583.0, 1326272.0, 126606.0, 70398.0, 41673.0, 26101.0, 16574.0, 10903.0, 7304.0, 4851.0, 3181.0, 2206.0, 1430.0, 1018.0, 631.0, 445.0, 302.0, 177.0, 129.0, 82.0, 76.0, 39.0, 33.0, 17.0, 15.0, 18.0, 6.0, 6.0, 3.0, 1.0, 3.0], "bins": [-3.16015625, -3.067718505859375, -2.97528076171875, -2.882843017578125, -2.7904052734375, -2.697967529296875, -2.60552978515625, -2.513092041015625, -2.420654296875, -2.328216552734375, -2.23577880859375, -2.143341064453125, -2.0509033203125, -1.958465576171875, -1.86602783203125, -1.773590087890625, -1.68115234375, -1.588714599609375, -1.49627685546875, -1.403839111328125, -1.3114013671875, -1.218963623046875, -1.12652587890625, -1.034088134765625, -0.941650390625, -0.849212646484375, -0.75677490234375, -0.664337158203125, -0.5718994140625, -0.479461669921875, -0.38702392578125, -0.294586181640625, -0.2021484375, -0.109710693359375, -0.01727294921875, 0.075164794921875, 0.1676025390625, 0.260040283203125, 0.35247802734375, 0.444915771484375, 0.537353515625, 0.629791259765625, 0.72222900390625, 0.814666748046875, 0.9071044921875, 0.999542236328125, 1.09197998046875, 1.184417724609375, 1.27685546875, 1.369293212890625, 1.46173095703125, 1.554168701171875, 1.6466064453125, 1.739044189453125, 1.83148193359375, 1.923919677734375, 2.016357421875, 2.108795166015625, 2.20123291015625, 2.293670654296875, 2.3861083984375, 2.478546142578125, 2.57098388671875, 2.663421630859375, 2.755859375]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 4.0, 0.0, 5.0, 4.0, 4.0, 8.0, 7.0, 10.0, 12.0, 18.0, 22.0, 30.0, 26.0, 31.0, 53.0, 55.0, 81.0, 101.0, 88.0, 82.0, 66.0, 56.0, 47.0, 39.0, 34.0, 32.0, 28.0, 15.0, 13.0, 8.0, 11.0, 2.0, 9.0, 7.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001251220703125, -0.0011951625347137451, -0.0011391043663024902, -0.0010830461978912354, -0.0010269880294799805, -0.0009709298610687256, -0.0009148716926574707, -0.0008588135242462158, -0.0008027553558349609, -0.0007466971874237061, -0.0006906390190124512, -0.0006345808506011963, -0.0005785226821899414, -0.0005224645137786865, -0.00046640634536743164, -0.00041034817695617676, -0.0003542900085449219, -0.000298231840133667, -0.0002421736717224121, -0.00018611550331115723, -0.00013005733489990234, -7.399916648864746e-05, -1.7940998077392578e-05, 3.8117170333862305e-05, 9.417533874511719e-05, 0.00015023350715637207, 0.00020629167556762695, 0.00026234984397888184, 0.0003184080123901367, 0.0003744661808013916, 0.0004305243492126465, 0.00048658251762390137, 0.0005426406860351562, 0.0005986988544464111, 0.000654757022857666, 0.0007108151912689209, 0.0007668733596801758, 0.0008229315280914307, 0.0008789896965026855, 0.0009350478649139404, 0.0009911060333251953, 0.0010471642017364502, 0.001103222370147705, 0.00115928053855896, 0.0012153387069702148, 0.0012713968753814697, 0.0013274550437927246, 0.0013835132122039795, 0.0014395713806152344, 0.0014956295490264893, 0.0015516877174377441, 0.001607745885848999, 0.001663804054260254, 0.0017198622226715088, 0.0017759203910827637, 0.0018319785594940186, 0.0018880367279052734, 0.0019440948963165283, 0.002000153064727783, 0.002056211233139038, 0.002112269401550293, 0.002168327569961548, 0.0022243857383728027, 0.0022804439067840576, 0.0023365020751953125]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 8.0, 4.0, 6.0, 18.0, 16.0, 33.0, 40.0, 51.0, 76.0, 119.0, 229.0, 658.0, 4580.0, 1038400.0, 3162.0, 607.0, 214.0, 110.0, 80.0, 41.0, 26.0, 13.0, 20.0, 10.0, 10.0, 6.0, 3.0, 5.0, 7.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0621337890625, -0.06047534942626953, -0.05881690979003906, -0.057158470153808594, -0.055500030517578125, -0.053841590881347656, -0.05218315124511719, -0.05052471160888672, -0.04886627197265625, -0.04720783233642578, -0.04554939270019531, -0.043890953063964844, -0.042232513427734375, -0.040574073791503906, -0.03891563415527344, -0.03725719451904297, -0.0355987548828125, -0.03394031524658203, -0.03228187561035156, -0.030623435974121094, -0.028964996337890625, -0.027306556701660156, -0.025648117065429688, -0.02398967742919922, -0.02233123779296875, -0.02067279815673828, -0.019014358520507812, -0.017355918884277344, -0.015697479248046875, -0.014039039611816406, -0.012380599975585938, -0.010722160339355469, -0.009063720703125, -0.007405281066894531, -0.0057468414306640625, -0.004088401794433594, -0.002429962158203125, -0.0007715225219726562, 0.0008869171142578125, 0.0025453567504882812, 0.00420379638671875, 0.005862236022949219, 0.0075206756591796875, 0.009179115295410156, 0.010837554931640625, 0.012495994567871094, 0.014154434204101562, 0.01581287384033203, 0.0174713134765625, 0.01912975311279297, 0.020788192749023438, 0.022446632385253906, 0.024105072021484375, 0.025763511657714844, 0.027421951293945312, 0.02908039093017578, 0.03073883056640625, 0.03239727020263672, 0.03405570983886719, 0.035714149475097656, 0.037372589111328125, 0.039031028747558594, 0.04068946838378906, 0.04234790802001953, 0.04400634765625]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 51.0, 363.0, 473.0, 122.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028919833712279797, -0.0027328943833708763, -0.002573805395513773, -0.0024147164076566696, -0.0022556274197995663, -0.002096538431942463, -0.0019374494440853596, -0.0017783604562282562, -0.0016192714683711529, -0.0014601824805140495, -0.0013010934926569462, -0.0011420045047998428, -0.0009829155169427395, -0.0008238265290856361, -0.0006647375412285328, -0.0005056485533714294, -0.0003465595655143261, -0.00018747057765722275, -2.83815898001194e-05, 0.00013070739805698395, 0.0002897963859140873, 0.00044888537377119064, 0.000607974361628294, 0.0007670633494853973, 0.0009261523373425007, 0.001085241325199604, 0.0012443303130567074, 0.0014034193009138107, 0.001562508288770914, 0.0017215972766280174, 0.0018806862644851208, 0.002039775252342224, 0.0021988647058606148, 0.002357953693717718, 0.0025170426815748215, 0.002676131669431925, 0.002835220657289028, 0.0029943096451461315, 0.003153398633003235, 0.003312487620860338, 0.0034715766087174416, 0.003630665596574545, 0.0037897545844316483, 0.003948843572288752, 0.004107932560145855, 0.004267021548002958, 0.004426110535860062, 0.004585199523717165, 0.004744288511574268, 0.004903377499431372, 0.005062466487288475, 0.005221555475145578, 0.005380644463002682, 0.005539733450859785, 0.005698822438716888, 0.005857911426573992, 0.006017000414431095, 0.0061760894022881985, 0.006335178390145302, 0.006494267378002405, 0.0066533563658595085, 0.006812445353716612, 0.006971534341573715, 0.0071306233294308186, 0.007289712317287922]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 4.0, 1.0, 4.0, 3.0, 3.0, 2.0, 4.0, 7.0, 3.0, 13.0, 9.0, 8.0, 21.0, 14.0, 30.0, 21.0, 29.0, 22.0, 24.0, 22.0, 36.0, 39.0, 31.0, 46.0, 36.0, 48.0, 49.0, 39.0, 28.0, 34.0, 42.0, 36.0, 30.0, 33.0, 38.0, 20.0, 22.0, 25.0, 15.0, 21.0, 19.0, 18.0, 13.0, 9.0, 13.0, 10.0, 6.0, 2.0, 4.0, 1.0, 2.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0007154941558837891, -0.0006936388090252876, -0.0006717834621667862, -0.0006499281153082848, -0.0006280727684497833, -0.0006062174215912819, -0.0005843620747327805, -0.000562506727874279, -0.0005406513810157776, -0.0005187960341572762, -0.0004969406872987747, -0.0004750853404402733, -0.00045322999358177185, -0.0004313746467232704, -0.000409519299864769, -0.00038766395300626755, -0.0003658086061477661, -0.0003439532592892647, -0.00032209791243076324, -0.0003002425655722618, -0.0002783872187137604, -0.00025653187185525894, -0.0002346765249967575, -0.00021282117813825607, -0.00019096583127975464, -0.0001691104844212532, -0.00014725513756275177, -0.00012539979070425034, -0.0001035444438457489, -8.168909698724747e-05, -5.983375012874603e-05, -3.79784032702446e-05, -1.6123056411743164e-05, 5.73229044675827e-06, 2.7587637305259705e-05, 4.944298416376114e-05, 7.129833102226257e-05, 9.315367788076401e-05, 0.00011500902473926544, 0.00013686437159776688, 0.0001587197184562683, 0.00018057506531476974, 0.00020243041217327118, 0.0002242857590317726, 0.00024614110589027405, 0.0002679964527487755, 0.0002898517996072769, 0.00031170714646577835, 0.0003335624933242798, 0.0003554178401827812, 0.00037727318704128265, 0.0003991285338997841, 0.0004209838807582855, 0.00044283922761678696, 0.0004646945744752884, 0.0004865499213337898, 0.0005084052681922913, 0.0005302606150507927, 0.0005521159619092941, 0.0005739713087677956, 0.000595826655626297, 0.0006176820024847984, 0.0006395373493432999, 0.0006613926962018013, 0.0006832480430603027]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 2.0, 11.0, 7.0, 8.0, 10.0, 15.0, 19.0, 22.0, 12.0, 33.0, 27.0, 37.0, 27.0, 42.0, 30.0, 35.0, 44.0, 34.0, 52.0, 34.0, 45.0, 49.0, 43.0, 55.0, 32.0, 28.0, 38.0, 30.0, 20.0, 22.0, 19.0, 21.0, 23.0, 14.0, 9.0, 10.0, 8.0, 7.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3359375, -14.8524169921875, -14.368896484375, -13.8853759765625, -13.40185546875, -12.9183349609375, -12.434814453125, -11.9512939453125, -11.4677734375, -10.9842529296875, -10.500732421875, -10.0172119140625, -9.53369140625, -9.0501708984375, -8.566650390625, -8.0831298828125, -7.599609375, -7.1160888671875, -6.632568359375, -6.1490478515625, -5.66552734375, -5.1820068359375, -4.698486328125, -4.2149658203125, -3.7314453125, -3.2479248046875, -2.764404296875, -2.2808837890625, -1.79736328125, -1.3138427734375, -0.830322265625, -0.3468017578125, 0.13671875, 0.6202392578125, 1.103759765625, 1.5872802734375, 2.07080078125, 2.5543212890625, 3.037841796875, 3.5213623046875, 4.0048828125, 4.4884033203125, 4.971923828125, 5.4554443359375, 5.93896484375, 6.4224853515625, 6.906005859375, 7.3895263671875, 7.873046875, 8.3565673828125, 8.840087890625, 9.3236083984375, 9.80712890625, 10.2906494140625, 10.774169921875, 11.2576904296875, 11.7412109375, 12.2247314453125, 12.708251953125, 13.1917724609375, 13.67529296875, 14.1588134765625, 14.642333984375, 15.1258544921875, 15.609375]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 3.0, 4.0, 5.0, 5.0, 5.0, 9.0, 18.0, 20.0, 23.0, 44.0, 40.0, 73.0, 78.0, 109.0, 159.0, 202.0, 307.0, 402.0, 651.0, 1031.0, 1764.0, 3071.0, 5645.0, 11667.0, 25343.0, 62684.0, 179335.0, 413842.0, 211444.0, 73329.0, 29144.0, 13148.0, 6265.0, 3364.0, 1905.0, 1067.0, 732.0, 476.0, 295.0, 227.0, 184.0, 114.0, 72.0, 65.0, 40.0, 34.0, 31.0, 24.0, 19.0, 16.0, 11.0, 5.0, 4.0, 5.0, 2.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-9.328125, -9.0230712890625, -8.718017578125, -8.4129638671875, -8.10791015625, -7.8028564453125, -7.497802734375, -7.1927490234375, -6.8876953125, -6.5826416015625, -6.277587890625, -5.9725341796875, -5.66748046875, -5.3624267578125, -5.057373046875, -4.7523193359375, -4.447265625, -4.1422119140625, -3.837158203125, -3.5321044921875, -3.22705078125, -2.9219970703125, -2.616943359375, -2.3118896484375, -2.0068359375, -1.7017822265625, -1.396728515625, -1.0916748046875, -0.78662109375, -0.4815673828125, -0.176513671875, 0.1285400390625, 0.43359375, 0.7386474609375, 1.043701171875, 1.3487548828125, 1.65380859375, 1.9588623046875, 2.263916015625, 2.5689697265625, 2.8740234375, 3.1790771484375, 3.484130859375, 3.7891845703125, 4.09423828125, 4.3992919921875, 4.704345703125, 5.0093994140625, 5.314453125, 5.6195068359375, 5.924560546875, 6.2296142578125, 6.53466796875, 6.8397216796875, 7.144775390625, 7.4498291015625, 7.7548828125, 8.0599365234375, 8.364990234375, 8.6700439453125, 8.97509765625, 9.2801513671875, 9.585205078125, 9.8902587890625, 10.1953125]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 6.0, 5.0, 8.0, 3.0, 5.0, 12.0, 4.0, 13.0, 24.0, 18.0, 20.0, 32.0, 36.0, 30.0, 44.0, 45.0, 49.0, 47.0, 87.0, 254.0, 1700.0, 154.0, 61.0, 50.0, 50.0, 36.0, 44.0, 47.0, 28.0, 19.0, 27.0, 17.0, 13.0, 17.0, 10.0, 9.0, 12.0, 9.0, 3.0, 1.0, 3.0, 0.0, 4.0, 0.0, 2.0, 0.0, 3.0], "bins": [-65.375, -63.623046875, -61.87109375, -60.119140625, -58.3671875, -56.615234375, -54.86328125, -53.111328125, -51.359375, -49.607421875, -47.85546875, -46.103515625, -44.3515625, -42.599609375, -40.84765625, -39.095703125, -37.34375, -35.591796875, -33.83984375, -32.087890625, -30.3359375, -28.583984375, -26.83203125, -25.080078125, -23.328125, -21.576171875, -19.82421875, -18.072265625, -16.3203125, -14.568359375, -12.81640625, -11.064453125, -9.3125, -7.560546875, -5.80859375, -4.056640625, -2.3046875, -0.552734375, 1.19921875, 2.951171875, 4.703125, 6.455078125, 8.20703125, 9.958984375, 11.7109375, 13.462890625, 15.21484375, 16.966796875, 18.71875, 20.470703125, 22.22265625, 23.974609375, 25.7265625, 27.478515625, 29.23046875, 30.982421875, 32.734375, 34.486328125, 36.23828125, 37.990234375, 39.7421875, 41.494140625, 43.24609375, 44.998046875, 46.75]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 2.0, 5.0, 1.0, 10.0, 10.0, 18.0, 22.0, 24.0, 35.0, 36.0, 59.0, 74.0, 81.0, 122.0, 178.0, 240.0, 332.0, 596.0, 3444.0, 3056176.0, 81589.0, 1155.0, 433.0, 260.0, 226.0, 138.0, 117.0, 81.0, 59.0, 41.0, 32.0, 15.0, 25.0, 9.0, 19.0, 7.0, 12.0, 3.0, 5.0, 3.0, 6.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-129.875, -125.7890625, -121.703125, -117.6171875, -113.53125, -109.4453125, -105.359375, -101.2734375, -97.1875, -93.1015625, -89.015625, -84.9296875, -80.84375, -76.7578125, -72.671875, -68.5859375, -64.5, -60.4140625, -56.328125, -52.2421875, -48.15625, -44.0703125, -39.984375, -35.8984375, -31.8125, -27.7265625, -23.640625, -19.5546875, -15.46875, -11.3828125, -7.296875, -3.2109375, 0.875, 4.9609375, 9.046875, 13.1328125, 17.21875, 21.3046875, 25.390625, 29.4765625, 33.5625, 37.6484375, 41.734375, 45.8203125, 49.90625, 53.9921875, 58.078125, 62.1640625, 66.25, 70.3359375, 74.421875, 78.5078125, 82.59375, 86.6796875, 90.765625, 94.8515625, 98.9375, 103.0234375, 107.109375, 111.1953125, 115.28125, 119.3671875, 123.453125, 127.5390625, 131.625]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [2.0, 73.0, 758.0, 182.0, 6.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.98760986328125, -16.812795639038086, -6.637981414794922, 3.536832809448242, 13.711647033691406, 23.886459350585938, 34.061275482177734, 44.23609161376953, 54.41090393066406, 64.5857162475586, 74.76052856445312, 84.93534851074219, 95.11016082763672, 105.28497314453125, 115.45979309082031, 125.63460540771484, 135.80941772460938, 145.98423767089844, 156.15904235839844, 166.3338623046875, 176.5086669921875, 186.68348693847656, 196.85830688476562, 207.03311157226562, 217.2079315185547, 227.38275146484375, 237.55755615234375, 247.7323760986328, 257.9071960449219, 268.0820007324219, 278.2568054199219, 288.431640625, 298.6064453125, 308.78125, 318.9560852050781, 329.1308898925781, 339.3056945800781, 349.48052978515625, 359.65533447265625, 369.83013916015625, 380.00494384765625, 390.17974853515625, 400.3545837402344, 410.5293884277344, 420.7041931152344, 430.8790283203125, 441.0538330078125, 451.2286376953125, 461.4034729003906, 471.5782775878906, 481.75311279296875, 491.92791748046875, 502.10272216796875, 512.2775268554688, 522.4523315429688, 532.627197265625, 542.802001953125, 552.976806640625, 563.151611328125, 573.326416015625, 583.5012817382812, 593.6760864257812, 603.8508911132812, 614.0256958007812, 624.2005004882812]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 6.0, 4.0, 4.0, 2.0, 12.0, 19.0, 9.0, 6.0, 11.0, 14.0, 18.0, 21.0, 32.0, 24.0, 29.0, 34.0, 25.0, 36.0, 37.0, 44.0, 42.0, 35.0, 42.0, 29.0, 42.0, 42.0, 42.0, 37.0, 43.0, 26.0, 30.0, 19.0, 22.0, 28.0, 22.0, 16.0, 17.0, 14.0, 16.0, 12.0, 14.0, 7.0, 7.0, 8.0, 4.0, 2.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.138427734375, -121.9851303100586, -117.83183288574219, -113.67853546142578, -109.52523803710938, -105.37193298339844, -101.21863555908203, -97.06533813476562, -92.91204071044922, -88.75874328613281, -84.6054458618164, -80.4521484375, -76.29884338378906, -72.14555358886719, -67.99224853515625, -63.838951110839844, -59.68565368652344, -55.53235626220703, -51.379058837890625, -47.22575759887695, -43.07246017456055, -38.91916275024414, -34.76586151123047, -30.612564086914062, -26.459266662597656, -22.30596923828125, -18.15266990661621, -13.999371528625488, -9.846073150634766, -5.692775726318359, -1.5394763946533203, 2.6138229370117188, 6.7671051025390625, 10.920403480529785, 15.073701858520508, 19.227001190185547, 23.380298614501953, 27.53359603881836, 31.6868953704834, 35.84019470214844, 39.993492126464844, 44.14678955078125, 48.300086975097656, 52.45338821411133, 56.606685638427734, 60.75998306274414, 64.91328430175781, 69.06658172607422, 73.21987915039062, 77.37317657470703, 81.52647399902344, 85.67977142333984, 89.83306884765625, 93.98637390136719, 98.1396713256836, 102.29296875, 106.4462661743164, 110.59956359863281, 114.75286102294922, 118.90615844726562, 123.05946350097656, 127.21275329589844, 131.36605834960938, 135.51934814453125, 139.6726531982422]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 9.0, 10.0, 7.0, 9.0, 22.0, 14.0, 16.0, 24.0, 32.0, 28.0, 31.0, 34.0, 31.0, 42.0, 42.0, 34.0, 45.0, 41.0, 39.0, 47.0, 57.0, 35.0, 41.0, 40.0, 31.0, 36.0, 23.0, 25.0, 24.0, 21.0, 21.0, 15.0, 15.0, 9.0, 10.0, 7.0, 8.0, 5.0, 6.0, 3.0, 5.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.9921875, -15.4837646484375, -14.975341796875, -14.4669189453125, -13.95849609375, -13.4500732421875, -12.941650390625, -12.4332275390625, -11.9248046875, -11.4163818359375, -10.907958984375, -10.3995361328125, -9.89111328125, -9.3826904296875, -8.874267578125, -8.3658447265625, -7.857421875, -7.3489990234375, -6.840576171875, -6.3321533203125, -5.82373046875, -5.3153076171875, -4.806884765625, -4.2984619140625, -3.7900390625, -3.2816162109375, -2.773193359375, -2.2647705078125, -1.75634765625, -1.2479248046875, -0.739501953125, -0.2310791015625, 0.27734375, 0.7857666015625, 1.294189453125, 1.8026123046875, 2.31103515625, 2.8194580078125, 3.327880859375, 3.8363037109375, 4.3447265625, 4.8531494140625, 5.361572265625, 5.8699951171875, 6.37841796875, 6.8868408203125, 7.395263671875, 7.9036865234375, 8.412109375, 8.9205322265625, 9.428955078125, 9.9373779296875, 10.44580078125, 10.9542236328125, 11.462646484375, 11.9710693359375, 12.4794921875, 12.9879150390625, 13.496337890625, 14.0047607421875, 14.51318359375, 15.0216064453125, 15.530029296875, 16.0384521484375, 16.546875]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 6.0, 4.0, 5.0, 5.0, 9.0, 6.0, 14.0, 11.0, 11.0, 21.0, 16.0, 23.0, 22.0, 36.0, 40.0, 68.0, 77.0, 133.0, 206.0, 408.0, 1220.0, 6642.0, 111779.0, 2119935.0, 1861383.0, 84605.0, 5467.0, 1103.0, 372.0, 189.0, 112.0, 70.0, 51.0, 50.0, 36.0, 22.0, 17.0, 19.0, 20.0, 18.0, 11.0, 6.0, 3.0, 5.0, 7.0, 10.0, 5.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-39.125, -37.90087890625, -36.6767578125, -35.45263671875, -34.228515625, -33.00439453125, -31.7802734375, -30.55615234375, -29.33203125, -28.10791015625, -26.8837890625, -25.65966796875, -24.435546875, -23.21142578125, -21.9873046875, -20.76318359375, -19.5390625, -18.31494140625, -17.0908203125, -15.86669921875, -14.642578125, -13.41845703125, -12.1943359375, -10.97021484375, -9.74609375, -8.52197265625, -7.2978515625, -6.07373046875, -4.849609375, -3.62548828125, -2.4013671875, -1.17724609375, 0.046875, 1.27099609375, 2.4951171875, 3.71923828125, 4.943359375, 6.16748046875, 7.3916015625, 8.61572265625, 9.83984375, 11.06396484375, 12.2880859375, 13.51220703125, 14.736328125, 15.96044921875, 17.1845703125, 18.40869140625, 19.6328125, 20.85693359375, 22.0810546875, 23.30517578125, 24.529296875, 25.75341796875, 26.9775390625, 28.20166015625, 29.42578125, 30.64990234375, 31.8740234375, 33.09814453125, 34.322265625, 35.54638671875, 36.7705078125, 37.99462890625, 39.21875]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 7.0, 1.0, 5.0, 6.0, 6.0, 3.0, 12.0, 13.0, 24.0, 33.0, 28.0, 36.0, 50.0, 58.0, 84.0, 92.0, 126.0, 199.0, 235.0, 314.0, 368.0, 449.0, 460.0, 355.0, 286.0, 193.0, 145.0, 120.0, 95.0, 66.0, 59.0, 39.0, 26.0, 17.0, 20.0, 17.0, 12.0, 5.0, 3.0, 6.0, 3.0, 7.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0], "bins": [-31.71875, -30.87939453125, -30.0400390625, -29.20068359375, -28.361328125, -27.52197265625, -26.6826171875, -25.84326171875, -25.00390625, -24.16455078125, -23.3251953125, -22.48583984375, -21.646484375, -20.80712890625, -19.9677734375, -19.12841796875, -18.2890625, -17.44970703125, -16.6103515625, -15.77099609375, -14.931640625, -14.09228515625, -13.2529296875, -12.41357421875, -11.57421875, -10.73486328125, -9.8955078125, -9.05615234375, -8.216796875, -7.37744140625, -6.5380859375, -5.69873046875, -4.859375, -4.02001953125, -3.1806640625, -2.34130859375, -1.501953125, -0.66259765625, 0.1767578125, 1.01611328125, 1.85546875, 2.69482421875, 3.5341796875, 4.37353515625, 5.212890625, 6.05224609375, 6.8916015625, 7.73095703125, 8.5703125, 9.40966796875, 10.2490234375, 11.08837890625, 11.927734375, 12.76708984375, 13.6064453125, 14.44580078125, 15.28515625, 16.12451171875, 16.9638671875, 17.80322265625, 18.642578125, 19.48193359375, 20.3212890625, 21.16064453125, 22.0]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 3.0, 3.0, 6.0, 6.0, 14.0, 6.0, 14.0, 18.0, 26.0, 31.0, 32.0, 49.0, 67.0, 59.0, 88.0, 119.0, 173.0, 233.0, 365.0, 638.0, 5810.0, 4096374.0, 87466.0, 1041.0, 468.0, 272.0, 185.0, 134.0, 125.0, 89.0, 82.0, 58.0, 53.0, 33.0, 31.0, 23.0, 25.0, 15.0, 16.0, 2.0, 3.0, 4.0, 10.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-145.875, -140.962890625, -136.05078125, -131.138671875, -126.2265625, -121.314453125, -116.40234375, -111.490234375, -106.578125, -101.666015625, -96.75390625, -91.841796875, -86.9296875, -82.017578125, -77.10546875, -72.193359375, -67.28125, -62.369140625, -57.45703125, -52.544921875, -47.6328125, -42.720703125, -37.80859375, -32.896484375, -27.984375, -23.072265625, -18.16015625, -13.248046875, -8.3359375, -3.423828125, 1.48828125, 6.400390625, 11.3125, 16.224609375, 21.13671875, 26.048828125, 30.9609375, 35.873046875, 40.78515625, 45.697265625, 50.609375, 55.521484375, 60.43359375, 65.345703125, 70.2578125, 75.169921875, 80.08203125, 84.994140625, 89.90625, 94.818359375, 99.73046875, 104.642578125, 109.5546875, 114.466796875, 119.37890625, 124.291015625, 129.203125, 134.115234375, 139.02734375, 143.939453125, 148.8515625, 153.763671875, 158.67578125, 163.587890625, 168.5]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 11.0, 11.0, 18.0, 38.0, 70.0, 81.0, 122.0, 148.0, 143.0, 130.0, 111.0, 61.0, 35.0, 13.0, 8.0, 3.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.38042449951172, -71.58676147460938, -67.79310607910156, -63.99944305419922, -60.205780029296875, -56.4121208190918, -52.61846160888672, -48.824798583984375, -45.0311393737793, -41.23748016357422, -37.443817138671875, -33.6501579284668, -29.856496810913086, -26.062835693359375, -22.269176483154297, -18.475515365600586, -14.681854248046875, -10.888193130493164, -7.0945329666137695, -3.300872802734375, 0.49278831481933594, 4.286449432373047, 8.080108642578125, 11.873769760131836, 15.667430877685547, 19.461091995239258, 23.25475311279297, 27.048412322998047, 30.842073440551758, 34.63573455810547, 38.42939376831055, 42.223052978515625, 46.0167236328125, 49.81038284301758, 53.60404586791992, 57.397705078125, 61.191368103027344, 64.98503112792969, 68.7786865234375, 72.57234954833984, 76.36601257324219, 80.15967559814453, 83.95333099365234, 87.74699401855469, 91.54065704345703, 95.33432006835938, 99.12797546386719, 102.92163848876953, 106.71529388427734, 110.50895690917969, 114.3026123046875, 118.09627532958984, 121.88993835449219, 125.68359375, 129.47726440429688, 133.2709197998047, 137.0645751953125, 140.8582305908203, 144.6519012451172, 148.445556640625, 152.2392120361328, 156.0328826904297, 159.8265380859375, 163.6201934814453, 167.4138641357422]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 9.0, 3.0, 12.0, 14.0, 12.0, 27.0, 26.0, 15.0, 33.0, 35.0, 23.0, 27.0, 33.0, 42.0, 30.0, 40.0, 49.0, 47.0, 36.0, 33.0, 35.0, 36.0, 43.0, 36.0, 37.0, 27.0, 29.0, 30.0, 28.0, 24.0, 11.0, 20.0, 18.0, 9.0, 12.0, 9.0, 11.0, 7.0, 8.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-90.218505859375, -87.36639404296875, -84.51427459716797, -81.66216278076172, -78.81005096435547, -75.95793151855469, -73.10581970214844, -70.25370788574219, -67.40159606933594, -64.54948425292969, -61.69736862182617, -58.845252990722656, -55.993141174316406, -53.14102554321289, -50.288909912109375, -47.436798095703125, -44.584678649902344, -41.73256301879883, -38.88045120239258, -36.02833557128906, -33.17622375488281, -30.324108123779297, -27.47199249267578, -24.6198787689209, -21.767765045166016, -18.915651321411133, -16.06353759765625, -13.211421966552734, -10.359308242797852, -7.507194519042969, -4.655078887939453, -1.8029651641845703, 1.0491485595703125, 3.9012627601623535, 6.7533769607543945, 9.605491638183594, 12.457605361938477, 15.30971908569336, 18.161834716796875, 21.013948440551758, 23.86606216430664, 26.718175888061523, 29.570289611816406, 32.42240524291992, 35.27452087402344, 38.12663269042969, 40.9787483215332, 43.83086395263672, 46.68297576904297, 49.535091400146484, 52.387203216552734, 55.23931884765625, 58.0914306640625, 60.943546295166016, 63.79566192626953, 66.64777374267578, 69.49989318847656, 72.35200500488281, 75.2041244506836, 78.05623626708984, 80.9083480834961, 83.76046752929688, 86.61257934570312, 89.46469116210938, 92.31680297851562]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 9.0, 5.0, 7.0, 9.0, 14.0, 15.0, 11.0, 13.0, 26.0, 25.0, 25.0, 29.0, 38.0, 31.0, 31.0, 33.0, 37.0, 35.0, 54.0, 44.0, 50.0, 48.0, 37.0, 32.0, 24.0, 36.0, 37.0, 36.0, 32.0, 28.0, 21.0, 13.0, 20.0, 14.0, 17.0, 9.0, 5.0, 16.0, 9.0, 11.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.328125, -14.85302734375, -14.3779296875, -13.90283203125, -13.427734375, -12.95263671875, -12.4775390625, -12.00244140625, -11.52734375, -11.05224609375, -10.5771484375, -10.10205078125, -9.626953125, -9.15185546875, -8.6767578125, -8.20166015625, -7.7265625, -7.25146484375, -6.7763671875, -6.30126953125, -5.826171875, -5.35107421875, -4.8759765625, -4.40087890625, -3.92578125, -3.45068359375, -2.9755859375, -2.50048828125, -2.025390625, -1.55029296875, -1.0751953125, -0.60009765625, -0.125, 0.35009765625, 0.8251953125, 1.30029296875, 1.775390625, 2.25048828125, 2.7255859375, 3.20068359375, 3.67578125, 4.15087890625, 4.6259765625, 5.10107421875, 5.576171875, 6.05126953125, 6.5263671875, 7.00146484375, 7.4765625, 7.95166015625, 8.4267578125, 8.90185546875, 9.376953125, 9.85205078125, 10.3271484375, 10.80224609375, 11.27734375, 11.75244140625, 12.2275390625, 12.70263671875, 13.177734375, 13.65283203125, 14.1279296875, 14.60302734375, 15.078125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 6.0, 11.0, 11.0, 19.0, 26.0, 37.0, 65.0, 83.0, 128.0, 214.0, 314.0, 500.0, 800.0, 1268.0, 1958.0, 3064.0, 4967.0, 7666.0, 12303.0, 19924.0, 32926.0, 55481.0, 97264.0, 238872.0, 308044.0, 107981.0, 60699.0, 36277.0, 21597.0, 13148.0, 8229.0, 5181.0, 3439.0, 2173.0, 1381.0, 883.0, 574.0, 361.0, 247.0, 148.0, 91.0, 70.0, 39.0, 31.0, 21.0, 15.0, 10.0, 6.0, 5.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-3.642578125, -3.529052734375, -3.41552734375, -3.302001953125, -3.1884765625, -3.074951171875, -2.96142578125, -2.847900390625, -2.734375, -2.620849609375, -2.50732421875, -2.393798828125, -2.2802734375, -2.166748046875, -2.05322265625, -1.939697265625, -1.826171875, -1.712646484375, -1.59912109375, -1.485595703125, -1.3720703125, -1.258544921875, -1.14501953125, -1.031494140625, -0.91796875, -0.804443359375, -0.69091796875, -0.577392578125, -0.4638671875, -0.350341796875, -0.23681640625, -0.123291015625, -0.009765625, 0.103759765625, 0.21728515625, 0.330810546875, 0.4443359375, 0.557861328125, 0.67138671875, 0.784912109375, 0.8984375, 1.011962890625, 1.12548828125, 1.239013671875, 1.3525390625, 1.466064453125, 1.57958984375, 1.693115234375, 1.806640625, 1.920166015625, 2.03369140625, 2.147216796875, 2.2607421875, 2.374267578125, 2.48779296875, 2.601318359375, 2.71484375, 2.828369140625, 2.94189453125, 3.055419921875, 3.1689453125, 3.282470703125, 3.39599609375, 3.509521484375, 3.623046875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 3.0, 7.0, 9.0, 6.0, 9.0, 10.0, 13.0, 14.0, 20.0, 22.0, 23.0, 23.0, 32.0, 29.0, 31.0, 33.0, 31.0, 27.0, 44.0, 33.0, 52.0, 1063.0, 51.0, 35.0, 23.0, 52.0, 45.0, 29.0, 23.0, 31.0, 31.0, 30.0, 30.0, 20.0, 21.0, 18.0, 12.0, 5.0, 9.0, 9.0, 7.0, 3.0, 4.0, 3.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-10.2734375, -9.9771728515625, -9.680908203125, -9.3846435546875, -9.08837890625, -8.7921142578125, -8.495849609375, -8.1995849609375, -7.9033203125, -7.6070556640625, -7.310791015625, -7.0145263671875, -6.71826171875, -6.4219970703125, -6.125732421875, -5.8294677734375, -5.533203125, -5.2369384765625, -4.940673828125, -4.6444091796875, -4.34814453125, -4.0518798828125, -3.755615234375, -3.4593505859375, -3.1630859375, -2.8668212890625, -2.570556640625, -2.2742919921875, -1.97802734375, -1.6817626953125, -1.385498046875, -1.0892333984375, -0.79296875, -0.4967041015625, -0.200439453125, 0.0958251953125, 0.39208984375, 0.6883544921875, 0.984619140625, 1.2808837890625, 1.5771484375, 1.8734130859375, 2.169677734375, 2.4659423828125, 2.76220703125, 3.0584716796875, 3.354736328125, 3.6510009765625, 3.947265625, 4.2435302734375, 4.539794921875, 4.8360595703125, 5.13232421875, 5.4285888671875, 5.724853515625, 6.0211181640625, 6.3173828125, 6.6136474609375, 6.909912109375, 7.2061767578125, 7.50244140625, 7.7987060546875, 8.094970703125, 8.3912353515625, 8.6875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 3.0, 0.0, 4.0, 13.0, 5.0, 14.0, 24.0, 38.0, 57.0, 77.0, 106.0, 168.0, 228.0, 371.0, 530.0, 801.0, 1191.0, 1822.0, 2562.0, 3922.0, 5722.0, 8615.0, 12974.0, 19898.0, 30176.0, 47269.0, 77619.0, 136638.0, 1353636.0, 157677.0, 85909.0, 52162.0, 32826.0, 21343.0, 14326.0, 9276.0, 6288.0, 4170.0, 2842.0, 1873.0, 1287.0, 852.0, 617.0, 389.0, 296.0, 182.0, 131.0, 77.0, 47.0, 43.0, 18.0, 10.0, 9.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.70703125, -2.615570068359375, -2.52410888671875, -2.432647705078125, -2.3411865234375, -2.249725341796875, -2.15826416015625, -2.066802978515625, -1.975341796875, -1.883880615234375, -1.79241943359375, -1.700958251953125, -1.6094970703125, -1.518035888671875, -1.42657470703125, -1.335113525390625, -1.24365234375, -1.152191162109375, -1.06072998046875, -0.969268798828125, -0.8778076171875, -0.786346435546875, -0.69488525390625, -0.603424072265625, -0.511962890625, -0.420501708984375, -0.32904052734375, -0.237579345703125, -0.1461181640625, -0.054656982421875, 0.03680419921875, 0.128265380859375, 0.2197265625, 0.311187744140625, 0.40264892578125, 0.494110107421875, 0.5855712890625, 0.677032470703125, 0.76849365234375, 0.859954833984375, 0.951416015625, 1.042877197265625, 1.13433837890625, 1.225799560546875, 1.3172607421875, 1.408721923828125, 1.50018310546875, 1.591644287109375, 1.68310546875, 1.774566650390625, 1.86602783203125, 1.957489013671875, 2.0489501953125, 2.140411376953125, 2.23187255859375, 2.323333740234375, 2.414794921875, 2.506256103515625, 2.59771728515625, 2.689178466796875, 2.7806396484375, 2.872100830078125, 2.96356201171875, 3.055023193359375, 3.146484375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 11.0, 11.0, 15.0, 14.0, 27.0, 26.0, 32.0, 51.0, 57.0, 50.0, 63.0, 69.0, 63.0, 88.0, 51.0, 59.0, 66.0, 44.0, 38.0, 25.0, 34.0, 18.0, 16.0, 14.0, 10.0, 8.0, 12.0, 6.0, 3.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.002552032470703125, -0.002484947443008423, -0.0024178624153137207, -0.0023507773876190186, -0.0022836923599243164, -0.0022166073322296143, -0.002149522304534912, -0.00208243727684021, -0.002015352249145508, -0.0019482672214508057, -0.0018811821937561035, -0.0018140971660614014, -0.0017470121383666992, -0.001679927110671997, -0.001612842082977295, -0.0015457570552825928, -0.0014786720275878906, -0.0014115869998931885, -0.0013445019721984863, -0.0012774169445037842, -0.001210331916809082, -0.0011432468891143799, -0.0010761618614196777, -0.0010090768337249756, -0.0009419918060302734, -0.0008749067783355713, -0.0008078217506408691, -0.000740736722946167, -0.0006736516952514648, -0.0006065666675567627, -0.0005394816398620605, -0.0004723966121673584, -0.00040531158447265625, -0.0003382265567779541, -0.00027114152908325195, -0.0002040565013885498, -0.00013697147369384766, -6.988644599914551e-05, -2.8014183044433594e-06, 6.428360939025879e-05, 0.00013136863708496094, 0.00019845366477966309, 0.00026553869247436523, 0.0003326237201690674, 0.00039970874786376953, 0.0004667937755584717, 0.0005338788032531738, 0.000600963830947876, 0.0006680488586425781, 0.0007351338863372803, 0.0008022189140319824, 0.0008693039417266846, 0.0009363889694213867, 0.0010034739971160889, 0.001070559024810791, 0.0011376440525054932, 0.0012047290802001953, 0.0012718141078948975, 0.0013388991355895996, 0.0014059841632843018, 0.001473069190979004, 0.001540154218673706, 0.0016072392463684082, 0.0016743242740631104, 0.0017414093017578125]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 5.0, 5.0, 7.0, 6.0, 11.0, 10.0, 12.0, 10.0, 21.0, 25.0, 30.0, 31.0, 44.0, 60.0, 88.0, 172.0, 493.0, 20491.0, 1025077.0, 1228.0, 280.0, 120.0, 77.0, 63.0, 37.0, 39.0, 24.0, 13.0, 15.0, 10.0, 19.0, 10.0, 8.0, 5.0, 2.0, 4.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04345703125, -0.041800498962402344, -0.04014396667480469, -0.03848743438720703, -0.036830902099609375, -0.03517436981201172, -0.03351783752441406, -0.031861305236816406, -0.03020477294921875, -0.028548240661621094, -0.026891708374023438, -0.02523517608642578, -0.023578643798828125, -0.02192211151123047, -0.020265579223632812, -0.018609046936035156, -0.0169525146484375, -0.015295982360839844, -0.013639450073242188, -0.011982917785644531, -0.010326385498046875, -0.008669853210449219, -0.0070133209228515625, -0.005356788635253906, -0.00370025634765625, -0.0020437240600585938, -0.0003871917724609375, 0.0012693405151367188, 0.002925872802734375, 0.004582405090332031, 0.0062389373779296875, 0.007895469665527344, 0.009552001953125, 0.011208534240722656, 0.012865066528320312, 0.014521598815917969, 0.016178131103515625, 0.01783466339111328, 0.019491195678710938, 0.021147727966308594, 0.02280426025390625, 0.024460792541503906, 0.026117324829101562, 0.02777385711669922, 0.029430389404296875, 0.03108692169189453, 0.03274345397949219, 0.034399986267089844, 0.0360565185546875, 0.037713050842285156, 0.03936958312988281, 0.04102611541748047, 0.042682647705078125, 0.04433917999267578, 0.04599571228027344, 0.047652244567871094, 0.04930877685546875, 0.050965309143066406, 0.05262184143066406, 0.05427837371826172, 0.055934906005859375, 0.05759143829345703, 0.05924797058105469, 0.060904502868652344, 0.06256103515625]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 131.0, 557.0, 300.0, 20.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.00871509499847889, -0.008552760817110538, -0.008390425704419613, -0.008228091523051262, -0.008065757341682911, -0.00790342316031456, -0.007741088513284922, -0.007578753866255283, -0.007416419684886932, -0.007254085037857294, -0.007091750856488943, -0.006929416209459305, -0.006767082028090954, -0.0066047473810613155, -0.0064424131996929646, -0.006280078552663326, -0.006117744371294975, -0.005955409724265337, -0.005793075542896986, -0.005630740895867348, -0.005468406714498997, -0.0053060720674693584, -0.0051437378861010075, -0.004981403239071369, -0.004819068592041731, -0.004656733945012093, -0.004494399763643742, -0.004332065116614103, -0.004169730935245752, -0.004007396288216114, -0.003845062106847763, -0.0036827274598181248, -0.0035203928127884865, -0.003358058398589492, -0.003195723984390497, -0.0030333895701915026, -0.002871055155992508, -0.0027087207417935133, -0.0025463863275945187, -0.0023840516805648804, -0.0022217174991965294, -0.0020593830849975348, -0.0018970486707985401, -0.0017347142565995455, -0.0015723798424005508, -0.0014100454282015562, -0.0012477108975872397, -0.001085376483388245, -0.0009230420691892505, -0.0007607076549902558, -0.0005983732407912612, -0.00043603876838460565, -0.000273704354185611, -0.00011136993998661637, 5.096453242003918e-05, 0.0002132989466190338, 0.00037563336081802845, 0.0005379677750170231, 0.0007003021892160177, 0.0008626366616226733, 0.001024971017614007, 0.0011873054318130016, 0.001349639962427318, 0.0015119743766263127, 0.0016743087908253074]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 6.0, 1.0, 6.0, 9.0, 7.0, 14.0, 16.0, 17.0, 16.0, 19.0, 18.0, 13.0, 31.0, 27.0, 29.0, 42.0, 30.0, 32.0, 40.0, 32.0, 33.0, 31.0, 43.0, 42.0, 34.0, 38.0, 31.0, 43.0, 32.0, 35.0, 28.0, 28.0, 19.0, 21.0, 19.0, 25.0, 16.0, 15.0, 10.0, 8.0, 13.0, 12.0, 7.0, 3.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0008792877197265625, -0.0008515045046806335, -0.0008237212896347046, -0.0007959380745887756, -0.0007681548595428467, -0.0007403716444969177, -0.0007125884294509888, -0.0006848052144050598, -0.0006570219993591309, -0.0006292387843132019, -0.000601455569267273, -0.000573672354221344, -0.000545889139175415, -0.0005181059241294861, -0.0004903227090835571, -0.0004625394940376282, -0.0004347562789916992, -0.00040697306394577026, -0.0003791898488998413, -0.00035140663385391235, -0.0003236234188079834, -0.00029584020376205444, -0.0002680569887161255, -0.00024027377367019653, -0.00021249055862426758, -0.00018470734357833862, -0.00015692412853240967, -0.0001291409134864807, -0.00010135769844055176, -7.35744833946228e-05, -4.579126834869385e-05, -1.8008053302764893e-05, 9.775161743164062e-06, 3.755837678909302e-05, 6.534159183502197e-05, 9.312480688095093e-05, 0.00012090802192687988, 0.00014869123697280884, 0.0001764744520187378, 0.00020425766706466675, 0.0002320408821105957, 0.00025982409715652466, 0.0002876073122024536, 0.00031539052724838257, 0.0003431737422943115, 0.0003709569573402405, 0.00039874017238616943, 0.0004265233874320984, 0.00045430660247802734, 0.0004820898175239563, 0.0005098730325698853, 0.0005376562476158142, 0.0005654394626617432, 0.0005932226777076721, 0.0006210058927536011, 0.00064878910779953, 0.000676572322845459, 0.0007043555378913879, 0.0007321387529373169, 0.0007599219679832458, 0.0007877051830291748, 0.0008154883980751038, 0.0008432716131210327, 0.0008710548281669617, 0.0008988380432128906]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 9.0, 5.0, 7.0, 9.0, 14.0, 15.0, 11.0, 13.0, 26.0, 25.0, 25.0, 29.0, 38.0, 31.0, 31.0, 33.0, 37.0, 35.0, 55.0, 43.0, 50.0, 48.0, 37.0, 32.0, 24.0, 36.0, 37.0, 36.0, 32.0, 28.0, 21.0, 13.0, 20.0, 14.0, 17.0, 9.0, 5.0, 16.0, 9.0, 11.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-15.328125, -14.85302734375, -14.3779296875, -13.90283203125, -13.427734375, -12.95263671875, -12.4775390625, -12.00244140625, -11.52734375, -11.05224609375, -10.5771484375, -10.10205078125, -9.626953125, -9.15185546875, -8.6767578125, -8.20166015625, -7.7265625, -7.25146484375, -6.7763671875, -6.30126953125, -5.826171875, -5.35107421875, -4.8759765625, -4.40087890625, -3.92578125, -3.45068359375, -2.9755859375, -2.50048828125, -2.025390625, -1.55029296875, -1.0751953125, -0.60009765625, -0.125, 0.35009765625, 0.8251953125, 1.30029296875, 1.775390625, 2.25048828125, 2.7255859375, 3.20068359375, 3.67578125, 4.15087890625, 4.6259765625, 5.10107421875, 5.576171875, 6.05126953125, 6.5263671875, 7.00146484375, 7.4765625, 7.95166015625, 8.4267578125, 8.90185546875, 9.376953125, 9.85205078125, 10.3271484375, 10.80224609375, 11.27734375, 11.75244140625, 12.2275390625, 12.70263671875, 13.177734375, 13.65283203125, 14.1279296875, 14.60302734375, 15.078125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 3.0, 10.0, 7.0, 7.0, 12.0, 17.0, 21.0, 22.0, 28.0, 52.0, 58.0, 93.0, 133.0, 245.0, 369.0, 764.0, 1666.0, 4687.0, 14263.0, 51005.0, 249468.0, 571683.0, 113478.0, 26814.0, 8264.0, 2868.0, 1145.0, 523.0, 295.0, 171.0, 100.0, 68.0, 52.0, 37.0, 26.0, 27.0, 13.0, 8.0, 16.0, 10.0, 12.0, 6.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-14.8828125, -14.4215087890625, -13.960205078125, -13.4989013671875, -13.03759765625, -12.5762939453125, -12.114990234375, -11.6536865234375, -11.1923828125, -10.7310791015625, -10.269775390625, -9.8084716796875, -9.34716796875, -8.8858642578125, -8.424560546875, -7.9632568359375, -7.501953125, -7.0406494140625, -6.579345703125, -6.1180419921875, -5.65673828125, -5.1954345703125, -4.734130859375, -4.2728271484375, -3.8115234375, -3.3502197265625, -2.888916015625, -2.4276123046875, -1.96630859375, -1.5050048828125, -1.043701171875, -0.5823974609375, -0.12109375, 0.3402099609375, 0.801513671875, 1.2628173828125, 1.72412109375, 2.1854248046875, 2.646728515625, 3.1080322265625, 3.5693359375, 4.0306396484375, 4.491943359375, 4.9532470703125, 5.41455078125, 5.8758544921875, 6.337158203125, 6.7984619140625, 7.259765625, 7.7210693359375, 8.182373046875, 8.6436767578125, 9.10498046875, 9.5662841796875, 10.027587890625, 10.4888916015625, 10.9501953125, 11.4114990234375, 11.872802734375, 12.3341064453125, 12.79541015625, 13.2567138671875, 13.718017578125, 14.1793212890625, 14.640625]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 8.0, 4.0, 4.0, 5.0, 6.0, 12.0, 16.0, 15.0, 16.0, 17.0, 37.0, 42.0, 25.0, 32.0, 43.0, 48.0, 29.0, 47.0, 99.0, 1869.0, 211.0, 71.0, 57.0, 41.0, 47.0, 40.0, 31.0, 33.0, 29.0, 25.0, 19.0, 14.0, 13.0, 9.0, 6.0, 9.0, 7.0, 9.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-47.59375, -45.81103515625, -44.0283203125, -42.24560546875, -40.462890625, -38.68017578125, -36.8974609375, -35.11474609375, -33.33203125, -31.54931640625, -29.7666015625, -27.98388671875, -26.201171875, -24.41845703125, -22.6357421875, -20.85302734375, -19.0703125, -17.28759765625, -15.5048828125, -13.72216796875, -11.939453125, -10.15673828125, -8.3740234375, -6.59130859375, -4.80859375, -3.02587890625, -1.2431640625, 0.53955078125, 2.322265625, 4.10498046875, 5.8876953125, 7.67041015625, 9.453125, 11.23583984375, 13.0185546875, 14.80126953125, 16.583984375, 18.36669921875, 20.1494140625, 21.93212890625, 23.71484375, 25.49755859375, 27.2802734375, 29.06298828125, 30.845703125, 32.62841796875, 34.4111328125, 36.19384765625, 37.9765625, 39.75927734375, 41.5419921875, 43.32470703125, 45.107421875, 46.89013671875, 48.6728515625, 50.45556640625, 52.23828125, 54.02099609375, 55.8037109375, 57.58642578125, 59.369140625, 61.15185546875, 62.9345703125, 64.71728515625, 66.5]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 3.0, 4.0, 7.0, 9.0, 12.0, 8.0, 12.0, 13.0, 13.0, 25.0, 40.0, 37.0, 68.0, 79.0, 103.0, 155.0, 241.0, 361.0, 888.0, 11592.0, 3124031.0, 6149.0, 740.0, 325.0, 230.0, 153.0, 97.0, 80.0, 62.0, 47.0, 26.0, 21.0, 20.0, 15.0, 8.0, 6.0, 5.0, 4.0, 13.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-147.5, -143.3369140625, -139.173828125, -135.0107421875, -130.84765625, -126.6845703125, -122.521484375, -118.3583984375, -114.1953125, -110.0322265625, -105.869140625, -101.7060546875, -97.54296875, -93.3798828125, -89.216796875, -85.0537109375, -80.890625, -76.7275390625, -72.564453125, -68.4013671875, -64.23828125, -60.0751953125, -55.912109375, -51.7490234375, -47.5859375, -43.4228515625, -39.259765625, -35.0966796875, -30.93359375, -26.7705078125, -22.607421875, -18.4443359375, -14.28125, -10.1181640625, -5.955078125, -1.7919921875, 2.37109375, 6.5341796875, 10.697265625, 14.8603515625, 19.0234375, 23.1865234375, 27.349609375, 31.5126953125, 35.67578125, 39.8388671875, 44.001953125, 48.1650390625, 52.328125, 56.4912109375, 60.654296875, 64.8173828125, 68.98046875, 73.1435546875, 77.306640625, 81.4697265625, 85.6328125, 89.7958984375, 93.958984375, 98.1220703125, 102.28515625, 106.4482421875, 110.611328125, 114.7744140625, 118.9375]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 101.0, 908.0, 11.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-700.9904174804688, -687.8353881835938, -674.6802978515625, -661.5252685546875, -648.3702392578125, -635.2152099609375, -622.0601196289062, -608.9050903320312, -595.7500610351562, -582.5950317382812, -569.43994140625, -556.284912109375, -543.1298828125, -529.974853515625, -516.8197631835938, -503.66473388671875, -490.5096435546875, -477.3545837402344, -464.1995544433594, -451.04449462890625, -437.88946533203125, -424.7344055175781, -411.579345703125, -398.42431640625, -385.269287109375, -372.1142272949219, -358.9591979980469, -345.80413818359375, -332.64910888671875, -319.4940490722656, -306.3389892578125, -293.1839599609375, -280.0289001464844, -266.87384033203125, -253.71881103515625, -240.56375122070312, -227.40870666503906, -214.253662109375, -201.09861755371094, -187.94357299804688, -174.78851318359375, -161.6334686279297, -148.47842407226562, -135.3233642578125, -122.16831970214844, -109.01327514648438, -95.85823059082031, -82.70317840576172, -69.54814147949219, -56.39309310913086, -43.23804473876953, -30.08300018310547, -16.92795181274414, -3.7729034423828125, 9.38214111328125, 22.537193298339844, 35.692237854003906, 48.847286224365234, 62.00233459472656, 75.15737915039062, 88.31242370605469, 101.46747589111328, 114.62252044677734, 127.77757263183594, 140.9326171875]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 4.0, 0.0, 1.0, 2.0, 7.0, 7.0, 11.0, 15.0, 12.0, 13.0, 20.0, 20.0, 26.0, 19.0, 21.0, 20.0, 30.0, 32.0, 50.0, 42.0, 44.0, 37.0, 43.0, 38.0, 44.0, 48.0, 39.0, 31.0, 38.0, 31.0, 33.0, 39.0, 19.0, 25.0, 19.0, 23.0, 23.0, 9.0, 15.0, 9.0, 9.0, 10.0, 11.0, 4.0, 8.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0], "bins": [-132.06719970703125, -128.21533203125, -124.36345672607422, -120.51158905029297, -116.65972137451172, -112.80784606933594, -108.95597839355469, -105.10411071777344, -101.25224304199219, -97.40037536621094, -93.54850006103516, -89.6966323852539, -85.84476470947266, -81.99288940429688, -78.14102172851562, -74.28915405273438, -70.4372787475586, -66.58541107177734, -62.73353958129883, -58.88166809082031, -55.02980041503906, -51.17792892456055, -47.32605743408203, -43.47418975830078, -39.622318267822266, -35.77044677734375, -31.9185791015625, -28.066707611083984, -24.2148380279541, -20.36296844482422, -16.511096954345703, -12.65922737121582, -8.807357788085938, -4.9554877281188965, -1.1036176681518555, 2.7482528686523438, 6.600122451782227, 10.45199203491211, 14.303863525390625, 18.155733108520508, 22.00760269165039, 25.859472274780273, 29.711341857910156, 33.56321334838867, 37.41508483886719, 41.26695251464844, 45.11882400512695, 48.97069549560547, 52.82256317138672, 56.674434661865234, 60.526302337646484, 64.378173828125, 68.23004150390625, 72.0819091796875, 75.93378448486328, 79.78565216064453, 83.63752746582031, 87.48939514160156, 91.34127044677734, 95.1931381225586, 99.04500579833984, 102.89688110351562, 106.74874877929688, 110.60061645507812, 114.45248413085938]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 4.0, 7.0, 6.0, 8.0, 7.0, 17.0, 14.0, 14.0, 9.0, 28.0, 26.0, 31.0, 36.0, 33.0, 28.0, 33.0, 30.0, 40.0, 49.0, 45.0, 41.0, 38.0, 45.0, 37.0, 35.0, 25.0, 38.0, 33.0, 30.0, 32.0, 27.0, 20.0, 14.0, 17.0, 18.0, 16.0, 7.0, 11.0, 11.0, 8.0, 9.0, 10.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.28125, -14.80517578125, -14.3291015625, -13.85302734375, -13.376953125, -12.90087890625, -12.4248046875, -11.94873046875, -11.47265625, -10.99658203125, -10.5205078125, -10.04443359375, -9.568359375, -9.09228515625, -8.6162109375, -8.14013671875, -7.6640625, -7.18798828125, -6.7119140625, -6.23583984375, -5.759765625, -5.28369140625, -4.8076171875, -4.33154296875, -3.85546875, -3.37939453125, -2.9033203125, -2.42724609375, -1.951171875, -1.47509765625, -0.9990234375, -0.52294921875, -0.046875, 0.42919921875, 0.9052734375, 1.38134765625, 1.857421875, 2.33349609375, 2.8095703125, 3.28564453125, 3.76171875, 4.23779296875, 4.7138671875, 5.18994140625, 5.666015625, 6.14208984375, 6.6181640625, 7.09423828125, 7.5703125, 8.04638671875, 8.5224609375, 8.99853515625, 9.474609375, 9.95068359375, 10.4267578125, 10.90283203125, 11.37890625, 11.85498046875, 12.3310546875, 12.80712890625, 13.283203125, 13.75927734375, 14.2353515625, 14.71142578125, 15.1875]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 8.0, 6.0, 9.0, 9.0, 4.0, 7.0, 12.0, 14.0, 14.0, 21.0, 29.0, 27.0, 28.0, 39.0, 53.0, 58.0, 78.0, 90.0, 122.0, 149.0, 212.0, 320.0, 691.0, 1945.0, 10610.0, 182762.0, 2204790.0, 1685945.0, 95848.0, 7094.0, 1516.0, 547.0, 310.0, 193.0, 133.0, 86.0, 86.0, 76.0, 69.0, 46.0, 26.0, 33.0, 29.0, 19.0, 27.0, 18.0, 25.0, 10.0, 8.0, 15.0, 6.0, 6.0, 7.0, 1.0, 7.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-34.0, -32.89990234375, -31.7998046875, -30.69970703125, -29.599609375, -28.49951171875, -27.3994140625, -26.29931640625, -25.19921875, -24.09912109375, -22.9990234375, -21.89892578125, -20.798828125, -19.69873046875, -18.5986328125, -17.49853515625, -16.3984375, -15.29833984375, -14.1982421875, -13.09814453125, -11.998046875, -10.89794921875, -9.7978515625, -8.69775390625, -7.59765625, -6.49755859375, -5.3974609375, -4.29736328125, -3.197265625, -2.09716796875, -0.9970703125, 0.10302734375, 1.203125, 2.30322265625, 3.4033203125, 4.50341796875, 5.603515625, 6.70361328125, 7.8037109375, 8.90380859375, 10.00390625, 11.10400390625, 12.2041015625, 13.30419921875, 14.404296875, 15.50439453125, 16.6044921875, 17.70458984375, 18.8046875, 19.90478515625, 21.0048828125, 22.10498046875, 23.205078125, 24.30517578125, 25.4052734375, 26.50537109375, 27.60546875, 28.70556640625, 29.8056640625, 30.90576171875, 32.005859375, 33.10595703125, 34.2060546875, 35.30615234375, 36.40625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 8.0, 7.0, 9.0, 3.0, 7.0, 9.0, 20.0, 28.0, 30.0, 48.0, 71.0, 89.0, 147.0, 186.0, 244.0, 370.0, 482.0, 571.0, 484.0, 363.0, 275.0, 185.0, 148.0, 70.0, 69.0, 37.0, 41.0, 33.0, 17.0, 11.0, 8.0, 4.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.125, -32.136962890625, -31.14892578125, -30.160888671875, -29.1728515625, -28.184814453125, -27.19677734375, -26.208740234375, -25.220703125, -24.232666015625, -23.24462890625, -22.256591796875, -21.2685546875, -20.280517578125, -19.29248046875, -18.304443359375, -17.31640625, -16.328369140625, -15.34033203125, -14.352294921875, -13.3642578125, -12.376220703125, -11.38818359375, -10.400146484375, -9.412109375, -8.424072265625, -7.43603515625, -6.447998046875, -5.4599609375, -4.471923828125, -3.48388671875, -2.495849609375, -1.5078125, -0.519775390625, 0.46826171875, 1.456298828125, 2.4443359375, 3.432373046875, 4.42041015625, 5.408447265625, 6.396484375, 7.384521484375, 8.37255859375, 9.360595703125, 10.3486328125, 11.336669921875, 12.32470703125, 13.312744140625, 14.30078125, 15.288818359375, 16.27685546875, 17.264892578125, 18.2529296875, 19.240966796875, 20.22900390625, 21.217041015625, 22.205078125, 23.193115234375, 24.18115234375, 25.169189453125, 26.1572265625, 27.145263671875, 28.13330078125, 29.121337890625, 30.109375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 3.0, 6.0, 11.0, 19.0, 13.0, 36.0, 40.0, 40.0, 81.0, 89.0, 110.0, 156.0, 247.0, 322.0, 529.0, 1442.0, 1635607.0, 2552258.0, 1501.0, 503.0, 330.0, 218.0, 157.0, 116.0, 114.0, 88.0, 57.0, 45.0, 28.0, 30.0, 25.0, 12.0, 14.0, 14.0, 4.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-184.125, -178.548828125, -172.97265625, -167.396484375, -161.8203125, -156.244140625, -150.66796875, -145.091796875, -139.515625, -133.939453125, -128.36328125, -122.787109375, -117.2109375, -111.634765625, -106.05859375, -100.482421875, -94.90625, -89.330078125, -83.75390625, -78.177734375, -72.6015625, -67.025390625, -61.44921875, -55.873046875, -50.296875, -44.720703125, -39.14453125, -33.568359375, -27.9921875, -22.416015625, -16.83984375, -11.263671875, -5.6875, -0.111328125, 5.46484375, 11.041015625, 16.6171875, 22.193359375, 27.76953125, 33.345703125, 38.921875, 44.498046875, 50.07421875, 55.650390625, 61.2265625, 66.802734375, 72.37890625, 77.955078125, 83.53125, 89.107421875, 94.68359375, 100.259765625, 105.8359375, 111.412109375, 116.98828125, 122.564453125, 128.140625, 133.716796875, 139.29296875, 144.869140625, 150.4453125, 156.021484375, 161.59765625, 167.173828125, 172.75]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 10.0, 364.0, 604.0, 36.0, 2.0, 1.0], "bins": [-1339.5291748046875, -1317.2569580078125, -1294.98486328125, -1272.712646484375, -1250.4404296875, -1228.168212890625, -1205.8961181640625, -1183.6239013671875, -1161.3516845703125, -1139.0794677734375, -1116.807373046875, -1094.53515625, -1072.262939453125, -1049.99072265625, -1027.7186279296875, -1005.4464111328125, -983.17431640625, -960.9021606445312, -938.6299438476562, -916.3577880859375, -894.0855712890625, -871.8134155273438, -849.541259765625, -827.26904296875, -804.996826171875, -782.7246704101562, -760.4524536132812, -738.1802978515625, -715.9080810546875, -693.6359252929688, -671.36376953125, -649.091552734375, -626.8193969726562, -604.5472412109375, -582.2750244140625, -560.0028686523438, -537.7306518554688, -515.45849609375, -493.1863098144531, -470.91412353515625, -448.6419677734375, -426.3697814941406, -404.09759521484375, -381.825439453125, -359.5532531738281, -337.28106689453125, -315.0088806152344, -292.7366943359375, -270.46453857421875, -248.19235229492188, -225.92018127441406, -203.6479949951172, -181.37582397460938, -159.1036376953125, -136.83145141601562, -114.55928039550781, -92.28707885742188, -70.01490020751953, -47.74271774291992, -25.470535278320312, -3.1983566284179688, 19.073822021484375, 41.34600830078125, 63.61817932128906, 85.89036560058594]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 7.0, 4.0, 3.0, 5.0, 4.0, 4.0, 4.0, 8.0, 7.0, 9.0, 11.0, 20.0, 16.0, 29.0, 28.0, 33.0, 28.0, 30.0, 42.0, 56.0, 32.0, 35.0, 37.0, 45.0, 42.0, 44.0, 49.0, 32.0, 36.0, 40.0, 34.0, 27.0, 34.0, 28.0, 18.0, 27.0, 13.0, 15.0, 20.0, 13.0, 11.0, 10.0, 5.0, 4.0, 3.0, 4.0, 4.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-77.71340942382812, -74.9053726196289, -72.09733581542969, -69.28929901123047, -66.48126220703125, -63.67322540283203, -60.86518478393555, -58.05714797973633, -55.24911117553711, -52.44107437133789, -49.63303756713867, -46.82499694824219, -44.01696014404297, -41.20892333984375, -38.40088653564453, -35.59284973144531, -32.784812927246094, -29.976776123046875, -27.168739318847656, -24.360700607299805, -21.552663803100586, -18.744626998901367, -15.936588287353516, -13.128551483154297, -10.320514678955078, -7.512477397918701, -4.704440116882324, -1.896402359008789, 0.9116344451904297, 3.7196712493896484, 6.5277099609375, 9.335746765136719, 12.143783569335938, 14.951820373535156, 17.759857177734375, 20.567895889282227, 23.375932693481445, 26.183969497680664, 28.992008209228516, 31.800045013427734, 34.60808181762695, 37.41611862182617, 40.22415542602539, 43.032196044921875, 45.840232849121094, 48.64826965332031, 51.45630645751953, 54.26434326171875, 57.07238006591797, 59.88041687011719, 62.688453674316406, 65.49649047851562, 68.30452728271484, 71.11256408691406, 73.92060852050781, 76.7286376953125, 79.53668212890625, 82.34471893310547, 85.15275573730469, 87.9607925415039, 90.76882934570312, 93.57686614990234, 96.38490295410156, 99.19294738769531, 102.0009765625]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 4.0, 2.0, 10.0, 9.0, 12.0, 10.0, 14.0, 14.0, 12.0, 20.0, 26.0, 25.0, 30.0, 30.0, 37.0, 35.0, 31.0, 48.0, 41.0, 33.0, 47.0, 45.0, 53.0, 46.0, 37.0, 31.0, 29.0, 32.0, 19.0, 32.0, 27.0, 21.0, 19.0, 17.0, 21.0, 15.0, 11.0, 10.0, 8.0, 7.0, 8.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1953125, -14.7244873046875, -14.253662109375, -13.7828369140625, -13.31201171875, -12.8411865234375, -12.370361328125, -11.8995361328125, -11.4287109375, -10.9578857421875, -10.487060546875, -10.0162353515625, -9.54541015625, -9.0745849609375, -8.603759765625, -8.1329345703125, -7.662109375, -7.1912841796875, -6.720458984375, -6.2496337890625, -5.77880859375, -5.3079833984375, -4.837158203125, -4.3663330078125, -3.8955078125, -3.4246826171875, -2.953857421875, -2.4830322265625, -2.01220703125, -1.5413818359375, -1.070556640625, -0.5997314453125, -0.12890625, 0.3419189453125, 0.812744140625, 1.2835693359375, 1.75439453125, 2.2252197265625, 2.696044921875, 3.1668701171875, 3.6376953125, 4.1085205078125, 4.579345703125, 5.0501708984375, 5.52099609375, 5.9918212890625, 6.462646484375, 6.9334716796875, 7.404296875, 7.8751220703125, 8.345947265625, 8.8167724609375, 9.28759765625, 9.7584228515625, 10.229248046875, 10.7000732421875, 11.1708984375, 11.6417236328125, 12.112548828125, 12.5833740234375, 13.05419921875, 13.5250244140625, 13.995849609375, 14.4666748046875, 14.9375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 8.0, 16.0, 21.0, 22.0, 35.0, 48.0, 73.0, 99.0, 153.0, 198.0, 285.0, 381.0, 566.0, 773.0, 1174.0, 1521.0, 2210.0, 3051.0, 4445.0, 6344.0, 9197.0, 13433.0, 19858.0, 29943.0, 46262.0, 74933.0, 136637.0, 299572.0, 159939.0, 84105.0, 51155.0, 32606.0, 21733.0, 14757.0, 9956.0, 6813.0, 4814.0, 3355.0, 2377.0, 1657.0, 1174.0, 849.0, 606.0, 434.0, 301.0, 209.0, 173.0, 84.0, 86.0, 47.0, 26.0, 15.0, 13.0, 13.0, 5.0, 2.0, 2.0, 2.0, 0.0, 3.0], "bins": [-2.9765625, -2.88238525390625, -2.7882080078125, -2.69403076171875, -2.599853515625, -2.50567626953125, -2.4114990234375, -2.31732177734375, -2.22314453125, -2.12896728515625, -2.0347900390625, -1.94061279296875, -1.846435546875, -1.75225830078125, -1.6580810546875, -1.56390380859375, -1.4697265625, -1.37554931640625, -1.2813720703125, -1.18719482421875, -1.093017578125, -0.99884033203125, -0.9046630859375, -0.81048583984375, -0.71630859375, -0.62213134765625, -0.5279541015625, -0.43377685546875, -0.339599609375, -0.24542236328125, -0.1512451171875, -0.05706787109375, 0.037109375, 0.13128662109375, 0.2254638671875, 0.31964111328125, 0.413818359375, 0.50799560546875, 0.6021728515625, 0.69635009765625, 0.79052734375, 0.88470458984375, 0.9788818359375, 1.07305908203125, 1.167236328125, 1.26141357421875, 1.3555908203125, 1.44976806640625, 1.5439453125, 1.63812255859375, 1.7322998046875, 1.82647705078125, 1.920654296875, 2.01483154296875, 2.1090087890625, 2.20318603515625, 2.29736328125, 2.39154052734375, 2.4857177734375, 2.57989501953125, 2.674072265625, 2.76824951171875, 2.8624267578125, 2.95660400390625, 3.05078125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 5.0, 0.0, 5.0, 4.0, 5.0, 9.0, 5.0, 14.0, 10.0, 12.0, 21.0, 14.0, 26.0, 22.0, 35.0, 32.0, 40.0, 41.0, 43.0, 35.0, 34.0, 45.0, 47.0, 1067.0, 41.0, 47.0, 37.0, 39.0, 30.0, 38.0, 35.0, 28.0, 27.0, 24.0, 16.0, 14.0, 16.0, 20.0, 9.0, 6.0, 10.0, 5.0, 7.0, 3.0, 4.0, 4.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.8515625, -8.5306396484375, -8.209716796875, -7.8887939453125, -7.56787109375, -7.2469482421875, -6.926025390625, -6.6051025390625, -6.2841796875, -5.9632568359375, -5.642333984375, -5.3214111328125, -5.00048828125, -4.6795654296875, -4.358642578125, -4.0377197265625, -3.716796875, -3.3958740234375, -3.074951171875, -2.7540283203125, -2.43310546875, -2.1121826171875, -1.791259765625, -1.4703369140625, -1.1494140625, -0.8284912109375, -0.507568359375, -0.1866455078125, 0.13427734375, 0.4552001953125, 0.776123046875, 1.0970458984375, 1.41796875, 1.7388916015625, 2.059814453125, 2.3807373046875, 2.70166015625, 3.0225830078125, 3.343505859375, 3.6644287109375, 3.9853515625, 4.3062744140625, 4.627197265625, 4.9481201171875, 5.26904296875, 5.5899658203125, 5.910888671875, 6.2318115234375, 6.552734375, 6.8736572265625, 7.194580078125, 7.5155029296875, 7.83642578125, 8.1573486328125, 8.478271484375, 8.7991943359375, 9.1201171875, 9.4410400390625, 9.761962890625, 10.0828857421875, 10.40380859375, 10.7247314453125, 11.045654296875, 11.3665771484375, 11.6875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 2.0, 3.0, 4.0, 8.0, 16.0, 18.0, 22.0, 33.0, 67.0, 108.0, 134.0, 210.0, 320.0, 453.0, 692.0, 1034.0, 1565.0, 2342.0, 3442.0, 5163.0, 7946.0, 12207.0, 19187.0, 31040.0, 51065.0, 87595.0, 172480.0, 1367395.0, 138673.0, 74372.0, 43836.0, 26933.0, 16885.0, 10701.0, 7135.0, 4626.0, 3150.0, 2082.0, 1330.0, 956.0, 654.0, 399.0, 283.0, 205.0, 120.0, 83.0, 57.0, 39.0, 28.0, 18.0, 6.0, 5.0, 9.0, 4.0, 0.0, 2.0, 1.0], "bins": [-3.556640625, -3.453125, -3.349609375, -3.24609375, -3.142578125, -3.0390625, -2.935546875, -2.83203125, -2.728515625, -2.625, -2.521484375, -2.41796875, -2.314453125, -2.2109375, -2.107421875, -2.00390625, -1.900390625, -1.796875, -1.693359375, -1.58984375, -1.486328125, -1.3828125, -1.279296875, -1.17578125, -1.072265625, -0.96875, -0.865234375, -0.76171875, -0.658203125, -0.5546875, -0.451171875, -0.34765625, -0.244140625, -0.140625, -0.037109375, 0.06640625, 0.169921875, 0.2734375, 0.376953125, 0.48046875, 0.583984375, 0.6875, 0.791015625, 0.89453125, 0.998046875, 1.1015625, 1.205078125, 1.30859375, 1.412109375, 1.515625, 1.619140625, 1.72265625, 1.826171875, 1.9296875, 2.033203125, 2.13671875, 2.240234375, 2.34375, 2.447265625, 2.55078125, 2.654296875, 2.7578125, 2.861328125, 2.96484375, 3.068359375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0, 4.0, 7.0, 5.0, 3.0, 10.0, 13.0, 13.0, 28.0, 24.0, 24.0, 41.0, 61.0, 61.0, 87.0, 100.0, 95.0, 94.0, 64.0, 68.0, 58.0, 34.0, 24.0, 23.0, 6.0, 10.0, 11.0, 11.0, 6.0, 5.0, 5.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0024318695068359375, -0.0023487210273742676, -0.0022655725479125977, -0.0021824240684509277, -0.002099275588989258, -0.002016127109527588, -0.001932978630065918, -0.001849830150604248, -0.0017666816711425781, -0.0016835331916809082, -0.0016003847122192383, -0.0015172362327575684, -0.0014340877532958984, -0.0013509392738342285, -0.0012677907943725586, -0.0011846423149108887, -0.0011014938354492188, -0.0010183453559875488, -0.0009351968765258789, -0.000852048397064209, -0.0007688999176025391, -0.0006857514381408691, -0.0006026029586791992, -0.0005194544792175293, -0.0004363059997558594, -0.00035315752029418945, -0.00027000904083251953, -0.0001868605613708496, -0.00010371208190917969, -2.0563602447509766e-05, 6.258487701416016e-05, 0.00014573335647583008, 0.0002288818359375, 0.0003120303153991699, 0.00039517879486083984, 0.00047832727432250977, 0.0005614757537841797, 0.0006446242332458496, 0.0007277727127075195, 0.0008109211921691895, 0.0008940696716308594, 0.0009772181510925293, 0.0010603666305541992, 0.0011435151100158691, 0.001226663589477539, 0.001309812068939209, 0.001392960548400879, 0.0014761090278625488, 0.0015592575073242188, 0.0016424059867858887, 0.0017255544662475586, 0.0018087029457092285, 0.0018918514251708984, 0.0019749999046325684, 0.0020581483840942383, 0.002141296863555908, 0.002224445343017578, 0.002307593822479248, 0.002390742301940918, 0.002473890781402588, 0.002557039260864258, 0.0026401877403259277, 0.0027233362197875977, 0.0028064846992492676, 0.0028896331787109375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 8.0, 10.0, 6.0, 14.0, 13.0, 21.0, 29.0, 38.0, 72.0, 122.0, 247.0, 883.0, 619453.0, 426199.0, 814.0, 239.0, 136.0, 71.0, 45.0, 34.0, 30.0, 18.0, 11.0, 8.0, 8.0, 7.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07537841796875, -0.07322406768798828, -0.07106971740722656, -0.06891536712646484, -0.06676101684570312, -0.0646066665649414, -0.06245231628417969, -0.06029796600341797, -0.05814361572265625, -0.05598926544189453, -0.05383491516113281, -0.051680564880371094, -0.049526214599609375, -0.047371864318847656, -0.04521751403808594, -0.04306316375732422, -0.0409088134765625, -0.03875446319580078, -0.03660011291503906, -0.034445762634277344, -0.032291412353515625, -0.030137062072753906, -0.027982711791992188, -0.02582836151123047, -0.02367401123046875, -0.02151966094970703, -0.019365310668945312, -0.017210960388183594, -0.015056610107421875, -0.012902259826660156, -0.010747909545898438, -0.008593559265136719, -0.006439208984375, -0.004284858703613281, -0.0021305084228515625, 2.384185791015625e-05, 0.002178192138671875, 0.004332542419433594, 0.0064868927001953125, 0.008641242980957031, 0.01079559326171875, 0.012949943542480469, 0.015104293823242188, 0.017258644104003906, 0.019412994384765625, 0.021567344665527344, 0.023721694946289062, 0.02587604522705078, 0.0280303955078125, 0.03018474578857422, 0.03233909606933594, 0.034493446350097656, 0.036647796630859375, 0.038802146911621094, 0.04095649719238281, 0.04311084747314453, 0.04526519775390625, 0.04741954803466797, 0.04957389831542969, 0.051728248596191406, 0.053882598876953125, 0.056036949157714844, 0.05819129943847656, 0.06034564971923828, 0.0625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 9.0, 90.0, 591.0, 296.0, 27.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.009726536460220814, -0.00953865796327591, -0.009350779466331005, -0.009162900038063526, -0.008975021541118622, -0.008787143044173717, -0.008599264547228813, -0.008411385118961334, -0.00822350662201643, -0.008035628125071526, -0.007847749628126621, -0.00765987066552043, -0.007471991702914238, -0.007284113205969334, -0.007096234709024429, -0.006908355746418238, -0.006720477249473333, -0.006532598752528429, -0.006344719789922237, -0.006156841292977333, -0.0059689623303711414, -0.005781083833426237, -0.0055932048708200455, -0.005405326373875141, -0.005217447876930237, -0.0050295693799853325, -0.004841690417379141, -0.0046538119204342365, -0.004465932957828045, -0.0042780544608831406, -0.004090175963938236, -0.0039022970013320446, -0.0037144175730645657, -0.0035265388432890177, -0.0033386601135134697, -0.0031507816165685654, -0.0029629026539623737, -0.0027750241570174694, -0.0025871454272419214, -0.0023992666974663734, -0.0022113879676908255, -0.0020235092379152775, -0.0018356305081397295, -0.0016477518947795033, -0.0014598731650039554, -0.0012719944352284074, -0.0010841158218681812, -0.0008962370920926332, -0.0007083583623170853, -0.0005204796325415373, -0.0003326009609736502, -0.00014472228940576315, 4.315644036978483e-05, 0.0002310351701453328, 0.00041891378350555897, 0.000606792513281107, 0.0007946712430566549, 0.000982549972832203, 0.001170428702607751, 0.001358307315967977, 0.001546186045743525, 0.001734064775519073, 0.0019219433888792992, 0.002109822118654847, 0.002297700848430395]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 4.0, 1.0, 2.0, 5.0, 6.0, 7.0, 7.0, 10.0, 10.0, 17.0, 22.0, 11.0, 23.0, 17.0, 21.0, 32.0, 36.0, 27.0, 26.0, 20.0, 34.0, 31.0, 27.0, 28.0, 35.0, 39.0, 37.0, 36.0, 33.0, 47.0, 31.0, 29.0, 32.0, 35.0, 37.0, 29.0, 37.0, 13.0, 10.0, 13.0, 18.0, 11.0, 15.0, 8.0, 7.0, 6.0, 9.0, 6.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.000903785228729248, -0.0008736820891499519, -0.0008435789495706558, -0.0008134758099913597, -0.0007833726704120636, -0.0007532695308327675, -0.0007231663912534714, -0.0006930632516741753, -0.0006629601120948792, -0.000632856972515583, -0.0006027538329362869, -0.0005726506933569908, -0.0005425475537776947, -0.0005124444141983986, -0.0004823412746191025, -0.00045223813503980637, -0.00042213499546051025, -0.00039203185588121414, -0.00036192871630191803, -0.0003318255767226219, -0.0003017224371433258, -0.0002716192975640297, -0.00024151615798473358, -0.00021141301840543747, -0.00018130987882614136, -0.00015120673924684525, -0.00012110359966754913, -9.100046008825302e-05, -6.089732050895691e-05, -3.07941809296608e-05, -6.910413503646851e-07, 2.9412098228931427e-05, 5.951523780822754e-05, 8.961837738752365e-05, 0.00011972151696681976, 0.00014982465654611588, 0.000179927796125412, 0.0002100309357047081, 0.0002401340752840042, 0.0002702372148633003, 0.00030034035444259644, 0.00033044349402189255, 0.00036054663360118866, 0.00039064977318048477, 0.0004207529127597809, 0.000450856052339077, 0.0004809591919183731, 0.0005110623314976692, 0.0005411654710769653, 0.0005712686106562614, 0.0006013717502355576, 0.0006314748898148537, 0.0006615780293941498, 0.0006916811689734459, 0.000721784308552742, 0.0007518874481320381, 0.0007819905877113342, 0.0008120937272906303, 0.0008421968668699265, 0.0008723000064492226, 0.0009024031460285187, 0.0009325062856078148, 0.0009626094251871109, 0.000992712564766407, 0.0010228157043457031]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 7.0, 4.0, 2.0, 10.0, 9.0, 12.0, 10.0, 14.0, 14.0, 12.0, 20.0, 26.0, 25.0, 30.0, 30.0, 37.0, 35.0, 31.0, 48.0, 41.0, 33.0, 47.0, 45.0, 53.0, 46.0, 37.0, 31.0, 29.0, 32.0, 19.0, 32.0, 27.0, 21.0, 19.0, 17.0, 21.0, 15.0, 11.0, 10.0, 8.0, 7.0, 8.0, 9.0, 4.0, 2.0, 5.0, 1.0, 1.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1953125, -14.7244873046875, -14.253662109375, -13.7828369140625, -13.31201171875, -12.8411865234375, -12.370361328125, -11.8995361328125, -11.4287109375, -10.9578857421875, -10.487060546875, -10.0162353515625, -9.54541015625, -9.0745849609375, -8.603759765625, -8.1329345703125, -7.662109375, -7.1912841796875, -6.720458984375, -6.2496337890625, -5.77880859375, -5.3079833984375, -4.837158203125, -4.3663330078125, -3.8955078125, -3.4246826171875, -2.953857421875, -2.4830322265625, -2.01220703125, -1.5413818359375, -1.070556640625, -0.5997314453125, -0.12890625, 0.3419189453125, 0.812744140625, 1.2835693359375, 1.75439453125, 2.2252197265625, 2.696044921875, 3.1668701171875, 3.6376953125, 4.1085205078125, 4.579345703125, 5.0501708984375, 5.52099609375, 5.9918212890625, 6.462646484375, 6.9334716796875, 7.404296875, 7.8751220703125, 8.345947265625, 8.8167724609375, 9.28759765625, 9.7584228515625, 10.229248046875, 10.7000732421875, 11.1708984375, 11.6417236328125, 12.112548828125, 12.5833740234375, 13.05419921875, 13.5250244140625, 13.995849609375, 14.4666748046875, 14.9375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 4.0, 6.0, 5.0, 6.0, 16.0, 12.0, 14.0, 17.0, 34.0, 37.0, 64.0, 75.0, 128.0, 204.0, 370.0, 722.0, 1427.0, 2760.0, 6188.0, 12903.0, 28576.0, 70019.0, 193136.0, 423878.0, 187474.0, 68311.0, 27993.0, 12466.0, 5810.0, 2797.0, 1392.0, 662.0, 413.0, 199.0, 125.0, 86.0, 47.0, 51.0, 36.0, 15.0, 18.0, 15.0, 13.0, 9.0, 3.0, 3.0, 9.0, 5.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-8.890625, -8.616943359375, -8.34326171875, -8.069580078125, -7.7958984375, -7.522216796875, -7.24853515625, -6.974853515625, -6.701171875, -6.427490234375, -6.15380859375, -5.880126953125, -5.6064453125, -5.332763671875, -5.05908203125, -4.785400390625, -4.51171875, -4.238037109375, -3.96435546875, -3.690673828125, -3.4169921875, -3.143310546875, -2.86962890625, -2.595947265625, -2.322265625, -2.048583984375, -1.77490234375, -1.501220703125, -1.2275390625, -0.953857421875, -0.68017578125, -0.406494140625, -0.1328125, 0.140869140625, 0.41455078125, 0.688232421875, 0.9619140625, 1.235595703125, 1.50927734375, 1.782958984375, 2.056640625, 2.330322265625, 2.60400390625, 2.877685546875, 3.1513671875, 3.425048828125, 3.69873046875, 3.972412109375, 4.24609375, 4.519775390625, 4.79345703125, 5.067138671875, 5.3408203125, 5.614501953125, 5.88818359375, 6.161865234375, 6.435546875, 6.709228515625, 6.98291015625, 7.256591796875, 7.5302734375, 7.803955078125, 8.07763671875, 8.351318359375, 8.625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 6.0, 4.0, 5.0, 9.0, 6.0, 12.0, 7.0, 8.0, 17.0, 21.0, 28.0, 36.0, 32.0, 47.0, 42.0, 34.0, 53.0, 69.0, 116.0, 1660.0, 326.0, 99.0, 58.0, 50.0, 33.0, 38.0, 33.0, 39.0, 30.0, 21.0, 28.0, 22.0, 13.0, 9.0, 9.0, 1.0, 8.0, 4.0, 5.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.5, -57.626953125, -55.75390625, -53.880859375, -52.0078125, -50.134765625, -48.26171875, -46.388671875, -44.515625, -42.642578125, -40.76953125, -38.896484375, -37.0234375, -35.150390625, -33.27734375, -31.404296875, -29.53125, -27.658203125, -25.78515625, -23.912109375, -22.0390625, -20.166015625, -18.29296875, -16.419921875, -14.546875, -12.673828125, -10.80078125, -8.927734375, -7.0546875, -5.181640625, -3.30859375, -1.435546875, 0.4375, 2.310546875, 4.18359375, 6.056640625, 7.9296875, 9.802734375, 11.67578125, 13.548828125, 15.421875, 17.294921875, 19.16796875, 21.041015625, 22.9140625, 24.787109375, 26.66015625, 28.533203125, 30.40625, 32.279296875, 34.15234375, 36.025390625, 37.8984375, 39.771484375, 41.64453125, 43.517578125, 45.390625, 47.263671875, 49.13671875, 51.009765625, 52.8828125, 54.755859375, 56.62890625, 58.501953125, 60.375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 9.0, 4.0, 9.0, 9.0, 18.0, 25.0, 45.0, 37.0, 58.0, 65.0, 83.0, 130.0, 162.0, 228.0, 337.0, 784.0, 13353.0, 3123806.0, 4742.0, 653.0, 326.0, 185.0, 168.0, 103.0, 80.0, 66.0, 49.0, 39.0, 32.0, 15.0, 15.0, 16.0, 8.0, 8.0, 6.0, 5.0, 5.0, 2.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-145.25, -140.767578125, -136.28515625, -131.802734375, -127.3203125, -122.837890625, -118.35546875, -113.873046875, -109.390625, -104.908203125, -100.42578125, -95.943359375, -91.4609375, -86.978515625, -82.49609375, -78.013671875, -73.53125, -69.048828125, -64.56640625, -60.083984375, -55.6015625, -51.119140625, -46.63671875, -42.154296875, -37.671875, -33.189453125, -28.70703125, -24.224609375, -19.7421875, -15.259765625, -10.77734375, -6.294921875, -1.8125, 2.669921875, 7.15234375, 11.634765625, 16.1171875, 20.599609375, 25.08203125, 29.564453125, 34.046875, 38.529296875, 43.01171875, 47.494140625, 51.9765625, 56.458984375, 60.94140625, 65.423828125, 69.90625, 74.388671875, 78.87109375, 83.353515625, 87.8359375, 92.318359375, 96.80078125, 101.283203125, 105.765625, 110.248046875, 114.73046875, 119.212890625, 123.6953125, 128.177734375, 132.66015625, 137.142578125, 141.625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 119.0, 702.0, 187.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.55695343017578, -51.71538543701172, -44.873817443847656, -38.032249450683594, -31.1906795501709, -24.349109649658203, -17.50754165649414, -10.665973663330078, -3.8244056701660156, 3.017162799835205, 9.858731269836426, 16.700300216674805, 23.541868209838867, 30.383438110351562, 37.225006103515625, 44.06657409667969, 50.90814208984375, 57.74971008300781, 64.59127807617188, 71.43284606933594, 78.2744140625, 85.11598205566406, 91.95755004882812, 98.79911804199219, 105.64068603515625, 112.48225402832031, 119.32382202148438, 126.16539001464844, 133.0069580078125, 139.84852600097656, 146.69009399414062, 153.5316619873047, 160.3732452392578, 167.21481323242188, 174.05638122558594, 180.89794921875, 187.73951721191406, 194.58108520507812, 201.4226531982422, 208.26422119140625, 215.1057891845703, 221.94735717773438, 228.78892517089844, 235.6304931640625, 242.47206115722656, 249.31362915039062, 256.15521240234375, 262.99676513671875, 269.8383483886719, 276.679931640625, 283.521484375, 290.3630676269531, 297.2046203613281, 304.04620361328125, 310.88775634765625, 317.7293395996094, 324.5708923339844, 331.4124755859375, 338.2540283203125, 345.0956115722656, 351.9371643066406, 358.77874755859375, 365.62030029296875, 372.4618835449219, 379.3034362792969]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 2.0, 5.0, 11.0, 9.0, 9.0, 14.0, 12.0, 13.0, 11.0, 16.0, 22.0, 17.0, 30.0, 24.0, 30.0, 32.0, 42.0, 28.0, 31.0, 34.0, 34.0, 36.0, 32.0, 33.0, 47.0, 33.0, 41.0, 46.0, 28.0, 34.0, 41.0, 25.0, 24.0, 24.0, 27.0, 12.0, 16.0, 10.0, 11.0, 9.0, 8.0, 15.0, 2.0, 9.0, 6.0, 2.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-125.42848205566406, -121.53656005859375, -117.6446304321289, -113.7527084350586, -109.86078643798828, -105.96885681152344, -102.07693481445312, -98.18501281738281, -94.29308319091797, -90.40116119384766, -86.50923156738281, -82.6173095703125, -78.72538757324219, -74.83345794677734, -70.94153594970703, -67.04960632324219, -63.15768814086914, -59.26576232910156, -55.37384033203125, -51.48191452026367, -47.589988708496094, -43.69806671142578, -39.8061408996582, -35.914215087890625, -32.02229309082031, -28.130369186401367, -24.23844337463379, -20.346519470214844, -16.454593658447266, -12.56266975402832, -8.670745849609375, -4.778820037841797, -0.8868942260742188, 3.005030393600464, 6.8969550132751465, 10.78887939453125, 14.680804252624512, 18.572729110717773, 22.46465301513672, 26.356578826904297, 30.248502731323242, 34.14042663574219, 38.032352447509766, 41.924278259277344, 45.816200256347656, 49.708126068115234, 53.60005187988281, 57.491973876953125, 61.3838996887207, 65.27582550048828, 69.1677474975586, 73.05967712402344, 76.95159912109375, 80.84352111816406, 84.73544311523438, 88.62737274169922, 92.51929473876953, 96.41121673583984, 100.30314636230469, 104.195068359375, 108.08699035644531, 111.97891998291016, 115.87084197998047, 119.76277160644531, 123.65469360351562]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 3.0, 3.0, 11.0, 5.0, 17.0, 11.0, 11.0, 18.0, 18.0, 19.0, 29.0, 22.0, 24.0, 36.0, 45.0, 27.0, 39.0, 40.0, 40.0, 29.0, 54.0, 44.0, 38.0, 35.0, 40.0, 47.0, 25.0, 27.0, 32.0, 17.0, 37.0, 20.0, 19.0, 16.0, 16.0, 16.0, 9.0, 9.0, 7.0, 12.0, 6.0, 5.0, 9.0, 3.0, 3.0, 1.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-15.1796875, -14.7064208984375, -14.233154296875, -13.7598876953125, -13.28662109375, -12.8133544921875, -12.340087890625, -11.8668212890625, -11.3935546875, -10.9202880859375, -10.447021484375, -9.9737548828125, -9.50048828125, -9.0272216796875, -8.553955078125, -8.0806884765625, -7.607421875, -7.1341552734375, -6.660888671875, -6.1876220703125, -5.71435546875, -5.2410888671875, -4.767822265625, -4.2945556640625, -3.8212890625, -3.3480224609375, -2.874755859375, -2.4014892578125, -1.92822265625, -1.4549560546875, -0.981689453125, -0.5084228515625, -0.03515625, 0.4381103515625, 0.911376953125, 1.3846435546875, 1.85791015625, 2.3311767578125, 2.804443359375, 3.2777099609375, 3.7509765625, 4.2242431640625, 4.697509765625, 5.1707763671875, 5.64404296875, 6.1173095703125, 6.590576171875, 7.0638427734375, 7.537109375, 8.0103759765625, 8.483642578125, 8.9569091796875, 9.43017578125, 9.9034423828125, 10.376708984375, 10.8499755859375, 11.3232421875, 11.7965087890625, 12.269775390625, 12.7430419921875, 13.21630859375, 13.6895751953125, 14.162841796875, 14.6361083984375, 15.109375]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 3.0, 2.0, 7.0, 4.0, 5.0, 9.0, 5.0, 10.0, 10.0, 10.0, 16.0, 24.0, 15.0, 19.0, 19.0, 24.0, 34.0, 50.0, 75.0, 108.0, 194.0, 375.0, 886.0, 3457.0, 49495.0, 1931985.0, 2145744.0, 56258.0, 3478.0, 914.0, 393.0, 200.0, 103.0, 63.0, 61.0, 31.0, 27.0, 29.0, 22.0, 17.0, 12.0, 17.0, 7.0, 10.0, 6.0, 11.0, 9.0, 2.0, 6.0, 7.0, 3.0, 6.0, 2.0, 3.0, 3.0, 4.0, 2.0], "bins": [-47.53125, -46.091796875, -44.65234375, -43.212890625, -41.7734375, -40.333984375, -38.89453125, -37.455078125, -36.015625, -34.576171875, -33.13671875, -31.697265625, -30.2578125, -28.818359375, -27.37890625, -25.939453125, -24.5, -23.060546875, -21.62109375, -20.181640625, -18.7421875, -17.302734375, -15.86328125, -14.423828125, -12.984375, -11.544921875, -10.10546875, -8.666015625, -7.2265625, -5.787109375, -4.34765625, -2.908203125, -1.46875, -0.029296875, 1.41015625, 2.849609375, 4.2890625, 5.728515625, 7.16796875, 8.607421875, 10.046875, 11.486328125, 12.92578125, 14.365234375, 15.8046875, 17.244140625, 18.68359375, 20.123046875, 21.5625, 23.001953125, 24.44140625, 25.880859375, 27.3203125, 28.759765625, 30.19921875, 31.638671875, 33.078125, 34.517578125, 35.95703125, 37.396484375, 38.8359375, 40.275390625, 41.71484375, 43.154296875, 44.59375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 2.0, 2.0, 8.0, 9.0, 2.0, 8.0, 9.0, 9.0, 11.0, 19.0, 19.0, 22.0, 42.0, 62.0, 66.0, 66.0, 95.0, 138.0, 166.0, 207.0, 250.0, 339.0, 458.0, 390.0, 378.0, 290.0, 252.0, 158.0, 143.0, 102.0, 66.0, 55.0, 49.0, 43.0, 35.0, 24.0, 20.0, 14.0, 14.0, 6.0, 5.0, 6.0, 7.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-20.96875, -20.24951171875, -19.5302734375, -18.81103515625, -18.091796875, -17.37255859375, -16.6533203125, -15.93408203125, -15.21484375, -14.49560546875, -13.7763671875, -13.05712890625, -12.337890625, -11.61865234375, -10.8994140625, -10.18017578125, -9.4609375, -8.74169921875, -8.0224609375, -7.30322265625, -6.583984375, -5.86474609375, -5.1455078125, -4.42626953125, -3.70703125, -2.98779296875, -2.2685546875, -1.54931640625, -0.830078125, -0.11083984375, 0.6083984375, 1.32763671875, 2.046875, 2.76611328125, 3.4853515625, 4.20458984375, 4.923828125, 5.64306640625, 6.3623046875, 7.08154296875, 7.80078125, 8.52001953125, 9.2392578125, 9.95849609375, 10.677734375, 11.39697265625, 12.1162109375, 12.83544921875, 13.5546875, 14.27392578125, 14.9931640625, 15.71240234375, 16.431640625, 17.15087890625, 17.8701171875, 18.58935546875, 19.30859375, 20.02783203125, 20.7470703125, 21.46630859375, 22.185546875, 22.90478515625, 23.6240234375, 24.34326171875, 25.0625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 2.0, 5.0, 13.0, 8.0, 12.0, 9.0, 12.0, 12.0, 18.0, 23.0, 20.0, 35.0, 47.0, 53.0, 66.0, 65.0, 97.0, 107.0, 147.0, 200.0, 248.0, 343.0, 575.0, 2823.0, 3250990.0, 934459.0, 1824.0, 530.0, 313.0, 247.0, 160.0, 136.0, 116.0, 119.0, 85.0, 62.0, 47.0, 51.0, 38.0, 26.0, 31.0, 26.0, 16.0, 15.0, 25.0, 6.0, 8.0, 5.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-142.25, -137.9296875, -133.609375, -129.2890625, -124.96875, -120.6484375, -116.328125, -112.0078125, -107.6875, -103.3671875, -99.046875, -94.7265625, -90.40625, -86.0859375, -81.765625, -77.4453125, -73.125, -68.8046875, -64.484375, -60.1640625, -55.84375, -51.5234375, -47.203125, -42.8828125, -38.5625, -34.2421875, -29.921875, -25.6015625, -21.28125, -16.9609375, -12.640625, -8.3203125, -4.0, 0.3203125, 4.640625, 8.9609375, 13.28125, 17.6015625, 21.921875, 26.2421875, 30.5625, 34.8828125, 39.203125, 43.5234375, 47.84375, 52.1640625, 56.484375, 60.8046875, 65.125, 69.4453125, 73.765625, 78.0859375, 82.40625, 86.7265625, 91.046875, 95.3671875, 99.6875, 104.0078125, 108.328125, 112.6484375, 116.96875, 121.2890625, 125.609375, 129.9296875, 134.25]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 31.0, 248.0, 483.0, 215.0, 32.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-408.2960205078125, -396.7792053222656, -385.2624206542969, -373.74560546875, -362.2287902832031, -350.71197509765625, -339.1951904296875, -327.6783752441406, -316.16156005859375, -304.6447448730469, -293.1279602050781, -281.61114501953125, -270.0943298339844, -258.5775146484375, -247.06072998046875, -235.54391479492188, -224.02713012695312, -212.5103302001953, -200.99351501464844, -189.47671508789062, -177.95989990234375, -166.44309997558594, -154.92630004882812, -143.40948486328125, -131.89268493652344, -120.3758773803711, -108.85906982421875, -97.34226989746094, -85.8254623413086, -74.30865478515625, -62.79185485839844, -51.275047302246094, -39.75823974609375, -28.24143409729004, -16.724628448486328, -5.20782470703125, 6.308982849121094, 17.825790405273438, 29.34259033203125, 40.859397888183594, 52.37620544433594, 63.89301300048828, 75.40982055664062, 86.92662048339844, 98.44342803955078, 109.96023559570312, 121.47703552246094, 132.99383544921875, 144.51065063476562, 156.02745056152344, 167.5442657470703, 179.06106567382812, 190.577880859375, 202.0946807861328, 213.61148071289062, 225.1282958984375, 236.6450958251953, 248.16189575195312, 259.6787109375, 271.19549560546875, 282.7123107910156, 294.2291259765625, 305.74591064453125, 317.2627258300781, 328.779541015625]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 12.0, 7.0, 5.0, 9.0, 14.0, 14.0, 14.0, 17.0, 18.0, 22.0, 18.0, 15.0, 21.0, 39.0, 27.0, 35.0, 29.0, 25.0, 39.0, 42.0, 34.0, 37.0, 39.0, 34.0, 34.0, 31.0, 32.0, 36.0, 27.0, 30.0, 31.0, 27.0, 23.0, 26.0, 19.0, 19.0, 19.0, 13.0, 6.0, 12.0, 7.0, 13.0, 5.0, 7.0, 5.0, 3.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-81.31988525390625, -78.83118438720703, -76.34249114990234, -73.85379028320312, -71.3650894165039, -68.87639617919922, -66.3876953125, -63.89899826049805, -61.410301208496094, -58.92160415649414, -56.43290328979492, -53.94420623779297, -51.455509185791016, -48.96681213378906, -46.478111267089844, -43.98941421508789, -41.50071334838867, -39.01201629638672, -36.5233154296875, -34.03461837768555, -31.545921325683594, -29.057222366333008, -26.568523406982422, -24.07982635498047, -21.591127395629883, -19.102428436279297, -16.613731384277344, -14.125032424926758, -11.636334419250488, -9.147636413574219, -6.658937454223633, -4.17024040222168, -1.6815414428710938, 0.8071568012237549, 3.2958550453186035, 5.784553527832031, 8.2732515335083, 10.76194953918457, 13.250648498535156, 15.73934555053711, 18.228044509887695, 20.71674346923828, 23.205440521240234, 25.69413948059082, 28.182838439941406, 30.67153549194336, 33.16023254394531, 35.64893341064453, 38.137630462646484, 40.62632751464844, 43.115028381347656, 45.60372543334961, 48.09242248535156, 50.58112335205078, 53.069820404052734, 55.55851745605469, 58.047218322753906, 60.53591537475586, 63.02461624145508, 65.51331329345703, 68.00201416015625, 70.49070739746094, 72.97940826416016, 75.46810913085938, 77.95680236816406]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 13.0, 12.0, 14.0, 11.0, 15.0, 20.0, 23.0, 25.0, 20.0, 35.0, 30.0, 31.0, 39.0, 37.0, 38.0, 30.0, 40.0, 42.0, 49.0, 30.0, 44.0, 48.0, 40.0, 39.0, 21.0, 23.0, 27.0, 22.0, 23.0, 15.0, 17.0, 18.0, 13.0, 15.0, 2.0, 10.0, 7.0, 8.0, 9.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-14.609375, -14.1610107421875, -13.712646484375, -13.2642822265625, -12.81591796875, -12.3675537109375, -11.919189453125, -11.4708251953125, -11.0224609375, -10.5740966796875, -10.125732421875, -9.6773681640625, -9.22900390625, -8.7806396484375, -8.332275390625, -7.8839111328125, -7.435546875, -6.9871826171875, -6.538818359375, -6.0904541015625, -5.64208984375, -5.1937255859375, -4.745361328125, -4.2969970703125, -3.8486328125, -3.4002685546875, -2.951904296875, -2.5035400390625, -2.05517578125, -1.6068115234375, -1.158447265625, -0.7100830078125, -0.26171875, 0.1866455078125, 0.635009765625, 1.0833740234375, 1.53173828125, 1.9801025390625, 2.428466796875, 2.8768310546875, 3.3251953125, 3.7735595703125, 4.221923828125, 4.6702880859375, 5.11865234375, 5.5670166015625, 6.015380859375, 6.4637451171875, 6.912109375, 7.3604736328125, 7.808837890625, 8.2572021484375, 8.70556640625, 9.1539306640625, 9.602294921875, 10.0506591796875, 10.4990234375, 10.9473876953125, 11.395751953125, 11.8441162109375, 12.29248046875, 12.7408447265625, 13.189208984375, 13.6375732421875, 14.0859375]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 8.0, 14.0, 16.0, 25.0, 40.0, 55.0, 80.0, 118.0, 165.0, 228.0, 329.0, 474.0, 691.0, 953.0, 1314.0, 1863.0, 2641.0, 3787.0, 5149.0, 7456.0, 10444.0, 15258.0, 21896.0, 32380.0, 49071.0, 79341.0, 140081.0, 298927.0, 140702.0, 79820.0, 49598.0, 32218.0, 22114.0, 15097.0, 10763.0, 7472.0, 5179.0, 3753.0, 2640.0, 1825.0, 1280.0, 1015.0, 691.0, 515.0, 334.0, 223.0, 150.0, 120.0, 78.0, 58.0, 48.0, 30.0, 14.0, 11.0, 5.0, 3.0, 3.0, 2.0, 2.0], "bins": [-2.765625, -2.6805419921875, -2.595458984375, -2.5103759765625, -2.42529296875, -2.3402099609375, -2.255126953125, -2.1700439453125, -2.0849609375, -1.9998779296875, -1.914794921875, -1.8297119140625, -1.74462890625, -1.6595458984375, -1.574462890625, -1.4893798828125, -1.404296875, -1.3192138671875, -1.234130859375, -1.1490478515625, -1.06396484375, -0.9788818359375, -0.893798828125, -0.8087158203125, -0.7236328125, -0.6385498046875, -0.553466796875, -0.4683837890625, -0.38330078125, -0.2982177734375, -0.213134765625, -0.1280517578125, -0.04296875, 0.0421142578125, 0.127197265625, 0.2122802734375, 0.29736328125, 0.3824462890625, 0.467529296875, 0.5526123046875, 0.6376953125, 0.7227783203125, 0.807861328125, 0.8929443359375, 0.97802734375, 1.0631103515625, 1.148193359375, 1.2332763671875, 1.318359375, 1.4034423828125, 1.488525390625, 1.5736083984375, 1.65869140625, 1.7437744140625, 1.828857421875, 1.9139404296875, 1.9990234375, 2.0841064453125, 2.169189453125, 2.2542724609375, 2.33935546875, 2.4244384765625, 2.509521484375, 2.5946044921875, 2.6796875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 2.0, 4.0, 4.0, 7.0, 11.0, 7.0, 11.0, 15.0, 6.0, 8.0, 9.0, 10.0, 16.0, 20.0, 25.0, 41.0, 31.0, 30.0, 27.0, 33.0, 48.0, 30.0, 42.0, 40.0, 1066.0, 35.0, 28.0, 49.0, 26.0, 46.0, 41.0, 29.0, 31.0, 17.0, 24.0, 22.0, 15.0, 11.0, 13.0, 15.0, 14.0, 9.0, 13.0, 8.0, 7.0, 10.0, 4.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0], "bins": [-9.078125, -8.79931640625, -8.5205078125, -8.24169921875, -7.962890625, -7.68408203125, -7.4052734375, -7.12646484375, -6.84765625, -6.56884765625, -6.2900390625, -6.01123046875, -5.732421875, -5.45361328125, -5.1748046875, -4.89599609375, -4.6171875, -4.33837890625, -4.0595703125, -3.78076171875, -3.501953125, -3.22314453125, -2.9443359375, -2.66552734375, -2.38671875, -2.10791015625, -1.8291015625, -1.55029296875, -1.271484375, -0.99267578125, -0.7138671875, -0.43505859375, -0.15625, 0.12255859375, 0.4013671875, 0.68017578125, 0.958984375, 1.23779296875, 1.5166015625, 1.79541015625, 2.07421875, 2.35302734375, 2.6318359375, 2.91064453125, 3.189453125, 3.46826171875, 3.7470703125, 4.02587890625, 4.3046875, 4.58349609375, 4.8623046875, 5.14111328125, 5.419921875, 5.69873046875, 5.9775390625, 6.25634765625, 6.53515625, 6.81396484375, 7.0927734375, 7.37158203125, 7.650390625, 7.92919921875, 8.2080078125, 8.48681640625, 8.765625]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 6.0, 10.0, 27.0, 18.0, 54.0, 70.0, 89.0, 134.0, 201.0, 268.0, 414.0, 515.0, 767.0, 1084.0, 1537.0, 2075.0, 2817.0, 3838.0, 5205.0, 7309.0, 10140.0, 14392.0, 21465.0, 31741.0, 50009.0, 81560.0, 146504.0, 1335657.0, 144857.0, 80891.0, 49468.0, 31774.0, 21328.0, 14472.0, 10112.0, 7198.0, 5316.0, 3854.0, 2806.0, 2009.0, 1465.0, 1115.0, 772.0, 560.0, 398.0, 264.0, 177.0, 134.0, 94.0, 50.0, 45.0, 29.0, 20.0, 14.0, 9.0, 0.0, 3.0, 1.0, 3.0, 1.0], "bins": [-2.6640625, -2.5794677734375, -2.494873046875, -2.4102783203125, -2.32568359375, -2.2410888671875, -2.156494140625, -2.0718994140625, -1.9873046875, -1.9027099609375, -1.818115234375, -1.7335205078125, -1.64892578125, -1.5643310546875, -1.479736328125, -1.3951416015625, -1.310546875, -1.2259521484375, -1.141357421875, -1.0567626953125, -0.97216796875, -0.8875732421875, -0.802978515625, -0.7183837890625, -0.6337890625, -0.5491943359375, -0.464599609375, -0.3800048828125, -0.29541015625, -0.2108154296875, -0.126220703125, -0.0416259765625, 0.04296875, 0.1275634765625, 0.212158203125, 0.2967529296875, 0.38134765625, 0.4659423828125, 0.550537109375, 0.6351318359375, 0.7197265625, 0.8043212890625, 0.888916015625, 0.9735107421875, 1.05810546875, 1.1427001953125, 1.227294921875, 1.3118896484375, 1.396484375, 1.4810791015625, 1.565673828125, 1.6502685546875, 1.73486328125, 1.8194580078125, 1.904052734375, 1.9886474609375, 2.0732421875, 2.1578369140625, 2.242431640625, 2.3270263671875, 2.41162109375, 2.4962158203125, 2.580810546875, 2.6654052734375, 2.75]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 4.0, 1.0, 3.0, 12.0, 11.0, 14.0, 20.0, 25.0, 23.0, 48.0, 43.0, 61.0, 70.0, 85.0, 80.0, 79.0, 73.0, 67.0, 52.0, 43.0, 38.0, 41.0, 29.0, 22.0, 14.0, 9.0, 5.0, 9.0, 8.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0015459060668945312, -0.001486465334892273, -0.0014270246028900146, -0.0013675838708877563, -0.001308143138885498, -0.0012487024068832397, -0.0011892616748809814, -0.0011298209428787231, -0.0010703802108764648, -0.0010109394788742065, -0.0009514987468719482, -0.0008920580148696899, -0.0008326172828674316, -0.0007731765508651733, -0.000713735818862915, -0.0006542950868606567, -0.0005948543548583984, -0.0005354136228561401, -0.00047597289085388184, -0.00041653215885162354, -0.00035709142684936523, -0.00029765069484710693, -0.00023820996284484863, -0.00017876923084259033, -0.00011932849884033203, -5.988776683807373e-05, -4.470348358154297e-07, 5.899369716644287e-05, 0.00011843442916870117, 0.00017787516117095947, 0.00023731589317321777, 0.0002967566251754761, 0.0003561973571777344, 0.0004156380891799927, 0.000475078821182251, 0.0005345195531845093, 0.0005939602851867676, 0.0006534010171890259, 0.0007128417491912842, 0.0007722824811935425, 0.0008317232131958008, 0.0008911639451980591, 0.0009506046772003174, 0.0010100454092025757, 0.001069486141204834, 0.0011289268732070923, 0.0011883676052093506, 0.0012478083372116089, 0.0013072490692138672, 0.0013666898012161255, 0.0014261305332183838, 0.001485571265220642, 0.0015450119972229004, 0.0016044527292251587, 0.001663893461227417, 0.0017233341932296753, 0.0017827749252319336, 0.001842215657234192, 0.0019016563892364502, 0.0019610971212387085, 0.002020537853240967, 0.002079978585243225, 0.0021394193172454834, 0.0021988600492477417, 0.00225830078125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 7.0, 5.0, 10.0, 17.0, 24.0, 23.0, 37.0, 54.0, 69.0, 95.0, 152.0, 347.0, 1264.0, 1002562.0, 42537.0, 657.0, 263.0, 124.0, 68.0, 68.0, 48.0, 44.0, 22.0, 16.0, 9.0, 5.0, 4.0, 2.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0545654296875, -0.053082942962646484, -0.05160045623779297, -0.05011796951293945, -0.04863548278808594, -0.04715299606323242, -0.045670509338378906, -0.04418802261352539, -0.042705535888671875, -0.04122304916381836, -0.039740562438964844, -0.03825807571411133, -0.03677558898925781, -0.0352931022644043, -0.03381061553955078, -0.032328128814697266, -0.03084564208984375, -0.029363155364990234, -0.02788066864013672, -0.026398181915283203, -0.024915695190429688, -0.023433208465576172, -0.021950721740722656, -0.02046823501586914, -0.018985748291015625, -0.01750326156616211, -0.016020774841308594, -0.014538288116455078, -0.013055801391601562, -0.011573314666748047, -0.010090827941894531, -0.008608341217041016, -0.0071258544921875, -0.005643367767333984, -0.004160881042480469, -0.002678394317626953, -0.0011959075927734375, 0.0002865791320800781, 0.0017690658569335938, 0.0032515525817871094, 0.004734039306640625, 0.006216526031494141, 0.007699012756347656, 0.009181499481201172, 0.010663986206054688, 0.012146472930908203, 0.013628959655761719, 0.015111446380615234, 0.01659393310546875, 0.018076419830322266, 0.01955890655517578, 0.021041393280029297, 0.022523880004882812, 0.024006366729736328, 0.025488853454589844, 0.02697134017944336, 0.028453826904296875, 0.02993631362915039, 0.031418800354003906, 0.03290128707885742, 0.03438377380371094, 0.03586626052856445, 0.03734874725341797, 0.038831233978271484, 0.040313720703125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 19.0, 116.0, 441.0, 348.0, 80.0, 10.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019446087535470724, -0.0018292968161404133, -0.0017139847623184323, -0.0015986727084964514, -0.0014833607710897923, -0.0013680488336831331, -0.0012527367798611522, -0.0011374247260391712, -0.001022112788632512, -0.000906800793018192, -0.000791488797403872, -0.000676176801789552, -0.0005608648061752319, -0.0004455528105609119, -0.00033024081494659185, -0.00021492881933227181, -9.961682371795177e-05, 1.5695171896368265e-05, 0.0001310071675106883, 0.00024631916312500834, 0.0003616311587393284, 0.0004769431543536484, 0.0005922551499679685, 0.0007075671455822885, 0.0008228791411966085, 0.0009381911368109286, 0.0010535031324252486, 0.0011688151862472296, 0.0012841271236538887, 0.0013994390610605478, 0.0015147511148825288, 0.0016300631687045097, 0.0017453753389418125, 0.0018606872763484716, 0.0019759992137551308, 0.0020913113839924335, 0.0022066233213990927, 0.002321935258805752, 0.0024372474290430546, 0.0025525593664497137, 0.002667871303856373, 0.002783183241263032, 0.002898495178669691, 0.003013807348906994, 0.003129119286313653, 0.003244431223720312, 0.003359743393957615, 0.003475055331364274, 0.003590367268770933, 0.0037056792061775923, 0.0038209911435842514, 0.003936303313821554, 0.004051615484058857, 0.0041669271886348724, 0.004282239358872175, 0.004397551063448191, 0.0045128632336854935, 0.004628175403922796, 0.004743487108498812, 0.0048587992787361145, 0.00497411098331213, 0.005089423153549433, 0.0052047353237867355, 0.005320047028362751, 0.005435359198600054]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 8.0, 9.0, 6.0, 6.0, 7.0, 7.0, 10.0, 16.0, 13.0, 23.0, 15.0, 27.0, 26.0, 16.0, 33.0, 40.0, 34.0, 34.0, 27.0, 33.0, 55.0, 41.0, 37.0, 27.0, 47.0, 37.0, 36.0, 40.0, 36.0, 32.0, 28.0, 30.0, 27.0, 22.0, 16.0, 23.0, 17.0, 17.0, 7.0, 12.0, 9.0, 5.0, 6.0, 6.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.0008009672164916992, -0.000777791254222393, -0.0007546152919530869, -0.0007314393296837807, -0.0007082633674144745, -0.0006850874051451683, -0.0006619114428758621, -0.0006387354806065559, -0.0006155595183372498, -0.0005923835560679436, -0.0005692075937986374, -0.0005460316315293312, -0.000522855669260025, -0.0004996797069907188, -0.00047650374472141266, -0.0004533277824521065, -0.0004301518201828003, -0.0004069758579134941, -0.00038379989564418793, -0.00036062393337488174, -0.00033744797110557556, -0.0003142720088362694, -0.0002910960465669632, -0.000267920084297657, -0.00024474412202835083, -0.00022156815975904465, -0.00019839219748973846, -0.00017521623522043228, -0.0001520402729511261, -0.00012886431068181992, -0.00010568834841251373, -8.251238614320755e-05, -5.933642387390137e-05, -3.6160461604595184e-05, -1.2984499335289001e-05, 1.0191462934017181e-05, 3.3367425203323364e-05, 5.654338747262955e-05, 7.971934974193573e-05, 0.00010289531201124191, 0.0001260712742805481, 0.00014924723654985428, 0.00017242319881916046, 0.00019559916108846664, 0.00021877512335777283, 0.000241951085627079, 0.0002651270478963852, 0.0002883030101656914, 0.00031147897243499756, 0.00033465493470430374, 0.0003578308969736099, 0.0003810068592429161, 0.0004041828215122223, 0.0004273587837815285, 0.00045053474605083466, 0.00047371070832014084, 0.000496886670589447, 0.0005200626328587532, 0.0005432385951280594, 0.0005664145573973656, 0.0005895905196666718, 0.0006127664819359779, 0.0006359424442052841, 0.0006591184064745903, 0.0006822943687438965]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 3.0, 5.0, 7.0, 8.0, 11.0, 13.0, 12.0, 14.0, 11.0, 15.0, 20.0, 23.0, 25.0, 20.0, 35.0, 30.0, 31.0, 39.0, 37.0, 38.0, 30.0, 40.0, 42.0, 49.0, 30.0, 44.0, 48.0, 40.0, 39.0, 21.0, 23.0, 27.0, 22.0, 23.0, 15.0, 17.0, 18.0, 13.0, 15.0, 2.0, 10.0, 7.0, 8.0, 9.0, 5.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0], "bins": [-14.609375, -14.1610107421875, -13.712646484375, -13.2642822265625, -12.81591796875, -12.3675537109375, -11.919189453125, -11.4708251953125, -11.0224609375, -10.5740966796875, -10.125732421875, -9.6773681640625, -9.22900390625, -8.7806396484375, -8.332275390625, -7.8839111328125, -7.435546875, -6.9871826171875, -6.538818359375, -6.0904541015625, -5.64208984375, -5.1937255859375, -4.745361328125, -4.2969970703125, -3.8486328125, -3.4002685546875, -2.951904296875, -2.5035400390625, -2.05517578125, -1.6068115234375, -1.158447265625, -0.7100830078125, -0.26171875, 0.1866455078125, 0.635009765625, 1.0833740234375, 1.53173828125, 1.9801025390625, 2.428466796875, 2.8768310546875, 3.3251953125, 3.7735595703125, 4.221923828125, 4.6702880859375, 5.11865234375, 5.5670166015625, 6.015380859375, 6.4637451171875, 6.912109375, 7.3604736328125, 7.808837890625, 8.2572021484375, 8.70556640625, 9.1539306640625, 9.602294921875, 10.0506591796875, 10.4990234375, 10.9473876953125, 11.395751953125, 11.8441162109375, 12.29248046875, 12.7408447265625, 13.189208984375, 13.6375732421875, 14.0859375]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 5.0, 5.0, 6.0, 18.0, 19.0, 12.0, 20.0, 27.0, 47.0, 44.0, 70.0, 94.0, 103.0, 153.0, 193.0, 294.0, 546.0, 1092.0, 2488.0, 7239.0, 21421.0, 66410.0, 249540.0, 509072.0, 129762.0, 38812.0, 12873.0, 4400.0, 1688.0, 761.0, 398.0, 240.0, 171.0, 123.0, 103.0, 63.0, 52.0, 51.0, 34.0, 17.0, 18.0, 13.0, 16.0, 14.0, 11.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 3.0], "bins": [-15.5, -15.0196533203125, -14.539306640625, -14.0589599609375, -13.57861328125, -13.0982666015625, -12.617919921875, -12.1375732421875, -11.6572265625, -11.1768798828125, -10.696533203125, -10.2161865234375, -9.73583984375, -9.2554931640625, -8.775146484375, -8.2947998046875, -7.814453125, -7.3341064453125, -6.853759765625, -6.3734130859375, -5.89306640625, -5.4127197265625, -4.932373046875, -4.4520263671875, -3.9716796875, -3.4913330078125, -3.010986328125, -2.5306396484375, -2.05029296875, -1.5699462890625, -1.089599609375, -0.6092529296875, -0.12890625, 0.3514404296875, 0.831787109375, 1.3121337890625, 1.79248046875, 2.2728271484375, 2.753173828125, 3.2335205078125, 3.7138671875, 4.1942138671875, 4.674560546875, 5.1549072265625, 5.63525390625, 6.1156005859375, 6.595947265625, 7.0762939453125, 7.556640625, 8.0369873046875, 8.517333984375, 8.9976806640625, 9.47802734375, 9.9583740234375, 10.438720703125, 10.9190673828125, 11.3994140625, 11.8797607421875, 12.360107421875, 12.8404541015625, 13.32080078125, 13.8011474609375, 14.281494140625, 14.7618408203125, 15.2421875]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 4.0, 6.0, 4.0, 4.0, 3.0, 12.0, 5.0, 11.0, 12.0, 17.0, 21.0, 20.0, 19.0, 29.0, 27.0, 40.0, 30.0, 33.0, 43.0, 45.0, 55.0, 143.0, 1596.0, 358.0, 99.0, 53.0, 44.0, 36.0, 43.0, 32.0, 33.0, 26.0, 23.0, 27.0, 14.0, 17.0, 13.0, 7.0, 12.0, 9.0, 4.0, 8.0, 6.0, 2.0, 6.0, 2.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-51.4375, -49.9189453125, -48.400390625, -46.8818359375, -45.36328125, -43.8447265625, -42.326171875, -40.8076171875, -39.2890625, -37.7705078125, -36.251953125, -34.7333984375, -33.21484375, -31.6962890625, -30.177734375, -28.6591796875, -27.140625, -25.6220703125, -24.103515625, -22.5849609375, -21.06640625, -19.5478515625, -18.029296875, -16.5107421875, -14.9921875, -13.4736328125, -11.955078125, -10.4365234375, -8.91796875, -7.3994140625, -5.880859375, -4.3623046875, -2.84375, -1.3251953125, 0.193359375, 1.7119140625, 3.23046875, 4.7490234375, 6.267578125, 7.7861328125, 9.3046875, 10.8232421875, 12.341796875, 13.8603515625, 15.37890625, 16.8974609375, 18.416015625, 19.9345703125, 21.453125, 22.9716796875, 24.490234375, 26.0087890625, 27.52734375, 29.0458984375, 30.564453125, 32.0830078125, 33.6015625, 35.1201171875, 36.638671875, 38.1572265625, 39.67578125, 41.1943359375, 42.712890625, 44.2314453125, 45.75]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 2.0, 5.0, 6.0, 8.0, 10.0, 11.0, 13.0, 21.0, 28.0, 24.0, 35.0, 49.0, 72.0, 71.0, 108.0, 160.0, 230.0, 375.0, 866.0, 10869.0, 3117155.0, 13422.0, 850.0, 410.0, 255.0, 148.0, 135.0, 104.0, 61.0, 57.0, 35.0, 25.0, 23.0, 14.0, 12.0, 9.0, 14.0, 3.0, 4.0, 5.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-129.75, -125.759765625, -121.76953125, -117.779296875, -113.7890625, -109.798828125, -105.80859375, -101.818359375, -97.828125, -93.837890625, -89.84765625, -85.857421875, -81.8671875, -77.876953125, -73.88671875, -69.896484375, -65.90625, -61.916015625, -57.92578125, -53.935546875, -49.9453125, -45.955078125, -41.96484375, -37.974609375, -33.984375, -29.994140625, -26.00390625, -22.013671875, -18.0234375, -14.033203125, -10.04296875, -6.052734375, -2.0625, 1.927734375, 5.91796875, 9.908203125, 13.8984375, 17.888671875, 21.87890625, 25.869140625, 29.859375, 33.849609375, 37.83984375, 41.830078125, 45.8203125, 49.810546875, 53.80078125, 57.791015625, 61.78125, 65.771484375, 69.76171875, 73.751953125, 77.7421875, 81.732421875, 85.72265625, 89.712890625, 93.703125, 97.693359375, 101.68359375, 105.673828125, 109.6640625, 113.654296875, 117.64453125, 121.634765625, 125.625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 15.0, 94.0, 298.0, 361.0, 195.0, 40.0, 8.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.27523040771484, -62.64409637451172, -59.01296615600586, -55.381832122802734, -51.750701904296875, -48.11956787109375, -44.488433837890625, -40.8572998046875, -37.22616958618164, -33.595035552978516, -29.963905334472656, -26.33277130126953, -22.70163917541504, -19.070507049560547, -15.439373016357422, -11.80824089050293, -8.177108764648438, -4.545976161956787, -0.9148435592651367, 2.716289520263672, 6.347421646118164, 9.978553771972656, 13.609687805175781, 17.240819931030273, 20.871952056884766, 24.503084182739258, 28.13421630859375, 31.765350341796875, 35.396484375, 39.02761459350586, 42.658748626708984, 46.289878845214844, 49.9210205078125, 53.552154541015625, 57.183284759521484, 60.81441879272461, 64.44554901123047, 68.0766830444336, 71.70781707763672, 75.33895111083984, 78.97007751464844, 82.60121154785156, 86.23234558105469, 89.86347961425781, 93.4946060180664, 97.12574005126953, 100.75687408447266, 104.38800811767578, 108.0191421508789, 111.65027618408203, 115.28141021728516, 118.91253662109375, 122.54367065429688, 126.1748046875, 129.80593872070312, 133.43707275390625, 137.06820678710938, 140.6993408203125, 144.33047485351562, 147.96160888671875, 151.59274291992188, 155.223876953125, 158.85501098632812, 162.4861297607422, 166.1172637939453]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 3.0, 6.0, 3.0, 1.0, 7.0, 6.0, 4.0, 15.0, 18.0, 9.0, 19.0, 22.0, 19.0, 32.0, 27.0, 25.0, 42.0, 39.0, 33.0, 27.0, 38.0, 41.0, 45.0, 36.0, 38.0, 46.0, 39.0, 44.0, 39.0, 37.0, 30.0, 36.0, 25.0, 18.0, 24.0, 17.0, 22.0, 15.0, 13.0, 12.0, 8.0, 7.0, 9.0, 4.0, 3.0, 0.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-125.12220764160156, -121.20587921142578, -117.28954315185547, -113.37321472167969, -109.4568862915039, -105.54055786132812, -101.62422180175781, -97.70789337158203, -93.79156494140625, -89.87523651123047, -85.95890045166016, -82.04257202148438, -78.1262435913086, -74.20991516113281, -70.2935791015625, -66.37725067138672, -62.460914611816406, -58.54458236694336, -54.62825393676758, -50.71192169189453, -46.79559326171875, -42.8792610168457, -38.962928771972656, -35.046600341796875, -31.130268096923828, -27.213937759399414, -23.297607421875, -19.381275177001953, -15.464944839477539, -11.548614501953125, -7.632282257080078, -3.715951919555664, 0.20037841796875, 4.116709232330322, 8.033040046691895, 11.949371337890625, 15.865701675415039, 19.782032012939453, 23.6983642578125, 27.614694595336914, 31.531024932861328, 35.447357177734375, 39.363685607910156, 43.2800178527832, 47.19635009765625, 51.11267852783203, 55.02901077270508, 58.945343017578125, 62.861671447753906, 66.77799987792969, 70.6943359375, 74.61066436767578, 78.52699279785156, 82.44332885742188, 86.35965728759766, 90.27598571777344, 94.19232177734375, 98.10865020751953, 102.02498626708984, 105.94131469726562, 109.8576431274414, 113.77397155761719, 117.6903076171875, 121.60663604736328, 125.52296447753906]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 10.0, 13.0, 14.0, 12.0, 10.0, 13.0, 19.0, 17.0, 17.0, 18.0, 26.0, 28.0, 32.0, 35.0, 35.0, 27.0, 46.0, 36.0, 29.0, 35.0, 42.0, 41.0, 38.0, 42.0, 37.0, 40.0, 38.0, 33.0, 22.0, 23.0, 20.0, 20.0, 22.0, 18.0, 10.0, 12.0, 12.0, 7.0, 8.0, 8.0, 5.0, 10.0, 5.0, 2.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 0.0, 1.0], "bins": [-14.7734375, -14.3126220703125, -13.851806640625, -13.3909912109375, -12.93017578125, -12.4693603515625, -12.008544921875, -11.5477294921875, -11.0869140625, -10.6260986328125, -10.165283203125, -9.7044677734375, -9.24365234375, -8.7828369140625, -8.322021484375, -7.8612060546875, -7.400390625, -6.9395751953125, -6.478759765625, -6.0179443359375, -5.55712890625, -5.0963134765625, -4.635498046875, -4.1746826171875, -3.7138671875, -3.2530517578125, -2.792236328125, -2.3314208984375, -1.87060546875, -1.4097900390625, -0.948974609375, -0.4881591796875, -0.02734375, 0.4334716796875, 0.894287109375, 1.3551025390625, 1.81591796875, 2.2767333984375, 2.737548828125, 3.1983642578125, 3.6591796875, 4.1199951171875, 4.580810546875, 5.0416259765625, 5.50244140625, 5.9632568359375, 6.424072265625, 6.8848876953125, 7.345703125, 7.8065185546875, 8.267333984375, 8.7281494140625, 9.18896484375, 9.6497802734375, 10.110595703125, 10.5714111328125, 11.0322265625, 11.4930419921875, 11.953857421875, 12.4146728515625, 12.87548828125, 13.3363037109375, 13.797119140625, 14.2579345703125, 14.71875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 6.0, 7.0, 1.0, 7.0, 3.0, 9.0, 9.0, 7.0, 15.0, 20.0, 18.0, 17.0, 21.0, 32.0, 34.0, 47.0, 71.0, 79.0, 111.0, 152.0, 235.0, 390.0, 886.0, 4212.0, 72488.0, 2455651.0, 1618028.0, 37038.0, 2837.0, 695.0, 339.0, 199.0, 139.0, 116.0, 67.0, 62.0, 45.0, 45.0, 23.0, 23.0, 22.0, 19.0, 9.0, 7.0, 9.0, 8.0, 6.0, 6.0, 6.0, 3.0, 4.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0], "bins": [-46.9375, -45.51123046875, -44.0849609375, -42.65869140625, -41.232421875, -39.80615234375, -38.3798828125, -36.95361328125, -35.52734375, -34.10107421875, -32.6748046875, -31.24853515625, -29.822265625, -28.39599609375, -26.9697265625, -25.54345703125, -24.1171875, -22.69091796875, -21.2646484375, -19.83837890625, -18.412109375, -16.98583984375, -15.5595703125, -14.13330078125, -12.70703125, -11.28076171875, -9.8544921875, -8.42822265625, -7.001953125, -5.57568359375, -4.1494140625, -2.72314453125, -1.296875, 0.12939453125, 1.5556640625, 2.98193359375, 4.408203125, 5.83447265625, 7.2607421875, 8.68701171875, 10.11328125, 11.53955078125, 12.9658203125, 14.39208984375, 15.818359375, 17.24462890625, 18.6708984375, 20.09716796875, 21.5234375, 22.94970703125, 24.3759765625, 25.80224609375, 27.228515625, 28.65478515625, 30.0810546875, 31.50732421875, 32.93359375, 34.35986328125, 35.7861328125, 37.21240234375, 38.638671875, 40.06494140625, 41.4912109375, 42.91748046875, 44.34375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 4.0, 15.0, 14.0, 35.0, 46.0, 94.0, 139.0, 263.0, 444.0, 844.0, 936.0, 571.0, 286.0, 165.0, 75.0, 68.0, 30.0, 22.0, 13.0, 7.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.65625, -44.03564453125, -42.4150390625, -40.79443359375, -39.173828125, -37.55322265625, -35.9326171875, -34.31201171875, -32.69140625, -31.07080078125, -29.4501953125, -27.82958984375, -26.208984375, -24.58837890625, -22.9677734375, -21.34716796875, -19.7265625, -18.10595703125, -16.4853515625, -14.86474609375, -13.244140625, -11.62353515625, -10.0029296875, -8.38232421875, -6.76171875, -5.14111328125, -3.5205078125, -1.89990234375, -0.279296875, 1.34130859375, 2.9619140625, 4.58251953125, 6.203125, 7.82373046875, 9.4443359375, 11.06494140625, 12.685546875, 14.30615234375, 15.9267578125, 17.54736328125, 19.16796875, 20.78857421875, 22.4091796875, 24.02978515625, 25.650390625, 27.27099609375, 28.8916015625, 30.51220703125, 32.1328125, 33.75341796875, 35.3740234375, 36.99462890625, 38.615234375, 40.23583984375, 41.8564453125, 43.47705078125, 45.09765625, 46.71826171875, 48.3388671875, 49.95947265625, 51.580078125, 53.20068359375, 54.8212890625, 56.44189453125, 58.0625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 8.0, 5.0, 20.0, 28.0, 36.0, 77.0, 84.0, 121.0, 190.0, 286.0, 457.0, 1509.0, 4174367.0, 15291.0, 721.0, 332.0, 250.0, 163.0, 129.0, 77.0, 56.0, 33.0, 24.0, 16.0, 7.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-338.75, -329.265625, -319.78125, -310.296875, -300.8125, -291.328125, -281.84375, -272.359375, -262.875, -253.390625, -243.90625, -234.421875, -224.9375, -215.453125, -205.96875, -196.484375, -187.0, -177.515625, -168.03125, -158.546875, -149.0625, -139.578125, -130.09375, -120.609375, -111.125, -101.640625, -92.15625, -82.671875, -73.1875, -63.703125, -54.21875, -44.734375, -35.25, -25.765625, -16.28125, -6.796875, 2.6875, 12.171875, 21.65625, 31.140625, 40.625, 50.109375, 59.59375, 69.078125, 78.5625, 88.046875, 97.53125, 107.015625, 116.5, 125.984375, 135.46875, 144.953125, 154.4375, 163.921875, 173.40625, 182.890625, 192.375, 201.859375, 211.34375, 220.828125, 230.3125, 239.796875, 249.28125, 258.765625, 268.25]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 27.0, 73.0, 193.0, 299.0, 239.0, 133.0, 31.0, 14.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-105.88075256347656, -99.18383026123047, -92.48690032958984, -85.78997802734375, -79.09304809570312, -72.39612579345703, -65.69920349121094, -59.00227737426758, -52.30535125732422, -45.60842514038086, -38.9114990234375, -32.214576721191406, -25.517650604248047, -18.820724487304688, -12.123802185058594, -5.426876068115234, 1.270050048828125, 7.966975212097168, 14.663900375366211, 21.360824584960938, 28.057750701904297, 34.754676818847656, 41.45159912109375, 48.14852523803711, 54.84545135498047, 61.54237747192383, 68.23930358886719, 74.93622589111328, 81.63314819335938, 88.330078125, 95.0270004272461, 101.72392272949219, 108.42086791992188, 115.11779022216797, 121.8147201538086, 128.5116424560547, 135.2085723876953, 141.90548706054688, 148.6024169921875, 155.29934692382812, 161.99627685546875, 168.69320678710938, 175.39012145996094, 182.08705139160156, 188.7839813232422, 195.48089599609375, 202.17782592773438, 208.874755859375, 215.57167053222656, 222.2686004638672, 228.96551513671875, 235.66244506835938, 242.359375, 249.05630493164062, 255.7532196044922, 262.45013427734375, 269.1470642089844, 275.843994140625, 282.5409240722656, 289.23785400390625, 295.93475341796875, 302.6316833496094, 309.32861328125, 316.0255432128906, 322.72247314453125]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 4.0, 3.0, 4.0, 6.0, 14.0, 8.0, 10.0, 10.0, 29.0, 24.0, 32.0, 19.0, 34.0, 27.0, 32.0, 40.0, 49.0, 43.0, 45.0, 41.0, 45.0, 43.0, 39.0, 35.0, 40.0, 35.0, 39.0, 49.0, 27.0, 25.0, 39.0, 22.0, 12.0, 19.0, 15.0, 8.0, 7.0, 8.0, 4.0, 4.0, 11.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-84.56769561767578, -81.64826202392578, -78.72882080078125, -75.80938720703125, -72.88995361328125, -69.97052001953125, -67.05108642578125, -64.13164520263672, -61.21221160888672, -58.29277801513672, -55.37334060668945, -52.45390319824219, -49.53446960449219, -46.61503601074219, -43.69559860229492, -40.776161193847656, -37.856727600097656, -34.937294006347656, -32.01785659790039, -29.098421096801758, -26.178985595703125, -23.259550094604492, -20.34011459350586, -17.420679092407227, -14.501243591308594, -11.581808090209961, -8.662372589111328, -5.742937088012695, -2.8235015869140625, 0.09593391418457031, 3.015369415283203, 5.934804916381836, 8.854248046875, 11.773683547973633, 14.693119049072266, 17.6125545501709, 20.53199005126953, 23.451425552368164, 26.370861053466797, 29.29029655456543, 32.20973205566406, 35.12916564941406, 38.04860305786133, 40.968040466308594, 43.887474060058594, 46.806907653808594, 49.72634506225586, 52.645782470703125, 55.565216064453125, 58.484649658203125, 61.40408706665039, 64.32352447509766, 67.24295806884766, 70.16239166259766, 73.08183288574219, 76.00126647949219, 78.92070007324219, 81.84013366699219, 84.75956726074219, 87.67900848388672, 90.59844207763672, 93.51787567138672, 96.43731689453125, 99.35675048828125, 102.27618408203125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 9.0, 9.0, 9.0, 17.0, 21.0, 23.0, 18.0, 27.0, 22.0, 27.0, 27.0, 31.0, 41.0, 48.0, 51.0, 40.0, 31.0, 49.0, 44.0, 39.0, 55.0, 47.0, 27.0, 27.0, 36.0, 29.0, 30.0, 24.0, 22.0, 26.0, 16.0, 15.0, 9.0, 6.0, 9.0, 8.0, 6.0, 8.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.872802734375, -15.35498046875, -14.837158203125, -14.3193359375, -13.801513671875, -13.28369140625, -12.765869140625, -12.248046875, -11.730224609375, -11.21240234375, -10.694580078125, -10.1767578125, -9.658935546875, -9.14111328125, -8.623291015625, -8.10546875, -7.587646484375, -7.06982421875, -6.552001953125, -6.0341796875, -5.516357421875, -4.99853515625, -4.480712890625, -3.962890625, -3.445068359375, -2.92724609375, -2.409423828125, -1.8916015625, -1.373779296875, -0.85595703125, -0.338134765625, 0.1796875, 0.697509765625, 1.21533203125, 1.733154296875, 2.2509765625, 2.768798828125, 3.28662109375, 3.804443359375, 4.322265625, 4.840087890625, 5.35791015625, 5.875732421875, 6.3935546875, 6.911376953125, 7.42919921875, 7.947021484375, 8.46484375, 8.982666015625, 9.50048828125, 10.018310546875, 10.5361328125, 11.053955078125, 11.57177734375, 12.089599609375, 12.607421875, 13.125244140625, 13.64306640625, 14.160888671875, 14.6787109375, 15.196533203125, 15.71435546875, 16.232177734375, 16.75]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 8.0, 3.0, 10.0, 19.0, 31.0, 33.0, 59.0, 79.0, 109.0, 145.0, 236.0, 390.0, 606.0, 891.0, 1376.0, 2000.0, 3273.0, 5333.0, 8329.0, 13372.0, 21924.0, 35932.0, 63522.0, 122738.0, 326449.0, 215134.0, 95713.0, 51425.0, 30174.0, 18380.0, 11271.0, 7135.0, 4419.0, 2780.0, 1831.0, 1136.0, 824.0, 494.0, 334.0, 187.0, 129.0, 92.0, 69.0, 57.0, 40.0, 26.0, 16.0, 9.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0], "bins": [-3.724609375, -3.607574462890625, -3.49053955078125, -3.373504638671875, -3.2564697265625, -3.139434814453125, -3.02239990234375, -2.905364990234375, -2.788330078125, -2.671295166015625, -2.55426025390625, -2.437225341796875, -2.3201904296875, -2.203155517578125, -2.08612060546875, -1.969085693359375, -1.85205078125, -1.735015869140625, -1.61798095703125, -1.500946044921875, -1.3839111328125, -1.266876220703125, -1.14984130859375, -1.032806396484375, -0.915771484375, -0.798736572265625, -0.68170166015625, -0.564666748046875, -0.4476318359375, -0.330596923828125, -0.21356201171875, -0.096527099609375, 0.0205078125, 0.137542724609375, 0.25457763671875, 0.371612548828125, 0.4886474609375, 0.605682373046875, 0.72271728515625, 0.839752197265625, 0.956787109375, 1.073822021484375, 1.19085693359375, 1.307891845703125, 1.4249267578125, 1.541961669921875, 1.65899658203125, 1.776031494140625, 1.89306640625, 2.010101318359375, 2.12713623046875, 2.244171142578125, 2.3612060546875, 2.478240966796875, 2.59527587890625, 2.712310791015625, 2.829345703125, 2.946380615234375, 3.06341552734375, 3.180450439453125, 3.2974853515625, 3.414520263671875, 3.53155517578125, 3.648590087890625, 3.765625]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 4.0, 1.0, 13.0, 8.0, 10.0, 9.0, 17.0, 12.0, 14.0, 21.0, 29.0, 25.0, 37.0, 37.0, 35.0, 31.0, 25.0, 48.0, 40.0, 46.0, 1066.0, 49.0, 44.0, 42.0, 49.0, 46.0, 34.0, 36.0, 24.0, 28.0, 22.0, 18.0, 17.0, 14.0, 23.0, 9.0, 11.0, 10.0, 2.0, 5.0, 3.0, 4.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-9.3203125, -9.0050048828125, -8.689697265625, -8.3743896484375, -8.05908203125, -7.7437744140625, -7.428466796875, -7.1131591796875, -6.7978515625, -6.4825439453125, -6.167236328125, -5.8519287109375, -5.53662109375, -5.2213134765625, -4.906005859375, -4.5906982421875, -4.275390625, -3.9600830078125, -3.644775390625, -3.3294677734375, -3.01416015625, -2.6988525390625, -2.383544921875, -2.0682373046875, -1.7529296875, -1.4376220703125, -1.122314453125, -0.8070068359375, -0.49169921875, -0.1763916015625, 0.138916015625, 0.4542236328125, 0.76953125, 1.0848388671875, 1.400146484375, 1.7154541015625, 2.03076171875, 2.3460693359375, 2.661376953125, 2.9766845703125, 3.2919921875, 3.6072998046875, 3.922607421875, 4.2379150390625, 4.55322265625, 4.8685302734375, 5.183837890625, 5.4991455078125, 5.814453125, 6.1297607421875, 6.445068359375, 6.7603759765625, 7.07568359375, 7.3909912109375, 7.706298828125, 8.0216064453125, 8.3369140625, 8.6522216796875, 8.967529296875, 9.2828369140625, 9.59814453125, 9.9134521484375, 10.228759765625, 10.5440673828125, 10.859375]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 9.0, 9.0, 4.0, 12.0, 11.0, 19.0, 35.0, 27.0, 50.0, 78.0, 146.0, 177.0, 280.0, 359.0, 588.0, 845.0, 1271.0, 1818.0, 2735.0, 3948.0, 5911.0, 8788.0, 13442.0, 20440.0, 32518.0, 52382.0, 90476.0, 179551.0, 1356463.0, 131594.0, 71735.0, 42863.0, 26926.0, 17084.0, 11329.0, 7468.0, 5021.0, 3482.0, 2334.0, 1530.0, 1108.0, 703.0, 496.0, 355.0, 245.0, 128.0, 118.0, 73.0, 53.0, 31.0, 17.0, 14.0, 19.0, 13.0, 4.0, 2.0, 4.0, 3.0], "bins": [-3.296875, -3.20074462890625, -3.1046142578125, -3.00848388671875, -2.912353515625, -2.81622314453125, -2.7200927734375, -2.62396240234375, -2.52783203125, -2.43170166015625, -2.3355712890625, -2.23944091796875, -2.143310546875, -2.04718017578125, -1.9510498046875, -1.85491943359375, -1.7587890625, -1.66265869140625, -1.5665283203125, -1.47039794921875, -1.374267578125, -1.27813720703125, -1.1820068359375, -1.08587646484375, -0.98974609375, -0.89361572265625, -0.7974853515625, -0.70135498046875, -0.605224609375, -0.50909423828125, -0.4129638671875, -0.31683349609375, -0.220703125, -0.12457275390625, -0.0284423828125, 0.06768798828125, 0.163818359375, 0.25994873046875, 0.3560791015625, 0.45220947265625, 0.54833984375, 0.64447021484375, 0.7406005859375, 0.83673095703125, 0.932861328125, 1.02899169921875, 1.1251220703125, 1.22125244140625, 1.3173828125, 1.41351318359375, 1.5096435546875, 1.60577392578125, 1.701904296875, 1.79803466796875, 1.8941650390625, 1.99029541015625, 2.08642578125, 2.18255615234375, 2.2786865234375, 2.37481689453125, 2.470947265625, 2.56707763671875, 2.6632080078125, 2.75933837890625, 2.85546875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 2.0, 8.0, 3.0, 5.0, 6.0, 6.0, 9.0, 15.0, 10.0, 13.0, 14.0, 24.0, 21.0, 26.0, 27.0, 39.0, 51.0, 63.0, 68.0, 70.0, 75.0, 67.0, 67.0, 52.0, 45.0, 35.0, 39.0, 15.0, 18.0, 15.0, 11.0, 15.0, 11.0, 11.0, 4.0, 13.0, 7.0, 3.0, 5.0, 6.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.002166748046875, -0.0021068304777145386, -0.002046912908554077, -0.0019869953393936157, -0.0019270777702331543, -0.0018671602010726929, -0.0018072426319122314, -0.00174732506275177, -0.0016874074935913086, -0.0016274899244308472, -0.0015675723552703857, -0.0015076547861099243, -0.0014477372169494629, -0.0013878196477890015, -0.00132790207862854, -0.0012679845094680786, -0.0012080669403076172, -0.0011481493711471558, -0.0010882318019866943, -0.001028314232826233, -0.0009683966636657715, -0.0009084790945053101, -0.0008485615253448486, -0.0007886439561843872, -0.0007287263870239258, -0.0006688088178634644, -0.0006088912487030029, -0.0005489736795425415, -0.0004890561103820801, -0.00042913854122161865, -0.0003692209720611572, -0.0003093034029006958, -0.0002493858337402344, -0.00018946826457977295, -0.00012955069541931152, -6.96331262588501e-05, -9.715557098388672e-06, 5.0202012062072754e-05, 0.00011011958122253418, 0.0001700371503829956, 0.00022995471954345703, 0.00028987228870391846, 0.0003497898578643799, 0.0004097074270248413, 0.00046962499618530273, 0.0005295425653457642, 0.0005894601345062256, 0.000649377703666687, 0.0007092952728271484, 0.0007692128419876099, 0.0008291304111480713, 0.0008890479803085327, 0.0009489655494689941, 0.0010088831186294556, 0.001068800687789917, 0.0011287182569503784, 0.0011886358261108398, 0.0012485533952713013, 0.0013084709644317627, 0.0013683885335922241, 0.0014283061027526855, 0.001488223671913147, 0.0015481412410736084, 0.0016080588102340698, 0.0016679763793945312]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 6.0, 4.0, 12.0, 14.0, 15.0, 12.0, 11.0, 15.0, 26.0, 25.0, 36.0, 53.0, 62.0, 99.0, 171.0, 352.0, 1300.0, 993364.0, 51493.0, 726.0, 249.0, 134.0, 87.0, 52.0, 52.0, 30.0, 33.0, 20.0, 12.0, 14.0, 8.0, 10.0, 9.0, 7.0, 8.0, 7.0, 7.0, 1.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046112060546875, -0.04456615447998047, -0.04302024841308594, -0.041474342346191406, -0.039928436279296875, -0.038382530212402344, -0.03683662414550781, -0.03529071807861328, -0.03374481201171875, -0.03219890594482422, -0.030652999877929688, -0.029107093811035156, -0.027561187744140625, -0.026015281677246094, -0.024469375610351562, -0.02292346954345703, -0.0213775634765625, -0.01983165740966797, -0.018285751342773438, -0.016739845275878906, -0.015193939208984375, -0.013648033142089844, -0.012102127075195312, -0.010556221008300781, -0.00901031494140625, -0.007464408874511719, -0.0059185028076171875, -0.004372596740722656, -0.002826690673828125, -0.0012807846069335938, 0.0002651214599609375, 0.0018110275268554688, 0.00335693359375, 0.004902839660644531, 0.0064487457275390625, 0.007994651794433594, 0.009540557861328125, 0.011086463928222656, 0.012632369995117188, 0.014178276062011719, 0.01572418212890625, 0.01727008819580078, 0.018815994262695312, 0.020361900329589844, 0.021907806396484375, 0.023453712463378906, 0.024999618530273438, 0.02654552459716797, 0.0280914306640625, 0.02963733673095703, 0.031183242797851562, 0.032729148864746094, 0.034275054931640625, 0.035820960998535156, 0.03736686706542969, 0.03891277313232422, 0.04045867919921875, 0.04200458526611328, 0.04355049133300781, 0.045096397399902344, 0.046642303466796875, 0.048188209533691406, 0.04973411560058594, 0.05128002166748047, 0.052825927734375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 6.0, 46.0, 206.0, 465.0, 221.0, 63.0, 7.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0050995489582419395, -0.004989993292838335, -0.0048804376274347305, -0.004770882427692413, -0.004661326762288809, -0.004551771096885204, -0.0044422154314816, -0.004332659766077995, -0.004223104100674391, -0.004113548435270786, -0.004003992769867182, -0.003894437337294221, -0.0037848816718906164, -0.0036753262393176556, -0.003565770573914051, -0.0034562149085104465, -0.0033466597087681293, -0.003237104043364525, -0.003127548610791564, -0.0030179929453879595, -0.002908437279984355, -0.002798881847411394, -0.0026893261820077896, -0.002579770516604185, -0.0024702148512005806, -0.002360659185796976, -0.0022511037532240152, -0.0021415480878204107, -0.0020319924224168062, -0.0019224369898438454, -0.0018128813244402409, -0.0017033257754519582, -0.0015937702264636755, -0.0014842146774753928, -0.0013746590120717883, -0.0012651034630835056, -0.001155547914095223, -0.0010459923651069403, -0.0009364366997033358, -0.0008268811507150531, -0.0007173255435191095, -0.0006077699363231659, -0.0004982143873348832, -0.0003886587801389396, -0.0002791032020468265, -0.00016954762395471334, -5.999201675876975e-05, 4.956353222951293e-05, 0.00015911913942545652, 0.00026867471751756966, 0.0003782302956096828, 0.0004877859028056264, 0.0005973414517939091, 0.0007068970589898527, 0.0008164526661857963, 0.0009260082151740789, 0.0010355638805776834, 0.0011451194295659661, 0.0012546750949695706, 0.0013642306439578533, 0.001473786192946136, 0.0015833417419344187, 0.0016928974073380232, 0.0018024529563263059, 0.0019120085053145885]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 1.0, 3.0, 7.0, 11.0, 8.0, 8.0, 12.0, 18.0, 11.0, 17.0, 25.0, 26.0, 29.0, 32.0, 37.0, 34.0, 46.0, 40.0, 45.0, 48.0, 42.0, 40.0, 30.0, 35.0, 48.0, 35.0, 32.0, 29.0, 30.0, 39.0, 25.0, 22.0, 33.0, 18.0, 13.0, 13.0, 16.0, 8.0, 5.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009604096412658691, -0.000928487628698349, -0.0008965656161308289, -0.0008646436035633087, -0.0008327215909957886, -0.0008007995784282684, -0.0007688775658607483, -0.0007369555532932281, -0.000705033540725708, -0.0006731115281581879, -0.0006411895155906677, -0.0006092675030231476, -0.0005773454904556274, -0.0005454234778881073, -0.0005135014653205872, -0.000481579452753067, -0.0004496574401855469, -0.00041773542761802673, -0.0003858134150505066, -0.00035389140248298645, -0.0003219693899154663, -0.00029004737734794617, -0.000258125364780426, -0.00022620335221290588, -0.00019428133964538574, -0.0001623593270778656, -0.00013043731451034546, -9.851530194282532e-05, -6.659328937530518e-05, -3.4671276807785034e-05, -2.7492642402648926e-06, 2.917274832725525e-05, 6.109476089477539e-05, 9.301677346229553e-05, 0.00012493878602981567, 0.00015686079859733582, 0.00018878281116485596, 0.0002207048237323761, 0.00025262683629989624, 0.0002845488488674164, 0.0003164708614349365, 0.00034839287400245667, 0.0003803148865699768, 0.00041223689913749695, 0.0004441589117050171, 0.00047608092427253723, 0.0005080029368400574, 0.0005399249494075775, 0.0005718469619750977, 0.0006037689745426178, 0.0006356909871101379, 0.0006676129996776581, 0.0006995350122451782, 0.0007314570248126984, 0.0007633790373802185, 0.0007953010499477386, 0.0008272230625152588, 0.0008591450750827789, 0.0008910670876502991, 0.0009229891002178192, 0.0009549111127853394, 0.0009868331253528595, 0.0010187551379203796, 0.0010506771504878998, 0.00108259916305542]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 6.0, 9.0, 9.0, 9.0, 17.0, 21.0, 23.0, 18.0, 27.0, 22.0, 27.0, 27.0, 31.0, 41.0, 48.0, 51.0, 40.0, 31.0, 49.0, 44.0, 39.0, 55.0, 47.0, 27.0, 27.0, 36.0, 29.0, 30.0, 24.0, 22.0, 26.0, 16.0, 15.0, 9.0, 6.0, 9.0, 8.0, 6.0, 8.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.872802734375, -15.35498046875, -14.837158203125, -14.3193359375, -13.801513671875, -13.28369140625, -12.765869140625, -12.248046875, -11.730224609375, -11.21240234375, -10.694580078125, -10.1767578125, -9.658935546875, -9.14111328125, -8.623291015625, -8.10546875, -7.587646484375, -7.06982421875, -6.552001953125, -6.0341796875, -5.516357421875, -4.99853515625, -4.480712890625, -3.962890625, -3.445068359375, -2.92724609375, -2.409423828125, -1.8916015625, -1.373779296875, -0.85595703125, -0.338134765625, 0.1796875, 0.697509765625, 1.21533203125, 1.733154296875, 2.2509765625, 2.768798828125, 3.28662109375, 3.804443359375, 4.322265625, 4.840087890625, 5.35791015625, 5.875732421875, 6.3935546875, 6.911376953125, 7.42919921875, 7.947021484375, 8.46484375, 8.982666015625, 9.50048828125, 10.018310546875, 10.5361328125, 11.053955078125, 11.57177734375, 12.089599609375, 12.607421875, 13.125244140625, 13.64306640625, 14.160888671875, 14.6787109375, 15.196533203125, 15.71435546875, 16.232177734375, 16.75]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 6.0, 5.0, 9.0, 11.0, 13.0, 27.0, 28.0, 42.0, 46.0, 59.0, 78.0, 119.0, 155.0, 227.0, 367.0, 641.0, 1276.0, 4108.0, 34898.0, 674295.0, 307184.0, 19402.0, 2911.0, 984.0, 558.0, 330.0, 209.0, 149.0, 113.0, 66.0, 51.0, 51.0, 37.0, 30.0, 11.0, 14.0, 6.0, 13.0, 5.0, 12.0, 4.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.703125, -29.739990234375, -28.77685546875, -27.813720703125, -26.8505859375, -25.887451171875, -24.92431640625, -23.961181640625, -22.998046875, -22.034912109375, -21.07177734375, -20.108642578125, -19.1455078125, -18.182373046875, -17.21923828125, -16.256103515625, -15.29296875, -14.329833984375, -13.36669921875, -12.403564453125, -11.4404296875, -10.477294921875, -9.51416015625, -8.551025390625, -7.587890625, -6.624755859375, -5.66162109375, -4.698486328125, -3.7353515625, -2.772216796875, -1.80908203125, -0.845947265625, 0.1171875, 1.080322265625, 2.04345703125, 3.006591796875, 3.9697265625, 4.932861328125, 5.89599609375, 6.859130859375, 7.822265625, 8.785400390625, 9.74853515625, 10.711669921875, 11.6748046875, 12.637939453125, 13.60107421875, 14.564208984375, 15.52734375, 16.490478515625, 17.45361328125, 18.416748046875, 19.3798828125, 20.343017578125, 21.30615234375, 22.269287109375, 23.232421875, 24.195556640625, 25.15869140625, 26.121826171875, 27.0849609375, 28.048095703125, 29.01123046875, 29.974365234375, 30.9375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 6.0, 5.0, 1.0, 4.0, 4.0, 4.0, 14.0, 14.0, 10.0, 11.0, 19.0, 28.0, 21.0, 37.0, 28.0, 39.0, 36.0, 43.0, 49.0, 66.0, 134.0, 1761.0, 248.0, 60.0, 58.0, 43.0, 40.0, 43.0, 32.0, 33.0, 33.0, 21.0, 21.0, 21.0, 21.0, 10.0, 10.0, 9.0, 8.0, 1.0, 5.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-60.5, -58.708984375, -56.91796875, -55.126953125, -53.3359375, -51.544921875, -49.75390625, -47.962890625, -46.171875, -44.380859375, -42.58984375, -40.798828125, -39.0078125, -37.216796875, -35.42578125, -33.634765625, -31.84375, -30.052734375, -28.26171875, -26.470703125, -24.6796875, -22.888671875, -21.09765625, -19.306640625, -17.515625, -15.724609375, -13.93359375, -12.142578125, -10.3515625, -8.560546875, -6.76953125, -4.978515625, -3.1875, -1.396484375, 0.39453125, 2.185546875, 3.9765625, 5.767578125, 7.55859375, 9.349609375, 11.140625, 12.931640625, 14.72265625, 16.513671875, 18.3046875, 20.095703125, 21.88671875, 23.677734375, 25.46875, 27.259765625, 29.05078125, 30.841796875, 32.6328125, 34.423828125, 36.21484375, 38.005859375, 39.796875, 41.587890625, 43.37890625, 45.169921875, 46.9609375, 48.751953125, 50.54296875, 52.333984375, 54.125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 5.0, 1.0, 9.0, 9.0, 10.0, 9.0, 20.0, 29.0, 21.0, 21.0, 33.0, 36.0, 53.0, 58.0, 90.0, 166.0, 363.0, 723.0, 29168.0, 3112118.0, 1599.0, 452.0, 218.0, 129.0, 73.0, 59.0, 45.0, 41.0, 28.0, 26.0, 22.0, 10.0, 7.0, 14.0, 17.0, 4.0, 6.0, 1.0, 2.0, 5.0, 4.0, 4.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-163.125, -157.7265625, -152.328125, -146.9296875, -141.53125, -136.1328125, -130.734375, -125.3359375, -119.9375, -114.5390625, -109.140625, -103.7421875, -98.34375, -92.9453125, -87.546875, -82.1484375, -76.75, -71.3515625, -65.953125, -60.5546875, -55.15625, -49.7578125, -44.359375, -38.9609375, -33.5625, -28.1640625, -22.765625, -17.3671875, -11.96875, -6.5703125, -1.171875, 4.2265625, 9.625, 15.0234375, 20.421875, 25.8203125, 31.21875, 36.6171875, 42.015625, 47.4140625, 52.8125, 58.2109375, 63.609375, 69.0078125, 74.40625, 79.8046875, 85.203125, 90.6015625, 96.0, 101.3984375, 106.796875, 112.1953125, 117.59375, 122.9921875, 128.390625, 133.7890625, 139.1875, 144.5859375, 149.984375, 155.3828125, 160.78125, 166.1796875, 171.578125, 176.9765625, 182.375]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 9.0, 21.0, 77.0, 172.0, 252.0, 218.0, 144.0, 75.0, 36.0, 7.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.911794662475586, -20.988351821899414, -19.06490707397461, -17.141464233398438, -15.218021392822266, -13.294578552246094, -11.371134757995605, -9.447690963745117, -7.524248123168945, -5.600804805755615, -3.677361488342285, -1.753918170928955, 0.169525146484375, 2.092967987060547, 4.016411781311035, 5.939855575561523, 7.863298416137695, 9.786741256713867, 11.710185050964355, 13.633628845214844, 15.557071685791016, 17.480514526367188, 19.40395736694336, 21.327402114868164, 23.250844955444336, 25.174287796020508, 27.097732543945312, 29.021175384521484, 30.944618225097656, 32.86806106567383, 34.79150390625, 36.71495056152344, 38.638389587402344, 40.561832427978516, 42.48527526855469, 44.40871810913086, 46.33216094970703, 48.25560760498047, 50.17905044555664, 52.10249328613281, 54.025936126708984, 55.949378967285156, 57.87282180786133, 59.7962646484375, 61.71971130371094, 63.643150329589844, 65.56659698486328, 67.49003601074219, 69.41348266601562, 71.33692932128906, 73.26036834716797, 75.1838150024414, 77.10725402832031, 79.03070068359375, 80.95413970947266, 82.8775863647461, 84.801025390625, 86.72447204589844, 88.64791107177734, 90.57135772705078, 92.49479675292969, 94.41824340820312, 96.34168243408203, 98.26512908935547, 100.1885757446289]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 5.0, 3.0, 12.0, 10.0, 8.0, 6.0, 18.0, 19.0, 21.0, 16.0, 27.0, 25.0, 18.0, 26.0, 33.0, 33.0, 49.0, 34.0, 46.0, 45.0, 35.0, 36.0, 44.0, 41.0, 35.0, 31.0, 34.0, 35.0, 32.0, 39.0, 20.0, 30.0, 19.0, 24.0, 16.0, 21.0, 14.0, 6.0, 8.0, 5.0, 11.0, 5.0, 6.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-141.3252410888672, -136.6411590576172, -131.9570770263672, -127.27298736572266, -122.58890533447266, -117.90481567382812, -113.22073364257812, -108.53665161132812, -103.85256958007812, -99.16848754882812, -94.4843978881836, -89.8003158569336, -85.1162338256836, -80.43214416503906, -75.74806213378906, -71.06398010253906, -66.37989044189453, -61.695804595947266, -57.011722564697266, -52.32763671875, -47.6435546875, -42.959468841552734, -38.27538299560547, -33.59130096435547, -28.907215118408203, -24.22313117980957, -19.539047241210938, -14.854961395263672, -10.170877456665039, -5.486793518066406, -0.8027076721191406, 3.8813743591308594, 8.565460205078125, 13.249544143676758, 17.93362808227539, 22.617713928222656, 27.30179786682129, 31.985881805419922, 36.66996765136719, 41.35404968261719, 46.03813552856445, 50.72222137451172, 55.40630340576172, 60.090389251708984, 64.77447509765625, 69.45855712890625, 74.14263916015625, 78.82672119140625, 83.51081085205078, 88.19489288330078, 92.87898254394531, 97.56306457519531, 102.24714660644531, 106.93122863769531, 111.61531829833984, 116.29940032958984, 120.98348999023438, 125.66757202148438, 130.35165405273438, 135.03573608398438, 139.71983337402344, 144.40391540527344, 149.08799743652344, 153.77207946777344, 158.45616149902344]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 8.0, 5.0, 5.0, 14.0, 6.0, 11.0, 22.0, 16.0, 28.0, 21.0, 23.0, 25.0, 29.0, 26.0, 35.0, 35.0, 51.0, 43.0, 43.0, 35.0, 43.0, 40.0, 37.0, 52.0, 34.0, 39.0, 27.0, 29.0, 33.0, 23.0, 24.0, 24.0, 22.0, 19.0, 20.0, 12.0, 5.0, 9.0, 7.0, 6.0, 6.0, 3.0, 7.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.390625, -15.87109375, -15.3515625, -14.83203125, -14.3125, -13.79296875, -13.2734375, -12.75390625, -12.234375, -11.71484375, -11.1953125, -10.67578125, -10.15625, -9.63671875, -9.1171875, -8.59765625, -8.078125, -7.55859375, -7.0390625, -6.51953125, -6.0, -5.48046875, -4.9609375, -4.44140625, -3.921875, -3.40234375, -2.8828125, -2.36328125, -1.84375, -1.32421875, -0.8046875, -0.28515625, 0.234375, 0.75390625, 1.2734375, 1.79296875, 2.3125, 2.83203125, 3.3515625, 3.87109375, 4.390625, 4.91015625, 5.4296875, 5.94921875, 6.46875, 6.98828125, 7.5078125, 8.02734375, 8.546875, 9.06640625, 9.5859375, 10.10546875, 10.625, 11.14453125, 11.6640625, 12.18359375, 12.703125, 13.22265625, 13.7421875, 14.26171875, 14.78125, 15.30078125, 15.8203125, 16.33984375, 16.859375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 4.0, 7.0, 7.0, 14.0, 15.0, 22.0, 28.0, 18.0, 50.0, 50.0, 79.0, 91.0, 130.0, 196.0, 281.0, 488.0, 859.0, 1766.0, 4163.0, 12019.0, 47977.0, 230180.0, 887019.0, 1619703.0, 1019746.0, 286778.0, 59489.0, 14215.0, 4590.0, 1908.0, 900.0, 519.0, 290.0, 156.0, 138.0, 100.0, 67.0, 72.0, 40.0, 32.0, 14.0, 25.0, 11.0, 8.0, 6.0, 5.0, 2.0, 9.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-19.1875, -18.598388671875, -18.00927734375, -17.420166015625, -16.8310546875, -16.241943359375, -15.65283203125, -15.063720703125, -14.474609375, -13.885498046875, -13.29638671875, -12.707275390625, -12.1181640625, -11.529052734375, -10.93994140625, -10.350830078125, -9.76171875, -9.172607421875, -8.58349609375, -7.994384765625, -7.4052734375, -6.816162109375, -6.22705078125, -5.637939453125, -5.048828125, -4.459716796875, -3.87060546875, -3.281494140625, -2.6923828125, -2.103271484375, -1.51416015625, -0.925048828125, -0.3359375, 0.253173828125, 0.84228515625, 1.431396484375, 2.0205078125, 2.609619140625, 3.19873046875, 3.787841796875, 4.376953125, 4.966064453125, 5.55517578125, 6.144287109375, 6.7333984375, 7.322509765625, 7.91162109375, 8.500732421875, 9.08984375, 9.678955078125, 10.26806640625, 10.857177734375, 11.4462890625, 12.035400390625, 12.62451171875, 13.213623046875, 13.802734375, 14.391845703125, 14.98095703125, 15.570068359375, 16.1591796875, 16.748291015625, 17.33740234375, 17.926513671875, 18.515625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 7.0, 10.0, 17.0, 19.0, 34.0, 32.0, 63.0, 100.0, 106.0, 181.0, 212.0, 341.0, 452.0, 634.0, 525.0, 432.0, 270.0, 171.0, 152.0, 104.0, 61.0, 64.0, 27.0, 23.0, 14.0, 10.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-46.15625, -44.93505859375, -43.7138671875, -42.49267578125, -41.271484375, -40.05029296875, -38.8291015625, -37.60791015625, -36.38671875, -35.16552734375, -33.9443359375, -32.72314453125, -31.501953125, -30.28076171875, -29.0595703125, -27.83837890625, -26.6171875, -25.39599609375, -24.1748046875, -22.95361328125, -21.732421875, -20.51123046875, -19.2900390625, -18.06884765625, -16.84765625, -15.62646484375, -14.4052734375, -13.18408203125, -11.962890625, -10.74169921875, -9.5205078125, -8.29931640625, -7.078125, -5.85693359375, -4.6357421875, -3.41455078125, -2.193359375, -0.97216796875, 0.2490234375, 1.47021484375, 2.69140625, 3.91259765625, 5.1337890625, 6.35498046875, 7.576171875, 8.79736328125, 10.0185546875, 11.23974609375, 12.4609375, 13.68212890625, 14.9033203125, 16.12451171875, 17.345703125, 18.56689453125, 19.7880859375, 21.00927734375, 22.23046875, 23.45166015625, 24.6728515625, 25.89404296875, 27.115234375, 28.33642578125, 29.5576171875, 30.77880859375, 32.0]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 4.0, 12.0, 9.0, 15.0, 19.0, 25.0, 35.0, 44.0, 36.0, 67.0, 85.0, 107.0, 121.0, 168.0, 205.0, 239.0, 364.0, 683.0, 2757.0, 1971648.0, 2212522.0, 2740.0, 695.0, 369.0, 262.0, 206.0, 170.0, 134.0, 107.0, 98.0, 74.0, 59.0, 34.0, 41.0, 27.0, 19.0, 22.0, 16.0, 17.0, 7.0, 8.0, 7.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-135.625, -130.94921875, -126.2734375, -121.59765625, -116.921875, -112.24609375, -107.5703125, -102.89453125, -98.21875, -93.54296875, -88.8671875, -84.19140625, -79.515625, -74.83984375, -70.1640625, -65.48828125, -60.8125, -56.13671875, -51.4609375, -46.78515625, -42.109375, -37.43359375, -32.7578125, -28.08203125, -23.40625, -18.73046875, -14.0546875, -9.37890625, -4.703125, -0.02734375, 4.6484375, 9.32421875, 14.0, 18.67578125, 23.3515625, 28.02734375, 32.703125, 37.37890625, 42.0546875, 46.73046875, 51.40625, 56.08203125, 60.7578125, 65.43359375, 70.109375, 74.78515625, 79.4609375, 84.13671875, 88.8125, 93.48828125, 98.1640625, 102.83984375, 107.515625, 112.19140625, 116.8671875, 121.54296875, 126.21875, 130.89453125, 135.5703125, 140.24609375, 144.921875, 149.59765625, 154.2734375, 158.94921875, 163.625]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 18.0, 192.0, 593.0, 202.0, 8.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-695.6502685546875, -681.0103759765625, -666.3705444335938, -651.7306518554688, -637.0907592773438, -622.450927734375, -607.81103515625, -593.171142578125, -578.53125, -563.891357421875, -549.2515258789062, -534.6116333007812, -519.9717407226562, -505.3318786621094, -490.6920166015625, -476.0521240234375, -461.41229248046875, -446.7724304199219, -432.1325378417969, -417.49267578125, -402.852783203125, -388.2129211425781, -373.57305908203125, -358.93316650390625, -344.2933044433594, -329.6534423828125, -315.0135498046875, -300.3736877441406, -285.73382568359375, -271.09393310546875, -256.4540710449219, -241.81419372558594, -227.17433166503906, -212.53445434570312, -197.89459228515625, -183.2547149658203, -168.61483764648438, -153.97496032714844, -139.3350830078125, -124.69522094726562, -110.05534362792969, -95.41546630859375, -80.77559661865234, -66.13572692871094, -51.495849609375, -36.85597229003906, -22.216102600097656, -7.57623291015625, 7.0636444091796875, 21.70351791381836, 36.34339141845703, 50.9832649230957, 65.62313842773438, 80.26301574707031, 94.90288543701172, 109.54275512695312, 124.18263244628906, 138.822509765625, 153.46237182617188, 168.1022491455078, 182.74212646484375, 197.3820037841797, 212.02188110351562, 226.6617431640625, 241.30162048339844]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 10.0, 6.0, 10.0, 14.0, 15.0, 20.0, 18.0, 16.0, 22.0, 16.0, 28.0, 21.0, 36.0, 40.0, 37.0, 46.0, 33.0, 44.0, 45.0, 46.0, 50.0, 47.0, 48.0, 47.0, 31.0, 35.0, 33.0, 29.0, 33.0, 22.0, 24.0, 18.0, 8.0, 13.0, 9.0, 9.0, 11.0, 6.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-123.20047760009766, -119.50052642822266, -115.80057525634766, -112.10062408447266, -108.40067291259766, -104.70072174072266, -101.00077056884766, -97.30081939697266, -93.60086822509766, -89.90091705322266, -86.20096588134766, -82.50101470947266, -78.80106353759766, -75.10111236572266, -71.40116119384766, -67.70121002197266, -64.00125885009766, -60.301307678222656, -56.601356506347656, -52.901405334472656, -49.201454162597656, -45.501502990722656, -41.801551818847656, -38.101600646972656, -34.401649475097656, -30.701698303222656, -27.001747131347656, -23.301795959472656, -19.601844787597656, -15.901893615722656, -12.201942443847656, -8.501991271972656, -4.8020477294921875, -1.1020965576171875, 2.5978546142578125, 6.2978057861328125, 9.997756958007812, 13.697708129882812, 17.397659301757812, 21.097610473632812, 24.797561645507812, 28.497512817382812, 32.19746398925781, 35.89741516113281, 39.59736633300781, 43.29731750488281, 46.99726867675781, 50.69721984863281, 54.39717102050781, 58.09712219238281, 61.79707336425781, 65.49702453613281, 69.19697570800781, 72.89692687988281, 76.59687805175781, 80.29682922363281, 83.99678039550781, 87.69673156738281, 91.39668273925781, 95.09663391113281, 98.79658508300781, 102.49653625488281, 106.19648742675781, 109.89643859863281, 113.59638977050781]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 5.0, 4.0, 6.0, 5.0, 9.0, 7.0, 12.0, 16.0, 17.0, 10.0, 30.0, 29.0, 29.0, 34.0, 30.0, 34.0, 46.0, 42.0, 47.0, 33.0, 33.0, 50.0, 37.0, 38.0, 40.0, 48.0, 34.0, 29.0, 46.0, 30.0, 26.0, 20.0, 22.0, 19.0, 13.0, 17.0, 14.0, 13.0, 13.0, 7.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.8125, -16.29443359375, -15.7763671875, -15.25830078125, -14.740234375, -14.22216796875, -13.7041015625, -13.18603515625, -12.66796875, -12.14990234375, -11.6318359375, -11.11376953125, -10.595703125, -10.07763671875, -9.5595703125, -9.04150390625, -8.5234375, -8.00537109375, -7.4873046875, -6.96923828125, -6.451171875, -5.93310546875, -5.4150390625, -4.89697265625, -4.37890625, -3.86083984375, -3.3427734375, -2.82470703125, -2.306640625, -1.78857421875, -1.2705078125, -0.75244140625, -0.234375, 0.28369140625, 0.8017578125, 1.31982421875, 1.837890625, 2.35595703125, 2.8740234375, 3.39208984375, 3.91015625, 4.42822265625, 4.9462890625, 5.46435546875, 5.982421875, 6.50048828125, 7.0185546875, 7.53662109375, 8.0546875, 8.57275390625, 9.0908203125, 9.60888671875, 10.126953125, 10.64501953125, 11.1630859375, 11.68115234375, 12.19921875, 12.71728515625, 13.2353515625, 13.75341796875, 14.271484375, 14.78955078125, 15.3076171875, 15.82568359375, 16.34375]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 3.0, 2.0, 0.0, 11.0, 12.0, 18.0, 18.0, 42.0, 36.0, 64.0, 103.0, 142.0, 196.0, 299.0, 432.0, 631.0, 883.0, 1341.0, 2003.0, 2974.0, 4455.0, 6890.0, 10937.0, 17342.0, 27411.0, 44719.0, 77015.0, 144386.0, 326866.0, 163517.0, 84826.0, 49118.0, 29424.0, 18435.0, 11716.0, 7526.0, 4890.0, 3240.0, 2112.0, 1498.0, 918.0, 669.0, 428.0, 324.0, 227.0, 136.0, 108.0, 63.0, 53.0, 32.0, 26.0, 17.0, 15.0, 8.0, 3.0, 3.0, 4.0, 0.0, 1.0, 2.0, 1.0], "bins": [-3.40234375, -3.29461669921875, -3.1868896484375, -3.07916259765625, -2.971435546875, -2.86370849609375, -2.7559814453125, -2.64825439453125, -2.54052734375, -2.43280029296875, -2.3250732421875, -2.21734619140625, -2.109619140625, -2.00189208984375, -1.8941650390625, -1.78643798828125, -1.6787109375, -1.57098388671875, -1.4632568359375, -1.35552978515625, -1.247802734375, -1.14007568359375, -1.0323486328125, -0.92462158203125, -0.81689453125, -0.70916748046875, -0.6014404296875, -0.49371337890625, -0.385986328125, -0.27825927734375, -0.1705322265625, -0.06280517578125, 0.044921875, 0.15264892578125, 0.2603759765625, 0.36810302734375, 0.475830078125, 0.58355712890625, 0.6912841796875, 0.79901123046875, 0.90673828125, 1.01446533203125, 1.1221923828125, 1.22991943359375, 1.337646484375, 1.44537353515625, 1.5531005859375, 1.66082763671875, 1.7685546875, 1.87628173828125, 1.9840087890625, 2.09173583984375, 2.199462890625, 2.30718994140625, 2.4149169921875, 2.52264404296875, 2.63037109375, 2.73809814453125, 2.8458251953125, 2.95355224609375, 3.061279296875, 3.16900634765625, 3.2767333984375, 3.38446044921875, 3.4921875]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 2.0, 5.0, 7.0, 8.0, 6.0, 5.0, 9.0, 9.0, 18.0, 24.0, 23.0, 21.0, 17.0, 24.0, 28.0, 39.0, 22.0, 28.0, 44.0, 46.0, 44.0, 49.0, 1060.0, 40.0, 42.0, 44.0, 41.0, 34.0, 28.0, 28.0, 25.0, 42.0, 36.0, 25.0, 18.0, 16.0, 15.0, 5.0, 9.0, 4.0, 8.0, 7.0, 12.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-10.2421875, -9.9300537109375, -9.617919921875, -9.3057861328125, -8.99365234375, -8.6815185546875, -8.369384765625, -8.0572509765625, -7.7451171875, -7.4329833984375, -7.120849609375, -6.8087158203125, -6.49658203125, -6.1844482421875, -5.872314453125, -5.5601806640625, -5.248046875, -4.9359130859375, -4.623779296875, -4.3116455078125, -3.99951171875, -3.6873779296875, -3.375244140625, -3.0631103515625, -2.7509765625, -2.4388427734375, -2.126708984375, -1.8145751953125, -1.50244140625, -1.1903076171875, -0.878173828125, -0.5660400390625, -0.25390625, 0.0582275390625, 0.370361328125, 0.6824951171875, 0.99462890625, 1.3067626953125, 1.618896484375, 1.9310302734375, 2.2431640625, 2.5552978515625, 2.867431640625, 3.1795654296875, 3.49169921875, 3.8038330078125, 4.115966796875, 4.4281005859375, 4.740234375, 5.0523681640625, 5.364501953125, 5.6766357421875, 5.98876953125, 6.3009033203125, 6.613037109375, 6.9251708984375, 7.2373046875, 7.5494384765625, 7.861572265625, 8.1737060546875, 8.48583984375, 8.7979736328125, 9.110107421875, 9.4222412109375, 9.734375]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 3.0, 9.0, 13.0, 17.0, 25.0, 44.0, 55.0, 92.0, 143.0, 176.0, 258.0, 389.0, 551.0, 754.0, 1035.0, 1522.0, 2249.0, 3127.0, 4655.0, 6647.0, 9794.0, 14773.0, 22234.0, 33857.0, 53286.0, 90228.0, 179861.0, 1339944.0, 130153.0, 71667.0, 43739.0, 27989.0, 18696.0, 12443.0, 8289.0, 5643.0, 3795.0, 2649.0, 1913.0, 1312.0, 940.0, 671.0, 472.0, 309.0, 235.0, 146.0, 103.0, 75.0, 60.0, 35.0, 21.0, 15.0, 12.0, 11.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-2.96484375, -2.870086669921875, -2.77532958984375, -2.680572509765625, -2.5858154296875, -2.491058349609375, -2.39630126953125, -2.301544189453125, -2.206787109375, -2.112030029296875, -2.01727294921875, -1.922515869140625, -1.8277587890625, -1.733001708984375, -1.63824462890625, -1.543487548828125, -1.44873046875, -1.353973388671875, -1.25921630859375, -1.164459228515625, -1.0697021484375, -0.974945068359375, -0.88018798828125, -0.785430908203125, -0.690673828125, -0.595916748046875, -0.50115966796875, -0.406402587890625, -0.3116455078125, -0.216888427734375, -0.12213134765625, -0.027374267578125, 0.0673828125, 0.162139892578125, 0.25689697265625, 0.351654052734375, 0.4464111328125, 0.541168212890625, 0.63592529296875, 0.730682373046875, 0.825439453125, 0.920196533203125, 1.01495361328125, 1.109710693359375, 1.2044677734375, 1.299224853515625, 1.39398193359375, 1.488739013671875, 1.58349609375, 1.678253173828125, 1.77301025390625, 1.867767333984375, 1.9625244140625, 2.057281494140625, 2.15203857421875, 2.246795654296875, 2.341552734375, 2.436309814453125, 2.53106689453125, 2.625823974609375, 2.7205810546875, 2.815338134765625, 2.91009521484375, 3.004852294921875, 3.099609375]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 7.0, 2.0, 5.0, 5.0, 4.0, 13.0, 12.0, 16.0, 11.0, 20.0, 31.0, 51.0, 61.0, 68.0, 105.0, 106.0, 105.0, 93.0, 54.0, 56.0, 35.0, 29.0, 18.0, 18.0, 14.0, 19.0, 9.0, 6.0, 10.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030059814453125, -0.002906113862991333, -0.002806246280670166, -0.002706378698348999, -0.002606511116027832, -0.002506643533706665, -0.002406775951385498, -0.002306908369064331, -0.002207040786743164, -0.002107173204421997, -0.00200730562210083, -0.001907438039779663, -0.001807570457458496, -0.001707702875137329, -0.0016078352928161621, -0.0015079677104949951, -0.0014081001281738281, -0.0013082325458526611, -0.0012083649635314941, -0.0011084973812103271, -0.0010086297988891602, -0.0009087622165679932, -0.0008088946342468262, -0.0007090270519256592, -0.0006091594696044922, -0.0005092918872833252, -0.0004094243049621582, -0.0003095567226409912, -0.00020968914031982422, -0.00010982155799865723, -9.953975677490234e-06, 8.991360664367676e-05, 0.00018978118896484375, 0.00028964877128601074, 0.00038951635360717773, 0.0004893839359283447, 0.0005892515182495117, 0.0006891191005706787, 0.0007889866828918457, 0.0008888542652130127, 0.0009887218475341797, 0.0010885894298553467, 0.0011884570121765137, 0.0012883245944976807, 0.0013881921768188477, 0.0014880597591400146, 0.0015879273414611816, 0.0016877949237823486, 0.0017876625061035156, 0.0018875300884246826, 0.0019873976707458496, 0.0020872652530670166, 0.0021871328353881836, 0.0022870004177093506, 0.0023868680000305176, 0.0024867355823516846, 0.0025866031646728516, 0.0026864707469940186, 0.0027863383293151855, 0.0028862059116363525, 0.0029860734939575195, 0.0030859410762786865, 0.0031858086585998535, 0.0032856762409210205, 0.0033855438232421875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 2.0, 4.0, 5.0, 2.0, 8.0, 12.0, 13.0, 21.0, 21.0, 23.0, 36.0, 64.0, 94.0, 185.0, 713.0, 1021963.0, 24435.0, 501.0, 169.0, 97.0, 56.0, 32.0, 18.0, 23.0, 13.0, 12.0, 11.0, 4.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0943603515625, -0.09157371520996094, -0.08878707885742188, -0.08600044250488281, -0.08321380615234375, -0.08042716979980469, -0.07764053344726562, -0.07485389709472656, -0.0720672607421875, -0.06928062438964844, -0.06649398803710938, -0.06370735168457031, -0.06092071533203125, -0.05813407897949219, -0.055347442626953125, -0.05256080627441406, -0.049774169921875, -0.04698753356933594, -0.044200897216796875, -0.04141426086425781, -0.03862762451171875, -0.03584098815917969, -0.033054351806640625, -0.030267715454101562, -0.0274810791015625, -0.024694442749023438, -0.021907806396484375, -0.019121170043945312, -0.01633453369140625, -0.013547897338867188, -0.010761260986328125, -0.007974624633789062, -0.00518798828125, -0.0024013519287109375, 0.000385284423828125, 0.0031719207763671875, 0.00595855712890625, 0.008745193481445312, 0.011531829833984375, 0.014318466186523438, 0.0171051025390625, 0.019891738891601562, 0.022678375244140625, 0.025465011596679688, 0.02825164794921875, 0.031038284301757812, 0.033824920654296875, 0.03661155700683594, 0.039398193359375, 0.04218482971191406, 0.044971466064453125, 0.04775810241699219, 0.05054473876953125, 0.05333137512207031, 0.056118011474609375, 0.05890464782714844, 0.0616912841796875, 0.06447792053222656, 0.06726455688476562, 0.07005119323730469, 0.07283782958984375, 0.07562446594238281, 0.07841110229492188, 0.08119773864746094, 0.083984375]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 13.0, 276.0, 614.0, 105.0, 8.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00866528507322073, -0.008485988713800907, -0.00830669142305851, -0.008127395063638687, -0.007948098704218864, -0.0077688018791377544, -0.007589505519717932, -0.007410208694636822, -0.007230912335216999, -0.007051615510135889, -0.006872319150716066, -0.006693022325634956, -0.006513725966215134, -0.006334429141134024, -0.006155132781714201, -0.005975835956633091, -0.005796539597213268, -0.005617242772132158, -0.005437946412712336, -0.005258649587631226, -0.005079353228211403, -0.004900056403130293, -0.00472076004371047, -0.00454146321862936, -0.00436216639354825, -0.00418286956846714, -0.0040035732090473175, -0.003824276616796851, -0.003644980024546385, -0.0034656834322959185, -0.003286386840045452, -0.003107090014964342, -0.0029277936555445194, -0.002748497063294053, -0.0025692004710435867, -0.0023899038787931204, -0.002210607286542654, -0.0020313106942921877, -0.0018520139856263995, -0.0016727173933759332, -0.0014934208011254668, -0.0013141242088750005, -0.0011348276166245341, -0.0009555309661664069, -0.0007762343739159405, -0.0005969377816654742, -0.0004176411312073469, -0.00023834453895688057, -5.904794670641422e-05, 0.00012024866009596735, 0.00029954526689834893, 0.00047884188825264573, 0.0006581384805031121, 0.0008374350727535784, 0.0010167317232117057, 0.001196028315462172, 0.0013753249077126384, 0.0015546214999631047, 0.001733918092213571, 0.0019132148008793592, 0.0020925113931298256, 0.002271807985380292, 0.0024511045776307583, 0.0026304011698812246, 0.002809697762131691]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 5.0, 1.0, 4.0, 8.0, 3.0, 14.0, 16.0, 11.0, 21.0, 30.0, 28.0, 26.0, 43.0, 28.0, 39.0, 36.0, 50.0, 50.0, 43.0, 46.0, 29.0, 45.0, 35.0, 34.0, 39.0, 52.0, 42.0, 24.0, 32.0, 35.0, 23.0, 24.0, 14.0, 12.0, 13.0, 13.0, 12.0, 10.0, 2.0, 5.0, 5.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014861822128295898, -0.0014415578916668892, -0.0013969335705041885, -0.0013523092493414879, -0.0013076849281787872, -0.0012630606070160866, -0.001218436285853386, -0.0011738119646906853, -0.0011291876435279846, -0.001084563322365284, -0.0010399390012025833, -0.0009953146800398827, -0.000950690358877182, -0.0009060660377144814, -0.0008614417165517807, -0.00081681739538908, -0.0007721930742263794, -0.0007275687530636787, -0.0006829444319009781, -0.0006383201107382774, -0.0005936957895755768, -0.0005490714684128761, -0.0005044471472501755, -0.0004598228260874748, -0.00041519850492477417, -0.0003705741837620735, -0.00032594986259937286, -0.0002813255414366722, -0.00023670122027397156, -0.0001920768991112709, -0.00014745257794857025, -0.0001028282567858696, -5.8203935623168945e-05, -1.3579614460468292e-05, 3.104470670223236e-05, 7.566902786493301e-05, 0.00012029334902763367, 0.00016491767019033432, 0.00020954199135303497, 0.0002541663125157356, 0.0002987906336784363, 0.00034341495484113693, 0.0003880392760038376, 0.00043266359716653824, 0.0004772879183292389, 0.0005219122394919395, 0.0005665365606546402, 0.0006111608818173409, 0.0006557852029800415, 0.0007004095241427422, 0.0007450338453054428, 0.0007896581664681435, 0.0008342824876308441, 0.0008789068087935448, 0.0009235311299562454, 0.0009681554511189461, 0.0010127797722816467, 0.0010574040934443474, 0.001102028414607048, 0.0011466527357697487, 0.0011912770569324493, 0.00123590137809515, 0.0012805256992578506, 0.0013251500204205513, 0.001369774341583252]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 0.0, 5.0, 4.0, 6.0, 5.0, 9.0, 7.0, 12.0, 16.0, 17.0, 10.0, 30.0, 29.0, 29.0, 34.0, 30.0, 34.0, 46.0, 42.0, 47.0, 33.0, 33.0, 50.0, 37.0, 38.0, 40.0, 48.0, 34.0, 29.0, 46.0, 30.0, 26.0, 20.0, 22.0, 19.0, 13.0, 17.0, 14.0, 13.0, 12.0, 8.0, 2.0, 5.0, 2.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.8125, -16.29443359375, -15.7763671875, -15.25830078125, -14.740234375, -14.22216796875, -13.7041015625, -13.18603515625, -12.66796875, -12.14990234375, -11.6318359375, -11.11376953125, -10.595703125, -10.07763671875, -9.5595703125, -9.04150390625, -8.5234375, -8.00537109375, -7.4873046875, -6.96923828125, -6.451171875, -5.93310546875, -5.4150390625, -4.89697265625, -4.37890625, -3.86083984375, -3.3427734375, -2.82470703125, -2.306640625, -1.78857421875, -1.2705078125, -0.75244140625, -0.234375, 0.28369140625, 0.8017578125, 1.31982421875, 1.837890625, 2.35595703125, 2.8740234375, 3.39208984375, 3.91015625, 4.42822265625, 4.9462890625, 5.46435546875, 5.982421875, 6.50048828125, 7.0185546875, 7.53662109375, 8.0546875, 8.57275390625, 9.0908203125, 9.60888671875, 10.126953125, 10.64501953125, 11.1630859375, 11.68115234375, 12.19921875, 12.71728515625, 13.2353515625, 13.75341796875, 14.271484375, 14.78955078125, 15.3076171875, 15.82568359375, 16.34375]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 7.0, 1.0, 4.0, 8.0, 10.0, 10.0, 8.0, 18.0, 17.0, 24.0, 28.0, 29.0, 68.0, 122.0, 185.0, 357.0, 710.0, 1521.0, 3493.0, 8606.0, 21505.0, 57832.0, 177042.0, 440536.0, 222716.0, 70164.0, 25704.0, 10100.0, 4185.0, 1781.0, 828.0, 369.0, 200.0, 103.0, 62.0, 56.0, 32.0, 32.0, 30.0, 18.0, 13.0, 10.0, 5.0, 3.0, 8.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.1796875, -13.74462890625, -13.3095703125, -12.87451171875, -12.439453125, -12.00439453125, -11.5693359375, -11.13427734375, -10.69921875, -10.26416015625, -9.8291015625, -9.39404296875, -8.958984375, -8.52392578125, -8.0888671875, -7.65380859375, -7.21875, -6.78369140625, -6.3486328125, -5.91357421875, -5.478515625, -5.04345703125, -4.6083984375, -4.17333984375, -3.73828125, -3.30322265625, -2.8681640625, -2.43310546875, -1.998046875, -1.56298828125, -1.1279296875, -0.69287109375, -0.2578125, 0.17724609375, 0.6123046875, 1.04736328125, 1.482421875, 1.91748046875, 2.3525390625, 2.78759765625, 3.22265625, 3.65771484375, 4.0927734375, 4.52783203125, 4.962890625, 5.39794921875, 5.8330078125, 6.26806640625, 6.703125, 7.13818359375, 7.5732421875, 8.00830078125, 8.443359375, 8.87841796875, 9.3134765625, 9.74853515625, 10.18359375, 10.61865234375, 11.0537109375, 11.48876953125, 11.923828125, 12.35888671875, 12.7939453125, 13.22900390625, 13.6640625]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 4.0, 9.0, 2.0, 7.0, 8.0, 10.0, 7.0, 11.0, 11.0, 20.0, 21.0, 22.0, 31.0, 24.0, 22.0, 27.0, 35.0, 45.0, 43.0, 50.0, 81.0, 354.0, 1646.0, 118.0, 51.0, 38.0, 44.0, 28.0, 45.0, 30.0, 29.0, 29.0, 22.0, 26.0, 17.0, 16.0, 14.0, 9.0, 10.0, 7.0, 7.0, 6.0, 5.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 3.0], "bins": [-56.1875, -54.6357421875, -53.083984375, -51.5322265625, -49.98046875, -48.4287109375, -46.876953125, -45.3251953125, -43.7734375, -42.2216796875, -40.669921875, -39.1181640625, -37.56640625, -36.0146484375, -34.462890625, -32.9111328125, -31.359375, -29.8076171875, -28.255859375, -26.7041015625, -25.15234375, -23.6005859375, -22.048828125, -20.4970703125, -18.9453125, -17.3935546875, -15.841796875, -14.2900390625, -12.73828125, -11.1865234375, -9.634765625, -8.0830078125, -6.53125, -4.9794921875, -3.427734375, -1.8759765625, -0.32421875, 1.2275390625, 2.779296875, 4.3310546875, 5.8828125, 7.4345703125, 8.986328125, 10.5380859375, 12.08984375, 13.6416015625, 15.193359375, 16.7451171875, 18.296875, 19.8486328125, 21.400390625, 22.9521484375, 24.50390625, 26.0556640625, 27.607421875, 29.1591796875, 30.7109375, 32.2626953125, 33.814453125, 35.3662109375, 36.91796875, 38.4697265625, 40.021484375, 41.5732421875, 43.125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 3.0, 7.0, 6.0, 7.0, 4.0, 9.0, 13.0, 15.0, 18.0, 37.0, 27.0, 53.0, 56.0, 70.0, 110.0, 129.0, 185.0, 253.0, 439.0, 1002.0, 15709.0, 3075453.0, 49127.0, 1453.0, 485.0, 288.0, 188.0, 147.0, 81.0, 60.0, 68.0, 57.0, 32.0, 29.0, 19.0, 14.0, 15.0, 10.0, 7.0, 6.0, 6.0, 7.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-88.3125, -85.5185546875, -82.724609375, -79.9306640625, -77.13671875, -74.3427734375, -71.548828125, -68.7548828125, -65.9609375, -63.1669921875, -60.373046875, -57.5791015625, -54.78515625, -51.9912109375, -49.197265625, -46.4033203125, -43.609375, -40.8154296875, -38.021484375, -35.2275390625, -32.43359375, -29.6396484375, -26.845703125, -24.0517578125, -21.2578125, -18.4638671875, -15.669921875, -12.8759765625, -10.08203125, -7.2880859375, -4.494140625, -1.7001953125, 1.09375, 3.8876953125, 6.681640625, 9.4755859375, 12.26953125, 15.0634765625, 17.857421875, 20.6513671875, 23.4453125, 26.2392578125, 29.033203125, 31.8271484375, 34.62109375, 37.4150390625, 40.208984375, 43.0029296875, 45.796875, 48.5908203125, 51.384765625, 54.1787109375, 56.97265625, 59.7666015625, 62.560546875, 65.3544921875, 68.1484375, 70.9423828125, 73.736328125, 76.5302734375, 79.32421875, 82.1181640625, 84.912109375, 87.7060546875, 90.5]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [2.0, 4.0, 197.0, 629.0, 180.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.44273567199707, -17.408714294433594, -10.374692916870117, -3.3406715393066406, 3.693349838256836, 10.72736930847168, 17.76139259338379, 24.7954158782959, 31.829435348510742, 38.86345672607422, 45.89747619628906, 52.93149948120117, 59.96552276611328, 66.99954223632812, 74.03356170654297, 81.06758880615234, 88.10160827636719, 95.13562774658203, 102.16964721679688, 109.20367431640625, 116.2376937866211, 123.27171325683594, 130.3057403564453, 137.33975219726562, 144.373779296875, 151.40780639648438, 158.4418182373047, 165.47584533691406, 172.50985717773438, 179.54388427734375, 186.57791137695312, 193.6119384765625, 200.64593505859375, 207.67996215820312, 214.71397399902344, 221.7480010986328, 228.78201293945312, 235.8160400390625, 242.85006713867188, 249.88409423828125, 256.9180908203125, 263.9521179199219, 270.98614501953125, 278.0201416015625, 285.0541687011719, 292.08819580078125, 299.1222229003906, 306.15625, 313.1902770996094, 320.22430419921875, 327.2583312988281, 334.2923278808594, 341.32635498046875, 348.3603820800781, 355.3944091796875, 362.4284362792969, 369.46246337890625, 376.4964904785156, 383.530517578125, 390.56451416015625, 397.5985412597656, 404.632568359375, 411.6665954589844, 418.70062255859375, 425.734619140625]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 8.0, 6.0, 10.0, 8.0, 9.0, 12.0, 17.0, 24.0, 29.0, 30.0, 25.0, 38.0, 38.0, 43.0, 47.0, 54.0, 58.0, 51.0, 55.0, 44.0, 60.0, 32.0, 50.0, 44.0, 40.0, 33.0, 19.0, 18.0, 17.0, 16.0, 13.0, 13.0, 17.0, 7.0, 5.0, 5.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-157.65243530273438, -153.06541442871094, -148.47837829589844, -143.891357421875, -139.3043212890625, -134.71730041503906, -130.13027954101562, -125.54325103759766, -120.95622253417969, -116.36919403076172, -111.78216552734375, -107.19514465332031, -102.60811614990234, -98.02108764648438, -93.43406677246094, -88.84703826904297, -84.260009765625, -79.67298126220703, -75.08595275878906, -70.49893188476562, -65.91190338134766, -61.32487487792969, -56.737850189208984, -52.15082550048828, -47.56379699707031, -42.976768493652344, -38.38974380493164, -33.80271911621094, -29.21569061279297, -24.628664016723633, -20.041637420654297, -15.454612731933594, -10.867584228515625, -6.280557632446289, -1.6935310363769531, 2.893495559692383, 7.480522155761719, 12.067548751831055, 16.65457534790039, 21.241600036621094, 25.828628540039062, 30.4156551361084, 35.002681732177734, 39.58970642089844, 44.176734924316406, 48.763763427734375, 53.35078811645508, 57.93781280517578, 62.52484130859375, 67.11186981201172, 71.69889831542969, 76.28591918945312, 80.8729476928711, 85.45997619628906, 90.0469970703125, 94.63402557373047, 99.22105407714844, 103.8080825805664, 108.39511108398438, 112.98213195800781, 117.56916046142578, 122.15618896484375, 126.74320983886719, 131.33023071289062, 135.91726684570312]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 5.0, 11.0, 8.0, 9.0, 14.0, 16.0, 15.0, 21.0, 23.0, 33.0, 28.0, 31.0, 35.0, 48.0, 41.0, 31.0, 50.0, 31.0, 48.0, 40.0, 36.0, 42.0, 39.0, 46.0, 35.0, 36.0, 36.0, 36.0, 20.0, 23.0, 14.0, 15.0, 14.0, 15.0, 13.0, 14.0, 7.0, 5.0, 9.0, 2.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.140625, -16.6044921875, -16.068359375, -15.5322265625, -14.99609375, -14.4599609375, -13.923828125, -13.3876953125, -12.8515625, -12.3154296875, -11.779296875, -11.2431640625, -10.70703125, -10.1708984375, -9.634765625, -9.0986328125, -8.5625, -8.0263671875, -7.490234375, -6.9541015625, -6.41796875, -5.8818359375, -5.345703125, -4.8095703125, -4.2734375, -3.7373046875, -3.201171875, -2.6650390625, -2.12890625, -1.5927734375, -1.056640625, -0.5205078125, 0.015625, 0.5517578125, 1.087890625, 1.6240234375, 2.16015625, 2.6962890625, 3.232421875, 3.7685546875, 4.3046875, 4.8408203125, 5.376953125, 5.9130859375, 6.44921875, 6.9853515625, 7.521484375, 8.0576171875, 8.59375, 9.1298828125, 9.666015625, 10.2021484375, 10.73828125, 11.2744140625, 11.810546875, 12.3466796875, 12.8828125, 13.4189453125, 13.955078125, 14.4912109375, 15.02734375, 15.5634765625, 16.099609375, 16.6357421875, 17.171875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 6.0, 3.0, 6.0, 5.0, 5.0, 6.0, 10.0, 9.0, 16.0, 15.0, 17.0, 35.0, 40.0, 45.0, 54.0, 56.0, 67.0, 90.0, 147.0, 395.0, 1258.0, 12134.0, 1088410.0, 3038372.0, 49555.0, 2253.0, 535.0, 205.0, 137.0, 77.0, 58.0, 54.0, 45.0, 29.0, 27.0, 27.0, 16.0, 10.0, 11.0, 10.0, 8.0, 10.0, 5.0, 7.0, 5.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-58.0, -56.1396484375, -54.279296875, -52.4189453125, -50.55859375, -48.6982421875, -46.837890625, -44.9775390625, -43.1171875, -41.2568359375, -39.396484375, -37.5361328125, -35.67578125, -33.8154296875, -31.955078125, -30.0947265625, -28.234375, -26.3740234375, -24.513671875, -22.6533203125, -20.79296875, -18.9326171875, -17.072265625, -15.2119140625, -13.3515625, -11.4912109375, -9.630859375, -7.7705078125, -5.91015625, -4.0498046875, -2.189453125, -0.3291015625, 1.53125, 3.3916015625, 5.251953125, 7.1123046875, 8.97265625, 10.8330078125, 12.693359375, 14.5537109375, 16.4140625, 18.2744140625, 20.134765625, 21.9951171875, 23.85546875, 25.7158203125, 27.576171875, 29.4365234375, 31.296875, 33.1572265625, 35.017578125, 36.8779296875, 38.73828125, 40.5986328125, 42.458984375, 44.3193359375, 46.1796875, 48.0400390625, 49.900390625, 51.7607421875, 53.62109375, 55.4814453125, 57.341796875, 59.2021484375, 61.0625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 3.0, 8.0, 2.0, 6.0, 10.0, 15.0, 17.0, 20.0, 36.0, 26.0, 37.0, 52.0, 68.0, 68.0, 111.0, 135.0, 182.0, 277.0, 380.0, 408.0, 478.0, 452.0, 323.0, 237.0, 165.0, 126.0, 110.0, 84.0, 47.0, 39.0, 32.0, 25.0, 24.0, 27.0, 8.0, 6.0, 8.0, 0.0, 3.0, 8.0, 3.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-27.453125, -26.62939453125, -25.8056640625, -24.98193359375, -24.158203125, -23.33447265625, -22.5107421875, -21.68701171875, -20.86328125, -20.03955078125, -19.2158203125, -18.39208984375, -17.568359375, -16.74462890625, -15.9208984375, -15.09716796875, -14.2734375, -13.44970703125, -12.6259765625, -11.80224609375, -10.978515625, -10.15478515625, -9.3310546875, -8.50732421875, -7.68359375, -6.85986328125, -6.0361328125, -5.21240234375, -4.388671875, -3.56494140625, -2.7412109375, -1.91748046875, -1.09375, -0.27001953125, 0.5537109375, 1.37744140625, 2.201171875, 3.02490234375, 3.8486328125, 4.67236328125, 5.49609375, 6.31982421875, 7.1435546875, 7.96728515625, 8.791015625, 9.61474609375, 10.4384765625, 11.26220703125, 12.0859375, 12.90966796875, 13.7333984375, 14.55712890625, 15.380859375, 16.20458984375, 17.0283203125, 17.85205078125, 18.67578125, 19.49951171875, 20.3232421875, 21.14697265625, 21.970703125, 22.79443359375, 23.6181640625, 24.44189453125, 25.265625]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 7.0, 8.0, 8.0, 14.0, 11.0, 17.0, 22.0, 33.0, 55.0, 71.0, 92.0, 119.0, 165.0, 239.0, 341.0, 742.0, 9495.0, 4173600.0, 7315.0, 697.0, 335.0, 231.0, 145.0, 110.0, 108.0, 71.0, 63.0, 37.0, 24.0, 23.0, 19.0, 11.0, 12.0, 16.0, 5.0, 4.0, 7.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-219.75, -213.185546875, -206.62109375, -200.056640625, -193.4921875, -186.927734375, -180.36328125, -173.798828125, -167.234375, -160.669921875, -154.10546875, -147.541015625, -140.9765625, -134.412109375, -127.84765625, -121.283203125, -114.71875, -108.154296875, -101.58984375, -95.025390625, -88.4609375, -81.896484375, -75.33203125, -68.767578125, -62.203125, -55.638671875, -49.07421875, -42.509765625, -35.9453125, -29.380859375, -22.81640625, -16.251953125, -9.6875, -3.123046875, 3.44140625, 10.005859375, 16.5703125, 23.134765625, 29.69921875, 36.263671875, 42.828125, 49.392578125, 55.95703125, 62.521484375, 69.0859375, 75.650390625, 82.21484375, 88.779296875, 95.34375, 101.908203125, 108.47265625, 115.037109375, 121.6015625, 128.166015625, 134.73046875, 141.294921875, 147.859375, 154.423828125, 160.98828125, 167.552734375, 174.1171875, 180.681640625, 187.24609375, 193.810546875, 200.375]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 185.0, 575.0, 226.0, 27.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-354.30059814453125, -341.4563903808594, -328.6121826171875, -315.7679748535156, -302.92376708984375, -290.0795593261719, -277.2353515625, -264.39117431640625, -251.5469512939453, -238.70274353027344, -225.85853576660156, -213.01434326171875, -200.17013549804688, -187.325927734375, -174.48171997070312, -161.63751220703125, -148.79330444335938, -135.9490966796875, -123.10488891601562, -110.26068878173828, -97.4164810180664, -84.57227325439453, -71.72807312011719, -58.88386535644531, -46.03965759277344, -33.19544982910156, -20.351245880126953, -7.507041931152344, 5.337165832519531, 18.181373596191406, 31.02557373046875, 43.869781494140625, 56.7139892578125, 69.55819702148438, 82.40240478515625, 95.2466049194336, 108.09081268310547, 120.93502044677734, 133.7792205810547, 146.62342834472656, 159.46763610839844, 172.3118438720703, 185.1560516357422, 198.000244140625, 210.84445190429688, 223.68865966796875, 236.53286743164062, 249.3770751953125, 262.2212829589844, 275.06549072265625, 287.9096984863281, 300.75390625, 313.5981140136719, 326.44232177734375, 339.2864990234375, 352.1307373046875, 364.97491455078125, 377.8191223144531, 390.663330078125, 403.5075378417969, 416.35174560546875, 429.1959533691406, 442.0401611328125, 454.88433837890625, 467.72857666015625]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 1.0, 6.0, 3.0, 4.0, 6.0, 5.0, 10.0, 12.0, 15.0, 16.0, 16.0, 30.0, 29.0, 28.0, 48.0, 31.0, 34.0, 46.0, 51.0, 49.0, 42.0, 56.0, 34.0, 41.0, 39.0, 35.0, 39.0, 46.0, 38.0, 24.0, 24.0, 23.0, 30.0, 21.0, 19.0, 9.0, 15.0, 11.0, 4.0, 4.0, 9.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-117.321044921875, -113.70855712890625, -110.0960693359375, -106.48357391357422, -102.87108612060547, -99.25859832763672, -95.64610290527344, -92.03361511230469, -88.42112731933594, -84.80863952636719, -81.19615173339844, -77.58365631103516, -73.9711685180664, -70.35868072509766, -66.74618530273438, -63.133697509765625, -59.521209716796875, -55.908721923828125, -52.29623031616211, -48.683738708496094, -45.071250915527344, -41.458763122558594, -37.84627151489258, -34.23377990722656, -30.621292114257812, -27.00880241394043, -23.396312713623047, -19.783823013305664, -16.17133331298828, -12.558843612670898, -8.946353912353516, -5.333864212036133, -1.72137451171875, 1.8911151885986328, 5.503604888916016, 9.116094589233398, 12.728584289550781, 16.341073989868164, 19.953563690185547, 23.56605339050293, 27.178543090820312, 30.791032791137695, 34.40352249145508, 38.016014099121094, 41.628501892089844, 45.240989685058594, 48.85348129272461, 52.465972900390625, 56.078460693359375, 59.690948486328125, 63.30344009399414, 66.91593170166016, 70.5284194946289, 74.14090728759766, 77.75340270996094, 81.36589050292969, 84.97837829589844, 88.59086608886719, 92.20335388183594, 95.81584930419922, 99.42833709716797, 103.04082489013672, 106.6533203125, 110.26580810546875, 113.8782958984375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 11.0, 6.0, 13.0, 13.0, 10.0, 17.0, 21.0, 18.0, 23.0, 23.0, 34.0, 33.0, 42.0, 37.0, 35.0, 30.0, 32.0, 51.0, 48.0, 40.0, 34.0, 36.0, 44.0, 44.0, 38.0, 33.0, 23.0, 21.0, 30.0, 27.0, 25.0, 13.0, 14.0, 16.0, 11.0, 9.0, 10.0, 8.0, 7.0, 6.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.546875, -16.0458984375, -15.544921875, -15.0439453125, -14.54296875, -14.0419921875, -13.541015625, -13.0400390625, -12.5390625, -12.0380859375, -11.537109375, -11.0361328125, -10.53515625, -10.0341796875, -9.533203125, -9.0322265625, -8.53125, -8.0302734375, -7.529296875, -7.0283203125, -6.52734375, -6.0263671875, -5.525390625, -5.0244140625, -4.5234375, -4.0224609375, -3.521484375, -3.0205078125, -2.51953125, -2.0185546875, -1.517578125, -1.0166015625, -0.515625, -0.0146484375, 0.486328125, 0.9873046875, 1.48828125, 1.9892578125, 2.490234375, 2.9912109375, 3.4921875, 3.9931640625, 4.494140625, 4.9951171875, 5.49609375, 5.9970703125, 6.498046875, 6.9990234375, 7.5, 8.0009765625, 8.501953125, 9.0029296875, 9.50390625, 10.0048828125, 10.505859375, 11.0068359375, 11.5078125, 12.0087890625, 12.509765625, 13.0107421875, 13.51171875, 14.0126953125, 14.513671875, 15.0146484375, 15.515625]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 3.0, 3.0, 13.0, 19.0, 18.0, 31.0, 41.0, 61.0, 98.0, 111.0, 161.0, 263.0, 359.0, 548.0, 797.0, 1133.0, 1713.0, 2445.0, 3577.0, 5437.0, 7941.0, 11955.0, 18022.0, 27633.0, 42781.0, 69018.0, 120856.0, 297951.0, 185528.0, 92205.0, 54982.0, 34595.0, 22583.0, 14898.0, 9970.0, 6709.0, 4450.0, 3003.0, 2093.0, 1466.0, 984.0, 664.0, 475.0, 315.0, 187.0, 146.0, 108.0, 59.0, 54.0, 28.0, 23.0, 16.0, 13.0, 10.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0], "bins": [-3.125, -3.0234375, -2.921875, -2.8203125, -2.71875, -2.6171875, -2.515625, -2.4140625, -2.3125, -2.2109375, -2.109375, -2.0078125, -1.90625, -1.8046875, -1.703125, -1.6015625, -1.5, -1.3984375, -1.296875, -1.1953125, -1.09375, -0.9921875, -0.890625, -0.7890625, -0.6875, -0.5859375, -0.484375, -0.3828125, -0.28125, -0.1796875, -0.078125, 0.0234375, 0.125, 0.2265625, 0.328125, 0.4296875, 0.53125, 0.6328125, 0.734375, 0.8359375, 0.9375, 1.0390625, 1.140625, 1.2421875, 1.34375, 1.4453125, 1.546875, 1.6484375, 1.75, 1.8515625, 1.953125, 2.0546875, 2.15625, 2.2578125, 2.359375, 2.4609375, 2.5625, 2.6640625, 2.765625, 2.8671875, 2.96875, 3.0703125, 3.171875, 3.2734375, 3.375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 5.0, 6.0, 3.0, 6.0, 7.0, 8.0, 9.0, 8.0, 19.0, 14.0, 16.0, 10.0, 26.0, 33.0, 31.0, 32.0, 41.0, 34.0, 35.0, 30.0, 43.0, 45.0, 1056.0, 45.0, 47.0, 47.0, 43.0, 28.0, 35.0, 37.0, 30.0, 27.0, 25.0, 30.0, 22.0, 16.0, 9.0, 13.0, 15.0, 6.0, 10.0, 9.0, 6.0, 3.0, 4.0, 2.0, 2.0, 6.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-10.1875, -9.8668212890625, -9.546142578125, -9.2254638671875, -8.90478515625, -8.5841064453125, -8.263427734375, -7.9427490234375, -7.6220703125, -7.3013916015625, -6.980712890625, -6.6600341796875, -6.33935546875, -6.0186767578125, -5.697998046875, -5.3773193359375, -5.056640625, -4.7359619140625, -4.415283203125, -4.0946044921875, -3.77392578125, -3.4532470703125, -3.132568359375, -2.8118896484375, -2.4912109375, -2.1705322265625, -1.849853515625, -1.5291748046875, -1.20849609375, -0.8878173828125, -0.567138671875, -0.2464599609375, 0.07421875, 0.3948974609375, 0.715576171875, 1.0362548828125, 1.35693359375, 1.6776123046875, 1.998291015625, 2.3189697265625, 2.6396484375, 2.9603271484375, 3.281005859375, 3.6016845703125, 3.92236328125, 4.2430419921875, 4.563720703125, 4.8843994140625, 5.205078125, 5.5257568359375, 5.846435546875, 6.1671142578125, 6.48779296875, 6.8084716796875, 7.129150390625, 7.4498291015625, 7.7705078125, 8.0911865234375, 8.411865234375, 8.7325439453125, 9.05322265625, 9.3739013671875, 9.694580078125, 10.0152587890625, 10.3359375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 19.0, 18.0, 18.0, 36.0, 62.0, 96.0, 123.0, 154.0, 240.0, 416.0, 495.0, 709.0, 1134.0, 1538.0, 2144.0, 3207.0, 4456.0, 6664.0, 9518.0, 14716.0, 22148.0, 34587.0, 54920.0, 92597.0, 184540.0, 1335566.0, 127505.0, 71426.0, 43835.0, 28050.0, 18122.0, 11876.0, 8093.0, 5637.0, 3740.0, 2634.0, 1918.0, 1170.0, 950.0, 659.0, 430.0, 280.0, 242.0, 159.0, 85.0, 66.0, 48.0, 34.0, 22.0, 11.0, 10.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-3.154296875, -3.0565185546875, -2.958740234375, -2.8609619140625, -2.76318359375, -2.6654052734375, -2.567626953125, -2.4698486328125, -2.3720703125, -2.2742919921875, -2.176513671875, -2.0787353515625, -1.98095703125, -1.8831787109375, -1.785400390625, -1.6876220703125, -1.58984375, -1.4920654296875, -1.394287109375, -1.2965087890625, -1.19873046875, -1.1009521484375, -1.003173828125, -0.9053955078125, -0.8076171875, -0.7098388671875, -0.612060546875, -0.5142822265625, -0.41650390625, -0.3187255859375, -0.220947265625, -0.1231689453125, -0.025390625, 0.0723876953125, 0.170166015625, 0.2679443359375, 0.36572265625, 0.4635009765625, 0.561279296875, 0.6590576171875, 0.7568359375, 0.8546142578125, 0.952392578125, 1.0501708984375, 1.14794921875, 1.2457275390625, 1.343505859375, 1.4412841796875, 1.5390625, 1.6368408203125, 1.734619140625, 1.8323974609375, 1.93017578125, 2.0279541015625, 2.125732421875, 2.2235107421875, 2.3212890625, 2.4190673828125, 2.516845703125, 2.6146240234375, 2.71240234375, 2.8101806640625, 2.907958984375, 3.0057373046875, 3.103515625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 3.0, 2.0, 9.0, 7.0, 9.0, 12.0, 5.0, 14.0, 24.0, 22.0, 21.0, 25.0, 31.0, 43.0, 40.0, 59.0, 64.0, 65.0, 81.0, 76.0, 62.0, 64.0, 38.0, 43.0, 29.0, 31.0, 29.0, 18.0, 8.0, 18.0, 10.0, 11.0, 5.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.001903533935546875, -0.0018429756164550781, -0.0017824172973632812, -0.0017218589782714844, -0.0016613006591796875, -0.0016007423400878906, -0.0015401840209960938, -0.0014796257019042969, -0.0014190673828125, -0.0013585090637207031, -0.0012979507446289062, -0.0012373924255371094, -0.0011768341064453125, -0.0011162757873535156, -0.0010557174682617188, -0.0009951591491699219, -0.000934600830078125, -0.0008740425109863281, -0.0008134841918945312, -0.0007529258728027344, -0.0006923675537109375, -0.0006318092346191406, -0.0005712509155273438, -0.0005106925964355469, -0.00045013427734375, -0.0003895759582519531, -0.00032901763916015625, -0.0002684593200683594, -0.0002079010009765625, -0.00014734268188476562, -8.678436279296875e-05, -2.6226043701171875e-05, 3.4332275390625e-05, 9.489059448242188e-05, 0.00015544891357421875, 0.00021600723266601562, 0.0002765655517578125, 0.0003371238708496094, 0.00039768218994140625, 0.0004582405090332031, 0.000518798828125, 0.0005793571472167969, 0.0006399154663085938, 0.0007004737854003906, 0.0007610321044921875, 0.0008215904235839844, 0.0008821487426757812, 0.0009427070617675781, 0.001003265380859375, 0.0010638236999511719, 0.0011243820190429688, 0.0011849403381347656, 0.0012454986572265625, 0.0013060569763183594, 0.0013666152954101562, 0.0014271736145019531, 0.00148773193359375, 0.0015482902526855469, 0.0016088485717773438, 0.0016694068908691406, 0.0017299652099609375, 0.0017905235290527344, 0.0018510818481445312, 0.0019116401672363281, 0.001972198486328125]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 5.0, 8.0, 6.0, 9.0, 15.0, 11.0, 20.0, 18.0, 44.0, 45.0, 55.0, 74.0, 150.0, 218.0, 428.0, 1295.0, 930897.0, 113304.0, 908.0, 376.0, 195.0, 124.0, 82.0, 54.0, 33.0, 39.0, 25.0, 18.0, 21.0, 15.0, 15.0, 7.0, 4.0, 8.0, 4.0, 2.0, 3.0, 4.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04437255859375, -0.04293537139892578, -0.04149818420410156, -0.040060997009277344, -0.038623809814453125, -0.037186622619628906, -0.03574943542480469, -0.03431224822998047, -0.03287506103515625, -0.03143787384033203, -0.030000686645507812, -0.028563499450683594, -0.027126312255859375, -0.025689125061035156, -0.024251937866210938, -0.02281475067138672, -0.0213775634765625, -0.01994037628173828, -0.018503189086914062, -0.017066001892089844, -0.015628814697265625, -0.014191627502441406, -0.012754440307617188, -0.011317253112792969, -0.00988006591796875, -0.008442878723144531, -0.0070056915283203125, -0.005568504333496094, -0.004131317138671875, -0.0026941299438476562, -0.0012569427490234375, 0.00018024444580078125, 0.001617431640625, 0.0030546188354492188, 0.0044918060302734375, 0.005928993225097656, 0.007366180419921875, 0.008803367614746094, 0.010240554809570312, 0.011677742004394531, 0.01311492919921875, 0.014552116394042969, 0.015989303588867188, 0.017426490783691406, 0.018863677978515625, 0.020300865173339844, 0.021738052368164062, 0.02317523956298828, 0.0246124267578125, 0.02604961395263672, 0.027486801147460938, 0.028923988342285156, 0.030361175537109375, 0.031798362731933594, 0.03323554992675781, 0.03467273712158203, 0.03610992431640625, 0.03754711151123047, 0.03898429870605469, 0.040421485900878906, 0.041858673095703125, 0.043295860290527344, 0.04473304748535156, 0.04617023468017578, 0.047607421875]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 4.0, 12.0, 57.0, 216.0, 405.0, 244.0, 66.0, 8.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014150834176689386, -0.0013105401303619146, -0.0012059968430548906, -0.0011014534393325448, -0.0009969101520255208, -0.0008923668647184968, -0.0007878235192038119, -0.000683280173689127, -0.000578736886382103, -0.0004741935699712485, -0.00036965025356039405, -0.0002651069371495396, -0.00016056362073868513, -5.602033343166113e-05, 4.8523012083023787e-05, 0.0001530663575977087, 0.0002576096449047327, 0.00036215296131558716, 0.0004666962777264416, 0.0005712396232411265, 0.0006757829105481505, 0.0007803261978551745, 0.0008848695433698595, 0.0009894128888845444, 0.0010939561761915684, 0.0011984994634985924, 0.0013030427508056164, 0.0014075861545279622, 0.0015121294418349862, 0.0016166727291420102, 0.001721216132864356, 0.00182575942017138, 0.0019303024746477604, 0.0020348457619547844, 0.0021393890492618084, 0.0022439323365688324, 0.0023484756238758564, 0.0024530189111828804, 0.002557562431320548, 0.002662105718627572, 0.002766649005934596, 0.00287119229324162, 0.002975735580548644, 0.003080278867855668, 0.0031848223879933357, 0.0032893656753003597, 0.0033939089626073837, 0.0034984522499144077, 0.0036029955372214317, 0.0037075388245284557, 0.0038120821118354797, 0.003916625399142504, 0.004021168686449528, 0.004125711973756552, 0.004230255261063576, 0.004334799014031887, 0.004439341835677624, 0.004543885122984648, 0.004648428410291672, 0.004752971697598696, 0.00485751498490572, 0.004962058272212744, 0.005066601559519768, 0.005171145312488079, 0.005275688599795103]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 11.0, 10.0, 13.0, 19.0, 8.0, 20.0, 19.0, 24.0, 27.0, 24.0, 29.0, 21.0, 32.0, 32.0, 38.0, 42.0, 47.0, 27.0, 35.0, 40.0, 42.0, 50.0, 44.0, 38.0, 29.0, 36.0, 30.0, 32.0, 29.0, 29.0, 17.0, 16.0, 22.0, 11.0, 4.0, 7.0, 11.0, 9.0, 4.0, 4.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0009923577308654785, -0.0009615933522582054, -0.0009308289736509323, -0.0009000645950436592, -0.0008693002164363861, -0.000838535837829113, -0.0008077714592218399, -0.0007770070806145668, -0.0007462427020072937, -0.0007154783234000206, -0.0006847139447927475, -0.0006539495661854744, -0.0006231851875782013, -0.0005924208089709282, -0.0005616564303636551, -0.000530892051756382, -0.0005001276731491089, -0.0004693632945418358, -0.0004385989159345627, -0.0004078345373272896, -0.0003770701587200165, -0.0003463057801127434, -0.0003155414015054703, -0.0002847770228981972, -0.00025401264429092407, -0.00022324826568365097, -0.00019248388707637787, -0.00016171950846910477, -0.00013095512986183167, -0.00010019075125455856, -6.942637264728546e-05, -3.866199404001236e-05, -7.897615432739258e-06, 2.2866763174533844e-05, 5.3631141781806946e-05, 8.439552038908005e-05, 0.00011515989899635315, 0.00014592427760362625, 0.00017668865621089935, 0.00020745303481817245, 0.00023821741342544556, 0.00026898179203271866, 0.00029974617063999176, 0.00033051054924726486, 0.00036127492785453796, 0.00039203930646181107, 0.00042280368506908417, 0.00045356806367635727, 0.00048433244228363037, 0.0005150968208909035, 0.0005458611994981766, 0.0005766255781054497, 0.0006073899567127228, 0.0006381543353199959, 0.000668918713927269, 0.0006996830925345421, 0.0007304474711418152, 0.0007612118497490883, 0.0007919762283563614, 0.0008227406069636345, 0.0008535049855709076, 0.0008842693641781807, 0.0009150337427854538, 0.0009457981213927269, 0.0009765625]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 8.0, 11.0, 6.0, 13.0, 13.0, 11.0, 16.0, 21.0, 18.0, 23.0, 23.0, 34.0, 33.0, 42.0, 37.0, 34.0, 31.0, 32.0, 51.0, 48.0, 40.0, 34.0, 36.0, 44.0, 44.0, 38.0, 33.0, 23.0, 21.0, 30.0, 27.0, 25.0, 13.0, 14.0, 16.0, 11.0, 9.0, 10.0, 8.0, 7.0, 6.0, 7.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.546875, -16.0458984375, -15.544921875, -15.0439453125, -14.54296875, -14.0419921875, -13.541015625, -13.0400390625, -12.5390625, -12.0380859375, -11.537109375, -11.0361328125, -10.53515625, -10.0341796875, -9.533203125, -9.0322265625, -8.53125, -8.0302734375, -7.529296875, -7.0283203125, -6.52734375, -6.0263671875, -5.525390625, -5.0244140625, -4.5234375, -4.0224609375, -3.521484375, -3.0205078125, -2.51953125, -2.0185546875, -1.517578125, -1.0166015625, -0.515625, -0.0146484375, 0.486328125, 0.9873046875, 1.48828125, 1.9892578125, 2.490234375, 2.9912109375, 3.4921875, 3.9931640625, 4.494140625, 4.9951171875, 5.49609375, 5.9970703125, 6.498046875, 6.9990234375, 7.5, 8.0009765625, 8.501953125, 9.0029296875, 9.50390625, 10.0048828125, 10.505859375, 11.0068359375, 11.5078125, 12.0087890625, 12.509765625, 13.0107421875, 13.51171875, 14.0126953125, 14.513671875, 15.0146484375, 15.515625]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 8.0, 11.0, 9.0, 13.0, 16.0, 22.0, 24.0, 43.0, 37.0, 46.0, 66.0, 98.0, 149.0, 238.0, 315.0, 571.0, 1531.0, 7568.0, 56325.0, 593391.0, 346329.0, 34154.0, 4920.0, 1153.0, 535.0, 264.0, 212.0, 113.0, 89.0, 66.0, 50.0, 45.0, 30.0, 17.0, 22.0, 13.0, 9.0, 13.0, 8.0, 8.0, 6.0, 7.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-31.78125, -30.814697265625, -29.84814453125, -28.881591796875, -27.9150390625, -26.948486328125, -25.98193359375, -25.015380859375, -24.048828125, -23.082275390625, -22.11572265625, -21.149169921875, -20.1826171875, -19.216064453125, -18.24951171875, -17.282958984375, -16.31640625, -15.349853515625, -14.38330078125, -13.416748046875, -12.4501953125, -11.483642578125, -10.51708984375, -9.550537109375, -8.583984375, -7.617431640625, -6.65087890625, -5.684326171875, -4.7177734375, -3.751220703125, -2.78466796875, -1.818115234375, -0.8515625, 0.114990234375, 1.08154296875, 2.048095703125, 3.0146484375, 3.981201171875, 4.94775390625, 5.914306640625, 6.880859375, 7.847412109375, 8.81396484375, 9.780517578125, 10.7470703125, 11.713623046875, 12.68017578125, 13.646728515625, 14.61328125, 15.579833984375, 16.54638671875, 17.512939453125, 18.4794921875, 19.446044921875, 20.41259765625, 21.379150390625, 22.345703125, 23.312255859375, 24.27880859375, 25.245361328125, 26.2119140625, 27.178466796875, 28.14501953125, 29.111572265625, 30.078125]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 6.0, 6.0, 5.0, 11.0, 7.0, 13.0, 10.0, 17.0, 14.0, 19.0, 25.0, 30.0, 38.0, 43.0, 50.0, 66.0, 58.0, 74.0, 176.0, 1643.0, 274.0, 77.0, 55.0, 25.0, 38.0, 39.0, 34.0, 31.0, 27.0, 35.0, 23.0, 15.0, 11.0, 15.0, 6.0, 14.0, 6.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.65625, -43.87646484375, -42.0966796875, -40.31689453125, -38.537109375, -36.75732421875, -34.9775390625, -33.19775390625, -31.41796875, -29.63818359375, -27.8583984375, -26.07861328125, -24.298828125, -22.51904296875, -20.7392578125, -18.95947265625, -17.1796875, -15.39990234375, -13.6201171875, -11.84033203125, -10.060546875, -8.28076171875, -6.5009765625, -4.72119140625, -2.94140625, -1.16162109375, 0.6181640625, 2.39794921875, 4.177734375, 5.95751953125, 7.7373046875, 9.51708984375, 11.296875, 13.07666015625, 14.8564453125, 16.63623046875, 18.416015625, 20.19580078125, 21.9755859375, 23.75537109375, 25.53515625, 27.31494140625, 29.0947265625, 30.87451171875, 32.654296875, 34.43408203125, 36.2138671875, 37.99365234375, 39.7734375, 41.55322265625, 43.3330078125, 45.11279296875, 46.892578125, 48.67236328125, 50.4521484375, 52.23193359375, 54.01171875, 55.79150390625, 57.5712890625, 59.35107421875, 61.130859375, 62.91064453125, 64.6904296875, 66.47021484375, 68.25]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 8.0, 9.0, 14.0, 13.0, 17.0, 25.0, 30.0, 52.0, 53.0, 78.0, 105.0, 151.0, 355.0, 958.0, 15016.0, 3119053.0, 8004.0, 853.0, 321.0, 179.0, 111.0, 82.0, 53.0, 46.0, 23.0, 22.0, 13.0, 15.0, 12.0, 7.0, 10.0, 5.0, 3.0, 3.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-158.75, -153.85546875, -148.9609375, -144.06640625, -139.171875, -134.27734375, -129.3828125, -124.48828125, -119.59375, -114.69921875, -109.8046875, -104.91015625, -100.015625, -95.12109375, -90.2265625, -85.33203125, -80.4375, -75.54296875, -70.6484375, -65.75390625, -60.859375, -55.96484375, -51.0703125, -46.17578125, -41.28125, -36.38671875, -31.4921875, -26.59765625, -21.703125, -16.80859375, -11.9140625, -7.01953125, -2.125, 2.76953125, 7.6640625, 12.55859375, 17.453125, 22.34765625, 27.2421875, 32.13671875, 37.03125, 41.92578125, 46.8203125, 51.71484375, 56.609375, 61.50390625, 66.3984375, 71.29296875, 76.1875, 81.08203125, 85.9765625, 90.87109375, 95.765625, 100.66015625, 105.5546875, 110.44921875, 115.34375, 120.23828125, 125.1328125, 130.02734375, 134.921875, 139.81640625, 144.7109375, 149.60546875, 154.5]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 47.0, 900.0, 67.0], "bins": [-1061.2073974609375, -1044.218505859375, -1027.229736328125, -1010.2409057617188, -993.2520751953125, -976.2632446289062, -959.2744140625, -942.2855834960938, -925.2967529296875, -908.3079223632812, -891.319091796875, -874.3302612304688, -857.3414306640625, -840.3526000976562, -823.36376953125, -806.3749389648438, -789.3861083984375, -772.3972778320312, -755.408447265625, -738.4196166992188, -721.4307861328125, -704.4419555664062, -687.453125, -670.4642944335938, -653.4754638671875, -636.4866333007812, -619.497802734375, -602.5089721679688, -585.5201416015625, -568.5313110351562, -551.54248046875, -534.5536499023438, -517.5647583007812, -500.575927734375, -483.58709716796875, -466.5982666015625, -449.60943603515625, -432.62060546875, -415.63177490234375, -398.6429443359375, -381.65411376953125, -364.665283203125, -347.67645263671875, -330.6876220703125, -313.69879150390625, -296.7099609375, -279.72113037109375, -262.7322998046875, -245.74346923828125, -228.754638671875, -211.76580810546875, -194.7769775390625, -177.78814697265625, -160.79931640625, -143.81048583984375, -126.8216552734375, -109.83282470703125, -92.843994140625, -75.85516357421875, -58.8663330078125, -41.87750244140625, -24.888671875, -7.89984130859375, 9.0889892578125, 26.077817916870117]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 12.0, 6.0, 5.0, 6.0, 12.0, 9.0, 6.0, 19.0, 13.0, 13.0, 16.0, 26.0, 19.0, 27.0, 26.0, 36.0, 35.0, 42.0, 35.0, 40.0, 56.0, 42.0, 52.0, 50.0, 48.0, 36.0, 34.0, 34.0, 35.0, 28.0, 18.0, 21.0, 23.0, 13.0, 18.0, 16.0, 9.0, 16.0, 11.0, 9.0, 8.0, 6.0, 7.0, 2.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-132.7777557373047, -128.6074981689453, -124.43724822998047, -120.26699829101562, -116.09674072265625, -111.92648315429688, -107.75623321533203, -103.58598327636719, -99.41572570800781, -95.24546813964844, -91.0752182006836, -86.90496826171875, -82.73471069335938, -78.564453125, -74.39420318603516, -70.22395324707031, -66.05369567871094, -61.88344192504883, -57.71318817138672, -53.54293441772461, -49.3726806640625, -45.20242691040039, -41.03217315673828, -36.86191940307617, -32.69166564941406, -28.521411895751953, -24.351158142089844, -20.180904388427734, -16.010650634765625, -11.840396881103516, -7.670143127441406, -3.499889373779297, 0.670379638671875, 4.840633392333984, 9.010887145996094, 13.181140899658203, 17.351394653320312, 21.521648406982422, 25.69190216064453, 29.86215591430664, 34.03240966796875, 38.20266342163086, 42.37291717529297, 46.54317092895508, 50.71342468261719, 54.8836784362793, 59.053932189941406, 63.224185943603516, 67.39443969726562, 71.564697265625, 75.73494720458984, 79.90519714355469, 84.07545471191406, 88.24571228027344, 92.41596221923828, 96.58621215820312, 100.7564697265625, 104.92672729492188, 109.09697723388672, 113.26722717285156, 117.43748474121094, 121.60774230957031, 125.77799224853516, 129.9482421875, 134.11849975585938]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 5.0, 2.0, 3.0, 4.0, 5.0, 9.0, 8.0, 6.0, 10.0, 11.0, 13.0, 14.0, 19.0, 31.0, 22.0, 22.0, 22.0, 27.0, 26.0, 28.0, 42.0, 34.0, 45.0, 41.0, 35.0, 38.0, 32.0, 38.0, 44.0, 35.0, 27.0, 42.0, 33.0, 25.0, 25.0, 21.0, 24.0, 18.0, 20.0, 19.0, 11.0, 9.0, 12.0, 8.0, 8.0, 9.0, 10.0, 5.0, 3.0, 6.0, 2.0, 0.0, 1.0, 2.0, 3.0], "bins": [-16.546875, -16.0677490234375, -15.588623046875, -15.1094970703125, -14.63037109375, -14.1512451171875, -13.672119140625, -13.1929931640625, -12.7138671875, -12.2347412109375, -11.755615234375, -11.2764892578125, -10.79736328125, -10.3182373046875, -9.839111328125, -9.3599853515625, -8.880859375, -8.4017333984375, -7.922607421875, -7.4434814453125, -6.96435546875, -6.4852294921875, -6.006103515625, -5.5269775390625, -5.0478515625, -4.5687255859375, -4.089599609375, -3.6104736328125, -3.13134765625, -2.6522216796875, -2.173095703125, -1.6939697265625, -1.21484375, -0.7357177734375, -0.256591796875, 0.2225341796875, 0.70166015625, 1.1807861328125, 1.659912109375, 2.1390380859375, 2.6181640625, 3.0972900390625, 3.576416015625, 4.0555419921875, 4.53466796875, 5.0137939453125, 5.492919921875, 5.9720458984375, 6.451171875, 6.9302978515625, 7.409423828125, 7.8885498046875, 8.36767578125, 8.8468017578125, 9.325927734375, 9.8050537109375, 10.2841796875, 10.7633056640625, 11.242431640625, 11.7215576171875, 12.20068359375, 12.6798095703125, 13.158935546875, 13.6380615234375, 14.1171875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [4.0, 1.0, 3.0, 3.0, 3.0, 0.0, 3.0, 6.0, 4.0, 3.0, 6.0, 9.0, 8.0, 16.0, 9.0, 19.0, 15.0, 26.0, 30.0, 35.0, 49.0, 65.0, 80.0, 116.0, 163.0, 229.0, 442.0, 1089.0, 5440.0, 125983.0, 2815712.0, 1210363.0, 30048.0, 2533.0, 695.0, 310.0, 180.0, 151.0, 88.0, 73.0, 65.0, 40.0, 36.0, 30.0, 15.0, 14.0, 17.0, 14.0, 10.0, 7.0, 9.0, 7.0, 10.0, 7.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-45.46875, -43.99267578125, -42.5166015625, -41.04052734375, -39.564453125, -38.08837890625, -36.6123046875, -35.13623046875, -33.66015625, -32.18408203125, -30.7080078125, -29.23193359375, -27.755859375, -26.27978515625, -24.8037109375, -23.32763671875, -21.8515625, -20.37548828125, -18.8994140625, -17.42333984375, -15.947265625, -14.47119140625, -12.9951171875, -11.51904296875, -10.04296875, -8.56689453125, -7.0908203125, -5.61474609375, -4.138671875, -2.66259765625, -1.1865234375, 0.28955078125, 1.765625, 3.24169921875, 4.7177734375, 6.19384765625, 7.669921875, 9.14599609375, 10.6220703125, 12.09814453125, 13.57421875, 15.05029296875, 16.5263671875, 18.00244140625, 19.478515625, 20.95458984375, 22.4306640625, 23.90673828125, 25.3828125, 26.85888671875, 28.3349609375, 29.81103515625, 31.287109375, 32.76318359375, 34.2392578125, 35.71533203125, 37.19140625, 38.66748046875, 40.1435546875, 41.61962890625, 43.095703125, 44.57177734375, 46.0478515625, 47.52392578125, 49.0]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 2.0, 2.0, 0.0, 10.0, 7.0, 10.0, 15.0, 22.0, 24.0, 48.0, 61.0, 85.0, 118.0, 185.0, 264.0, 419.0, 584.0, 644.0, 549.0, 379.0, 225.0, 150.0, 99.0, 67.0, 41.0, 25.0, 18.0, 9.0, 3.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.625, -38.43505859375, -37.2451171875, -36.05517578125, -34.865234375, -33.67529296875, -32.4853515625, -31.29541015625, -30.10546875, -28.91552734375, -27.7255859375, -26.53564453125, -25.345703125, -24.15576171875, -22.9658203125, -21.77587890625, -20.5859375, -19.39599609375, -18.2060546875, -17.01611328125, -15.826171875, -14.63623046875, -13.4462890625, -12.25634765625, -11.06640625, -9.87646484375, -8.6865234375, -7.49658203125, -6.306640625, -5.11669921875, -3.9267578125, -2.73681640625, -1.546875, -0.35693359375, 0.8330078125, 2.02294921875, 3.212890625, 4.40283203125, 5.5927734375, 6.78271484375, 7.97265625, 9.16259765625, 10.3525390625, 11.54248046875, 12.732421875, 13.92236328125, 15.1123046875, 16.30224609375, 17.4921875, 18.68212890625, 19.8720703125, 21.06201171875, 22.251953125, 23.44189453125, 24.6318359375, 25.82177734375, 27.01171875, 28.20166015625, 29.3916015625, 30.58154296875, 31.771484375, 32.96142578125, 34.1513671875, 35.34130859375, 36.53125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 6.0, 3.0, 5.0, 5.0, 4.0, 7.0, 9.0, 20.0, 18.0, 19.0, 27.0, 26.0, 31.0, 50.0, 48.0, 89.0, 117.0, 166.0, 191.0, 381.0, 773.0, 3862.0, 2603855.0, 1579261.0, 3295.0, 768.0, 319.0, 209.0, 163.0, 127.0, 79.0, 73.0, 44.0, 44.0, 45.0, 26.0, 29.0, 27.0, 14.0, 15.0, 9.0, 8.0, 4.0, 8.0, 5.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-129.875, -125.232421875, -120.58984375, -115.947265625, -111.3046875, -106.662109375, -102.01953125, -97.376953125, -92.734375, -88.091796875, -83.44921875, -78.806640625, -74.1640625, -69.521484375, -64.87890625, -60.236328125, -55.59375, -50.951171875, -46.30859375, -41.666015625, -37.0234375, -32.380859375, -27.73828125, -23.095703125, -18.453125, -13.810546875, -9.16796875, -4.525390625, 0.1171875, 4.759765625, 9.40234375, 14.044921875, 18.6875, 23.330078125, 27.97265625, 32.615234375, 37.2578125, 41.900390625, 46.54296875, 51.185546875, 55.828125, 60.470703125, 65.11328125, 69.755859375, 74.3984375, 79.041015625, 83.68359375, 88.326171875, 92.96875, 97.611328125, 102.25390625, 106.896484375, 111.5390625, 116.181640625, 120.82421875, 125.466796875, 130.109375, 134.751953125, 139.39453125, 144.037109375, 148.6796875, 153.322265625, 157.96484375, 162.607421875, 167.25]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 19.0, 698.0, 295.0, 4.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-933.2070922851562, -909.7885131835938, -886.3699951171875, -862.951416015625, -839.5328369140625, -816.1143188476562, -792.6957397460938, -769.2772216796875, -745.858642578125, -722.4400634765625, -699.0215454101562, -675.6029663085938, -652.1844482421875, -628.765869140625, -605.3472900390625, -581.9287109375, -558.5101928710938, -535.0916137695312, -511.673095703125, -488.2545166015625, -464.8359680175781, -441.41741943359375, -417.99884033203125, -394.5802917480469, -371.1617431640625, -347.7431945800781, -324.32464599609375, -300.90606689453125, -277.4875183105469, -254.0689697265625, -230.65040588378906, -207.23184204101562, -183.8133544921875, -160.39480590820312, -136.9762420654297, -113.55768585205078, -90.13912963867188, -66.72057342529297, -43.30201721191406, -19.883453369140625, 3.53509521484375, 26.953651428222656, 50.37220764160156, 73.79076385498047, 97.20932006835938, 120.62787628173828, 144.0464324951172, 167.46499633789062, 190.883544921875, 214.30209350585938, 237.7206573486328, 261.13922119140625, 284.5577697753906, 307.976318359375, 331.3948974609375, 354.8134460449219, 378.23199462890625, 401.6505432128906, 425.069091796875, 448.4876708984375, 471.9062194824219, 495.32476806640625, 518.7433471679688, 542.161865234375, 565.5804443359375]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 0.0, 2.0, 7.0, 9.0, 1.0, 11.0, 11.0, 11.0, 12.0, 19.0, 25.0, 22.0, 25.0, 22.0, 31.0, 36.0, 33.0, 43.0, 44.0, 36.0, 36.0, 47.0, 42.0, 55.0, 46.0, 56.0, 31.0, 21.0, 36.0, 31.0, 34.0, 21.0, 32.0, 18.0, 23.0, 13.0, 17.0, 12.0, 9.0, 12.0, 5.0, 7.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-117.49139404296875, -114.28168487548828, -111.07197570800781, -107.86226654052734, -104.65255737304688, -101.4428482055664, -98.23313903808594, -95.02342987060547, -91.813720703125, -88.60401153564453, -85.39430236816406, -82.1845932006836, -78.97488403320312, -75.76517486572266, -72.55546569824219, -69.34575653076172, -66.13604736328125, -62.92633819580078, -59.71662902832031, -56.506919860839844, -53.297210693359375, -50.087501525878906, -46.87779235839844, -43.66808319091797, -40.4583740234375, -37.24866485595703, -34.03895568847656, -30.829246520996094, -27.619537353515625, -24.409828186035156, -21.200119018554688, -17.99040985107422, -14.78070068359375, -11.570991516113281, -8.361282348632812, -5.151573181152344, -1.941864013671875, 1.2678451538085938, 4.4775543212890625, 7.687263488769531, 10.89697265625, 14.106681823730469, 17.316390991210938, 20.526100158691406, 23.735809326171875, 26.945518493652344, 30.155227661132812, 33.36493682861328, 36.57464599609375, 39.78435516357422, 42.99406433105469, 46.203773498535156, 49.413482666015625, 52.623191833496094, 55.83290100097656, 59.04261016845703, 62.2523193359375, 65.46202850341797, 68.67173767089844, 71.8814468383789, 75.09115600585938, 78.30086517333984, 81.51057434082031, 84.72028350830078, 87.92999267578125]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 3.0, 2.0, 6.0, 6.0, 9.0, 16.0, 11.0, 11.0, 23.0, 23.0, 22.0, 28.0, 21.0, 31.0, 43.0, 29.0, 41.0, 40.0, 39.0, 37.0, 47.0, 51.0, 54.0, 34.0, 43.0, 40.0, 48.0, 33.0, 25.0, 27.0, 32.0, 23.0, 14.0, 19.0, 15.0, 18.0, 9.0, 7.0, 4.0, 8.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.617919921875, -17.04833984375, -16.478759765625, -15.9091796875, -15.339599609375, -14.77001953125, -14.200439453125, -13.630859375, -13.061279296875, -12.49169921875, -11.922119140625, -11.3525390625, -10.782958984375, -10.21337890625, -9.643798828125, -9.07421875, -8.504638671875, -7.93505859375, -7.365478515625, -6.7958984375, -6.226318359375, -5.65673828125, -5.087158203125, -4.517578125, -3.947998046875, -3.37841796875, -2.808837890625, -2.2392578125, -1.669677734375, -1.10009765625, -0.530517578125, 0.0390625, 0.608642578125, 1.17822265625, 1.747802734375, 2.3173828125, 2.886962890625, 3.45654296875, 4.026123046875, 4.595703125, 5.165283203125, 5.73486328125, 6.304443359375, 6.8740234375, 7.443603515625, 8.01318359375, 8.582763671875, 9.15234375, 9.721923828125, 10.29150390625, 10.861083984375, 11.4306640625, 12.000244140625, 12.56982421875, 13.139404296875, 13.708984375, 14.278564453125, 14.84814453125, 15.417724609375, 15.9873046875, 16.556884765625, 17.12646484375, 17.696044921875, 18.265625]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 3.0, 7.0, 5.0, 6.0, 11.0, 24.0, 25.0, 29.0, 42.0, 68.0, 100.0, 151.0, 213.0, 338.0, 443.0, 793.0, 1008.0, 1619.0, 2401.0, 3666.0, 5617.0, 8559.0, 13536.0, 21580.0, 35927.0, 61216.0, 110630.0, 302842.0, 234410.0, 99027.0, 55642.0, 32910.0, 20108.0, 12216.0, 8080.0, 5125.0, 3417.0, 2250.0, 1478.0, 977.0, 659.0, 472.0, 307.0, 221.0, 131.0, 77.0, 66.0, 35.0, 31.0, 25.0, 20.0, 7.0, 4.0, 6.0, 7.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.990234375, -3.865203857421875, -3.74017333984375, -3.615142822265625, -3.4901123046875, -3.365081787109375, -3.24005126953125, -3.115020751953125, -2.989990234375, -2.864959716796875, -2.73992919921875, -2.614898681640625, -2.4898681640625, -2.364837646484375, -2.23980712890625, -2.114776611328125, -1.98974609375, -1.864715576171875, -1.73968505859375, -1.614654541015625, -1.4896240234375, -1.364593505859375, -1.23956298828125, -1.114532470703125, -0.989501953125, -0.864471435546875, -0.73944091796875, -0.614410400390625, -0.4893798828125, -0.364349365234375, -0.23931884765625, -0.114288330078125, 0.0107421875, 0.135772705078125, 0.26080322265625, 0.385833740234375, 0.5108642578125, 0.635894775390625, 0.76092529296875, 0.885955810546875, 1.010986328125, 1.136016845703125, 1.26104736328125, 1.386077880859375, 1.5111083984375, 1.636138916015625, 1.76116943359375, 1.886199951171875, 2.01123046875, 2.136260986328125, 2.26129150390625, 2.386322021484375, 2.5113525390625, 2.636383056640625, 2.76141357421875, 2.886444091796875, 3.011474609375, 3.136505126953125, 3.26153564453125, 3.386566162109375, 3.5115966796875, 3.636627197265625, 3.76165771484375, 3.886688232421875, 4.01171875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 9.0, 6.0, 7.0, 9.0, 13.0, 11.0, 18.0, 18.0, 15.0, 18.0, 23.0, 28.0, 38.0, 32.0, 33.0, 38.0, 35.0, 31.0, 34.0, 41.0, 34.0, 1053.0, 31.0, 41.0, 34.0, 23.0, 38.0, 30.0, 41.0, 34.0, 30.0, 20.0, 16.0, 12.0, 22.0, 20.0, 16.0, 13.0, 9.0, 13.0, 8.0, 5.0, 6.0, 5.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0], "bins": [-11.140625, -10.817138671875, -10.49365234375, -10.170166015625, -9.8466796875, -9.523193359375, -9.19970703125, -8.876220703125, -8.552734375, -8.229248046875, -7.90576171875, -7.582275390625, -7.2587890625, -6.935302734375, -6.61181640625, -6.288330078125, -5.96484375, -5.641357421875, -5.31787109375, -4.994384765625, -4.6708984375, -4.347412109375, -4.02392578125, -3.700439453125, -3.376953125, -3.053466796875, -2.72998046875, -2.406494140625, -2.0830078125, -1.759521484375, -1.43603515625, -1.112548828125, -0.7890625, -0.465576171875, -0.14208984375, 0.181396484375, 0.5048828125, 0.828369140625, 1.15185546875, 1.475341796875, 1.798828125, 2.122314453125, 2.44580078125, 2.769287109375, 3.0927734375, 3.416259765625, 3.73974609375, 4.063232421875, 4.38671875, 4.710205078125, 5.03369140625, 5.357177734375, 5.6806640625, 6.004150390625, 6.32763671875, 6.651123046875, 6.974609375, 7.298095703125, 7.62158203125, 7.945068359375, 8.2685546875, 8.592041015625, 8.91552734375, 9.239013671875, 9.5625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 6.0, 15.0, 15.0, 23.0, 35.0, 52.0, 82.0, 120.0, 173.0, 244.0, 360.0, 555.0, 785.0, 1162.0, 1677.0, 2405.0, 3339.0, 4814.0, 6833.0, 9881.0, 14309.0, 21149.0, 32139.0, 49070.0, 77689.0, 131929.0, 1313205.0, 164042.0, 90619.0, 56694.0, 36654.0, 24177.0, 16206.0, 11003.0, 7802.0, 5385.0, 3878.0, 2647.0, 1872.0, 1295.0, 891.0, 586.0, 457.0, 296.0, 207.0, 128.0, 77.0, 51.0, 42.0, 21.0, 14.0, 11.0, 7.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-2.947265625, -2.847900390625, -2.74853515625, -2.649169921875, -2.5498046875, -2.450439453125, -2.35107421875, -2.251708984375, -2.15234375, -2.052978515625, -1.95361328125, -1.854248046875, -1.7548828125, -1.655517578125, -1.55615234375, -1.456787109375, -1.357421875, -1.258056640625, -1.15869140625, -1.059326171875, -0.9599609375, -0.860595703125, -0.76123046875, -0.661865234375, -0.5625, -0.463134765625, -0.36376953125, -0.264404296875, -0.1650390625, -0.065673828125, 0.03369140625, 0.133056640625, 0.232421875, 0.331787109375, 0.43115234375, 0.530517578125, 0.6298828125, 0.729248046875, 0.82861328125, 0.927978515625, 1.02734375, 1.126708984375, 1.22607421875, 1.325439453125, 1.4248046875, 1.524169921875, 1.62353515625, 1.722900390625, 1.822265625, 1.921630859375, 2.02099609375, 2.120361328125, 2.2197265625, 2.319091796875, 2.41845703125, 2.517822265625, 2.6171875, 2.716552734375, 2.81591796875, 2.915283203125, 3.0146484375, 3.114013671875, 3.21337890625, 3.312744140625, 3.412109375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 4.0, 0.0, 4.0, 5.0, 7.0, 7.0, 11.0, 9.0, 15.0, 16.0, 21.0, 13.0, 19.0, 31.0, 35.0, 49.0, 44.0, 57.0, 78.0, 61.0, 85.0, 78.0, 60.0, 43.0, 46.0, 34.0, 25.0, 21.0, 22.0, 24.0, 21.0, 13.0, 6.0, 10.0, 4.0, 9.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0018939971923828125, -0.0018333792686462402, -0.001772761344909668, -0.0017121434211730957, -0.0016515254974365234, -0.0015909075736999512, -0.001530289649963379, -0.0014696717262268066, -0.0014090538024902344, -0.0013484358787536621, -0.0012878179550170898, -0.0012272000312805176, -0.0011665821075439453, -0.001105964183807373, -0.0010453462600708008, -0.0009847283363342285, -0.0009241104125976562, -0.000863492488861084, -0.0008028745651245117, -0.0007422566413879395, -0.0006816387176513672, -0.0006210207939147949, -0.0005604028701782227, -0.0004997849464416504, -0.0004391670227050781, -0.00037854909896850586, -0.0003179311752319336, -0.00025731325149536133, -0.00019669532775878906, -0.0001360774040222168, -7.545948028564453e-05, -1.4841556549072266e-05, 4.57763671875e-05, 0.00010639429092407227, 0.00016701221466064453, 0.0002276301383972168, 0.00028824806213378906, 0.00034886598587036133, 0.0004094839096069336, 0.00047010183334350586, 0.0005307197570800781, 0.0005913376808166504, 0.0006519556045532227, 0.0007125735282897949, 0.0007731914520263672, 0.0008338093757629395, 0.0008944272994995117, 0.000955045223236084, 0.0010156631469726562, 0.0010762810707092285, 0.0011368989944458008, 0.001197516918182373, 0.0012581348419189453, 0.0013187527656555176, 0.0013793706893920898, 0.0014399886131286621, 0.0015006065368652344, 0.0015612244606018066, 0.001621842384338379, 0.0016824603080749512, 0.0017430782318115234, 0.0018036961555480957, 0.001864314079284668, 0.0019249320030212402, 0.0019855499267578125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 5.0, 9.0, 10.0, 10.0, 11.0, 8.0, 19.0, 26.0, 29.0, 28.0, 42.0, 42.0, 85.0, 102.0, 213.0, 394.0, 1506.0, 1030443.0, 14170.0, 620.0, 266.0, 151.0, 84.0, 55.0, 57.0, 26.0, 20.0, 31.0, 19.0, 13.0, 16.0, 5.0, 9.0, 6.0, 6.0, 4.0, 2.0, 6.0, 2.0, 2.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.048797607421875, -0.047304630279541016, -0.04581165313720703, -0.04431867599487305, -0.04282569885253906, -0.04133272171020508, -0.039839744567871094, -0.03834676742553711, -0.036853790283203125, -0.03536081314086914, -0.033867835998535156, -0.03237485885620117, -0.030881881713867188, -0.029388904571533203, -0.02789592742919922, -0.026402950286865234, -0.02490997314453125, -0.023416996002197266, -0.02192401885986328, -0.020431041717529297, -0.018938064575195312, -0.017445087432861328, -0.015952110290527344, -0.01445913314819336, -0.012966156005859375, -0.01147317886352539, -0.009980201721191406, -0.008487224578857422, -0.0069942474365234375, -0.005501270294189453, -0.004008293151855469, -0.0025153160095214844, -0.0010223388671875, 0.0004706382751464844, 0.0019636154174804688, 0.003456592559814453, 0.0049495697021484375, 0.006442546844482422, 0.007935523986816406, 0.00942850112915039, 0.010921478271484375, 0.01241445541381836, 0.013907432556152344, 0.015400409698486328, 0.016893386840820312, 0.018386363983154297, 0.01987934112548828, 0.021372318267822266, 0.02286529541015625, 0.024358272552490234, 0.02585124969482422, 0.027344226837158203, 0.028837203979492188, 0.030330181121826172, 0.031823158264160156, 0.03331613540649414, 0.034809112548828125, 0.03630208969116211, 0.037795066833496094, 0.03928804397583008, 0.04078102111816406, 0.04227399826049805, 0.04376697540283203, 0.045259952545166016, 0.0467529296875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 28.0, 201.0, 538.0, 226.0, 18.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006039888132363558, -0.005897787865251303, -0.00575568713247776, -0.005613586865365505, -0.00547148659825325, -0.005329386331140995, -0.00518728606402874, -0.0050451853312551975, -0.004903085064142942, -0.004760984797030687, -0.004618884064257145, -0.00447678379714489, -0.004334683530032635, -0.00419258326292038, -0.0040504829958081245, -0.003908382263034582, -0.003766281995922327, -0.003624181728810072, -0.003482081228867173, -0.0033399807289242744, -0.0031978804618120193, -0.0030557801946997643, -0.0029136796947568655, -0.0027715791948139668, -0.0026294789277017117, -0.0024873786605894566, -0.002345278160646558, -0.002203177660703659, -0.002061077393591404, -0.001918977010063827, -0.0017768766265362501, -0.0016347762430086732, -0.0014926756266504526, -0.0013505752431228757, -0.0012084748595952988, -0.0010663744760677218, -0.0009242740925401449, -0.000782173709012568, -0.0006400733254849911, -0.0004979729419574142, -0.0003558725584298372, -0.0002137721749022603, -7.167179137468338e-05, 7.042859215289354e-05, 0.00021252897568047047, 0.0003546293592080474, 0.0004967297427356243, 0.0006388301262632012, 0.0007809305097907782, 0.0009230308933183551, 0.001065131276845932, 0.001207231660373509, 0.0013493320439010859, 0.0014914324274286628, 0.0016335328109562397, 0.0017756331944838166, 0.0019177335780113935, 0.0020598340779542923, 0.0022019343450665474, 0.0023440346121788025, 0.0024861351121217012, 0.0026282356120646, 0.002770335879176855, 0.00291243614628911, 0.003054536646232009]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 9.0, 9.0, 12.0, 12.0, 19.0, 22.0, 18.0, 23.0, 24.0, 26.0, 33.0, 41.0, 35.0, 26.0, 39.0, 41.0, 42.0, 46.0, 31.0, 42.0, 42.0, 36.0, 49.0, 45.0, 26.0, 45.0, 28.0, 27.0, 26.0, 21.0, 18.0, 20.0, 18.0, 15.0, 10.0, 10.0, 7.0, 1.0, 2.0, 7.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008946061134338379, -0.0008631432428956032, -0.0008316803723573685, -0.0008002175018191338, -0.000768754631280899, -0.0007372917607426643, -0.0007058288902044296, -0.0006743660196661949, -0.0006429031491279602, -0.0006114402785897255, -0.0005799774080514908, -0.0005485145375132561, -0.0005170516669750214, -0.00048558879643678665, -0.00045412592589855194, -0.00042266305536031723, -0.0003912001848220825, -0.0003597373142838478, -0.0003282744437456131, -0.0002968115732073784, -0.0002653487026691437, -0.00023388583213090897, -0.00020242296159267426, -0.00017096009105443954, -0.00013949722051620483, -0.00010803434997797012, -7.657147943973541e-05, -4.51086089015007e-05, -1.3645738363265991e-05, 1.781713217496872e-05, 4.928000271320343e-05, 8.074287325143814e-05, 0.00011220574378967285, 0.00014366861432790756, 0.00017513148486614227, 0.00020659435540437698, 0.0002380572259426117, 0.0002695200964808464, 0.0003009829670190811, 0.0003324458375573158, 0.00036390870809555054, 0.00039537157863378525, 0.00042683444917201996, 0.00045829731971025467, 0.0004897601902484894, 0.0005212230607867241, 0.0005526859313249588, 0.0005841488018631935, 0.0006156116724014282, 0.0006470745429396629, 0.0006785374134778976, 0.0007100002840161324, 0.0007414631545543671, 0.0007729260250926018, 0.0008043888956308365, 0.0008358517661690712, 0.0008673146367073059, 0.0008987775072455406, 0.0009302403777837753, 0.00096170324832201, 0.0009931661188602448, 0.0010246289893984795, 0.0010560918599367142, 0.0010875547304749489, 0.0011190176010131836]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 7.0, 3.0, 2.0, 6.0, 6.0, 9.0, 16.0, 11.0, 11.0, 23.0, 23.0, 22.0, 28.0, 21.0, 31.0, 43.0, 29.0, 41.0, 40.0, 39.0, 37.0, 47.0, 51.0, 54.0, 34.0, 43.0, 40.0, 49.0, 32.0, 25.0, 27.0, 32.0, 23.0, 14.0, 19.0, 15.0, 18.0, 9.0, 7.0, 4.0, 8.0, 5.0, 5.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.1875, -17.617919921875, -17.04833984375, -16.478759765625, -15.9091796875, -15.339599609375, -14.77001953125, -14.200439453125, -13.630859375, -13.061279296875, -12.49169921875, -11.922119140625, -11.3525390625, -10.782958984375, -10.21337890625, -9.643798828125, -9.07421875, -8.504638671875, -7.93505859375, -7.365478515625, -6.7958984375, -6.226318359375, -5.65673828125, -5.087158203125, -4.517578125, -3.947998046875, -3.37841796875, -2.808837890625, -2.2392578125, -1.669677734375, -1.10009765625, -0.530517578125, 0.0390625, 0.608642578125, 1.17822265625, 1.747802734375, 2.3173828125, 2.886962890625, 3.45654296875, 4.026123046875, 4.595703125, 5.165283203125, 5.73486328125, 6.304443359375, 6.8740234375, 7.443603515625, 8.01318359375, 8.582763671875, 9.15234375, 9.721923828125, 10.29150390625, 10.861083984375, 11.4306640625, 12.000244140625, 12.56982421875, 13.139404296875, 13.708984375, 14.278564453125, 14.84814453125, 15.417724609375, 15.9873046875, 16.556884765625, 17.12646484375, 17.696044921875, 18.265625]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 11.0, 4.0, 9.0, 10.0, 10.0, 15.0, 29.0, 38.0, 34.0, 60.0, 60.0, 106.0, 125.0, 150.0, 262.0, 327.0, 464.0, 646.0, 1027.0, 3028.0, 24242.0, 738913.0, 260792.0, 13053.0, 2065.0, 873.0, 631.0, 443.0, 294.0, 214.0, 159.0, 118.0, 95.0, 41.0, 45.0, 43.0, 31.0, 28.0, 16.0, 7.0, 16.0, 9.0, 10.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-45.875, -44.435546875, -42.99609375, -41.556640625, -40.1171875, -38.677734375, -37.23828125, -35.798828125, -34.359375, -32.919921875, -31.48046875, -30.041015625, -28.6015625, -27.162109375, -25.72265625, -24.283203125, -22.84375, -21.404296875, -19.96484375, -18.525390625, -17.0859375, -15.646484375, -14.20703125, -12.767578125, -11.328125, -9.888671875, -8.44921875, -7.009765625, -5.5703125, -4.130859375, -2.69140625, -1.251953125, 0.1875, 1.626953125, 3.06640625, 4.505859375, 5.9453125, 7.384765625, 8.82421875, 10.263671875, 11.703125, 13.142578125, 14.58203125, 16.021484375, 17.4609375, 18.900390625, 20.33984375, 21.779296875, 23.21875, 24.658203125, 26.09765625, 27.537109375, 28.9765625, 30.416015625, 31.85546875, 33.294921875, 34.734375, 36.173828125, 37.61328125, 39.052734375, 40.4921875, 41.931640625, 43.37109375, 44.810546875, 46.25]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 5.0, 8.0, 6.0, 8.0, 12.0, 13.0, 16.0, 22.0, 12.0, 33.0, 27.0, 27.0, 30.0, 37.0, 36.0, 40.0, 42.0, 45.0, 63.0, 211.0, 1722.0, 165.0, 57.0, 48.0, 38.0, 43.0, 45.0, 33.0, 31.0, 18.0, 32.0, 22.0, 13.0, 16.0, 16.0, 14.0, 7.0, 8.0, 6.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-52.3125, -50.74658203125, -49.1806640625, -47.61474609375, -46.048828125, -44.48291015625, -42.9169921875, -41.35107421875, -39.78515625, -38.21923828125, -36.6533203125, -35.08740234375, -33.521484375, -31.95556640625, -30.3896484375, -28.82373046875, -27.2578125, -25.69189453125, -24.1259765625, -22.56005859375, -20.994140625, -19.42822265625, -17.8623046875, -16.29638671875, -14.73046875, -13.16455078125, -11.5986328125, -10.03271484375, -8.466796875, -6.90087890625, -5.3349609375, -3.76904296875, -2.203125, -0.63720703125, 0.9287109375, 2.49462890625, 4.060546875, 5.62646484375, 7.1923828125, 8.75830078125, 10.32421875, 11.89013671875, 13.4560546875, 15.02197265625, 16.587890625, 18.15380859375, 19.7197265625, 21.28564453125, 22.8515625, 24.41748046875, 25.9833984375, 27.54931640625, 29.115234375, 30.68115234375, 32.2470703125, 33.81298828125, 35.37890625, 36.94482421875, 38.5107421875, 40.07666015625, 41.642578125, 43.20849609375, 44.7744140625, 46.34033203125, 47.90625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 4.0, 4.0, 8.0, 6.0, 9.0, 11.0, 11.0, 18.0, 17.0, 17.0, 28.0, 24.0, 24.0, 38.0, 49.0, 69.0, 103.0, 144.0, 261.0, 752.0, 6941.0, 3122762.0, 12632.0, 846.0, 314.0, 150.0, 101.0, 63.0, 53.0, 42.0, 32.0, 30.0, 31.0, 16.0, 20.0, 18.0, 9.0, 8.0, 12.0, 5.0, 11.0, 5.0, 2.0, 0.0, 5.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-135.25, -130.82421875, -126.3984375, -121.97265625, -117.546875, -113.12109375, -108.6953125, -104.26953125, -99.84375, -95.41796875, -90.9921875, -86.56640625, -82.140625, -77.71484375, -73.2890625, -68.86328125, -64.4375, -60.01171875, -55.5859375, -51.16015625, -46.734375, -42.30859375, -37.8828125, -33.45703125, -29.03125, -24.60546875, -20.1796875, -15.75390625, -11.328125, -6.90234375, -2.4765625, 1.94921875, 6.375, 10.80078125, 15.2265625, 19.65234375, 24.078125, 28.50390625, 32.9296875, 37.35546875, 41.78125, 46.20703125, 50.6328125, 55.05859375, 59.484375, 63.91015625, 68.3359375, 72.76171875, 77.1875, 81.61328125, 86.0390625, 90.46484375, 94.890625, 99.31640625, 103.7421875, 108.16796875, 112.59375, 117.01953125, 121.4453125, 125.87109375, 130.296875, 134.72265625, 139.1484375, 143.57421875, 148.0]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 6.0, 86.0, 439.0, 391.0, 82.0, 12.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.44284057617188, -87.07295227050781, -82.70305633544922, -78.33316802978516, -73.96327209472656, -69.5933837890625, -65.22349548339844, -60.853599548339844, -56.483707427978516, -52.11381530761719, -47.74392318725586, -43.37403106689453, -39.00414276123047, -34.634246826171875, -30.264358520507812, -25.894466400146484, -21.524574279785156, -17.154682159423828, -12.784790992736816, -8.414899826049805, -4.045007705688477, 0.32488441467285156, 4.694774627685547, 9.064666748046875, 13.434558868408203, 17.80445098876953, 22.17434310913086, 26.544233322143555, 30.914125442504883, 35.284019470214844, 39.653907775878906, 44.023799896240234, 48.39369201660156, 52.76358413696289, 57.13347625732422, 61.50336456298828, 65.87326049804688, 70.24314880371094, 74.613037109375, 78.9829330444336, 83.35282897949219, 87.72271728515625, 92.09261322021484, 96.4625015258789, 100.8323974609375, 105.20228576660156, 109.57217407226562, 113.94207000732422, 118.31195831298828, 122.68184661865234, 127.05174255371094, 131.421630859375, 135.79151916503906, 140.1614227294922, 144.53131103515625, 148.9011993408203, 153.27108764648438, 157.64097595214844, 162.0108642578125, 166.38076782226562, 170.7506561279297, 175.12054443359375, 179.4904327392578, 183.86032104492188, 188.230224609375]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 3.0, 3.0, 5.0, 6.0, 12.0, 11.0, 14.0, 19.0, 12.0, 21.0, 29.0, 14.0, 14.0, 26.0, 26.0, 30.0, 41.0, 29.0, 22.0, 30.0, 49.0, 34.0, 39.0, 36.0, 31.0, 40.0, 29.0, 42.0, 36.0, 33.0, 32.0, 26.0, 25.0, 26.0, 29.0, 11.0, 19.0, 13.0, 16.0, 10.0, 8.0, 8.0, 9.0, 4.0, 10.0, 5.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0], "bins": [-116.16033935546875, -112.47026062011719, -108.78018188476562, -105.09010314941406, -101.4000244140625, -97.70994567871094, -94.01986694335938, -90.32978820800781, -86.63970947265625, -82.94963073730469, -79.25955200195312, -75.56947326660156, -71.87939453125, -68.18931579589844, -64.49923706054688, -60.80915832519531, -57.11907958984375, -53.42900085449219, -49.738922119140625, -46.04884338378906, -42.3587646484375, -38.66868591308594, -34.978607177734375, -31.288528442382812, -27.59844970703125, -23.908370971679688, -20.218292236328125, -16.528213500976562, -12.838134765625, -9.148056030273438, -5.457977294921875, -1.7678985595703125, 1.92218017578125, 5.6122589111328125, 9.302337646484375, 12.992416381835938, 16.6824951171875, 20.372573852539062, 24.062652587890625, 27.752731323242188, 31.44281005859375, 35.13288879394531, 38.822967529296875, 42.51304626464844, 46.203125, 49.89320373535156, 53.583282470703125, 57.27336120605469, 60.96343994140625, 64.65351867675781, 68.34359741210938, 72.03367614746094, 75.7237548828125, 79.41383361816406, 83.10391235351562, 86.79399108886719, 90.48406982421875, 94.17414855957031, 97.86422729492188, 101.55430603027344, 105.244384765625, 108.93446350097656, 112.62454223632812, 116.31462097167969, 120.00469970703125]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 2.0, 5.0, 7.0, 8.0, 11.0, 21.0, 13.0, 12.0, 24.0, 19.0, 23.0, 21.0, 23.0, 40.0, 38.0, 37.0, 31.0, 39.0, 36.0, 42.0, 46.0, 51.0, 46.0, 51.0, 35.0, 43.0, 33.0, 24.0, 41.0, 31.0, 26.0, 19.0, 8.0, 22.0, 15.0, 19.0, 8.0, 7.0, 3.0, 5.0, 8.0, 4.0, 2.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-18.203125, -17.64501953125, -17.0869140625, -16.52880859375, -15.970703125, -15.41259765625, -14.8544921875, -14.29638671875, -13.73828125, -13.18017578125, -12.6220703125, -12.06396484375, -11.505859375, -10.94775390625, -10.3896484375, -9.83154296875, -9.2734375, -8.71533203125, -8.1572265625, -7.59912109375, -7.041015625, -6.48291015625, -5.9248046875, -5.36669921875, -4.80859375, -4.25048828125, -3.6923828125, -3.13427734375, -2.576171875, -2.01806640625, -1.4599609375, -0.90185546875, -0.34375, 0.21435546875, 0.7724609375, 1.33056640625, 1.888671875, 2.44677734375, 3.0048828125, 3.56298828125, 4.12109375, 4.67919921875, 5.2373046875, 5.79541015625, 6.353515625, 6.91162109375, 7.4697265625, 8.02783203125, 8.5859375, 9.14404296875, 9.7021484375, 10.26025390625, 10.818359375, 11.37646484375, 11.9345703125, 12.49267578125, 13.05078125, 13.60888671875, 14.1669921875, 14.72509765625, 15.283203125, 15.84130859375, 16.3994140625, 16.95751953125, 17.515625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 6.0, 8.0, 9.0, 14.0, 14.0, 14.0, 23.0, 18.0, 38.0, 35.0, 50.0, 72.0, 97.0, 96.0, 137.0, 158.0, 245.0, 302.0, 546.0, 839.0, 1748.0, 6461.0, 73858.0, 1635330.0, 2313167.0, 146530.0, 9346.0, 2174.0, 949.0, 569.0, 374.0, 226.0, 206.0, 144.0, 104.0, 84.0, 50.0, 43.0, 35.0, 29.0, 36.0, 16.0, 22.0, 9.0, 15.0, 10.0, 6.0, 4.0, 4.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 3.0], "bins": [-40.875, -39.6015625, -38.328125, -37.0546875, -35.78125, -34.5078125, -33.234375, -31.9609375, -30.6875, -29.4140625, -28.140625, -26.8671875, -25.59375, -24.3203125, -23.046875, -21.7734375, -20.5, -19.2265625, -17.953125, -16.6796875, -15.40625, -14.1328125, -12.859375, -11.5859375, -10.3125, -9.0390625, -7.765625, -6.4921875, -5.21875, -3.9453125, -2.671875, -1.3984375, -0.125, 1.1484375, 2.421875, 3.6953125, 4.96875, 6.2421875, 7.515625, 8.7890625, 10.0625, 11.3359375, 12.609375, 13.8828125, 15.15625, 16.4296875, 17.703125, 18.9765625, 20.25, 21.5234375, 22.796875, 24.0703125, 25.34375, 26.6171875, 27.890625, 29.1640625, 30.4375, 31.7109375, 32.984375, 34.2578125, 35.53125, 36.8046875, 38.078125, 39.3515625, 40.625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 7.0, 22.0, 33.0, 31.0, 54.0, 103.0, 171.0, 288.0, 482.0, 771.0, 843.0, 565.0, 295.0, 167.0, 85.0, 67.0, 33.0, 27.0, 11.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-48.28125, -46.81884765625, -45.3564453125, -43.89404296875, -42.431640625, -40.96923828125, -39.5068359375, -38.04443359375, -36.58203125, -35.11962890625, -33.6572265625, -32.19482421875, -30.732421875, -29.27001953125, -27.8076171875, -26.34521484375, -24.8828125, -23.42041015625, -21.9580078125, -20.49560546875, -19.033203125, -17.57080078125, -16.1083984375, -14.64599609375, -13.18359375, -11.72119140625, -10.2587890625, -8.79638671875, -7.333984375, -5.87158203125, -4.4091796875, -2.94677734375, -1.484375, -0.02197265625, 1.4404296875, 2.90283203125, 4.365234375, 5.82763671875, 7.2900390625, 8.75244140625, 10.21484375, 11.67724609375, 13.1396484375, 14.60205078125, 16.064453125, 17.52685546875, 18.9892578125, 20.45166015625, 21.9140625, 23.37646484375, 24.8388671875, 26.30126953125, 27.763671875, 29.22607421875, 30.6884765625, 32.15087890625, 33.61328125, 35.07568359375, 36.5380859375, 38.00048828125, 39.462890625, 40.92529296875, 42.3876953125, 43.85009765625, 45.3125]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 6.0, 9.0, 11.0, 17.0, 14.0, 20.0, 34.0, 46.0, 63.0, 106.0, 144.0, 214.0, 375.0, 980.0, 4481.0, 3854960.0, 328764.0, 2433.0, 640.0, 304.0, 183.0, 118.0, 90.0, 74.0, 49.0, 37.0, 26.0, 21.0, 15.0, 12.0, 11.0, 3.0, 4.0, 4.0, 4.0, 3.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-168.0, -162.88671875, -157.7734375, -152.66015625, -147.546875, -142.43359375, -137.3203125, -132.20703125, -127.09375, -121.98046875, -116.8671875, -111.75390625, -106.640625, -101.52734375, -96.4140625, -91.30078125, -86.1875, -81.07421875, -75.9609375, -70.84765625, -65.734375, -60.62109375, -55.5078125, -50.39453125, -45.28125, -40.16796875, -35.0546875, -29.94140625, -24.828125, -19.71484375, -14.6015625, -9.48828125, -4.375, 0.73828125, 5.8515625, 10.96484375, 16.078125, 21.19140625, 26.3046875, 31.41796875, 36.53125, 41.64453125, 46.7578125, 51.87109375, 56.984375, 62.09765625, 67.2109375, 72.32421875, 77.4375, 82.55078125, 87.6640625, 92.77734375, 97.890625, 103.00390625, 108.1171875, 113.23046875, 118.34375, 123.45703125, 128.5703125, 133.68359375, 138.796875, 143.91015625, 149.0234375, 154.13671875, 159.25]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 35.0, 328.0, 527.0, 112.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-441.8778991699219, -429.6914978027344, -417.5050964355469, -405.31866455078125, -393.13226318359375, -380.94586181640625, -368.75946044921875, -356.57305908203125, -344.38665771484375, -332.20025634765625, -320.01385498046875, -307.82745361328125, -295.6410217285156, -283.4546203613281, -271.2682189941406, -259.0818176269531, -246.8953857421875, -234.708984375, -222.52256774902344, -210.33616638183594, -198.14974975585938, -185.96334838867188, -173.77694702148438, -161.59054565429688, -149.4041290283203, -137.2177276611328, -125.03131103515625, -112.84490966796875, -100.65850067138672, -88.47209167480469, -76.28569030761719, -64.09928131103516, -51.912872314453125, -39.726463317871094, -27.540058135986328, -15.353652954101562, -3.1672439575195312, 9.0191650390625, 21.20556640625, 33.39197540283203, 45.57838439941406, 57.764793395996094, 69.95120239257812, 82.13760375976562, 94.32401275634766, 106.51042175292969, 118.69682312011719, 130.88323974609375, 143.06964111328125, 155.25604248046875, 167.4424591064453, 179.6288604736328, 191.81527709960938, 204.00167846679688, 216.18807983398438, 228.37448120117188, 240.56089782714844, 252.74729919433594, 264.9337158203125, 277.1201171875, 289.3065185546875, 301.492919921875, 313.6793212890625, 325.8657531738281, 338.0521545410156]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 7.0, 10.0, 12.0, 17.0, 18.0, 20.0, 18.0, 31.0, 27.0, 33.0, 47.0, 44.0, 54.0, 55.0, 60.0, 47.0, 63.0, 52.0, 47.0, 56.0, 33.0, 42.0, 39.0, 32.0, 29.0, 21.0, 19.0, 16.0, 18.0, 10.0, 11.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-126.52395629882812, -122.45703887939453, -118.39012145996094, -114.32319641113281, -110.25627899169922, -106.18936157226562, -102.1224365234375, -98.0555191040039, -93.98860168457031, -89.92168426513672, -85.85476684570312, -81.787841796875, -77.7209243774414, -73.65400695800781, -69.58708190917969, -65.5201644897461, -61.4532470703125, -57.386329650878906, -53.31940841674805, -49.25248718261719, -45.185569763183594, -41.11865234375, -37.05173110961914, -32.98480987548828, -28.917892456054688, -24.85097312927246, -20.784053802490234, -16.717134475708008, -12.650215148925781, -8.583295822143555, -4.516376495361328, -0.44945716857910156, 3.617462158203125, 7.684381484985352, 11.751300811767578, 15.818220138549805, 19.88513946533203, 23.952058792114258, 28.018978118896484, 32.085899353027344, 36.15281677246094, 40.21973419189453, 44.28665542602539, 48.35357666015625, 52.420494079589844, 56.48741149902344, 60.5543327331543, 64.62125396728516, 68.68817138671875, 72.75508880615234, 76.82200622558594, 80.88893127441406, 84.95584869384766, 89.02276611328125, 93.08969116210938, 97.15660858154297, 101.22352600097656, 105.29044342041016, 109.35736083984375, 113.42428588867188, 117.49120330810547, 121.55812072753906, 125.62504577636719, 129.69195556640625, 133.75888061523438]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 4.0, 4.0, 7.0, 5.0, 7.0, 15.0, 12.0, 17.0, 20.0, 27.0, 29.0, 21.0, 26.0, 34.0, 34.0, 38.0, 35.0, 35.0, 45.0, 45.0, 54.0, 48.0, 40.0, 44.0, 36.0, 33.0, 40.0, 31.0, 38.0, 26.0, 28.0, 25.0, 28.0, 19.0, 7.0, 9.0, 8.0, 10.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.734375, -17.1552734375, -16.576171875, -15.9970703125, -15.41796875, -14.8388671875, -14.259765625, -13.6806640625, -13.1015625, -12.5224609375, -11.943359375, -11.3642578125, -10.78515625, -10.2060546875, -9.626953125, -9.0478515625, -8.46875, -7.8896484375, -7.310546875, -6.7314453125, -6.15234375, -5.5732421875, -4.994140625, -4.4150390625, -3.8359375, -3.2568359375, -2.677734375, -2.0986328125, -1.51953125, -0.9404296875, -0.361328125, 0.2177734375, 0.796875, 1.3759765625, 1.955078125, 2.5341796875, 3.11328125, 3.6923828125, 4.271484375, 4.8505859375, 5.4296875, 6.0087890625, 6.587890625, 7.1669921875, 7.74609375, 8.3251953125, 8.904296875, 9.4833984375, 10.0625, 10.6416015625, 11.220703125, 11.7998046875, 12.37890625, 12.9580078125, 13.537109375, 14.1162109375, 14.6953125, 15.2744140625, 15.853515625, 16.4326171875, 17.01171875, 17.5908203125, 18.169921875, 18.7490234375, 19.328125]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 7.0, 9.0, 16.0, 34.0, 53.0, 57.0, 66.0, 107.0, 180.0, 281.0, 395.0, 577.0, 809.0, 1235.0, 1896.0, 2802.0, 4397.0, 6613.0, 10346.0, 16264.0, 25805.0, 41750.0, 69968.0, 130622.0, 335628.0, 177368.0, 86210.0, 50163.0, 30590.0, 19288.0, 12004.0, 7965.0, 5133.0, 3271.0, 2235.0, 1455.0, 921.0, 659.0, 470.0, 293.0, 183.0, 123.0, 84.0, 71.0, 48.0, 30.0, 24.0, 17.0, 10.0, 7.0, 6.0, 3.0, 3.0, 1.0, 2.0, 2.0, 1.0], "bins": [-3.806640625, -3.686492919921875, -3.56634521484375, -3.446197509765625, -3.3260498046875, -3.205902099609375, -3.08575439453125, -2.965606689453125, -2.845458984375, -2.725311279296875, -2.60516357421875, -2.485015869140625, -2.3648681640625, -2.244720458984375, -2.12457275390625, -2.004425048828125, -1.88427734375, -1.764129638671875, -1.64398193359375, -1.523834228515625, -1.4036865234375, -1.283538818359375, -1.16339111328125, -1.043243408203125, -0.923095703125, -0.802947998046875, -0.68280029296875, -0.562652587890625, -0.4425048828125, -0.322357177734375, -0.20220947265625, -0.082061767578125, 0.0380859375, 0.158233642578125, 0.27838134765625, 0.398529052734375, 0.5186767578125, 0.638824462890625, 0.75897216796875, 0.879119873046875, 0.999267578125, 1.119415283203125, 1.23956298828125, 1.359710693359375, 1.4798583984375, 1.600006103515625, 1.72015380859375, 1.840301513671875, 1.96044921875, 2.080596923828125, 2.20074462890625, 2.320892333984375, 2.4410400390625, 2.561187744140625, 2.68133544921875, 2.801483154296875, 2.921630859375, 3.041778564453125, 3.16192626953125, 3.282073974609375, 3.4022216796875, 3.522369384765625, 3.64251708984375, 3.762664794921875, 3.8828125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 4.0, 0.0, 3.0, 8.0, 9.0, 11.0, 9.0, 11.0, 12.0, 13.0, 23.0, 25.0, 25.0, 21.0, 24.0, 31.0, 32.0, 36.0, 32.0, 40.0, 46.0, 32.0, 40.0, 49.0, 1054.0, 26.0, 31.0, 43.0, 37.0, 37.0, 30.0, 26.0, 29.0, 28.0, 22.0, 17.0, 24.0, 17.0, 14.0, 16.0, 9.0, 4.0, 9.0, 6.0, 9.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.0234375, -10.703369140625, -10.38330078125, -10.063232421875, -9.7431640625, -9.423095703125, -9.10302734375, -8.782958984375, -8.462890625, -8.142822265625, -7.82275390625, -7.502685546875, -7.1826171875, -6.862548828125, -6.54248046875, -6.222412109375, -5.90234375, -5.582275390625, -5.26220703125, -4.942138671875, -4.6220703125, -4.302001953125, -3.98193359375, -3.661865234375, -3.341796875, -3.021728515625, -2.70166015625, -2.381591796875, -2.0615234375, -1.741455078125, -1.42138671875, -1.101318359375, -0.78125, -0.461181640625, -0.14111328125, 0.178955078125, 0.4990234375, 0.819091796875, 1.13916015625, 1.459228515625, 1.779296875, 2.099365234375, 2.41943359375, 2.739501953125, 3.0595703125, 3.379638671875, 3.69970703125, 4.019775390625, 4.33984375, 4.659912109375, 4.97998046875, 5.300048828125, 5.6201171875, 5.940185546875, 6.26025390625, 6.580322265625, 6.900390625, 7.220458984375, 7.54052734375, 7.860595703125, 8.1806640625, 8.500732421875, 8.82080078125, 9.140869140625, 9.4609375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 5.0, 10.0, 10.0, 19.0, 26.0, 31.0, 57.0, 101.0, 156.0, 194.0, 312.0, 510.0, 722.0, 986.0, 1465.0, 2238.0, 3199.0, 4627.0, 6684.0, 9771.0, 14363.0, 21221.0, 31597.0, 49082.0, 79216.0, 139455.0, 1325552.0, 158896.0, 87574.0, 53525.0, 34247.0, 22724.0, 15283.0, 10495.0, 7023.0, 4975.0, 3414.0, 2366.0, 1566.0, 1131.0, 763.0, 481.0, 357.0, 263.0, 137.0, 94.0, 72.0, 55.0, 28.0, 18.0, 12.0, 17.0, 5.0, 6.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.779754638671875, -2.68255615234375, -2.585357666015625, -2.4881591796875, -2.390960693359375, -2.29376220703125, -2.196563720703125, -2.099365234375, -2.002166748046875, -1.90496826171875, -1.807769775390625, -1.7105712890625, -1.613372802734375, -1.51617431640625, -1.418975830078125, -1.32177734375, -1.224578857421875, -1.12738037109375, -1.030181884765625, -0.9329833984375, -0.835784912109375, -0.73858642578125, -0.641387939453125, -0.544189453125, -0.446990966796875, -0.34979248046875, -0.252593994140625, -0.1553955078125, -0.058197021484375, 0.03900146484375, 0.136199951171875, 0.2333984375, 0.330596923828125, 0.42779541015625, 0.524993896484375, 0.6221923828125, 0.719390869140625, 0.81658935546875, 0.913787841796875, 1.010986328125, 1.108184814453125, 1.20538330078125, 1.302581787109375, 1.3997802734375, 1.496978759765625, 1.59417724609375, 1.691375732421875, 1.78857421875, 1.885772705078125, 1.98297119140625, 2.080169677734375, 2.1773681640625, 2.274566650390625, 2.37176513671875, 2.468963623046875, 2.566162109375, 2.663360595703125, 2.76055908203125, 2.857757568359375, 2.9549560546875, 3.052154541015625, 3.14935302734375, 3.246551513671875, 3.34375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 2.0, 3.0, 0.0, 3.0, 8.0, 5.0, 6.0, 9.0, 13.0, 19.0, 35.0, 28.0, 32.0, 53.0, 72.0, 76.0, 97.0, 117.0, 84.0, 80.0, 68.0, 36.0, 29.0, 30.0, 17.0, 20.0, 12.0, 7.0, 11.0, 7.0, 4.0, 4.0, 8.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0022182464599609375, -0.0021470189094543457, -0.002075791358947754, -0.002004563808441162, -0.0019333362579345703, -0.0018621087074279785, -0.0017908811569213867, -0.001719653606414795, -0.0016484260559082031, -0.0015771985054016113, -0.0015059709548950195, -0.0014347434043884277, -0.001363515853881836, -0.0012922883033752441, -0.0012210607528686523, -0.0011498332023620605, -0.0010786056518554688, -0.001007378101348877, -0.0009361505508422852, -0.0008649230003356934, -0.0007936954498291016, -0.0007224678993225098, -0.000651240348815918, -0.0005800127983093262, -0.0005087852478027344, -0.0004375576972961426, -0.0003663301467895508, -0.000295102596282959, -0.0002238750457763672, -0.0001526474952697754, -8.14199447631836e-05, -1.0192394256591797e-05, 6.103515625e-05, 0.0001322627067565918, 0.0002034902572631836, 0.0002747178077697754, 0.0003459453582763672, 0.000417172908782959, 0.0004884004592895508, 0.0005596280097961426, 0.0006308555603027344, 0.0007020831108093262, 0.000773310661315918, 0.0008445382118225098, 0.0009157657623291016, 0.0009869933128356934, 0.0010582208633422852, 0.001129448413848877, 0.0012006759643554688, 0.0012719035148620605, 0.0013431310653686523, 0.0014143586158752441, 0.001485586166381836, 0.0015568137168884277, 0.0016280412673950195, 0.0016992688179016113, 0.0017704963684082031, 0.001841723918914795, 0.0019129514694213867, 0.0019841790199279785, 0.0020554065704345703, 0.002126634120941162, 0.002197861671447754, 0.0022690892219543457, 0.0023403167724609375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 4.0, 10.0, 7.0, 14.0, 15.0, 14.0, 14.0, 17.0, 40.0, 47.0, 52.0, 86.0, 126.0, 208.0, 413.0, 924.0, 51404.0, 992102.0, 1744.0, 545.0, 255.0, 153.0, 97.0, 63.0, 35.0, 31.0, 30.0, 26.0, 15.0, 10.0, 6.0, 10.0, 2.0, 6.0, 4.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.047821044921875, -0.04633617401123047, -0.04485130310058594, -0.043366432189941406, -0.041881561279296875, -0.040396690368652344, -0.03891181945800781, -0.03742694854736328, -0.03594207763671875, -0.03445720672607422, -0.03297233581542969, -0.031487464904785156, -0.030002593994140625, -0.028517723083496094, -0.027032852172851562, -0.02554798126220703, -0.0240631103515625, -0.02257823944091797, -0.021093368530273438, -0.019608497619628906, -0.018123626708984375, -0.016638755798339844, -0.015153884887695312, -0.013669013977050781, -0.01218414306640625, -0.010699272155761719, -0.009214401245117188, -0.007729530334472656, -0.006244659423828125, -0.004759788513183594, -0.0032749176025390625, -0.0017900466918945312, -0.00030517578125, 0.0011796951293945312, 0.0026645660400390625, 0.004149436950683594, 0.005634307861328125, 0.007119178771972656, 0.008604049682617188, 0.010088920593261719, 0.01157379150390625, 0.013058662414550781, 0.014543533325195312, 0.016028404235839844, 0.017513275146484375, 0.018998146057128906, 0.020483016967773438, 0.02196788787841797, 0.0234527587890625, 0.02493762969970703, 0.026422500610351562, 0.027907371520996094, 0.029392242431640625, 0.030877113342285156, 0.03236198425292969, 0.03384685516357422, 0.03533172607421875, 0.03681659698486328, 0.03830146789550781, 0.039786338806152344, 0.041271209716796875, 0.042756080627441406, 0.04424095153808594, 0.04572582244873047, 0.047210693359375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 11.0, 54.0, 211.0, 391.0, 247.0, 83.0, 10.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005578490439802408, -0.005470382981002331, -0.005362275522202253, -0.005254167597740889, -0.005146060138940811, -0.005037952680140734, -0.004929845221340656, -0.004821737762540579, -0.004713630303740501, -0.004605522844940424, -0.0044974153861403465, -0.004389307461678982, -0.004281200002878904, -0.004173092544078827, -0.0040649850852787495, -0.003956877626478672, -0.0038487697020173073, -0.00374066224321723, -0.0036325545515865088, -0.0035244470927864313, -0.0034163394011557102, -0.0033082319423556328, -0.0032001244835555553, -0.003092017024755478, -0.002983909333124757, -0.0028758018743246794, -0.0027676941826939583, -0.002659586723893881, -0.0025514792650938034, -0.0024433715734630823, -0.002335264114663005, -0.0022271564230322838, -0.0021190489642322063, -0.002010941505432129, -0.0019028338138014078, -0.0017947263550013304, -0.0016866187797859311, -0.0015785112045705318, -0.0014704037457704544, -0.0013622961705550551, -0.001254188478924334, -0.0011460809037089348, -0.0010379734449088573, -0.0009298658696934581, -0.0008217582944780588, -0.0007136507192626595, -0.0006055432022549212, -0.0004974356852471828, -0.0003893281100317836, -0.00028122056392021477, -0.00017311301780864596, -6.500547169707716e-05, 4.3102074414491653e-05, 0.00015120964962989092, 0.00025931716663762927, 0.0003674246836453676, 0.0004755322588607669, 0.0005836398340761662, 0.0006917473510839045, 0.0007998548680916429, 0.0009079624433070421, 0.0010160700185224414, 0.0011241775937378407, 0.001232285052537918, 0.0013403926277533174]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 4.0, 1.0, 7.0, 2.0, 8.0, 7.0, 8.0, 12.0, 10.0, 11.0, 13.0, 15.0, 29.0, 30.0, 25.0, 28.0, 26.0, 42.0, 39.0, 34.0, 40.0, 37.0, 40.0, 47.0, 47.0, 50.0, 39.0, 36.0, 22.0, 31.0, 32.0, 34.0, 28.0, 20.0, 25.0, 24.0, 15.0, 14.0, 14.0, 11.0, 17.0, 7.0, 7.0, 8.0, 3.0, 9.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0008451342582702637, -0.0008164467290043831, -0.0007877591997385025, -0.0007590716704726219, -0.0007303841412067413, -0.0007016966119408607, -0.0006730090826749802, -0.0006443215534090996, -0.000615634024143219, -0.0005869464948773384, -0.0005582589656114578, -0.0005295714363455772, -0.0005008839070796967, -0.00047219637781381607, -0.0004435088485479355, -0.0004148213192820549, -0.0003861337900161743, -0.00035744626075029373, -0.00032875873148441315, -0.00030007120221853256, -0.000271383672952652, -0.0002426961436867714, -0.0002140086144208908, -0.00018532108515501022, -0.00015663355588912964, -0.00012794602662324905, -9.925849735736847e-05, -7.057096809148788e-05, -4.18834388256073e-05, -1.3195909559726715e-05, 1.549161970615387e-05, 4.4179148972034454e-05, 7.286667823791504e-05, 0.00010155420750379562, 0.0001302417367696762, 0.0001589292660355568, 0.00018761679530143738, 0.00021630432456731796, 0.00024499185383319855, 0.00027367938309907913, 0.0003023669123649597, 0.0003310544416308403, 0.0003597419708967209, 0.00038842950016260147, 0.00041711702942848206, 0.00044580455869436264, 0.0004744920879602432, 0.0005031796172261238, 0.0005318671464920044, 0.000560554675757885, 0.0005892422050237656, 0.0006179297342896461, 0.0006466172635555267, 0.0006753047928214073, 0.0007039923220872879, 0.0007326798513531685, 0.0007613673806190491, 0.0007900549098849297, 0.0008187424391508102, 0.0008474299684166908, 0.0008761174976825714, 0.000904805026948452, 0.0009334925562143326, 0.0009621800854802132, 0.0009908676147460938]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 10.0, 4.0, 4.0, 7.0, 5.0, 7.0, 15.0, 12.0, 17.0, 20.0, 27.0, 29.0, 21.0, 26.0, 34.0, 34.0, 38.0, 35.0, 35.0, 46.0, 44.0, 54.0, 48.0, 40.0, 44.0, 36.0, 33.0, 40.0, 31.0, 38.0, 26.0, 28.0, 25.0, 28.0, 19.0, 7.0, 9.0, 8.0, 10.0, 4.0, 5.0, 3.0, 1.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-17.734375, -17.1552734375, -16.576171875, -15.9970703125, -15.41796875, -14.8388671875, -14.259765625, -13.6806640625, -13.1015625, -12.5224609375, -11.943359375, -11.3642578125, -10.78515625, -10.2060546875, -9.626953125, -9.0478515625, -8.46875, -7.8896484375, -7.310546875, -6.7314453125, -6.15234375, -5.5732421875, -4.994140625, -4.4150390625, -3.8359375, -3.2568359375, -2.677734375, -2.0986328125, -1.51953125, -0.9404296875, -0.361328125, 0.2177734375, 0.796875, 1.3759765625, 1.955078125, 2.5341796875, 3.11328125, 3.6923828125, 4.271484375, 4.8505859375, 5.4296875, 6.0087890625, 6.587890625, 7.1669921875, 7.74609375, 8.3251953125, 8.904296875, 9.4833984375, 10.0625, 10.6416015625, 11.220703125, 11.7998046875, 12.37890625, 12.9580078125, 13.537109375, 14.1162109375, 14.6953125, 15.2744140625, 15.853515625, 16.4326171875, 17.01171875, 17.5908203125, 18.169921875, 18.7490234375, 19.328125]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 9.0, 5.0, 6.0, 16.0, 18.0, 26.0, 24.0, 37.0, 44.0, 69.0, 86.0, 104.0, 144.0, 182.0, 332.0, 662.0, 1579.0, 4449.0, 15261.0, 60801.0, 268870.0, 513162.0, 136456.0, 32337.0, 8686.0, 2797.0, 972.0, 492.0, 272.0, 171.0, 120.0, 103.0, 63.0, 47.0, 47.0, 26.0, 11.0, 18.0, 19.0, 10.0, 8.0, 4.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-22.625, -21.877685546875, -21.13037109375, -20.383056640625, -19.6357421875, -18.888427734375, -18.14111328125, -17.393798828125, -16.646484375, -15.899169921875, -15.15185546875, -14.404541015625, -13.6572265625, -12.909912109375, -12.16259765625, -11.415283203125, -10.66796875, -9.920654296875, -9.17333984375, -8.426025390625, -7.6787109375, -6.931396484375, -6.18408203125, -5.436767578125, -4.689453125, -3.942138671875, -3.19482421875, -2.447509765625, -1.7001953125, -0.952880859375, -0.20556640625, 0.541748046875, 1.2890625, 2.036376953125, 2.78369140625, 3.531005859375, 4.2783203125, 5.025634765625, 5.77294921875, 6.520263671875, 7.267578125, 8.014892578125, 8.76220703125, 9.509521484375, 10.2568359375, 11.004150390625, 11.75146484375, 12.498779296875, 13.24609375, 13.993408203125, 14.74072265625, 15.488037109375, 16.2353515625, 16.982666015625, 17.72998046875, 18.477294921875, 19.224609375, 19.971923828125, 20.71923828125, 21.466552734375, 22.2138671875, 22.961181640625, 23.70849609375, 24.455810546875, 25.203125]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 3.0, 3.0, 6.0, 11.0, 6.0, 7.0, 11.0, 10.0, 15.0, 19.0, 20.0, 23.0, 27.0, 29.0, 33.0, 35.0, 29.0, 36.0, 52.0, 63.0, 84.0, 142.0, 1516.0, 276.0, 94.0, 66.0, 51.0, 52.0, 40.0, 47.0, 34.0, 38.0, 30.0, 32.0, 20.0, 24.0, 11.0, 7.0, 15.0, 7.0, 8.0, 5.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-40.375, -38.87060546875, -37.3662109375, -35.86181640625, -34.357421875, -32.85302734375, -31.3486328125, -29.84423828125, -28.33984375, -26.83544921875, -25.3310546875, -23.82666015625, -22.322265625, -20.81787109375, -19.3134765625, -17.80908203125, -16.3046875, -14.80029296875, -13.2958984375, -11.79150390625, -10.287109375, -8.78271484375, -7.2783203125, -5.77392578125, -4.26953125, -2.76513671875, -1.2607421875, 0.24365234375, 1.748046875, 3.25244140625, 4.7568359375, 6.26123046875, 7.765625, 9.27001953125, 10.7744140625, 12.27880859375, 13.783203125, 15.28759765625, 16.7919921875, 18.29638671875, 19.80078125, 21.30517578125, 22.8095703125, 24.31396484375, 25.818359375, 27.32275390625, 28.8271484375, 30.33154296875, 31.8359375, 33.34033203125, 34.8447265625, 36.34912109375, 37.853515625, 39.35791015625, 40.8623046875, 42.36669921875, 43.87109375, 45.37548828125, 46.8798828125, 48.38427734375, 49.888671875, 51.39306640625, 52.8974609375, 54.40185546875, 55.90625]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 10.0, 4.0, 12.0, 7.0, 22.0, 15.0, 36.0, 48.0, 67.0, 91.0, 176.0, 251.0, 396.0, 966.0, 5474.0, 1763107.0, 1367822.0, 5187.0, 941.0, 367.0, 244.0, 148.0, 90.0, 72.0, 52.0, 25.0, 30.0, 18.0, 15.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-84.5625, -81.4296875, -78.296875, -75.1640625, -72.03125, -68.8984375, -65.765625, -62.6328125, -59.5, -56.3671875, -53.234375, -50.1015625, -46.96875, -43.8359375, -40.703125, -37.5703125, -34.4375, -31.3046875, -28.171875, -25.0390625, -21.90625, -18.7734375, -15.640625, -12.5078125, -9.375, -6.2421875, -3.109375, 0.0234375, 3.15625, 6.2890625, 9.421875, 12.5546875, 15.6875, 18.8203125, 21.953125, 25.0859375, 28.21875, 31.3515625, 34.484375, 37.6171875, 40.75, 43.8828125, 47.015625, 50.1484375, 53.28125, 56.4140625, 59.546875, 62.6796875, 65.8125, 68.9453125, 72.078125, 75.2109375, 78.34375, 81.4765625, 84.609375, 87.7421875, 90.875, 94.0078125, 97.140625, 100.2734375, 103.40625, 106.5390625, 109.671875, 112.8046875, 115.9375]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 35.0, 247.0, 516.0, 178.0, 34.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-154.77093505859375, -148.67889404296875, -142.58685302734375, -136.49481201171875, -130.40277099609375, -124.31072998046875, -118.21868896484375, -112.12664794921875, -106.03460693359375, -99.94256591796875, -93.85052490234375, -87.75848388671875, -81.66644287109375, -75.57440185546875, -69.48236083984375, -63.39031982421875, -57.29827880859375, -51.20623779296875, -45.11419677734375, -39.02215576171875, -32.93011474609375, -26.83807373046875, -20.74603271484375, -14.65399169921875, -8.56195068359375, -2.46990966796875, 3.62213134765625, 9.71417236328125, 15.80621337890625, 21.89825439453125, 27.99029541015625, 34.08233642578125, 40.17436218261719, 46.26640319824219, 52.35844421386719, 58.45048522949219, 64.54252624511719, 70.63456726074219, 76.72660827636719, 82.81864929199219, 88.91069030761719, 95.00273132324219, 101.09477233886719, 107.18681335449219, 113.27885437011719, 119.37089538574219, 125.46293640136719, 131.5549774169922, 137.6470184326172, 143.7390594482422, 149.8311004638672, 155.9231414794922, 162.0151824951172, 168.1072235107422, 174.1992645263672, 180.2913055419922, 186.3833465576172, 192.4753875732422, 198.5674285888672, 204.6594696044922, 210.7515106201172, 216.8435516357422, 222.9355926513672, 229.0276336669922, 235.1196746826172]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 5.0, 3.0, 5.0, 9.0, 12.0, 11.0, 7.0, 14.0, 19.0, 19.0, 20.0, 23.0, 28.0, 33.0, 27.0, 35.0, 37.0, 45.0, 50.0, 54.0, 33.0, 44.0, 42.0, 45.0, 39.0, 45.0, 27.0, 35.0, 30.0, 26.0, 38.0, 30.0, 17.0, 29.0, 15.0, 7.0, 15.0, 12.0, 6.0, 3.0, 1.0, 4.0, 4.0, 1.0, 2.0, 4.0, 2.0, 3.0], "bins": [-147.73855590820312, -143.81414794921875, -139.8897247314453, -135.96531677246094, -132.04090881347656, -128.11648559570312, -124.19207763671875, -120.26766204833984, -116.34324645996094, -112.41883087158203, -108.49442291259766, -104.57000732421875, -100.64559173583984, -96.72117614746094, -92.79676818847656, -88.87235260009766, -84.94794464111328, -81.02352905273438, -77.09912109375, -73.1747055053711, -69.25028991699219, -65.32588195800781, -61.401466369628906, -57.47705078125, -53.55263900756836, -49.62822723388672, -45.70381164550781, -41.77939987182617, -37.85498809814453, -33.930572509765625, -30.006160736083984, -26.08174705505371, -22.157333374023438, -18.232919692993164, -14.308506965637207, -10.38409423828125, -6.459680557250977, -2.535266876220703, 1.3891448974609375, 5.313558578491211, 9.237972259521484, 13.162385940551758, 17.08679962158203, 21.011211395263672, 24.935625076293945, 28.86003875732422, 32.78445053100586, 36.7088623046875, 40.633277893066406, 44.55768966674805, 48.48210525512695, 52.406517028808594, 56.3309326171875, 60.25534439086914, 64.17975616455078, 68.10417175292969, 72.02857971191406, 75.95299530029297, 79.87740325927734, 83.80181884765625, 87.72623443603516, 91.65065002441406, 95.57505798339844, 99.49947357177734, 103.42388916015625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 8.0, 4.0, 7.0, 8.0, 6.0, 15.0, 9.0, 20.0, 25.0, 24.0, 31.0, 20.0, 24.0, 18.0, 39.0, 36.0, 27.0, 48.0, 33.0, 48.0, 48.0, 41.0, 48.0, 31.0, 41.0, 31.0, 39.0, 29.0, 31.0, 23.0, 32.0, 35.0, 26.0, 15.0, 22.0, 10.0, 11.0, 9.0, 5.0, 7.0, 6.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.21875, -15.6591796875, -15.099609375, -14.5400390625, -13.98046875, -13.4208984375, -12.861328125, -12.3017578125, -11.7421875, -11.1826171875, -10.623046875, -10.0634765625, -9.50390625, -8.9443359375, -8.384765625, -7.8251953125, -7.265625, -6.7060546875, -6.146484375, -5.5869140625, -5.02734375, -4.4677734375, -3.908203125, -3.3486328125, -2.7890625, -2.2294921875, -1.669921875, -1.1103515625, -0.55078125, 0.0087890625, 0.568359375, 1.1279296875, 1.6875, 2.2470703125, 2.806640625, 3.3662109375, 3.92578125, 4.4853515625, 5.044921875, 5.6044921875, 6.1640625, 6.7236328125, 7.283203125, 7.8427734375, 8.40234375, 8.9619140625, 9.521484375, 10.0810546875, 10.640625, 11.2001953125, 11.759765625, 12.3193359375, 12.87890625, 13.4384765625, 13.998046875, 14.5576171875, 15.1171875, 15.6767578125, 16.236328125, 16.7958984375, 17.35546875, 17.9150390625, 18.474609375, 19.0341796875, 19.59375]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 13.0, 7.0, 7.0, 8.0, 14.0, 17.0, 20.0, 22.0, 35.0, 28.0, 25.0, 38.0, 69.0, 75.0, 156.0, 373.0, 990.0, 5401.0, 517172.0, 3588280.0, 77582.0, 2519.0, 624.0, 264.0, 136.0, 81.0, 53.0, 40.0, 37.0, 28.0, 27.0, 20.0, 9.0, 8.0, 13.0, 14.0, 7.0, 11.0, 6.0, 6.0, 7.0, 5.0, 2.0, 4.0, 4.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-70.3125, -68.1376953125, -65.962890625, -63.7880859375, -61.61328125, -59.4384765625, -57.263671875, -55.0888671875, -52.9140625, -50.7392578125, -48.564453125, -46.3896484375, -44.21484375, -42.0400390625, -39.865234375, -37.6904296875, -35.515625, -33.3408203125, -31.166015625, -28.9912109375, -26.81640625, -24.6416015625, -22.466796875, -20.2919921875, -18.1171875, -15.9423828125, -13.767578125, -11.5927734375, -9.41796875, -7.2431640625, -5.068359375, -2.8935546875, -0.71875, 1.4560546875, 3.630859375, 5.8056640625, 7.98046875, 10.1552734375, 12.330078125, 14.5048828125, 16.6796875, 18.8544921875, 21.029296875, 23.2041015625, 25.37890625, 27.5537109375, 29.728515625, 31.9033203125, 34.078125, 36.2529296875, 38.427734375, 40.6025390625, 42.77734375, 44.9521484375, 47.126953125, 49.3017578125, 51.4765625, 53.6513671875, 55.826171875, 58.0009765625, 60.17578125, 62.3505859375, 64.525390625, 66.7001953125, 68.875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 1.0, 4.0, 3.0, 11.0, 12.0, 16.0, 30.0, 51.0, 77.0, 140.0, 251.0, 432.0, 608.0, 769.0, 645.0, 419.0, 224.0, 163.0, 69.0, 48.0, 33.0, 27.0, 11.0, 6.0, 6.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-31.578125, -30.504638671875, -29.43115234375, -28.357666015625, -27.2841796875, -26.210693359375, -25.13720703125, -24.063720703125, -22.990234375, -21.916748046875, -20.84326171875, -19.769775390625, -18.6962890625, -17.622802734375, -16.54931640625, -15.475830078125, -14.40234375, -13.328857421875, -12.25537109375, -11.181884765625, -10.1083984375, -9.034912109375, -7.96142578125, -6.887939453125, -5.814453125, -4.740966796875, -3.66748046875, -2.593994140625, -1.5205078125, -0.447021484375, 0.62646484375, 1.699951171875, 2.7734375, 3.846923828125, 4.92041015625, 5.993896484375, 7.0673828125, 8.140869140625, 9.21435546875, 10.287841796875, 11.361328125, 12.434814453125, 13.50830078125, 14.581787109375, 15.6552734375, 16.728759765625, 17.80224609375, 18.875732421875, 19.94921875, 21.022705078125, 22.09619140625, 23.169677734375, 24.2431640625, 25.316650390625, 26.39013671875, 27.463623046875, 28.537109375, 29.610595703125, 30.68408203125, 31.757568359375, 32.8310546875, 33.904541015625, 34.97802734375, 36.051513671875, 37.125]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 5.0, 5.0, 6.0, 8.0, 8.0, 16.0, 12.0, 12.0, 33.0, 43.0, 57.0, 78.0, 136.0, 276.0, 627.0, 1672.0, 12946.0, 1607111.0, 2551085.0, 16972.0, 1752.0, 638.0, 329.0, 162.0, 91.0, 40.0, 31.0, 31.0, 21.0, 16.0, 14.0, 11.0, 5.0, 6.0, 7.0, 6.0, 4.0, 6.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-73.0, -70.396484375, -67.79296875, -65.189453125, -62.5859375, -59.982421875, -57.37890625, -54.775390625, -52.171875, -49.568359375, -46.96484375, -44.361328125, -41.7578125, -39.154296875, -36.55078125, -33.947265625, -31.34375, -28.740234375, -26.13671875, -23.533203125, -20.9296875, -18.326171875, -15.72265625, -13.119140625, -10.515625, -7.912109375, -5.30859375, -2.705078125, -0.1015625, 2.501953125, 5.10546875, 7.708984375, 10.3125, 12.916015625, 15.51953125, 18.123046875, 20.7265625, 23.330078125, 25.93359375, 28.537109375, 31.140625, 33.744140625, 36.34765625, 38.951171875, 41.5546875, 44.158203125, 46.76171875, 49.365234375, 51.96875, 54.572265625, 57.17578125, 59.779296875, 62.3828125, 64.986328125, 67.58984375, 70.193359375, 72.796875, 75.400390625, 78.00390625, 80.607421875, 83.2109375, 85.814453125, 88.41796875, 91.021484375, 93.625]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 17.0, 338.0, 602.0, 56.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-723.6837158203125, -708.3331909179688, -692.9826049804688, -677.632080078125, -662.281494140625, -646.9309692382812, -631.5804443359375, -616.2298583984375, -600.8793334960938, -585.52880859375, -570.17822265625, -554.8276977539062, -539.4771118164062, -524.1265869140625, -508.7760314941406, -493.42547607421875, -478.0749206542969, -462.724365234375, -447.3738098144531, -432.02325439453125, -416.6727294921875, -401.3221740722656, -385.97161865234375, -370.6210632324219, -355.2705078125, -339.9199523925781, -324.56939697265625, -309.2188720703125, -293.8683166503906, -278.51776123046875, -263.1672058105469, -247.816650390625, -232.46615600585938, -217.1156005859375, -201.7650604248047, -186.4145050048828, -171.06396484375, -155.71340942382812, -140.36285400390625, -125.0123062133789, -109.66175842285156, -94.31121063232422, -78.96066284179688, -63.610107421875, -48.259559631347656, -32.90901184082031, -17.558456420898438, -2.2079086303710938, 13.14263916015625, 28.493188858032227, 43.8437385559082, 59.19429016113281, 74.54483795166016, 89.8953857421875, 105.24594116210938, 120.59648895263672, 135.94703674316406, 151.29759216308594, 166.64813232421875, 181.99868774414062, 197.3492431640625, 212.6997833251953, 228.0503387451172, 243.40087890625, 258.7514343261719]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 4.0, 9.0, 8.0, 7.0, 6.0, 10.0, 8.0, 12.0, 11.0, 21.0, 23.0, 26.0, 35.0, 36.0, 41.0, 46.0, 42.0, 40.0, 52.0, 41.0, 39.0, 42.0, 36.0, 48.0, 40.0, 36.0, 40.0, 41.0, 30.0, 23.0, 30.0, 24.0, 19.0, 18.0, 12.0, 12.0, 12.0, 6.0, 4.0, 6.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-80.699951171875, -77.84577941894531, -74.9916000366211, -72.13742065429688, -69.28324890136719, -66.4290771484375, -63.57489776611328, -60.72072219848633, -57.866546630859375, -55.01237106323242, -52.15819549560547, -49.304019927978516, -46.44984436035156, -43.59566879272461, -40.741493225097656, -37.8873176574707, -35.03314208984375, -32.1789665222168, -29.324790954589844, -26.47061538696289, -23.616439819335938, -20.762264251708984, -17.90808868408203, -15.053913116455078, -12.199737548828125, -9.345561981201172, -6.491386413574219, -3.6372108459472656, -0.7830352783203125, 2.0711402893066406, 4.925315856933594, 7.779491424560547, 10.633659362792969, 13.487834930419922, 16.342010498046875, 19.196186065673828, 22.05036163330078, 24.904537200927734, 27.758712768554688, 30.61288833618164, 33.467063903808594, 36.32123947143555, 39.1754150390625, 42.02959060668945, 44.883766174316406, 47.73794174194336, 50.59211730957031, 53.446292877197266, 56.30046844482422, 59.15464401245117, 62.008819580078125, 64.86299133300781, 67.71717071533203, 70.57135009765625, 73.42552185058594, 76.27969360351562, 79.13387298583984, 81.98805236816406, 84.84222412109375, 87.69639587402344, 90.55057525634766, 93.40475463867188, 96.25892639160156, 99.11309814453125, 101.96727752685547]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 2.0, 5.0, 10.0, 3.0, 17.0, 9.0, 20.0, 31.0, 13.0, 14.0, 35.0, 31.0, 34.0, 42.0, 39.0, 33.0, 45.0, 45.0, 49.0, 58.0, 38.0, 63.0, 36.0, 39.0, 35.0, 34.0, 40.0, 37.0, 20.0, 19.0, 20.0, 20.0, 15.0, 13.0, 13.0, 8.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.78125, -17.147705078125, -16.51416015625, -15.880615234375, -15.2470703125, -14.613525390625, -13.97998046875, -13.346435546875, -12.712890625, -12.079345703125, -11.44580078125, -10.812255859375, -10.1787109375, -9.545166015625, -8.91162109375, -8.278076171875, -7.64453125, -7.010986328125, -6.37744140625, -5.743896484375, -5.1103515625, -4.476806640625, -3.84326171875, -3.209716796875, -2.576171875, -1.942626953125, -1.30908203125, -0.675537109375, -0.0419921875, 0.591552734375, 1.22509765625, 1.858642578125, 2.4921875, 3.125732421875, 3.75927734375, 4.392822265625, 5.0263671875, 5.659912109375, 6.29345703125, 6.927001953125, 7.560546875, 8.194091796875, 8.82763671875, 9.461181640625, 10.0947265625, 10.728271484375, 11.36181640625, 11.995361328125, 12.62890625, 13.262451171875, 13.89599609375, 14.529541015625, 15.1630859375, 15.796630859375, 16.43017578125, 17.063720703125, 17.697265625, 18.330810546875, 18.96435546875, 19.597900390625, 20.2314453125, 20.864990234375, 21.49853515625, 22.132080078125, 22.765625]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 8.0, 15.0, 17.0, 23.0, 45.0, 67.0, 90.0, 159.0, 282.0, 463.0, 815.0, 1241.0, 2170.0, 3626.0, 6176.0, 10383.0, 17473.0, 30151.0, 52710.0, 96977.0, 241584.0, 332035.0, 111762.0, 59069.0, 33553.0, 19291.0, 11532.0, 6840.0, 4046.0, 2289.0, 1435.0, 848.0, 510.0, 334.0, 187.0, 140.0, 80.0, 33.0, 43.0, 15.0, 16.0, 7.0, 4.0, 4.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.73046875, -4.57330322265625, -4.4161376953125, -4.25897216796875, -4.101806640625, -3.94464111328125, -3.7874755859375, -3.63031005859375, -3.47314453125, -3.31597900390625, -3.1588134765625, -3.00164794921875, -2.844482421875, -2.68731689453125, -2.5301513671875, -2.37298583984375, -2.2158203125, -2.05865478515625, -1.9014892578125, -1.74432373046875, -1.587158203125, -1.42999267578125, -1.2728271484375, -1.11566162109375, -0.95849609375, -0.80133056640625, -0.6441650390625, -0.48699951171875, -0.329833984375, -0.17266845703125, -0.0155029296875, 0.14166259765625, 0.298828125, 0.45599365234375, 0.6131591796875, 0.77032470703125, 0.927490234375, 1.08465576171875, 1.2418212890625, 1.39898681640625, 1.55615234375, 1.71331787109375, 1.8704833984375, 2.02764892578125, 2.184814453125, 2.34197998046875, 2.4991455078125, 2.65631103515625, 2.8134765625, 2.97064208984375, 3.1278076171875, 3.28497314453125, 3.442138671875, 3.59930419921875, 3.7564697265625, 3.91363525390625, 4.07080078125, 4.22796630859375, 4.3851318359375, 4.54229736328125, 4.699462890625, 4.85662841796875, 5.0137939453125, 5.17095947265625, 5.328125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 7.0, 2.0, 4.0, 4.0, 9.0, 10.0, 9.0, 6.0, 8.0, 7.0, 19.0, 13.0, 21.0, 12.0, 31.0, 25.0, 21.0, 40.0, 29.0, 23.0, 32.0, 31.0, 32.0, 37.0, 46.0, 1068.0, 38.0, 31.0, 37.0, 34.0, 33.0, 47.0, 29.0, 41.0, 23.0, 28.0, 23.0, 21.0, 18.0, 11.0, 10.0, 11.0, 11.0, 10.0, 7.0, 4.0, 3.0, 4.0, 6.0, 2.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-10.53125, -10.198974609375, -9.86669921875, -9.534423828125, -9.2021484375, -8.869873046875, -8.53759765625, -8.205322265625, -7.873046875, -7.540771484375, -7.20849609375, -6.876220703125, -6.5439453125, -6.211669921875, -5.87939453125, -5.547119140625, -5.21484375, -4.882568359375, -4.55029296875, -4.218017578125, -3.8857421875, -3.553466796875, -3.22119140625, -2.888916015625, -2.556640625, -2.224365234375, -1.89208984375, -1.559814453125, -1.2275390625, -0.895263671875, -0.56298828125, -0.230712890625, 0.1015625, 0.433837890625, 0.76611328125, 1.098388671875, 1.4306640625, 1.762939453125, 2.09521484375, 2.427490234375, 2.759765625, 3.092041015625, 3.42431640625, 3.756591796875, 4.0888671875, 4.421142578125, 4.75341796875, 5.085693359375, 5.41796875, 5.750244140625, 6.08251953125, 6.414794921875, 6.7470703125, 7.079345703125, 7.41162109375, 7.743896484375, 8.076171875, 8.408447265625, 8.74072265625, 9.072998046875, 9.4052734375, 9.737548828125, 10.06982421875, 10.402099609375, 10.734375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 6.0, 12.0, 11.0, 13.0, 38.0, 38.0, 93.0, 102.0, 145.0, 251.0, 337.0, 482.0, 705.0, 956.0, 1346.0, 1893.0, 2661.0, 3525.0, 5164.0, 7287.0, 10475.0, 15366.0, 22791.0, 34476.0, 52831.0, 85241.0, 153231.0, 1336765.0, 134233.0, 78018.0, 48681.0, 31822.0, 20856.0, 14098.0, 9738.0, 6810.0, 4701.0, 3416.0, 2527.0, 1716.0, 1272.0, 911.0, 627.0, 463.0, 329.0, 227.0, 152.0, 111.0, 72.0, 44.0, 33.0, 19.0, 11.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0], "bins": [-3.27734375, -3.17620849609375, -3.0750732421875, -2.97393798828125, -2.872802734375, -2.77166748046875, -2.6705322265625, -2.56939697265625, -2.46826171875, -2.36712646484375, -2.2659912109375, -2.16485595703125, -2.063720703125, -1.96258544921875, -1.8614501953125, -1.76031494140625, -1.6591796875, -1.55804443359375, -1.4569091796875, -1.35577392578125, -1.254638671875, -1.15350341796875, -1.0523681640625, -0.95123291015625, -0.85009765625, -0.74896240234375, -0.6478271484375, -0.54669189453125, -0.445556640625, -0.34442138671875, -0.2432861328125, -0.14215087890625, -0.041015625, 0.06011962890625, 0.1612548828125, 0.26239013671875, 0.363525390625, 0.46466064453125, 0.5657958984375, 0.66693115234375, 0.76806640625, 0.86920166015625, 0.9703369140625, 1.07147216796875, 1.172607421875, 1.27374267578125, 1.3748779296875, 1.47601318359375, 1.5771484375, 1.67828369140625, 1.7794189453125, 1.88055419921875, 1.981689453125, 2.08282470703125, 2.1839599609375, 2.28509521484375, 2.38623046875, 2.48736572265625, 2.5885009765625, 2.68963623046875, 2.790771484375, 2.89190673828125, 2.9930419921875, 3.09417724609375, 3.1953125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 2.0, 2.0, 6.0, 6.0, 6.0, 12.0, 11.0, 12.0, 21.0, 17.0, 26.0, 41.0, 55.0, 54.0, 84.0, 105.0, 95.0, 86.0, 67.0, 51.0, 49.0, 39.0, 35.0, 22.0, 20.0, 11.0, 14.0, 10.0, 11.0, 6.0, 10.0, 8.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.003314971923828125, -0.00321274995803833, -0.003110527992248535, -0.0030083060264587402, -0.0029060840606689453, -0.0028038620948791504, -0.0027016401290893555, -0.0025994181632995605, -0.0024971961975097656, -0.0023949742317199707, -0.0022927522659301758, -0.002190530300140381, -0.002088308334350586, -0.001986086368560791, -0.001883864402770996, -0.0017816424369812012, -0.0016794204711914062, -0.0015771985054016113, -0.0014749765396118164, -0.0013727545738220215, -0.0012705326080322266, -0.0011683106422424316, -0.0010660886764526367, -0.0009638667106628418, -0.0008616447448730469, -0.000759422779083252, -0.000657200813293457, -0.0005549788475036621, -0.0004527568817138672, -0.00035053491592407227, -0.00024831295013427734, -0.00014609098434448242, -4.38690185546875e-05, 5.835294723510742e-05, 0.00016057491302490234, 0.00026279687881469727, 0.0003650188446044922, 0.0004672408103942871, 0.000569462776184082, 0.000671684741973877, 0.0007739067077636719, 0.0008761286735534668, 0.0009783506393432617, 0.0010805726051330566, 0.0011827945709228516, 0.0012850165367126465, 0.0013872385025024414, 0.0014894604682922363, 0.0015916824340820312, 0.0016939043998718262, 0.001796126365661621, 0.001898348331451416, 0.002000570297241211, 0.002102792263031006, 0.0022050142288208008, 0.0023072361946105957, 0.0024094581604003906, 0.0025116801261901855, 0.0026139020919799805, 0.0027161240577697754, 0.0028183460235595703, 0.0029205679893493652, 0.00302278995513916, 0.003125011920928955, 0.00322723388671875]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 7.0, 11.0, 11.0, 12.0, 11.0, 18.0, 25.0, 27.0, 30.0, 61.0, 58.0, 86.0, 113.0, 206.0, 333.0, 697.0, 30867.0, 1013551.0, 1271.0, 414.0, 252.0, 158.0, 75.0, 61.0, 42.0, 31.0, 25.0, 25.0, 22.0, 8.0, 9.0, 8.0, 4.0, 6.0, 6.0, 5.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0631103515625, -0.061087608337402344, -0.05906486511230469, -0.05704212188720703, -0.055019378662109375, -0.05299663543701172, -0.05097389221191406, -0.048951148986816406, -0.04692840576171875, -0.044905662536621094, -0.04288291931152344, -0.04086017608642578, -0.038837432861328125, -0.03681468963623047, -0.03479194641113281, -0.032769203186035156, -0.0307464599609375, -0.028723716735839844, -0.026700973510742188, -0.02467823028564453, -0.022655487060546875, -0.02063274383544922, -0.018610000610351562, -0.016587257385253906, -0.01456451416015625, -0.012541770935058594, -0.010519027709960938, -0.008496284484863281, -0.006473541259765625, -0.004450798034667969, -0.0024280548095703125, -0.00040531158447265625, 0.001617431640625, 0.0036401748657226562, 0.0056629180908203125, 0.007685661315917969, 0.009708404541015625, 0.011731147766113281, 0.013753890991210938, 0.015776634216308594, 0.01779937744140625, 0.019822120666503906, 0.021844863891601562, 0.02386760711669922, 0.025890350341796875, 0.02791309356689453, 0.029935836791992188, 0.031958580017089844, 0.0339813232421875, 0.036004066467285156, 0.03802680969238281, 0.04004955291748047, 0.042072296142578125, 0.04409503936767578, 0.04611778259277344, 0.048140525817871094, 0.05016326904296875, 0.052186012268066406, 0.05420875549316406, 0.05623149871826172, 0.058254241943359375, 0.06027698516845703, 0.06229972839355469, 0.06432247161865234, 0.06634521484375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 165.0, 751.0, 88.0, 5.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00444948673248291, -0.004178408533334732, -0.003907330334186554, -0.0036362523678690195, -0.0033651741687208414, -0.0030940959695726633, -0.002823018003255129, -0.0025519398041069508, -0.0022808616049587727, -0.0020097834058105946, -0.0017387053230777383, -0.001467627240344882, -0.001196549041196704, -0.0009254708420485258, -0.0006543927593156695, -0.00038331467658281326, -0.00011223647743463516, 0.00015884166350588202, 0.0004299198044463992, 0.0007009979453869164, 0.0009720760863274336, 0.0012431542854756117, 0.001514232368208468, 0.0017853104509413242, 0.0020563886500895023, 0.0023274668492376804, 0.0025985450483858585, 0.002869623014703393, 0.003140701213851571, 0.003411779412999749, 0.0036828573793172836, 0.003953935578465462, 0.004225012846291065, 0.004496091045439243, 0.004767169244587421, 0.0050382474437355995, 0.005309325642883778, 0.005580403842031956, 0.0058514815755188465, 0.006122559774667025, 0.006393637973815203, 0.006664716172963381, 0.006935794372111559, 0.007206872571259737, 0.007477950304746628, 0.007749028503894806, 0.008020106703042984, 0.008291184902191162, 0.00856226310133934, 0.008833341300487518, 0.009104419499635696, 0.009375497698783875, 0.009646575897932053, 0.00991765409708023, 0.010188732296228409, 0.010459810495376587, 0.010730888694524765, 0.011001966893672943, 0.011273045092821121, 0.0115441232919693, 0.011815201491117477, 0.012086279690265656, 0.012357357889413834, 0.012628436088562012, 0.012899513356387615]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 6.0, 0.0, 3.0, 4.0, 11.0, 8.0, 5.0, 15.0, 16.0, 10.0, 22.0, 21.0, 27.0, 29.0, 21.0, 31.0, 30.0, 21.0, 42.0, 43.0, 47.0, 39.0, 29.0, 40.0, 36.0, 36.0, 51.0, 33.0, 36.0, 24.0, 23.0, 27.0, 25.0, 43.0, 23.0, 26.0, 18.0, 18.0, 11.0, 16.0, 4.0, 12.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0012633204460144043, -0.0012222891673445702, -0.001181257888674736, -0.0011402266100049019, -0.0010991953313350677, -0.0010581640526652336, -0.0010171327739953995, -0.0009761014953255653, -0.0009350702166557312, -0.0008940389379858971, -0.0008530076593160629, -0.0008119763806462288, -0.0007709451019763947, -0.0007299138233065605, -0.0006888825446367264, -0.0006478512659668922, -0.0006068199872970581, -0.000565788708627224, -0.0005247574299573898, -0.0004837261512875557, -0.00044269487261772156, -0.0004016635939478874, -0.0003606323152780533, -0.00031960103660821915, -0.000278569757938385, -0.00023753847926855087, -0.00019650720059871674, -0.0001554759219288826, -0.00011444464325904846, -7.341336458921432e-05, -3.238208591938019e-05, 8.649192750453949e-06, 4.9680471420288086e-05, 9.071175009012222e-05, 0.00013174302875995636, 0.0001727743074297905, 0.00021380558609962463, 0.00025483686476945877, 0.0002958681434392929, 0.00033689942210912704, 0.0003779307007789612, 0.0004189619794487953, 0.00045999325811862946, 0.0005010245367884636, 0.0005420558154582977, 0.0005830870941281319, 0.000624118372797966, 0.0006651496514678001, 0.0007061809301376343, 0.0007472122088074684, 0.0007882434874773026, 0.0008292747661471367, 0.0008703060448169708, 0.000911337323486805, 0.0009523686021566391, 0.0009933998808264732, 0.0010344311594963074, 0.0010754624381661415, 0.0011164937168359756, 0.0011575249955058098, 0.001198556274175644, 0.001239587552845478, 0.0012806188315153122, 0.0013216501101851463, 0.0013626813888549805]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 3.0, 2.0, 5.0, 10.0, 3.0, 17.0, 9.0, 20.0, 31.0, 13.0, 14.0, 35.0, 31.0, 34.0, 42.0, 39.0, 33.0, 45.0, 45.0, 49.0, 58.0, 38.0, 63.0, 36.0, 39.0, 35.0, 34.0, 40.0, 37.0, 20.0, 19.0, 20.0, 20.0, 15.0, 13.0, 13.0, 8.0, 4.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.78125, -17.147705078125, -16.51416015625, -15.880615234375, -15.2470703125, -14.613525390625, -13.97998046875, -13.346435546875, -12.712890625, -12.079345703125, -11.44580078125, -10.812255859375, -10.1787109375, -9.545166015625, -8.91162109375, -8.278076171875, -7.64453125, -7.010986328125, -6.37744140625, -5.743896484375, -5.1103515625, -4.476806640625, -3.84326171875, -3.209716796875, -2.576171875, -1.942626953125, -1.30908203125, -0.675537109375, -0.0419921875, 0.591552734375, 1.22509765625, 1.858642578125, 2.4921875, 3.125732421875, 3.75927734375, 4.392822265625, 5.0263671875, 5.659912109375, 6.29345703125, 6.927001953125, 7.560546875, 8.194091796875, 8.82763671875, 9.461181640625, 10.0947265625, 10.728271484375, 11.36181640625, 11.995361328125, 12.62890625, 13.262451171875, 13.89599609375, 14.529541015625, 15.1630859375, 15.796630859375, 16.43017578125, 17.063720703125, 17.697265625, 18.330810546875, 18.96435546875, 19.597900390625, 20.2314453125, 20.864990234375, 21.49853515625, 22.132080078125, 22.765625]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 4.0, 8.0, 11.0, 9.0, 17.0, 20.0, 25.0, 49.0, 67.0, 95.0, 128.0, 157.0, 245.0, 349.0, 502.0, 814.0, 1577.0, 3899.0, 13620.0, 63315.0, 306604.0, 491246.0, 127926.0, 25996.0, 6537.0, 2278.0, 1048.0, 620.0, 412.0, 282.0, 203.0, 141.0, 106.0, 76.0, 59.0, 37.0, 18.0, 18.0, 16.0, 10.0, 10.0, 2.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.3125, -24.57275390625, -23.8330078125, -23.09326171875, -22.353515625, -21.61376953125, -20.8740234375, -20.13427734375, -19.39453125, -18.65478515625, -17.9150390625, -17.17529296875, -16.435546875, -15.69580078125, -14.9560546875, -14.21630859375, -13.4765625, -12.73681640625, -11.9970703125, -11.25732421875, -10.517578125, -9.77783203125, -9.0380859375, -8.29833984375, -7.55859375, -6.81884765625, -6.0791015625, -5.33935546875, -4.599609375, -3.85986328125, -3.1201171875, -2.38037109375, -1.640625, -0.90087890625, -0.1611328125, 0.57861328125, 1.318359375, 2.05810546875, 2.7978515625, 3.53759765625, 4.27734375, 5.01708984375, 5.7568359375, 6.49658203125, 7.236328125, 7.97607421875, 8.7158203125, 9.45556640625, 10.1953125, 10.93505859375, 11.6748046875, 12.41455078125, 13.154296875, 13.89404296875, 14.6337890625, 15.37353515625, 16.11328125, 16.85302734375, 17.5927734375, 18.33251953125, 19.072265625, 19.81201171875, 20.5517578125, 21.29150390625, 22.03125]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 5.0, 10.0, 8.0, 12.0, 17.0, 21.0, 13.0, 19.0, 34.0, 38.0, 52.0, 51.0, 61.0, 91.0, 152.0, 1645.0, 362.0, 94.0, 74.0, 46.0, 50.0, 41.0, 39.0, 35.0, 24.0, 12.0, 14.0, 12.0, 7.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-81.3125, -79.041015625, -76.76953125, -74.498046875, -72.2265625, -69.955078125, -67.68359375, -65.412109375, -63.140625, -60.869140625, -58.59765625, -56.326171875, -54.0546875, -51.783203125, -49.51171875, -47.240234375, -44.96875, -42.697265625, -40.42578125, -38.154296875, -35.8828125, -33.611328125, -31.33984375, -29.068359375, -26.796875, -24.525390625, -22.25390625, -19.982421875, -17.7109375, -15.439453125, -13.16796875, -10.896484375, -8.625, -6.353515625, -4.08203125, -1.810546875, 0.4609375, 2.732421875, 5.00390625, 7.275390625, 9.546875, 11.818359375, 14.08984375, 16.361328125, 18.6328125, 20.904296875, 23.17578125, 25.447265625, 27.71875, 29.990234375, 32.26171875, 34.533203125, 36.8046875, 39.076171875, 41.34765625, 43.619140625, 45.890625, 48.162109375, 50.43359375, 52.705078125, 54.9765625, 57.248046875, 59.51953125, 61.791015625, 64.0625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 4.0, 6.0, 6.0, 14.0, 15.0, 22.0, 29.0, 47.0, 60.0, 113.0, 112.0, 151.0, 285.0, 481.0, 1156.0, 21891.0, 3085875.0, 32665.0, 1291.0, 515.0, 308.0, 181.0, 141.0, 85.0, 71.0, 47.0, 33.0, 30.0, 27.0, 14.0, 12.0, 8.0, 9.0, 4.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-87.25, -84.1923828125, -81.134765625, -78.0771484375, -75.01953125, -71.9619140625, -68.904296875, -65.8466796875, -62.7890625, -59.7314453125, -56.673828125, -53.6162109375, -50.55859375, -47.5009765625, -44.443359375, -41.3857421875, -38.328125, -35.2705078125, -32.212890625, -29.1552734375, -26.09765625, -23.0400390625, -19.982421875, -16.9248046875, -13.8671875, -10.8095703125, -7.751953125, -4.6943359375, -1.63671875, 1.4208984375, 4.478515625, 7.5361328125, 10.59375, 13.6513671875, 16.708984375, 19.7666015625, 22.82421875, 25.8818359375, 28.939453125, 31.9970703125, 35.0546875, 38.1123046875, 41.169921875, 44.2275390625, 47.28515625, 50.3427734375, 53.400390625, 56.4580078125, 59.515625, 62.5732421875, 65.630859375, 68.6884765625, 71.74609375, 74.8037109375, 77.861328125, 80.9189453125, 83.9765625, 87.0341796875, 90.091796875, 93.1494140625, 96.20703125, 99.2646484375, 102.322265625, 105.3798828125, 108.4375]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 58.0, 951.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-373.25146484375, -353.9856872558594, -334.71990966796875, -315.4541320800781, -296.1883544921875, -276.9225769042969, -257.65679931640625, -238.39102172851562, -219.125244140625, -199.85946655273438, -180.59368896484375, -161.32791137695312, -142.0621337890625, -122.79635620117188, -103.53057861328125, -84.26480102539062, -64.9990234375, -45.733245849609375, -26.46746826171875, -7.201690673828125, 12.0640869140625, 31.329864501953125, 50.59564208984375, 69.86141967773438, 89.127197265625, 108.39297485351562, 127.65875244140625, 146.92453002929688, 166.1903076171875, 185.45608520507812, 204.72186279296875, 223.98764038085938, 243.25341796875, 262.5191955566406, 281.78497314453125, 301.0507507324219, 320.3165283203125, 339.5823059082031, 358.84808349609375, 378.1138610839844, 397.379638671875, 416.6454162597656, 435.91119384765625, 455.1769714355469, 474.4427490234375, 493.7085266113281, 512.9743041992188, 532.2401123046875, 551.505859375, 570.7716064453125, 590.0374145507812, 609.30322265625, 628.5689697265625, 647.834716796875, 667.1005249023438, 686.3663330078125, 705.632080078125, 724.8978271484375, 744.1636352539062, 763.429443359375, 782.6951904296875, 801.9609375, 821.2267456054688, 840.4925537109375, 859.75830078125]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 9.0, 14.0, 16.0, 14.0, 24.0, 25.0, 28.0, 30.0, 27.0, 35.0, 39.0, 48.0, 33.0, 53.0, 45.0, 51.0, 51.0, 42.0, 45.0, 47.0, 42.0, 36.0, 33.0, 30.0, 29.0, 27.0, 27.0, 28.0, 11.0, 11.0, 13.0, 8.0, 9.0, 8.0, 5.0, 9.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-172.25927734375, -167.64524841308594, -163.03121948242188, -158.4171905517578, -153.80316162109375, -149.18914794921875, -144.57510375976562, -139.96109008789062, -135.34706115722656, -130.7330322265625, -126.11900329589844, -121.50497436523438, -116.89095306396484, -112.27692413330078, -107.66289520263672, -103.04887390136719, -98.4348373413086, -93.82080841064453, -89.20677947998047, -84.59275817871094, -79.97872924804688, -75.36470031738281, -70.75067138671875, -66.13664245605469, -61.52261734008789, -56.90858840942383, -52.29456329345703, -47.68053436279297, -43.066505432128906, -38.45248031616211, -33.83845138549805, -29.22442626953125, -24.610397338867188, -19.996370315551758, -15.382342338562012, -10.768314361572266, -6.154287338256836, -1.5402603149414062, 3.0737686157226562, 7.687793731689453, 12.301822662353516, 16.915849685668945, 21.529876708984375, 26.143905639648438, 30.757932662963867, 35.3719596862793, 39.98598861694336, 44.600013732910156, 49.21404266357422, 53.82807159423828, 58.44209671020508, 63.05612564086914, 67.67015075683594, 72.2841796875, 76.89820861816406, 81.51223754882812, 86.12626647949219, 90.74029541015625, 95.35432434082031, 99.96835327148438, 104.5823745727539, 109.19640350341797, 113.81043243408203, 118.42445373535156, 123.03848266601562]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 5.0, 7.0, 3.0, 7.0, 5.0, 16.0, 21.0, 15.0, 15.0, 21.0, 19.0, 15.0, 30.0, 30.0, 29.0, 39.0, 38.0, 28.0, 55.0, 42.0, 51.0, 50.0, 52.0, 48.0, 34.0, 37.0, 51.0, 29.0, 31.0, 24.0, 28.0, 16.0, 23.0, 23.0, 11.0, 16.0, 8.0, 11.0, 8.0, 2.0, 3.0, 2.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.546875, -16.939208984375, -16.33154296875, -15.723876953125, -15.1162109375, -14.508544921875, -13.90087890625, -13.293212890625, -12.685546875, -12.077880859375, -11.47021484375, -10.862548828125, -10.2548828125, -9.647216796875, -9.03955078125, -8.431884765625, -7.82421875, -7.216552734375, -6.60888671875, -6.001220703125, -5.3935546875, -4.785888671875, -4.17822265625, -3.570556640625, -2.962890625, -2.355224609375, -1.74755859375, -1.139892578125, -0.5322265625, 0.075439453125, 0.68310546875, 1.290771484375, 1.8984375, 2.506103515625, 3.11376953125, 3.721435546875, 4.3291015625, 4.936767578125, 5.54443359375, 6.152099609375, 6.759765625, 7.367431640625, 7.97509765625, 8.582763671875, 9.1904296875, 9.798095703125, 10.40576171875, 11.013427734375, 11.62109375, 12.228759765625, 12.83642578125, 13.444091796875, 14.0517578125, 14.659423828125, 15.26708984375, 15.874755859375, 16.482421875, 17.090087890625, 17.69775390625, 18.305419921875, 18.9130859375, 19.520751953125, 20.12841796875, 20.736083984375, 21.34375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 6.0, 5.0, 9.0, 13.0, 12.0, 12.0, 6.0, 11.0, 23.0, 24.0, 52.0, 50.0, 39.0, 56.0, 78.0, 150.0, 154.0, 184.0, 310.0, 313.0, 420.0, 1429.0, 4187265.0, 1672.0, 465.0, 353.0, 264.0, 190.0, 159.0, 130.0, 88.0, 76.0, 54.0, 41.0, 34.0, 22.0, 10.0, 24.0, 17.0, 11.0, 10.0, 10.0, 8.0, 8.0, 5.0, 0.0, 7.0, 1.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0], "bins": [-597.5, -579.140625, -560.78125, -542.421875, -524.0625, -505.703125, -487.34375, -468.984375, -450.625, -432.265625, -413.90625, -395.546875, -377.1875, -358.828125, -340.46875, -322.109375, -303.75, -285.390625, -267.03125, -248.671875, -230.3125, -211.953125, -193.59375, -175.234375, -156.875, -138.515625, -120.15625, -101.796875, -83.4375, -65.078125, -46.71875, -28.359375, -10.0, 8.359375, 26.71875, 45.078125, 63.4375, 81.796875, 100.15625, 118.515625, 136.875, 155.234375, 173.59375, 191.953125, 210.3125, 228.671875, 247.03125, 265.390625, 283.75, 302.109375, 320.46875, 338.828125, 357.1875, 375.546875, 393.90625, 412.265625, 430.625, 448.984375, 467.34375, 485.703125, 504.0625, 522.421875, 540.78125, 559.140625, 577.5]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 0.0, 6.0, 2.0, 2.0, 5.0, 7.0, 10.0, 12.0, 13.0, 13.0, 28.0, 36.0, 49.0, 62.0, 91.0, 101.0, 169.0, 240.0, 389.0, 579.0, 660.0, 531.0, 341.0, 203.0, 149.0, 93.0, 71.0, 47.0, 44.0, 27.0, 27.0, 9.0, 14.0, 8.0, 10.0, 7.0, 5.0, 4.0, 1.0, 4.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.5, -27.58935546875, -26.6787109375, -25.76806640625, -24.857421875, -23.94677734375, -23.0361328125, -22.12548828125, -21.21484375, -20.30419921875, -19.3935546875, -18.48291015625, -17.572265625, -16.66162109375, -15.7509765625, -14.84033203125, -13.9296875, -13.01904296875, -12.1083984375, -11.19775390625, -10.287109375, -9.37646484375, -8.4658203125, -7.55517578125, -6.64453125, -5.73388671875, -4.8232421875, -3.91259765625, -3.001953125, -2.09130859375, -1.1806640625, -0.27001953125, 0.640625, 1.55126953125, 2.4619140625, 3.37255859375, 4.283203125, 5.19384765625, 6.1044921875, 7.01513671875, 7.92578125, 8.83642578125, 9.7470703125, 10.65771484375, 11.568359375, 12.47900390625, 13.3896484375, 14.30029296875, 15.2109375, 16.12158203125, 17.0322265625, 17.94287109375, 18.853515625, 19.76416015625, 20.6748046875, 21.58544921875, 22.49609375, 23.40673828125, 24.3173828125, 25.22802734375, 26.138671875, 27.04931640625, 27.9599609375, 28.87060546875, 29.78125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 3.0, 4.0, 3.0, 4.0, 6.0, 8.0, 11.0, 10.0, 14.0, 10.0, 24.0, 20.0, 28.0, 43.0, 49.0, 57.0, 53.0, 67.0, 140.0, 431.0, 69987.0, 4121653.0, 993.0, 174.0, 105.0, 59.0, 53.0, 39.0, 39.0, 39.0, 25.0, 25.0, 21.0, 19.0, 9.0, 14.0, 8.0, 8.0, 8.0, 5.0, 3.0, 1.0, 2.0, 3.0, 3.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-302.5, -292.796875, -283.09375, -273.390625, -263.6875, -253.984375, -244.28125, -234.578125, -224.875, -215.171875, -205.46875, -195.765625, -186.0625, -176.359375, -166.65625, -156.953125, -147.25, -137.546875, -127.84375, -118.140625, -108.4375, -98.734375, -89.03125, -79.328125, -69.625, -59.921875, -50.21875, -40.515625, -30.8125, -21.109375, -11.40625, -1.703125, 8.0, 17.703125, 27.40625, 37.109375, 46.8125, 56.515625, 66.21875, 75.921875, 85.625, 95.328125, 105.03125, 114.734375, 124.4375, 134.140625, 143.84375, 153.546875, 163.25, 172.953125, 182.65625, 192.359375, 202.0625, 211.765625, 221.46875, 231.171875, 240.875, 250.578125, 260.28125, 269.984375, 279.6875, 289.390625, 299.09375, 308.796875, 318.5]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 66.0, 873.0, 78.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1340.907958984375, -1315.3824462890625, -1289.85693359375, -1264.3314208984375, -1238.805908203125, -1213.280517578125, -1187.7550048828125, -1162.2294921875, -1136.7039794921875, -1111.178466796875, -1085.6529541015625, -1060.12744140625, -1034.60205078125, -1009.0764770507812, -983.551025390625, -958.0255126953125, -932.5, -906.9744873046875, -881.448974609375, -855.9235229492188, -830.3980102539062, -804.8724975585938, -779.3470458984375, -753.821533203125, -728.2960205078125, -702.7705078125, -677.2449951171875, -651.7195434570312, -626.1940307617188, -600.6685180664062, -575.14306640625, -549.6175537109375, -524.092041015625, -498.5665283203125, -473.0410461425781, -447.51556396484375, -421.99005126953125, -396.46453857421875, -370.9390563964844, -345.41357421875, -319.8880310058594, -294.362548828125, -268.8370361328125, -243.31153869628906, -217.78604125976562, -192.2605438232422, -166.73504638671875, -141.2095489501953, -115.68405151367188, -90.15855407714844, -64.633056640625, -39.10755920410156, -13.582061767578125, 11.943435668945312, 37.46893310546875, 62.99443054199219, 88.51992797851562, 114.04542541503906, 139.5709228515625, 165.09642028808594, 190.62191772460938, 216.1474151611328, 241.67291259765625, 267.19842529296875, 292.7239074707031]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 1.0, 6.0, 3.0, 8.0, 5.0, 13.0, 13.0, 17.0, 23.0, 20.0, 21.0, 22.0, 33.0, 35.0, 30.0, 25.0, 39.0, 44.0, 34.0, 38.0, 46.0, 44.0, 47.0, 33.0, 45.0, 33.0, 33.0, 28.0, 40.0, 35.0, 27.0, 29.0, 25.0, 14.0, 23.0, 12.0, 9.0, 7.0, 17.0, 7.0, 5.0, 6.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-93.65692901611328, -90.480224609375, -87.30351257324219, -84.1268081665039, -80.95010375976562, -77.77339172363281, -74.59668731689453, -71.41998291015625, -68.24327087402344, -65.06656646728516, -61.889854431152344, -58.71315002441406, -55.536441802978516, -52.35973358154297, -49.18302917480469, -46.00632095336914, -42.829612731933594, -39.65290451049805, -36.4761962890625, -33.29949188232422, -30.122783660888672, -26.946075439453125, -23.76936912536621, -20.592662811279297, -17.41595458984375, -14.23924732208252, -11.062540054321289, -7.885832786560059, -4.709125518798828, -1.5324182510375977, 1.6442890167236328, 4.820995330810547, 7.997711181640625, 11.174418449401855, 14.351125717163086, 17.52783203125, 20.704540252685547, 23.881248474121094, 27.057954788208008, 30.234661102294922, 33.41136932373047, 36.588077545166016, 39.76478576660156, 42.941490173339844, 46.11819839477539, 49.29490661621094, 52.47161102294922, 55.648319244384766, 58.82502746582031, 62.00173568725586, 65.1784439086914, 68.35514831542969, 71.5318603515625, 74.70856475830078, 77.88526916503906, 81.06198120117188, 84.23868560791016, 87.41539001464844, 90.59210205078125, 93.76880645751953, 96.94551086425781, 100.12222290039062, 103.2989273071289, 106.47563171386719, 109.65234375]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 14.0, 12.0, 11.0, 15.0, 19.0, 21.0, 25.0, 28.0, 22.0, 28.0, 39.0, 33.0, 38.0, 32.0, 45.0, 48.0, 53.0, 46.0, 51.0, 44.0, 44.0, 42.0, 42.0, 32.0, 21.0, 29.0, 19.0, 27.0, 20.0, 16.0, 23.0, 13.0, 6.0, 5.0, 3.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.60546875, -16.9921875, -16.37890625, -15.765625, -15.15234375, -14.5390625, -13.92578125, -13.3125, -12.69921875, -12.0859375, -11.47265625, -10.859375, -10.24609375, -9.6328125, -9.01953125, -8.40625, -7.79296875, -7.1796875, -6.56640625, -5.953125, -5.33984375, -4.7265625, -4.11328125, -3.5, -2.88671875, -2.2734375, -1.66015625, -1.046875, -0.43359375, 0.1796875, 0.79296875, 1.40625, 2.01953125, 2.6328125, 3.24609375, 3.859375, 4.47265625, 5.0859375, 5.69921875, 6.3125, 6.92578125, 7.5390625, 8.15234375, 8.765625, 9.37890625, 9.9921875, 10.60546875, 11.21875, 11.83203125, 12.4453125, 13.05859375, 13.671875, 14.28515625, 14.8984375, 15.51171875, 16.125, 16.73828125, 17.3515625, 17.96484375, 18.578125, 19.19140625, 19.8046875, 20.41796875, 21.03125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 9.0, 7.0, 13.0, 15.0, 17.0, 32.0, 45.0, 85.0, 105.0, 153.0, 185.0, 310.0, 418.0, 638.0, 978.0, 1434.0, 2057.0, 3191.0, 4891.0, 7720.0, 11685.0, 18668.0, 30611.0, 52324.0, 92705.0, 215785.0, 331876.0, 114703.0, 62069.0, 35678.0, 21551.0, 13562.0, 8591.0, 5486.0, 3665.0, 2457.0, 1533.0, 1032.0, 701.0, 511.0, 331.0, 202.0, 174.0, 99.0, 78.0, 52.0, 42.0, 36.0, 16.0, 18.0, 5.0, 5.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-4.5625, -4.42059326171875, -4.2786865234375, -4.13677978515625, -3.994873046875, -3.85296630859375, -3.7110595703125, -3.56915283203125, -3.42724609375, -3.28533935546875, -3.1434326171875, -3.00152587890625, -2.859619140625, -2.71771240234375, -2.5758056640625, -2.43389892578125, -2.2919921875, -2.15008544921875, -2.0081787109375, -1.86627197265625, -1.724365234375, -1.58245849609375, -1.4405517578125, -1.29864501953125, -1.15673828125, -1.01483154296875, -0.8729248046875, -0.73101806640625, -0.589111328125, -0.44720458984375, -0.3052978515625, -0.16339111328125, -0.021484375, 0.12042236328125, 0.2623291015625, 0.40423583984375, 0.546142578125, 0.68804931640625, 0.8299560546875, 0.97186279296875, 1.11376953125, 1.25567626953125, 1.3975830078125, 1.53948974609375, 1.681396484375, 1.82330322265625, 1.9652099609375, 2.10711669921875, 2.2490234375, 2.39093017578125, 2.5328369140625, 2.67474365234375, 2.816650390625, 2.95855712890625, 3.1004638671875, 3.24237060546875, 3.38427734375, 3.52618408203125, 3.6680908203125, 3.80999755859375, 3.951904296875, 4.09381103515625, 4.2357177734375, 4.37762451171875, 4.51953125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 3.0, 1.0, 7.0, 7.0, 12.0, 12.0, 15.0, 12.0, 12.0, 21.0, 21.0, 24.0, 32.0, 33.0, 29.0, 40.0, 39.0, 44.0, 35.0, 41.0, 45.0, 1066.0, 42.0, 32.0, 40.0, 32.0, 37.0, 37.0, 36.0, 29.0, 32.0, 20.0, 27.0, 22.0, 24.0, 10.0, 16.0, 8.0, 9.0, 5.0, 6.0, 3.0, 5.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-13.5, -13.119873046875, -12.73974609375, -12.359619140625, -11.9794921875, -11.599365234375, -11.21923828125, -10.839111328125, -10.458984375, -10.078857421875, -9.69873046875, -9.318603515625, -8.9384765625, -8.558349609375, -8.17822265625, -7.798095703125, -7.41796875, -7.037841796875, -6.65771484375, -6.277587890625, -5.8974609375, -5.517333984375, -5.13720703125, -4.757080078125, -4.376953125, -3.996826171875, -3.61669921875, -3.236572265625, -2.8564453125, -2.476318359375, -2.09619140625, -1.716064453125, -1.3359375, -0.955810546875, -0.57568359375, -0.195556640625, 0.1845703125, 0.564697265625, 0.94482421875, 1.324951171875, 1.705078125, 2.085205078125, 2.46533203125, 2.845458984375, 3.2255859375, 3.605712890625, 3.98583984375, 4.365966796875, 4.74609375, 5.126220703125, 5.50634765625, 5.886474609375, 6.2666015625, 6.646728515625, 7.02685546875, 7.406982421875, 7.787109375, 8.167236328125, 8.54736328125, 8.927490234375, 9.3076171875, 9.687744140625, 10.06787109375, 10.447998046875, 10.828125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 3.0, 11.0, 10.0, 11.0, 28.0, 39.0, 52.0, 79.0, 109.0, 149.0, 239.0, 324.0, 441.0, 737.0, 1075.0, 1555.0, 2459.0, 3486.0, 5209.0, 8022.0, 12120.0, 18602.0, 29228.0, 46832.0, 78175.0, 141544.0, 1356161.0, 161196.0, 86702.0, 51482.0, 31801.0, 20340.0, 13003.0, 8684.0, 5694.0, 3845.0, 2442.0, 1708.0, 1150.0, 752.0, 524.0, 375.0, 224.0, 166.0, 118.0, 65.0, 59.0, 35.0, 22.0, 19.0, 14.0, 10.0, 3.0, 4.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.517578125, -3.398712158203125, -3.27984619140625, -3.160980224609375, -3.0421142578125, -2.923248291015625, -2.80438232421875, -2.685516357421875, -2.566650390625, -2.447784423828125, -2.32891845703125, -2.210052490234375, -2.0911865234375, -1.972320556640625, -1.85345458984375, -1.734588623046875, -1.61572265625, -1.496856689453125, -1.37799072265625, -1.259124755859375, -1.1402587890625, -1.021392822265625, -0.90252685546875, -0.783660888671875, -0.664794921875, -0.545928955078125, -0.42706298828125, -0.308197021484375, -0.1893310546875, -0.070465087890625, 0.04840087890625, 0.167266845703125, 0.2861328125, 0.404998779296875, 0.52386474609375, 0.642730712890625, 0.7615966796875, 0.880462646484375, 0.99932861328125, 1.118194580078125, 1.237060546875, 1.355926513671875, 1.47479248046875, 1.593658447265625, 1.7125244140625, 1.831390380859375, 1.95025634765625, 2.069122314453125, 2.18798828125, 2.306854248046875, 2.42572021484375, 2.544586181640625, 2.6634521484375, 2.782318115234375, 2.90118408203125, 3.020050048828125, 3.138916015625, 3.257781982421875, 3.37664794921875, 3.495513916015625, 3.6143798828125, 3.733245849609375, 3.85211181640625, 3.970977783203125, 4.08984375]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 0.0, 4.0, 10.0, 14.0, 11.0, 11.0, 15.0, 19.0, 21.0, 36.0, 47.0, 35.0, 54.0, 66.0, 81.0, 79.0, 85.0, 76.0, 64.0, 50.0, 45.0, 32.0, 44.0, 22.0, 20.0, 17.0, 9.0, 5.0, 9.0, 6.0, 5.0, 5.0, 5.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0034503936767578125, -0.0033597350120544434, -0.0032690763473510742, -0.003178417682647705, -0.003087759017944336, -0.002997100353240967, -0.0029064416885375977, -0.0028157830238342285, -0.0027251243591308594, -0.0026344656944274902, -0.002543807029724121, -0.002453148365020752, -0.002362489700317383, -0.0022718310356140137, -0.0021811723709106445, -0.0020905137062072754, -0.0019998550415039062, -0.0019091963768005371, -0.001818537712097168, -0.0017278790473937988, -0.0016372203826904297, -0.0015465617179870605, -0.0014559030532836914, -0.0013652443885803223, -0.0012745857238769531, -0.001183927059173584, -0.0010932683944702148, -0.0010026097297668457, -0.0009119510650634766, -0.0008212924003601074, -0.0007306337356567383, -0.0006399750709533691, -0.00054931640625, -0.00045865774154663086, -0.0003679990768432617, -0.0002773404121398926, -0.00018668174743652344, -9.60230827331543e-05, -5.364418029785156e-06, 8.529424667358398e-05, 0.00017595291137695312, 0.00026661157608032227, 0.0003572702407836914, 0.00044792890548706055, 0.0005385875701904297, 0.0006292462348937988, 0.000719904899597168, 0.0008105635643005371, 0.0009012222290039062, 0.0009918808937072754, 0.0010825395584106445, 0.0011731982231140137, 0.0012638568878173828, 0.001354515552520752, 0.001445174217224121, 0.0015358328819274902, 0.0016264915466308594, 0.0017171502113342285, 0.0018078088760375977, 0.0018984675407409668, 0.001989126205444336, 0.002079784870147705, 0.0021704435348510742, 0.0022611021995544434, 0.0023517608642578125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 10.0, 13.0, 13.0, 16.0, 18.0, 33.0, 37.0, 52.0, 80.0, 117.0, 181.0, 245.0, 439.0, 910.0, 31873.0, 1011346.0, 1607.0, 567.0, 335.0, 203.0, 122.0, 78.0, 59.0, 55.0, 36.0, 34.0, 21.0, 15.0, 18.0, 8.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.047698974609375, -0.04587984085083008, -0.044060707092285156, -0.042241573333740234, -0.04042243957519531, -0.03860330581665039, -0.03678417205810547, -0.03496503829956055, -0.033145904541015625, -0.0313267707824707, -0.02950763702392578, -0.02768850326538086, -0.025869369506835938, -0.024050235748291016, -0.022231101989746094, -0.020411968231201172, -0.01859283447265625, -0.016773700714111328, -0.014954566955566406, -0.013135433197021484, -0.011316299438476562, -0.00949716567993164, -0.007678031921386719, -0.005858898162841797, -0.004039764404296875, -0.002220630645751953, -0.00040149688720703125, 0.0014176368713378906, 0.0032367706298828125, 0.005055904388427734, 0.006875038146972656, 0.008694171905517578, 0.0105133056640625, 0.012332439422607422, 0.014151573181152344, 0.015970706939697266, 0.017789840698242188, 0.01960897445678711, 0.02142810821533203, 0.023247241973876953, 0.025066375732421875, 0.026885509490966797, 0.02870464324951172, 0.03052377700805664, 0.03234291076660156, 0.034162044525146484, 0.035981178283691406, 0.03780031204223633, 0.03961944580078125, 0.04143857955932617, 0.043257713317871094, 0.045076847076416016, 0.04689598083496094, 0.04871511459350586, 0.05053424835205078, 0.0523533821105957, 0.054172515869140625, 0.05599164962768555, 0.05781078338623047, 0.05962991714477539, 0.06144905090332031, 0.06326818466186523, 0.06508731842041016, 0.06690645217895508, 0.0687255859375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 159.0, 603.0, 224.0, 20.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007966863922774792, -0.007770548574626446, -0.007574233692139387, -0.0073779188096523285, -0.0071816034615039825, -0.006985288113355637, -0.006788973230868578, -0.006592658348381519, -0.006396343000233173, -0.006200027652084827, -0.006003712769597769, -0.00580739788711071, -0.005611082538962364, -0.005414767190814018, -0.00521845230832696, -0.005022137425839901, -0.004825822077691555, -0.004629506729543209, -0.0044331918470561504, -0.004236876964569092, -0.004040561616420746, -0.0038442465011030436, -0.0036479313857853413, -0.003451616270467639, -0.0032553011551499367, -0.0030589860398322344, -0.002862670924514532, -0.00266635580919683, -0.0024700406938791275, -0.002273725578561425, -0.002077410463243723, -0.0018810953479260206, -0.0016847806982696056, -0.0014884655829519033, -0.001292150467634201, -0.0010958353523164988, -0.0008995202369987965, -0.0007032051216810942, -0.0005068900063633919, -0.0003105748910456896, -0.00011425977572798729, 8.2055339589715e-05, 0.0002783704549074173, 0.0004746855702251196, 0.0006710006855428219, 0.0008673158008605242, 0.0010636309161782265, 0.0012599460314959288, 0.001456261146813631, 0.0016525762621313334, 0.0018488913774490356, 0.002045206492766738, 0.0022415216080844402, 0.0024378367234021425, 0.002634151838719845, 0.002830466954037547, 0.0030267820693552494, 0.0032230971846729517, 0.003419412299990654, 0.0036157274153083563, 0.0038120425306260586, 0.004008357413113117, 0.004204672761261463, 0.004400988109409809, 0.004597302991896868]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 7.0, 4.0, 7.0, 6.0, 4.0, 14.0, 19.0, 12.0, 17.0, 21.0, 16.0, 19.0, 22.0, 25.0, 32.0, 48.0, 35.0, 40.0, 41.0, 38.0, 51.0, 45.0, 35.0, 55.0, 38.0, 34.0, 31.0, 36.0, 35.0, 28.0, 25.0, 25.0, 21.0, 20.0, 26.0, 15.0, 14.0, 9.0, 7.0, 8.0, 2.0, 5.0, 8.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0010946989059448242, -0.0010558608919382095, -0.0010170228779315948, -0.0009781848639249802, -0.0009393468499183655, -0.0009005088359117508, -0.0008616708219051361, -0.0008228328078985214, -0.0007839947938919067, -0.000745156779885292, -0.0007063187658786774, -0.0006674807518720627, -0.000628642737865448, -0.0005898047238588333, -0.0005509667098522186, -0.0005121286958456039, -0.00047329068183898926, -0.00043445266783237457, -0.0003956146538257599, -0.0003567766398191452, -0.0003179386258125305, -0.00027910061180591583, -0.00024026259779930115, -0.00020142458379268646, -0.00016258656978607178, -0.0001237485557794571, -8.491054177284241e-05, -4.607252776622772e-05, -7.234513759613037e-06, 3.160350024700165e-05, 7.044151425361633e-05, 0.00010927952826023102, 0.0001481175422668457, 0.0001869555562734604, 0.00022579357028007507, 0.00026463158428668976, 0.00030346959829330444, 0.00034230761229991913, 0.0003811456263065338, 0.0004199836403131485, 0.0004588216543197632, 0.0004976596683263779, 0.0005364976823329926, 0.0005753356963396072, 0.0006141737103462219, 0.0006530117243528366, 0.0006918497383594513, 0.000730687752366066, 0.0007695257663726807, 0.0008083637803792953, 0.00084720179438591, 0.0008860398083925247, 0.0009248778223991394, 0.0009637158364057541, 0.0010025538504123688, 0.0010413918644189835, 0.0010802298784255981, 0.0011190678924322128, 0.0011579059064388275, 0.0011967439204454422, 0.0012355819344520569, 0.0012744199484586716, 0.0013132579624652863, 0.001352095976471901, 0.0013909339904785156]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 5.0, 7.0, 14.0, 12.0, 11.0, 15.0, 19.0, 21.0, 25.0, 28.0, 22.0, 28.0, 39.0, 33.0, 38.0, 32.0, 45.0, 48.0, 53.0, 46.0, 51.0, 44.0, 44.0, 42.0, 42.0, 32.0, 21.0, 29.0, 19.0, 27.0, 20.0, 16.0, 23.0, 13.0, 6.0, 5.0, 3.0, 2.0, 7.0, 3.0, 1.0, 1.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-18.21875, -17.60546875, -16.9921875, -16.37890625, -15.765625, -15.15234375, -14.5390625, -13.92578125, -13.3125, -12.69921875, -12.0859375, -11.47265625, -10.859375, -10.24609375, -9.6328125, -9.01953125, -8.40625, -7.79296875, -7.1796875, -6.56640625, -5.953125, -5.33984375, -4.7265625, -4.11328125, -3.5, -2.88671875, -2.2734375, -1.66015625, -1.046875, -0.43359375, 0.1796875, 0.79296875, 1.40625, 2.01953125, 2.6328125, 3.24609375, 3.859375, 4.47265625, 5.0859375, 5.69921875, 6.3125, 6.92578125, 7.5390625, 8.15234375, 8.765625, 9.37890625, 9.9921875, 10.60546875, 11.21875, 11.83203125, 12.4453125, 13.05859375, 13.671875, 14.28515625, 14.8984375, 15.51171875, 16.125, 16.73828125, 17.3515625, 17.96484375, 18.578125, 19.19140625, 19.8046875, 20.41796875, 21.03125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 7.0, 7.0, 7.0, 14.0, 16.0, 20.0, 27.0, 42.0, 44.0, 72.0, 93.0, 140.0, 160.0, 193.0, 315.0, 434.0, 568.0, 725.0, 873.0, 1255.0, 2073.0, 5424.0, 27878.0, 224211.0, 627788.0, 129413.0, 16494.0, 3820.0, 1811.0, 1143.0, 835.0, 652.0, 535.0, 396.0, 279.0, 206.0, 139.0, 126.0, 101.0, 67.0, 32.0, 26.0, 28.0, 25.0, 14.0, 7.0, 10.0, 4.0, 3.0, 1.0, 7.0, 0.0, 3.0, 1.0, 1.0, 1.0], "bins": [-30.390625, -29.45166015625, -28.5126953125, -27.57373046875, -26.634765625, -25.69580078125, -24.7568359375, -23.81787109375, -22.87890625, -21.93994140625, -21.0009765625, -20.06201171875, -19.123046875, -18.18408203125, -17.2451171875, -16.30615234375, -15.3671875, -14.42822265625, -13.4892578125, -12.55029296875, -11.611328125, -10.67236328125, -9.7333984375, -8.79443359375, -7.85546875, -6.91650390625, -5.9775390625, -5.03857421875, -4.099609375, -3.16064453125, -2.2216796875, -1.28271484375, -0.34375, 0.59521484375, 1.5341796875, 2.47314453125, 3.412109375, 4.35107421875, 5.2900390625, 6.22900390625, 7.16796875, 8.10693359375, 9.0458984375, 9.98486328125, 10.923828125, 11.86279296875, 12.8017578125, 13.74072265625, 14.6796875, 15.61865234375, 16.5576171875, 17.49658203125, 18.435546875, 19.37451171875, 20.3134765625, 21.25244140625, 22.19140625, 23.13037109375, 24.0693359375, 25.00830078125, 25.947265625, 26.88623046875, 27.8251953125, 28.76416015625, 29.703125]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 6.0, 7.0, 8.0, 10.0, 12.0, 6.0, 13.0, 22.0, 17.0, 20.0, 23.0, 35.0, 28.0, 35.0, 39.0, 30.0, 80.0, 66.0, 109.0, 1454.0, 470.0, 139.0, 59.0, 44.0, 48.0, 34.0, 32.0, 31.0, 34.0, 18.0, 20.0, 20.0, 16.0, 13.0, 13.0, 5.0, 8.0, 5.0, 4.0, 4.0, 4.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.96875, -44.32666015625, -42.6845703125, -41.04248046875, -39.400390625, -37.75830078125, -36.1162109375, -34.47412109375, -32.83203125, -31.18994140625, -29.5478515625, -27.90576171875, -26.263671875, -24.62158203125, -22.9794921875, -21.33740234375, -19.6953125, -18.05322265625, -16.4111328125, -14.76904296875, -13.126953125, -11.48486328125, -9.8427734375, -8.20068359375, -6.55859375, -4.91650390625, -3.2744140625, -1.63232421875, 0.009765625, 1.65185546875, 3.2939453125, 4.93603515625, 6.578125, 8.22021484375, 9.8623046875, 11.50439453125, 13.146484375, 14.78857421875, 16.4306640625, 18.07275390625, 19.71484375, 21.35693359375, 22.9990234375, 24.64111328125, 26.283203125, 27.92529296875, 29.5673828125, 31.20947265625, 32.8515625, 34.49365234375, 36.1357421875, 37.77783203125, 39.419921875, 41.06201171875, 42.7041015625, 44.34619140625, 45.98828125, 47.63037109375, 49.2724609375, 50.91455078125, 52.556640625, 54.19873046875, 55.8408203125, 57.48291015625, 59.125]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 4.0, 5.0, 6.0, 5.0, 5.0, 13.0, 11.0, 6.0, 13.0, 16.0, 19.0, 27.0, 26.0, 45.0, 48.0, 68.0, 74.0, 97.0, 152.0, 253.0, 465.0, 1150.0, 8116.0, 3126578.0, 6034.0, 1048.0, 466.0, 278.0, 170.0, 120.0, 64.0, 75.0, 56.0, 41.0, 32.0, 32.0, 26.0, 15.0, 13.0, 12.0, 8.0, 5.0, 3.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0], "bins": [-158.375, -154.0322265625, -149.689453125, -145.3466796875, -141.00390625, -136.6611328125, -132.318359375, -127.9755859375, -123.6328125, -119.2900390625, -114.947265625, -110.6044921875, -106.26171875, -101.9189453125, -97.576171875, -93.2333984375, -88.890625, -84.5478515625, -80.205078125, -75.8623046875, -71.51953125, -67.1767578125, -62.833984375, -58.4912109375, -54.1484375, -49.8056640625, -45.462890625, -41.1201171875, -36.77734375, -32.4345703125, -28.091796875, -23.7490234375, -19.40625, -15.0634765625, -10.720703125, -6.3779296875, -2.03515625, 2.3076171875, 6.650390625, 10.9931640625, 15.3359375, 19.6787109375, 24.021484375, 28.3642578125, 32.70703125, 37.0498046875, 41.392578125, 45.7353515625, 50.078125, 54.4208984375, 58.763671875, 63.1064453125, 67.44921875, 71.7919921875, 76.134765625, 80.4775390625, 84.8203125, 89.1630859375, 93.505859375, 97.8486328125, 102.19140625, 106.5341796875, 110.876953125, 115.2197265625, 119.5625]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 170.0, 801.0, 42.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.3962631225586, -51.85700607299805, -36.3177490234375, -20.778488159179688, -5.239231109619141, 10.300025939941406, 25.83928680419922, 41.3785400390625, 56.91780090332031, 72.45706176757812, 87.9963150024414, 103.53557586669922, 119.0748291015625, 134.6140899658203, 150.15335083007812, 165.69259643554688, 181.23187255859375, 196.77113342285156, 212.31039428710938, 227.84963989257812, 243.38890075683594, 258.92816162109375, 274.4674072265625, 290.0066833496094, 305.5459289550781, 321.0851745605469, 336.62445068359375, 352.1636962890625, 367.7029724121094, 383.2422180175781, 398.781494140625, 414.32073974609375, 429.8600158691406, 445.3992614746094, 460.93853759765625, 476.477783203125, 492.0170593261719, 507.5563049316406, 523.0955810546875, 538.6348266601562, 554.174072265625, 569.7133178710938, 585.2525634765625, 600.7918701171875, 616.3311157226562, 631.870361328125, 647.4096069335938, 662.9488525390625, 678.4881591796875, 694.0274047851562, 709.566650390625, 725.10595703125, 740.6452026367188, 756.1844482421875, 771.7236938476562, 787.262939453125, 802.8021850585938, 818.3414306640625, 833.8806762695312, 849.4199829101562, 864.959228515625, 880.4984741210938, 896.0377197265625, 911.5769653320312, 927.1162719726562]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 1.0, 0.0, 6.0, 9.0, 7.0, 9.0, 6.0, 15.0, 12.0, 21.0, 16.0, 24.0, 32.0, 26.0, 27.0, 36.0, 37.0, 45.0, 45.0, 43.0, 64.0, 44.0, 50.0, 50.0, 42.0, 32.0, 38.0, 26.0, 33.0, 30.0, 22.0, 24.0, 23.0, 21.0, 19.0, 17.0, 8.0, 11.0, 8.0, 7.0, 7.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-155.98114013671875, -151.36285400390625, -146.7445526123047, -142.1262664794922, -137.5079803466797, -132.88967895507812, -128.27139282226562, -123.65310668945312, -119.0348129272461, -114.41651916503906, -109.79823303222656, -105.17993927001953, -100.5616455078125, -95.943359375, -91.32506561279297, -86.70677185058594, -82.08848571777344, -77.4701919555664, -72.8519058227539, -68.23361206054688, -63.61532211303711, -58.997032165527344, -54.37873840332031, -49.76044845581055, -45.14215850830078, -40.523868560791016, -35.90557861328125, -31.28728485107422, -26.668994903564453, -22.050704956054688, -17.43241310119629, -12.81412124633789, -8.195831298828125, -3.577540397644043, 1.040750503540039, 5.659041404724121, 10.277332305908203, 14.895622253417969, 19.513914108276367, 24.132205963134766, 28.75049591064453, 33.3687858581543, 37.98707580566406, 42.605369567871094, 47.22365951538086, 51.841949462890625, 56.460243225097656, 61.07853317260742, 65.69682312011719, 70.31511688232422, 74.93340301513672, 79.55169677734375, 84.16998291015625, 88.78827667236328, 93.40657043457031, 98.02485656738281, 102.64315032958984, 107.26144409179688, 111.87973022460938, 116.4980239868164, 121.11631774902344, 125.73460388183594, 130.35289001464844, 134.97119140625, 139.5894775390625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 4.0, 2.0, 2.0, 5.0, 10.0, 9.0, 5.0, 13.0, 17.0, 10.0, 15.0, 16.0, 23.0, 20.0, 23.0, 29.0, 36.0, 25.0, 27.0, 40.0, 49.0, 44.0, 43.0, 43.0, 51.0, 45.0, 46.0, 53.0, 39.0, 30.0, 29.0, 26.0, 36.0, 23.0, 20.0, 19.0, 12.0, 19.0, 10.0, 15.0, 7.0, 3.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-16.28125, -15.69287109375, -15.1044921875, -14.51611328125, -13.927734375, -13.33935546875, -12.7509765625, -12.16259765625, -11.57421875, -10.98583984375, -10.3974609375, -9.80908203125, -9.220703125, -8.63232421875, -8.0439453125, -7.45556640625, -6.8671875, -6.27880859375, -5.6904296875, -5.10205078125, -4.513671875, -3.92529296875, -3.3369140625, -2.74853515625, -2.16015625, -1.57177734375, -0.9833984375, -0.39501953125, 0.193359375, 0.78173828125, 1.3701171875, 1.95849609375, 2.546875, 3.13525390625, 3.7236328125, 4.31201171875, 4.900390625, 5.48876953125, 6.0771484375, 6.66552734375, 7.25390625, 7.84228515625, 8.4306640625, 9.01904296875, 9.607421875, 10.19580078125, 10.7841796875, 11.37255859375, 11.9609375, 12.54931640625, 13.1376953125, 13.72607421875, 14.314453125, 14.90283203125, 15.4912109375, 16.07958984375, 16.66796875, 17.25634765625, 17.8447265625, 18.43310546875, 19.021484375, 19.60986328125, 20.1982421875, 20.78662109375, 21.375]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 1.0, 8.0, 7.0, 8.0, 6.0, 18.0, 14.0, 18.0, 27.0, 31.0, 32.0, 53.0, 57.0, 75.0, 79.0, 96.0, 123.0, 158.0, 214.0, 320.0, 723.0, 2752.0, 26891.0, 1599153.0, 2513216.0, 44080.0, 3859.0, 874.0, 361.0, 206.0, 143.0, 116.0, 97.0, 87.0, 68.0, 67.0, 57.0, 36.0, 39.0, 22.0, 22.0, 14.0, 13.0, 12.0, 8.0, 6.0, 7.0, 3.0, 6.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-62.53125, -60.45263671875, -58.3740234375, -56.29541015625, -54.216796875, -52.13818359375, -50.0595703125, -47.98095703125, -45.90234375, -43.82373046875, -41.7451171875, -39.66650390625, -37.587890625, -35.50927734375, -33.4306640625, -31.35205078125, -29.2734375, -27.19482421875, -25.1162109375, -23.03759765625, -20.958984375, -18.88037109375, -16.8017578125, -14.72314453125, -12.64453125, -10.56591796875, -8.4873046875, -6.40869140625, -4.330078125, -2.25146484375, -0.1728515625, 1.90576171875, 3.984375, 6.06298828125, 8.1416015625, 10.22021484375, 12.298828125, 14.37744140625, 16.4560546875, 18.53466796875, 20.61328125, 22.69189453125, 24.7705078125, 26.84912109375, 28.927734375, 31.00634765625, 33.0849609375, 35.16357421875, 37.2421875, 39.32080078125, 41.3994140625, 43.47802734375, 45.556640625, 47.63525390625, 49.7138671875, 51.79248046875, 53.87109375, 55.94970703125, 58.0283203125, 60.10693359375, 62.185546875, 64.26416015625, 66.3427734375, 68.42138671875, 70.5]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 5.0, 0.0, 3.0, 5.0, 1.0, 4.0, 2.0, 2.0, 6.0, 5.0, 8.0, 18.0, 21.0, 21.0, 30.0, 34.0, 35.0, 55.0, 70.0, 96.0, 126.0, 182.0, 179.0, 276.0, 398.0, 486.0, 447.0, 385.0, 303.0, 194.0, 132.0, 113.0, 93.0, 87.0, 57.0, 56.0, 34.0, 23.0, 30.0, 13.0, 6.0, 13.0, 13.0, 4.0, 3.0, 4.0, 6.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.15625, -23.291259765625, -22.42626953125, -21.561279296875, -20.6962890625, -19.831298828125, -18.96630859375, -18.101318359375, -17.236328125, -16.371337890625, -15.50634765625, -14.641357421875, -13.7763671875, -12.911376953125, -12.04638671875, -11.181396484375, -10.31640625, -9.451416015625, -8.58642578125, -7.721435546875, -6.8564453125, -5.991455078125, -5.12646484375, -4.261474609375, -3.396484375, -2.531494140625, -1.66650390625, -0.801513671875, 0.0634765625, 0.928466796875, 1.79345703125, 2.658447265625, 3.5234375, 4.388427734375, 5.25341796875, 6.118408203125, 6.9833984375, 7.848388671875, 8.71337890625, 9.578369140625, 10.443359375, 11.308349609375, 12.17333984375, 13.038330078125, 13.9033203125, 14.768310546875, 15.63330078125, 16.498291015625, 17.36328125, 18.228271484375, 19.09326171875, 19.958251953125, 20.8232421875, 21.688232421875, 22.55322265625, 23.418212890625, 24.283203125, 25.148193359375, 26.01318359375, 26.878173828125, 27.7431640625, 28.608154296875, 29.47314453125, 30.338134765625, 31.203125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 5.0, 4.0, 6.0, 8.0, 25.0, 32.0, 37.0, 46.0, 52.0, 97.0, 179.0, 300.0, 725.0, 2836.0, 127075.0, 4046221.0, 13956.0, 1541.0, 511.0, 227.0, 118.0, 80.0, 61.0, 37.0, 22.0, 22.0, 15.0, 15.0, 7.0, 10.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-160.5, -156.310546875, -152.12109375, -147.931640625, -143.7421875, -139.552734375, -135.36328125, -131.173828125, -126.984375, -122.794921875, -118.60546875, -114.416015625, -110.2265625, -106.037109375, -101.84765625, -97.658203125, -93.46875, -89.279296875, -85.08984375, -80.900390625, -76.7109375, -72.521484375, -68.33203125, -64.142578125, -59.953125, -55.763671875, -51.57421875, -47.384765625, -43.1953125, -39.005859375, -34.81640625, -30.626953125, -26.4375, -22.248046875, -18.05859375, -13.869140625, -9.6796875, -5.490234375, -1.30078125, 2.888671875, 7.078125, 11.267578125, 15.45703125, 19.646484375, 23.8359375, 28.025390625, 32.21484375, 36.404296875, 40.59375, 44.783203125, 48.97265625, 53.162109375, 57.3515625, 61.541015625, 65.73046875, 69.919921875, 74.109375, 78.298828125, 82.48828125, 86.677734375, 90.8671875, 95.056640625, 99.24609375, 103.435546875, 107.625]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 13.0, 304.0, 656.0, 39.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-693.0784912109375, -670.8988037109375, -648.7191162109375, -626.5393676757812, -604.3596801757812, -582.1799926757812, -560.000244140625, -537.820556640625, -515.640869140625, -493.461181640625, -471.2814636230469, -449.10174560546875, -426.92205810546875, -404.74237060546875, -382.5626525878906, -360.3829345703125, -338.2032470703125, -316.0235595703125, -293.8438415527344, -271.66412353515625, -249.48443603515625, -227.3047332763672, -205.12503051757812, -182.94532775878906, -160.765625, -138.58592224121094, -116.40621948242188, -94.22651672363281, -72.04681396484375, -49.86711120605469, -27.687408447265625, -5.5077056884765625, 16.6719970703125, 38.85169982910156, 61.031402587890625, 83.21110534667969, 105.39080810546875, 127.57051086425781, 149.75021362304688, 171.92991638183594, 194.109619140625, 216.28932189941406, 238.46902465820312, 260.64874267578125, 282.82843017578125, 305.00811767578125, 327.1878356933594, 349.3675537109375, 371.5472412109375, 393.7269287109375, 415.9066467285156, 438.08636474609375, 460.26605224609375, 482.44573974609375, 504.6254577636719, 526.80517578125, 548.98486328125, 571.16455078125, 593.34423828125, 615.5239868164062, 637.7036743164062, 659.8833618164062, 682.0631103515625, 704.2427978515625, 726.4224853515625]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 5.0, 0.0, 6.0, 6.0, 11.0, 14.0, 8.0, 16.0, 13.0, 22.0, 13.0, 24.0, 22.0, 32.0, 27.0, 38.0, 26.0, 33.0, 43.0, 44.0, 29.0, 45.0, 41.0, 50.0, 38.0, 36.0, 34.0, 45.0, 34.0, 37.0, 28.0, 32.0, 27.0, 14.0, 16.0, 15.0, 13.0, 9.0, 10.0, 8.0, 8.0, 9.0, 8.0, 5.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-112.80072021484375, -109.21649932861328, -105.63227844238281, -102.04806518554688, -98.4638442993164, -94.87962341308594, -91.29541015625, -87.71118927001953, -84.12696838378906, -80.5427474975586, -76.95852661132812, -73.37431335449219, -69.79009246826172, -66.20587158203125, -62.62165451049805, -59.037437438964844, -55.453216552734375, -51.868995666503906, -48.2847785949707, -44.7005615234375, -41.11634063720703, -37.53211975097656, -33.94790267944336, -30.363683700561523, -26.779464721679688, -23.19524574279785, -19.611026763916016, -16.02680778503418, -12.442588806152344, -8.858369827270508, -5.274150848388672, -1.689931869506836, 1.894287109375, 5.478506088256836, 9.062725067138672, 12.646944046020508, 16.231163024902344, 19.81538200378418, 23.399600982666016, 26.98381996154785, 30.568038940429688, 34.152259826660156, 37.73647689819336, 41.32069396972656, 44.90491485595703, 48.4891357421875, 52.0733528137207, 55.657569885253906, 59.241790771484375, 62.826011657714844, 66.41023254394531, 69.99444580078125, 73.57866668701172, 77.16288757324219, 80.74710083007812, 84.3313217163086, 87.91554260253906, 91.49976348876953, 95.083984375, 98.66819763183594, 102.2524185180664, 105.83663940429688, 109.42085266113281, 113.00507354736328, 116.58929443359375]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 6.0, 6.0, 6.0, 8.0, 21.0, 13.0, 23.0, 20.0, 21.0, 18.0, 20.0, 37.0, 34.0, 38.0, 46.0, 41.0, 41.0, 39.0, 54.0, 44.0, 46.0, 41.0, 35.0, 41.0, 36.0, 37.0, 26.0, 17.0, 24.0, 20.0, 24.0, 20.0, 25.0, 16.0, 12.0, 7.0, 8.0, 7.0, 6.0, 7.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.5703125, -15.0743408203125, -14.578369140625, -14.0823974609375, -13.58642578125, -13.0904541015625, -12.594482421875, -12.0985107421875, -11.6025390625, -11.1065673828125, -10.610595703125, -10.1146240234375, -9.61865234375, -9.1226806640625, -8.626708984375, -8.1307373046875, -7.634765625, -7.1387939453125, -6.642822265625, -6.1468505859375, -5.65087890625, -5.1549072265625, -4.658935546875, -4.1629638671875, -3.6669921875, -3.1710205078125, -2.675048828125, -2.1790771484375, -1.68310546875, -1.1871337890625, -0.691162109375, -0.1951904296875, 0.30078125, 0.7967529296875, 1.292724609375, 1.7886962890625, 2.28466796875, 2.7806396484375, 3.276611328125, 3.7725830078125, 4.2685546875, 4.7645263671875, 5.260498046875, 5.7564697265625, 6.25244140625, 6.7484130859375, 7.244384765625, 7.7403564453125, 8.236328125, 8.7322998046875, 9.228271484375, 9.7242431640625, 10.22021484375, 10.7161865234375, 11.212158203125, 11.7081298828125, 12.2041015625, 12.7000732421875, 13.196044921875, 13.6920166015625, 14.18798828125, 14.6839599609375, 15.179931640625, 15.6759033203125, 16.171875]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 4.0, 5.0, 16.0, 17.0, 28.0, 41.0, 55.0, 100.0, 130.0, 195.0, 314.0, 436.0, 697.0, 1007.0, 1552.0, 2274.0, 3579.0, 5476.0, 8002.0, 12105.0, 18647.0, 30417.0, 51436.0, 90080.0, 188544.0, 325076.0, 129515.0, 69317.0, 40566.0, 24239.0, 14905.0, 10081.0, 6689.0, 4473.0, 2897.0, 1899.0, 1271.0, 816.0, 563.0, 327.0, 246.0, 169.0, 104.0, 83.0, 66.0, 46.0, 16.0, 10.0, 7.0, 8.0, 9.0, 4.0, 2.0, 0.0, 1.0, 2.0, 2.0, 1.0], "bins": [-3.43359375, -3.32379150390625, -3.2139892578125, -3.10418701171875, -2.994384765625, -2.88458251953125, -2.7747802734375, -2.66497802734375, -2.55517578125, -2.44537353515625, -2.3355712890625, -2.22576904296875, -2.115966796875, -2.00616455078125, -1.8963623046875, -1.78656005859375, -1.6767578125, -1.56695556640625, -1.4571533203125, -1.34735107421875, -1.237548828125, -1.12774658203125, -1.0179443359375, -0.90814208984375, -0.79833984375, -0.68853759765625, -0.5787353515625, -0.46893310546875, -0.359130859375, -0.24932861328125, -0.1395263671875, -0.02972412109375, 0.080078125, 0.18988037109375, 0.2996826171875, 0.40948486328125, 0.519287109375, 0.62908935546875, 0.7388916015625, 0.84869384765625, 0.95849609375, 1.06829833984375, 1.1781005859375, 1.28790283203125, 1.397705078125, 1.50750732421875, 1.6173095703125, 1.72711181640625, 1.8369140625, 1.94671630859375, 2.0565185546875, 2.16632080078125, 2.276123046875, 2.38592529296875, 2.4957275390625, 2.60552978515625, 2.71533203125, 2.82513427734375, 2.9349365234375, 3.04473876953125, 3.154541015625, 3.26434326171875, 3.3741455078125, 3.48394775390625, 3.59375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 3.0, 6.0, 5.0, 7.0, 9.0, 10.0, 14.0, 15.0, 16.0, 17.0, 13.0, 21.0, 33.0, 34.0, 33.0, 41.0, 35.0, 38.0, 30.0, 44.0, 48.0, 1059.0, 35.0, 53.0, 40.0, 40.0, 36.0, 35.0, 31.0, 29.0, 32.0, 24.0, 18.0, 22.0, 22.0, 11.0, 13.0, 8.0, 7.0, 5.0, 9.0, 9.0, 5.0, 8.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.3359375, -9.026611328125, -8.71728515625, -8.407958984375, -8.0986328125, -7.789306640625, -7.47998046875, -7.170654296875, -6.861328125, -6.552001953125, -6.24267578125, -5.933349609375, -5.6240234375, -5.314697265625, -5.00537109375, -4.696044921875, -4.38671875, -4.077392578125, -3.76806640625, -3.458740234375, -3.1494140625, -2.840087890625, -2.53076171875, -2.221435546875, -1.912109375, -1.602783203125, -1.29345703125, -0.984130859375, -0.6748046875, -0.365478515625, -0.05615234375, 0.253173828125, 0.5625, 0.871826171875, 1.18115234375, 1.490478515625, 1.7998046875, 2.109130859375, 2.41845703125, 2.727783203125, 3.037109375, 3.346435546875, 3.65576171875, 3.965087890625, 4.2744140625, 4.583740234375, 4.89306640625, 5.202392578125, 5.51171875, 5.821044921875, 6.13037109375, 6.439697265625, 6.7490234375, 7.058349609375, 7.36767578125, 7.677001953125, 7.986328125, 8.295654296875, 8.60498046875, 8.914306640625, 9.2236328125, 9.532958984375, 9.84228515625, 10.151611328125, 10.4609375]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 5.0, 4.0, 7.0, 16.0, 13.0, 36.0, 40.0, 88.0, 90.0, 145.0, 222.0, 353.0, 422.0, 598.0, 966.0, 1341.0, 1918.0, 2837.0, 4055.0, 5696.0, 8345.0, 12238.0, 18832.0, 28624.0, 45152.0, 74203.0, 133788.0, 1344248.0, 170697.0, 88800.0, 53231.0, 33416.0, 21439.0, 14297.0, 9697.0, 6528.0, 4539.0, 3097.0, 2189.0, 1520.0, 1059.0, 759.0, 556.0, 336.0, 227.0, 177.0, 107.0, 61.0, 41.0, 35.0, 17.0, 14.0, 14.0, 4.0, 2.0, 3.0, 3.0, 1.0], "bins": [-3.16015625, -3.0662841796875, -2.972412109375, -2.8785400390625, -2.78466796875, -2.6907958984375, -2.596923828125, -2.5030517578125, -2.4091796875, -2.3153076171875, -2.221435546875, -2.1275634765625, -2.03369140625, -1.9398193359375, -1.845947265625, -1.7520751953125, -1.658203125, -1.5643310546875, -1.470458984375, -1.3765869140625, -1.28271484375, -1.1888427734375, -1.094970703125, -1.0010986328125, -0.9072265625, -0.8133544921875, -0.719482421875, -0.6256103515625, -0.53173828125, -0.4378662109375, -0.343994140625, -0.2501220703125, -0.15625, -0.0623779296875, 0.031494140625, 0.1253662109375, 0.21923828125, 0.3131103515625, 0.406982421875, 0.5008544921875, 0.5947265625, 0.6885986328125, 0.782470703125, 0.8763427734375, 0.97021484375, 1.0640869140625, 1.157958984375, 1.2518310546875, 1.345703125, 1.4395751953125, 1.533447265625, 1.6273193359375, 1.72119140625, 1.8150634765625, 1.908935546875, 2.0028076171875, 2.0966796875, 2.1905517578125, 2.284423828125, 2.3782958984375, 2.47216796875, 2.5660400390625, 2.659912109375, 2.7537841796875, 2.84765625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 2.0, 5.0, 3.0, 4.0, 9.0, 3.0, 10.0, 7.0, 14.0, 14.0, 16.0, 27.0, 21.0, 25.0, 45.0, 46.0, 59.0, 73.0, 68.0, 81.0, 69.0, 64.0, 57.0, 50.0, 40.0, 35.0, 29.0, 22.0, 11.0, 14.0, 13.0, 8.0, 10.0, 5.0, 8.0, 2.0, 5.0, 4.0, 5.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0014400482177734375, -0.0013910681009292603, -0.001342087984085083, -0.0012931078672409058, -0.0012441277503967285, -0.0011951476335525513, -0.001146167516708374, -0.0010971873998641968, -0.0010482072830200195, -0.0009992271661758423, -0.000950247049331665, -0.0009012669324874878, -0.0008522868156433105, -0.0008033066987991333, -0.0007543265819549561, -0.0007053464651107788, -0.0006563663482666016, -0.0006073862314224243, -0.0005584061145782471, -0.0005094259977340698, -0.0004604458808898926, -0.00041146576404571533, -0.0003624856472015381, -0.00031350553035736084, -0.0002645254135131836, -0.00021554529666900635, -0.0001665651798248291, -0.00011758506298065186, -6.860494613647461e-05, -1.9624829292297363e-05, 2.9355287551879883e-05, 7.833540439605713e-05, 0.00012731552124023438, 0.00017629563808441162, 0.00022527575492858887, 0.0002742558717727661, 0.00032323598861694336, 0.0003722161054611206, 0.00042119622230529785, 0.0004701763391494751, 0.0005191564559936523, 0.0005681365728378296, 0.0006171166896820068, 0.0006660968065261841, 0.0007150769233703613, 0.0007640570402145386, 0.0008130371570587158, 0.0008620172739028931, 0.0009109973907470703, 0.0009599775075912476, 0.0010089576244354248, 0.001057937741279602, 0.0011069178581237793, 0.0011558979749679565, 0.0012048780918121338, 0.001253858208656311, 0.0013028383255004883, 0.0013518184423446655, 0.0014007985591888428, 0.00144977867603302, 0.0014987587928771973, 0.0015477389097213745, 0.0015967190265655518, 0.001645699143409729, 0.0016946792602539062]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 4.0, 6.0, 1.0, 5.0, 8.0, 8.0, 5.0, 8.0, 11.0, 19.0, 26.0, 20.0, 25.0, 27.0, 52.0, 59.0, 74.0, 111.0, 137.0, 207.0, 307.0, 445.0, 854.0, 12815.0, 1018355.0, 12634.0, 802.0, 427.0, 312.0, 184.0, 127.0, 98.0, 67.0, 69.0, 51.0, 34.0, 34.0, 32.0, 14.0, 15.0, 16.0, 12.0, 5.0, 5.0, 8.0, 6.0, 3.0, 6.0, 1.0, 5.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.0302581787109375, -0.02938103675842285, -0.028503894805908203, -0.027626752853393555, -0.026749610900878906, -0.025872468948364258, -0.02499532699584961, -0.02411818504333496, -0.023241043090820312, -0.022363901138305664, -0.021486759185791016, -0.020609617233276367, -0.01973247528076172, -0.01885533332824707, -0.017978191375732422, -0.017101049423217773, -0.016223907470703125, -0.015346765518188477, -0.014469623565673828, -0.01359248161315918, -0.012715339660644531, -0.011838197708129883, -0.010961055755615234, -0.010083913803100586, -0.009206771850585938, -0.008329629898071289, -0.007452487945556641, -0.006575345993041992, -0.005698204040527344, -0.004821062088012695, -0.003943920135498047, -0.0030667781829833984, -0.00218963623046875, -0.0013124942779541016, -0.0004353523254394531, 0.0004417896270751953, 0.0013189315795898438, 0.002196073532104492, 0.0030732154846191406, 0.003950357437133789, 0.0048274993896484375, 0.005704641342163086, 0.006581783294677734, 0.007458925247192383, 0.008336067199707031, 0.00921320915222168, 0.010090351104736328, 0.010967493057250977, 0.011844635009765625, 0.012721776962280273, 0.013598918914794922, 0.01447606086730957, 0.015353202819824219, 0.016230344772338867, 0.017107486724853516, 0.017984628677368164, 0.018861770629882812, 0.01973891258239746, 0.02061605453491211, 0.021493196487426758, 0.022370338439941406, 0.023247480392456055, 0.024124622344970703, 0.02500176429748535, 0.02587890625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 9.0, 193.0, 711.0, 99.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017805881798267365, -0.00159098906442523, -0.0014013899490237236, -0.0012117908336222172, -0.0010221917182207108, -0.0008325926028192043, -0.0006429934874176979, -0.0004533943720161915, -0.00026379525661468506, -7.419614121317863e-05, 0.00011540297418832779, 0.0003050020895898342, 0.0004946012049913406, 0.0006842003203928471, 0.0008737994357943535, 0.00106339855119586, 0.0012529976665973663, 0.0014425967819988728, 0.0016321958974003792, 0.0018217950128018856, 0.002011394128203392, 0.0022009932436048985, 0.002390592359006405, 0.0025801914744079113, 0.0027697905898094177, 0.002959389705210924, 0.0031489888206124306, 0.003338587936013937, 0.0035281870514154434, 0.00371778616681695, 0.003907385282218456, 0.004096984397619963, 0.004286583513021469, 0.0044761826284229755, 0.004665781743824482, 0.004855380859225988, 0.005044979974627495, 0.005234579090029001, 0.005424178205430508, 0.005613777320832014, 0.0058033764362335205, 0.005992975551635027, 0.006182574667036533, 0.00637217378243804, 0.006561772897839546, 0.006751372013241053, 0.006940971128642559, 0.0071305702440440655, 0.007320169359445572, 0.007509768474847078, 0.007699367590248585, 0.007888967171311378, 0.008078565821051598, 0.008268164470791817, 0.00845776405185461, 0.008647363632917404, 0.008836962282657623, 0.009026560932397842, 0.009216160513460636, 0.00940576009452343, 0.009595358744263649, 0.009784957394003868, 0.009974556975066662, 0.010164156556129456, 0.010353755205869675]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 8.0, 3.0, 6.0, 7.0, 4.0, 6.0, 8.0, 17.0, 15.0, 18.0, 24.0, 14.0, 28.0, 27.0, 32.0, 31.0, 44.0, 38.0, 24.0, 43.0, 35.0, 40.0, 47.0, 46.0, 36.0, 43.0, 36.0, 41.0, 31.0, 31.0, 25.0, 30.0, 21.0, 30.0, 25.0, 21.0, 11.0, 13.0, 9.0, 7.0, 9.0, 7.0, 2.0, 3.0, 3.0, 2.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0007255077362060547, -0.000700872391462326, -0.0006762370467185974, -0.0006516017019748688, -0.0006269663572311401, -0.0006023310124874115, -0.0005776956677436829, -0.0005530603229999542, -0.0005284249782562256, -0.000503789633512497, -0.0004791542887687683, -0.00045451894402503967, -0.00042988359928131104, -0.0004052482545375824, -0.00038061290979385376, -0.0003559775650501251, -0.0003313422203063965, -0.00030670687556266785, -0.0002820715308189392, -0.00025743618607521057, -0.00023280084133148193, -0.0002081654965877533, -0.00018353015184402466, -0.00015889480710029602, -0.00013425946235656738, -0.00010962411761283875, -8.498877286911011e-05, -6.035342812538147e-05, -3.571808338165283e-05, -1.1082738637924194e-05, 1.3552606105804443e-05, 3.818795084953308e-05, 6.282329559326172e-05, 8.745864033699036e-05, 0.000112093985080719, 0.00013672932982444763, 0.00016136467456817627, 0.0001860000193119049, 0.00021063536405563354, 0.00023527070879936218, 0.0002599060535430908, 0.00028454139828681946, 0.0003091767430305481, 0.00033381208777427673, 0.00035844743251800537, 0.000383082777261734, 0.00040771812200546265, 0.0004323534667491913, 0.0004569888114929199, 0.00048162415623664856, 0.0005062595009803772, 0.0005308948457241058, 0.0005555301904678345, 0.0005801655352115631, 0.0006048008799552917, 0.0006294362246990204, 0.000654071569442749, 0.0006787069141864777, 0.0007033422589302063, 0.0007279776036739349, 0.0007526129484176636, 0.0007772482931613922, 0.0008018836379051208, 0.0008265189826488495, 0.0008511543273925781]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 5.0, 6.0, 6.0, 6.0, 8.0, 21.0, 13.0, 23.0, 20.0, 21.0, 18.0, 20.0, 37.0, 34.0, 38.0, 46.0, 41.0, 41.0, 39.0, 54.0, 44.0, 46.0, 41.0, 36.0, 40.0, 36.0, 37.0, 26.0, 17.0, 24.0, 20.0, 24.0, 20.0, 25.0, 16.0, 12.0, 7.0, 8.0, 7.0, 6.0, 7.0, 3.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-15.5703125, -15.0743408203125, -14.578369140625, -14.0823974609375, -13.58642578125, -13.0904541015625, -12.594482421875, -12.0985107421875, -11.6025390625, -11.1065673828125, -10.610595703125, -10.1146240234375, -9.61865234375, -9.1226806640625, -8.626708984375, -8.1307373046875, -7.634765625, -7.1387939453125, -6.642822265625, -6.1468505859375, -5.65087890625, -5.1549072265625, -4.658935546875, -4.1629638671875, -3.6669921875, -3.1710205078125, -2.675048828125, -2.1790771484375, -1.68310546875, -1.1871337890625, -0.691162109375, -0.1951904296875, 0.30078125, 0.7967529296875, 1.292724609375, 1.7886962890625, 2.28466796875, 2.7806396484375, 3.276611328125, 3.7725830078125, 4.2685546875, 4.7645263671875, 5.260498046875, 5.7564697265625, 6.25244140625, 6.7484130859375, 7.244384765625, 7.7403564453125, 8.236328125, 8.7322998046875, 9.228271484375, 9.7242431640625, 10.22021484375, 10.7161865234375, 11.212158203125, 11.7081298828125, 12.2041015625, 12.7000732421875, 13.196044921875, 13.6920166015625, 14.18798828125, 14.6839599609375, 15.179931640625, 15.6759033203125, 16.171875]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 0.0, 5.0, 14.0, 15.0, 12.0, 17.0, 28.0, 38.0, 58.0, 79.0, 109.0, 142.0, 213.0, 316.0, 484.0, 674.0, 1088.0, 1556.0, 2608.0, 5664.0, 24297.0, 327188.0, 624771.0, 42955.0, 7647.0, 3137.0, 1790.0, 1164.0, 780.0, 547.0, 364.0, 259.0, 147.0, 112.0, 79.0, 59.0, 43.0, 34.0, 13.0, 10.0, 10.0, 10.0, 7.0, 7.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-41.84375, -40.54150390625, -39.2392578125, -37.93701171875, -36.634765625, -35.33251953125, -34.0302734375, -32.72802734375, -31.42578125, -30.12353515625, -28.8212890625, -27.51904296875, -26.216796875, -24.91455078125, -23.6123046875, -22.31005859375, -21.0078125, -19.70556640625, -18.4033203125, -17.10107421875, -15.798828125, -14.49658203125, -13.1943359375, -11.89208984375, -10.58984375, -9.28759765625, -7.9853515625, -6.68310546875, -5.380859375, -4.07861328125, -2.7763671875, -1.47412109375, -0.171875, 1.13037109375, 2.4326171875, 3.73486328125, 5.037109375, 6.33935546875, 7.6416015625, 8.94384765625, 10.24609375, 11.54833984375, 12.8505859375, 14.15283203125, 15.455078125, 16.75732421875, 18.0595703125, 19.36181640625, 20.6640625, 21.96630859375, 23.2685546875, 24.57080078125, 25.873046875, 27.17529296875, 28.4775390625, 29.77978515625, 31.08203125, 32.38427734375, 33.6865234375, 34.98876953125, 36.291015625, 37.59326171875, 38.8955078125, 40.19775390625, 41.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 4.0, 2.0, 13.0, 5.0, 8.0, 18.0, 12.0, 25.0, 19.0, 32.0, 40.0, 48.0, 55.0, 57.0, 58.0, 107.0, 1624.0, 471.0, 76.0, 42.0, 56.0, 37.0, 34.0, 40.0, 37.0, 33.0, 24.0, 18.0, 12.0, 9.0, 15.0, 4.0, 2.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.15625, -50.41455078125, -48.6728515625, -46.93115234375, -45.189453125, -43.44775390625, -41.7060546875, -39.96435546875, -38.22265625, -36.48095703125, -34.7392578125, -32.99755859375, -31.255859375, -29.51416015625, -27.7724609375, -26.03076171875, -24.2890625, -22.54736328125, -20.8056640625, -19.06396484375, -17.322265625, -15.58056640625, -13.8388671875, -12.09716796875, -10.35546875, -8.61376953125, -6.8720703125, -5.13037109375, -3.388671875, -1.64697265625, 0.0947265625, 1.83642578125, 3.578125, 5.31982421875, 7.0615234375, 8.80322265625, 10.544921875, 12.28662109375, 14.0283203125, 15.77001953125, 17.51171875, 19.25341796875, 20.9951171875, 22.73681640625, 24.478515625, 26.22021484375, 27.9619140625, 29.70361328125, 31.4453125, 33.18701171875, 34.9287109375, 36.67041015625, 38.412109375, 40.15380859375, 41.8955078125, 43.63720703125, 45.37890625, 47.12060546875, 48.8623046875, 50.60400390625, 52.345703125, 54.08740234375, 55.8291015625, 57.57080078125, 59.3125]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 7.0, 5.0, 11.0, 9.0, 15.0, 14.0, 23.0, 26.0, 47.0, 69.0, 72.0, 111.0, 171.0, 310.0, 756.0, 5018.0, 3134496.0, 3042.0, 693.0, 279.0, 150.0, 101.0, 94.0, 39.0, 57.0, 27.0, 18.0, 18.0, 12.0, 5.0, 4.0, 7.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-193.875, -188.244140625, -182.61328125, -176.982421875, -171.3515625, -165.720703125, -160.08984375, -154.458984375, -148.828125, -143.197265625, -137.56640625, -131.935546875, -126.3046875, -120.673828125, -115.04296875, -109.412109375, -103.78125, -98.150390625, -92.51953125, -86.888671875, -81.2578125, -75.626953125, -69.99609375, -64.365234375, -58.734375, -53.103515625, -47.47265625, -41.841796875, -36.2109375, -30.580078125, -24.94921875, -19.318359375, -13.6875, -8.056640625, -2.42578125, 3.205078125, 8.8359375, 14.466796875, 20.09765625, 25.728515625, 31.359375, 36.990234375, 42.62109375, 48.251953125, 53.8828125, 59.513671875, 65.14453125, 70.775390625, 76.40625, 82.037109375, 87.66796875, 93.298828125, 98.9296875, 104.560546875, 110.19140625, 115.822265625, 121.453125, 127.083984375, 132.71484375, 138.345703125, 143.9765625, 149.607421875, 155.23828125, 160.869140625, 166.5]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 19.0, 267.0, 635.0, 84.0, 7.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-460.7056884765625, -450.5337219238281, -440.36175537109375, -430.1897888183594, -420.017822265625, -409.84588623046875, -399.67388916015625, -389.501953125, -379.3299865722656, -369.15802001953125, -358.9860534667969, -348.8140869140625, -338.6421203613281, -328.47015380859375, -318.2982177734375, -308.1262512207031, -297.95428466796875, -287.7823181152344, -277.6103515625, -267.4383850097656, -257.26641845703125, -247.09446716308594, -236.92250061035156, -226.75054931640625, -216.57855224609375, -206.40658569335938, -196.234619140625, -186.06265258789062, -175.8907012939453, -165.71873474121094, -155.54676818847656, -145.37481689453125, -135.20285034179688, -125.0308837890625, -114.85892486572266, -104.68695831298828, -94.51499938964844, -84.34303283691406, -74.17106628417969, -63.999107360839844, -53.82714080810547, -43.65517807006836, -33.48321533203125, -23.311248779296875, -13.139286041259766, -2.9673233032226562, 7.204643249511719, 17.376602172851562, 27.548568725585938, 37.72053146362305, 47.892494201660156, 58.06446075439453, 68.23641967773438, 78.40838623046875, 88.58035278320312, 98.75231170654297, 108.92427825927734, 119.09624481201172, 129.26820373535156, 139.44017028808594, 149.6121368408203, 159.78408813476562, 169.9560546875, 180.12802124023438, 190.29998779296875]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 8.0, 8.0, 12.0, 14.0, 7.0, 13.0, 18.0, 21.0, 28.0, 35.0, 28.0, 33.0, 38.0, 50.0, 50.0, 56.0, 35.0, 61.0, 57.0, 44.0, 41.0, 44.0, 49.0, 36.0, 32.0, 37.0, 23.0, 34.0, 14.0, 18.0, 9.0, 10.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 5.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-163.5412139892578, -158.53985595703125, -153.5384979248047, -148.53713989257812, -143.53578186035156, -138.534423828125, -133.53306579589844, -128.53170776367188, -123.53035736083984, -118.52899932861328, -113.52764129638672, -108.52628326416016, -103.52493286132812, -98.52357482910156, -93.522216796875, -88.52085876464844, -83.51950073242188, -78.51814270019531, -73.51678466796875, -68.51542663574219, -63.51407241821289, -58.51271438598633, -53.51136016845703, -48.51000213623047, -43.508644104003906, -38.507286071777344, -33.50592803955078, -28.504573822021484, -23.503215789794922, -18.50185775756836, -13.50050163269043, -8.4991455078125, -3.497802734375, 1.503554344177246, 6.504911422729492, 11.506268501281738, 16.507625579833984, 21.508983612060547, 26.510339736938477, 31.511695861816406, 36.51305389404297, 41.51441192626953, 46.515769958496094, 51.51712417602539, 56.51848220825195, 61.519840240478516, 66.52119445800781, 71.52255249023438, 76.52391052246094, 81.5252685546875, 86.52662658691406, 91.52798461914062, 96.52934265136719, 101.53070068359375, 106.53205108642578, 111.53340911865234, 116.5347671508789, 121.53612518310547, 126.53748321533203, 131.53883361816406, 136.54019165039062, 141.5415496826172, 146.54290771484375, 151.5442657470703, 156.54562377929688]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 8.0, 8.0, 8.0, 8.0, 16.0, 15.0, 29.0, 15.0, 26.0, 22.0, 32.0, 35.0, 23.0, 40.0, 39.0, 33.0, 42.0, 44.0, 47.0, 37.0, 38.0, 28.0, 33.0, 45.0, 33.0, 47.0, 34.0, 28.0, 30.0, 25.0, 24.0, 20.0, 14.0, 17.0, 15.0, 11.0, 6.0, 8.0, 9.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-15.9140625, -15.4053955078125, -14.896728515625, -14.3880615234375, -13.87939453125, -13.3707275390625, -12.862060546875, -12.3533935546875, -11.8447265625, -11.3360595703125, -10.827392578125, -10.3187255859375, -9.81005859375, -9.3013916015625, -8.792724609375, -8.2840576171875, -7.775390625, -7.2667236328125, -6.758056640625, -6.2493896484375, -5.74072265625, -5.2320556640625, -4.723388671875, -4.2147216796875, -3.7060546875, -3.1973876953125, -2.688720703125, -2.1800537109375, -1.67138671875, -1.1627197265625, -0.654052734375, -0.1453857421875, 0.36328125, 0.8719482421875, 1.380615234375, 1.8892822265625, 2.39794921875, 2.9066162109375, 3.415283203125, 3.9239501953125, 4.4326171875, 4.9412841796875, 5.449951171875, 5.9586181640625, 6.46728515625, 6.9759521484375, 7.484619140625, 7.9932861328125, 8.501953125, 9.0106201171875, 9.519287109375, 10.0279541015625, 10.53662109375, 11.0452880859375, 11.553955078125, 12.0626220703125, 12.5712890625, 13.0799560546875, 13.588623046875, 14.0972900390625, 14.60595703125, 15.1146240234375, 15.623291015625, 16.1319580078125, 16.640625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 3.0, 13.0, 14.0, 19.0, 26.0, 38.0, 49.0, 72.0, 96.0, 138.0, 214.0, 315.0, 481.0, 833.0, 1589.0, 3330.0, 8446.0, 28628.0, 151700.0, 1067252.0, 2209400.0, 610115.0, 81676.0, 18489.0, 5863.0, 2456.0, 1172.0, 653.0, 373.0, 265.0, 162.0, 130.0, 80.0, 61.0, 36.0, 40.0, 21.0, 12.0, 11.0, 6.0, 6.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-26.421875, -25.551025390625, -24.68017578125, -23.809326171875, -22.9384765625, -22.067626953125, -21.19677734375, -20.325927734375, -19.455078125, -18.584228515625, -17.71337890625, -16.842529296875, -15.9716796875, -15.100830078125, -14.22998046875, -13.359130859375, -12.48828125, -11.617431640625, -10.74658203125, -9.875732421875, -9.0048828125, -8.134033203125, -7.26318359375, -6.392333984375, -5.521484375, -4.650634765625, -3.77978515625, -2.908935546875, -2.0380859375, -1.167236328125, -0.29638671875, 0.574462890625, 1.4453125, 2.316162109375, 3.18701171875, 4.057861328125, 4.9287109375, 5.799560546875, 6.67041015625, 7.541259765625, 8.412109375, 9.282958984375, 10.15380859375, 11.024658203125, 11.8955078125, 12.766357421875, 13.63720703125, 14.508056640625, 15.37890625, 16.249755859375, 17.12060546875, 17.991455078125, 18.8623046875, 19.733154296875, 20.60400390625, 21.474853515625, 22.345703125, 23.216552734375, 24.08740234375, 24.958251953125, 25.8291015625, 26.699951171875, 27.57080078125, 28.441650390625, 29.3125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 5.0, 5.0, 5.0, 15.0, 24.0, 38.0, 49.0, 71.0, 113.0, 160.0, 232.0, 316.0, 454.0, 573.0, 581.0, 393.0, 297.0, 199.0, 166.0, 110.0, 82.0, 48.0, 39.0, 20.0, 24.0, 11.0, 9.0, 7.0, 9.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.5625, -34.48681640625, -33.4111328125, -32.33544921875, -31.259765625, -30.18408203125, -29.1083984375, -28.03271484375, -26.95703125, -25.88134765625, -24.8056640625, -23.72998046875, -22.654296875, -21.57861328125, -20.5029296875, -19.42724609375, -18.3515625, -17.27587890625, -16.2001953125, -15.12451171875, -14.048828125, -12.97314453125, -11.8974609375, -10.82177734375, -9.74609375, -8.67041015625, -7.5947265625, -6.51904296875, -5.443359375, -4.36767578125, -3.2919921875, -2.21630859375, -1.140625, -0.06494140625, 1.0107421875, 2.08642578125, 3.162109375, 4.23779296875, 5.3134765625, 6.38916015625, 7.46484375, 8.54052734375, 9.6162109375, 10.69189453125, 11.767578125, 12.84326171875, 13.9189453125, 14.99462890625, 16.0703125, 17.14599609375, 18.2216796875, 19.29736328125, 20.373046875, 21.44873046875, 22.5244140625, 23.60009765625, 24.67578125, 25.75146484375, 26.8271484375, 27.90283203125, 28.978515625, 30.05419921875, 31.1298828125, 32.20556640625, 33.28125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 3.0, 2.0, 5.0, 10.0, 13.0, 18.0, 27.0, 40.0, 62.0, 106.0, 201.0, 398.0, 978.0, 4169.0, 3835889.0, 347848.0, 2929.0, 854.0, 326.0, 178.0, 85.0, 47.0, 35.0, 22.0, 8.0, 6.0, 9.0, 5.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-128.125, -123.359375, -118.59375, -113.828125, -109.0625, -104.296875, -99.53125, -94.765625, -90.0, -85.234375, -80.46875, -75.703125, -70.9375, -66.171875, -61.40625, -56.640625, -51.875, -47.109375, -42.34375, -37.578125, -32.8125, -28.046875, -23.28125, -18.515625, -13.75, -8.984375, -4.21875, 0.546875, 5.3125, 10.078125, 14.84375, 19.609375, 24.375, 29.140625, 33.90625, 38.671875, 43.4375, 48.203125, 52.96875, 57.734375, 62.5, 67.265625, 72.03125, 76.796875, 81.5625, 86.328125, 91.09375, 95.859375, 100.625, 105.390625, 110.15625, 114.921875, 119.6875, 124.453125, 129.21875, 133.984375, 138.75, 143.515625, 148.28125, 153.046875, 157.8125, 162.578125, 167.34375, 172.109375, 176.875]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 87.0, 891.0, 37.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1413.0794677734375, -1386.62109375, -1360.16259765625, -1333.7042236328125, -1307.245849609375, -1280.787353515625, -1254.3289794921875, -1227.87060546875, -1201.412109375, -1174.9537353515625, -1148.4952392578125, -1122.036865234375, -1095.5784912109375, -1069.1199951171875, -1042.66162109375, -1016.2032470703125, -989.744873046875, -963.2864379882812, -936.8280639648438, -910.36962890625, -883.9111938476562, -857.4528198242188, -830.994384765625, -804.5360107421875, -778.0775146484375, -751.6190795898438, -725.1607055664062, -698.7022705078125, -672.2438354492188, -645.7854614257812, -619.3270263671875, -592.86865234375, -566.4102172851562, -539.9517822265625, -513.493408203125, -487.03497314453125, -460.5765686035156, -434.1181640625, -407.65972900390625, -381.2013244628906, -354.742919921875, -328.2845153808594, -301.8260803222656, -275.36767578125, -248.90927124023438, -222.4508514404297, -195.992431640625, -169.53402709960938, -143.07559204101562, -116.61717987060547, -90.15876770019531, -63.700347900390625, -37.24193572998047, -10.783523559570312, 15.674896240234375, 42.13330078125, 68.59172058105469, 95.05013275146484, 121.508544921875, 147.9669647216797, 174.42538452148438, 200.8837890625, 227.3422088623047, 253.8006134033203, 280.259033203125]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 6.0, 7.0, 6.0, 17.0, 13.0, 12.0, 16.0, 20.0, 30.0, 35.0, 32.0, 30.0, 31.0, 38.0, 37.0, 39.0, 37.0, 39.0, 36.0, 42.0, 44.0, 40.0, 32.0, 37.0, 30.0, 35.0, 22.0, 28.0, 20.0, 30.0, 22.0, 19.0, 17.0, 16.0, 20.0, 14.0, 13.0, 12.0, 7.0, 8.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.42303466796875, -110.6944808959961, -106.96592712402344, -103.23736572265625, -99.5088119506836, -95.78025817871094, -92.05170440673828, -88.32315063476562, -84.59458923339844, -80.86603546142578, -77.13748168945312, -73.40892028808594, -69.68036651611328, -65.95181274414062, -62.22325897216797, -58.49470138549805, -54.76614761352539, -51.037593841552734, -47.30903625488281, -43.580482482910156, -39.851924896240234, -36.12337112426758, -32.394813537597656, -28.666259765625, -24.93770408630371, -21.209148406982422, -17.480592727661133, -13.75203800201416, -10.023482322692871, -6.294927597045898, -2.5663719177246094, 1.1621837615966797, 4.890739440917969, 8.619295120239258, 12.347850799560547, 16.076404571533203, 19.804962158203125, 23.53351593017578, 27.26207160949707, 30.99062728881836, 34.71918487548828, 38.44773864746094, 42.17629623413086, 45.904850006103516, 49.63340759277344, 53.361961364746094, 57.09051513671875, 60.81907272338867, 64.54762268066406, 68.27617645263672, 72.00473022460938, 75.73329162597656, 79.46184539794922, 83.19039916992188, 86.91895294189453, 90.64750671386719, 94.37606811523438, 98.10462188720703, 101.83317565917969, 105.56173706054688, 109.29029083251953, 113.01884460449219, 116.74739837646484, 120.4759521484375, 124.20451354980469]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 5.0, 8.0, 14.0, 7.0, 7.0, 11.0, 30.0, 23.0, 27.0, 21.0, 45.0, 28.0, 28.0, 28.0, 43.0, 44.0, 59.0, 40.0, 39.0, 41.0, 46.0, 42.0, 38.0, 23.0, 29.0, 29.0, 31.0, 32.0, 21.0, 24.0, 18.0, 15.0, 29.0, 17.0, 8.0, 13.0, 11.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -10.9859619140625, -10.581298828125, -10.1766357421875, -9.77197265625, -9.3673095703125, -8.962646484375, -8.5579833984375, -8.1533203125, -7.7486572265625, -7.343994140625, -6.9393310546875, -6.53466796875, -6.1300048828125, -5.725341796875, -5.3206787109375, -4.916015625, -4.5113525390625, -4.106689453125, -3.7020263671875, -3.29736328125, -2.8927001953125, -2.488037109375, -2.0833740234375, -1.6787109375, -1.2740478515625, -0.869384765625, -0.4647216796875, -0.06005859375, 0.3446044921875, 0.749267578125, 1.1539306640625, 1.55859375, 1.9632568359375, 2.367919921875, 2.7725830078125, 3.17724609375, 3.5819091796875, 3.986572265625, 4.3912353515625, 4.7958984375, 5.2005615234375, 5.605224609375, 6.0098876953125, 6.41455078125, 6.8192138671875, 7.223876953125, 7.6285400390625, 8.033203125, 8.4378662109375, 8.842529296875, 9.2471923828125, 9.65185546875, 10.0565185546875, 10.461181640625, 10.8658447265625, 11.2705078125, 11.6751708984375, 12.079833984375, 12.4844970703125, 12.88916015625, 13.2938232421875, 13.698486328125, 14.1031494140625, 14.5078125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 4.0, 11.0, 20.0, 11.0, 25.0, 56.0, 86.0, 105.0, 171.0, 246.0, 385.0, 558.0, 894.0, 1438.0, 2172.0, 3452.0, 5470.0, 9003.0, 14737.0, 23900.0, 39401.0, 67572.0, 126483.0, 350944.0, 186614.0, 87302.0, 49615.0, 30105.0, 17798.0, 11208.0, 6854.0, 4377.0, 2744.0, 1697.0, 1081.0, 713.0, 474.0, 284.0, 169.0, 115.0, 99.0, 55.0, 34.0, 26.0, 19.0, 10.0, 7.0, 5.0, 3.0, 0.0, 1.0, 4.0], "bins": [-3.40234375, -3.307098388671875, -3.21185302734375, -3.116607666015625, -3.0213623046875, -2.926116943359375, -2.83087158203125, -2.735626220703125, -2.640380859375, -2.545135498046875, -2.44989013671875, -2.354644775390625, -2.2593994140625, -2.164154052734375, -2.06890869140625, -1.973663330078125, -1.87841796875, -1.783172607421875, -1.68792724609375, -1.592681884765625, -1.4974365234375, -1.402191162109375, -1.30694580078125, -1.211700439453125, -1.116455078125, -1.021209716796875, -0.92596435546875, -0.830718994140625, -0.7354736328125, -0.640228271484375, -0.54498291015625, -0.449737548828125, -0.3544921875, -0.259246826171875, -0.16400146484375, -0.068756103515625, 0.0264892578125, 0.121734619140625, 0.21697998046875, 0.312225341796875, 0.407470703125, 0.502716064453125, 0.59796142578125, 0.693206787109375, 0.7884521484375, 0.883697509765625, 0.97894287109375, 1.074188232421875, 1.16943359375, 1.264678955078125, 1.35992431640625, 1.455169677734375, 1.5504150390625, 1.645660400390625, 1.74090576171875, 1.836151123046875, 1.931396484375, 2.026641845703125, 2.12188720703125, 2.217132568359375, 2.3123779296875, 2.407623291015625, 2.50286865234375, 2.598114013671875, 2.693359375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 7.0, 9.0, 4.0, 8.0, 6.0, 9.0, 18.0, 9.0, 10.0, 19.0, 26.0, 18.0, 32.0, 23.0, 38.0, 40.0, 27.0, 40.0, 42.0, 37.0, 40.0, 1078.0, 39.0, 53.0, 50.0, 35.0, 40.0, 43.0, 26.0, 24.0, 20.0, 24.0, 18.0, 16.0, 12.0, 14.0, 16.0, 20.0, 10.0, 3.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 2.0], "bins": [-8.875, -8.62213134765625, -8.3692626953125, -8.11639404296875, -7.863525390625, -7.61065673828125, -7.3577880859375, -7.10491943359375, -6.85205078125, -6.59918212890625, -6.3463134765625, -6.09344482421875, -5.840576171875, -5.58770751953125, -5.3348388671875, -5.08197021484375, -4.8291015625, -4.57623291015625, -4.3233642578125, -4.07049560546875, -3.817626953125, -3.56475830078125, -3.3118896484375, -3.05902099609375, -2.80615234375, -2.55328369140625, -2.3004150390625, -2.04754638671875, -1.794677734375, -1.54180908203125, -1.2889404296875, -1.03607177734375, -0.783203125, -0.53033447265625, -0.2774658203125, -0.02459716796875, 0.228271484375, 0.48114013671875, 0.7340087890625, 0.98687744140625, 1.23974609375, 1.49261474609375, 1.7454833984375, 1.99835205078125, 2.251220703125, 2.50408935546875, 2.7569580078125, 3.00982666015625, 3.2626953125, 3.51556396484375, 3.7684326171875, 4.02130126953125, 4.274169921875, 4.52703857421875, 4.7799072265625, 5.03277587890625, 5.28564453125, 5.53851318359375, 5.7913818359375, 6.04425048828125, 6.297119140625, 6.54998779296875, 6.8028564453125, 7.05572509765625, 7.30859375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 2.0, 5.0, 15.0, 13.0, 19.0, 26.0, 47.0, 65.0, 108.0, 121.0, 193.0, 317.0, 464.0, 657.0, 946.0, 1408.0, 1981.0, 2755.0, 4083.0, 5839.0, 8490.0, 12427.0, 18688.0, 28709.0, 45805.0, 77390.0, 146513.0, 1364604.0, 156187.0, 80941.0, 47795.0, 29998.0, 19382.0, 12719.0, 8844.0, 5916.0, 4245.0, 2935.0, 2046.0, 1443.0, 920.0, 626.0, 468.0, 317.0, 194.0, 184.0, 89.0, 67.0, 50.0, 27.0, 21.0, 10.0, 9.0, 3.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.287109375, -2.209686279296875, -2.13226318359375, -2.054840087890625, -1.9774169921875, -1.899993896484375, -1.82257080078125, -1.745147705078125, -1.667724609375, -1.590301513671875, -1.51287841796875, -1.435455322265625, -1.3580322265625, -1.280609130859375, -1.20318603515625, -1.125762939453125, -1.04833984375, -0.970916748046875, -0.89349365234375, -0.816070556640625, -0.7386474609375, -0.661224365234375, -0.58380126953125, -0.506378173828125, -0.428955078125, -0.351531982421875, -0.27410888671875, -0.196685791015625, -0.1192626953125, -0.041839599609375, 0.03558349609375, 0.113006591796875, 0.1904296875, 0.267852783203125, 0.34527587890625, 0.422698974609375, 0.5001220703125, 0.577545166015625, 0.65496826171875, 0.732391357421875, 0.809814453125, 0.887237548828125, 0.96466064453125, 1.042083740234375, 1.1195068359375, 1.196929931640625, 1.27435302734375, 1.351776123046875, 1.42919921875, 1.506622314453125, 1.58404541015625, 1.661468505859375, 1.7388916015625, 1.816314697265625, 1.89373779296875, 1.971160888671875, 2.048583984375, 2.126007080078125, 2.20343017578125, 2.280853271484375, 2.3582763671875, 2.435699462890625, 2.51312255859375, 2.590545654296875, 2.66796875]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 3.0, 2.0, 9.0, 2.0, 7.0, 10.0, 11.0, 9.0, 11.0, 13.0, 31.0, 21.0, 23.0, 42.0, 40.0, 51.0, 40.0, 51.0, 74.0, 55.0, 51.0, 73.0, 54.0, 49.0, 46.0, 29.0, 28.0, 18.0, 31.0, 17.0, 21.0, 16.0, 14.0, 12.0, 6.0, 7.0, 9.0, 4.0, 5.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0011615753173828125, -0.001124158501625061, -0.0010867416858673096, -0.001049324870109558, -0.0010119080543518066, -0.0009744912385940552, -0.0009370744228363037, -0.0008996576070785522, -0.0008622407913208008, -0.0008248239755630493, -0.0007874071598052979, -0.0007499903440475464, -0.0007125735282897949, -0.0006751567125320435, -0.000637739896774292, -0.0006003230810165405, -0.0005629062652587891, -0.0005254894495010376, -0.00048807263374328613, -0.00045065581798553467, -0.0004132390022277832, -0.00037582218647003174, -0.0003384053707122803, -0.0003009885549545288, -0.00026357173919677734, -0.00022615492343902588, -0.00018873810768127441, -0.00015132129192352295, -0.00011390447616577148, -7.648766040802002e-05, -3.9070844650268555e-05, -1.6540288925170898e-06, 3.5762786865234375e-05, 7.317960262298584e-05, 0.0001105964183807373, 0.00014801323413848877, 0.00018543004989624023, 0.0002228468656539917, 0.00026026368141174316, 0.00029768049716949463, 0.0003350973129272461, 0.00037251412868499756, 0.000409930944442749, 0.0004473477602005005, 0.00048476457595825195, 0.0005221813917160034, 0.0005595982074737549, 0.0005970150232315063, 0.0006344318389892578, 0.0006718486547470093, 0.0007092654705047607, 0.0007466822862625122, 0.0007840991020202637, 0.0008215159177780151, 0.0008589327335357666, 0.0008963495492935181, 0.0009337663650512695, 0.000971183180809021, 0.0010085999965667725, 0.001046016812324524, 0.0010834336280822754, 0.0011208504438400269, 0.0011582672595977783, 0.0011956840753555298, 0.0012331008911132812]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 2.0, 6.0, 7.0, 7.0, 15.0, 15.0, 23.0, 24.0, 25.0, 28.0, 53.0, 84.0, 120.0, 143.0, 260.0, 419.0, 762.0, 3069.0, 1038408.0, 3067.0, 773.0, 424.0, 246.0, 153.0, 105.0, 91.0, 48.0, 49.0, 35.0, 27.0, 16.0, 18.0, 9.0, 7.0, 3.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.042510986328125, -0.04124164581298828, -0.03997230529785156, -0.038702964782714844, -0.037433624267578125, -0.036164283752441406, -0.03489494323730469, -0.03362560272216797, -0.03235626220703125, -0.03108692169189453, -0.029817581176757812, -0.028548240661621094, -0.027278900146484375, -0.026009559631347656, -0.024740219116210938, -0.02347087860107422, -0.0222015380859375, -0.02093219757080078, -0.019662857055664062, -0.018393516540527344, -0.017124176025390625, -0.015854835510253906, -0.014585494995117188, -0.013316154479980469, -0.01204681396484375, -0.010777473449707031, -0.009508132934570312, -0.008238792419433594, -0.006969451904296875, -0.005700111389160156, -0.0044307708740234375, -0.0031614303588867188, -0.00189208984375, -0.0006227493286132812, 0.0006465911865234375, 0.0019159317016601562, 0.003185272216796875, 0.004454612731933594, 0.0057239532470703125, 0.006993293762207031, 0.00826263427734375, 0.009531974792480469, 0.010801315307617188, 0.012070655822753906, 0.013339996337890625, 0.014609336853027344, 0.015878677368164062, 0.01714801788330078, 0.0184173583984375, 0.01968669891357422, 0.020956039428710938, 0.022225379943847656, 0.023494720458984375, 0.024764060974121094, 0.026033401489257812, 0.02730274200439453, 0.02857208251953125, 0.02984142303466797, 0.031110763549804688, 0.032380104064941406, 0.033649444580078125, 0.034918785095214844, 0.03618812561035156, 0.03745746612548828, 0.038726806640625]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 87.0, 751.0, 170.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.008135008625686169, -0.007964108139276505, -0.00779320765286684, -0.007622307166457176, -0.007451406680047512, -0.007280506659299135, -0.007109606172889471, -0.006938705686479807, -0.006767805200070143, -0.006596904713660479, -0.0064260042272508144, -0.00625510374084115, -0.0060842037200927734, -0.005913303233683109, -0.005742402747273445, -0.005571502260863781, -0.005400601774454117, -0.005229701288044453, -0.0050588008016347885, -0.004887900315225124, -0.00471699982881546, -0.004546099808067083, -0.004375199321657419, -0.004204298835247755, -0.004033398348838091, -0.0038624978624284267, -0.0036915973760187626, -0.003520697122439742, -0.003349796636030078, -0.0031788961496204138, -0.0030079958960413933, -0.002837095409631729, -0.0026661946903914213, -0.002495294203981757, -0.0023243939504027367, -0.0021534934639930725, -0.0019825929775834084, -0.0018116924911737442, -0.0016407921211794019, -0.0014698917511850595, -0.0012989912647753954, -0.0011280907783657312, -0.0009571904083713889, -0.0007862899801693857, -0.0006153895519673824, -0.0004444891237653792, -0.00027358869556337595, -0.00010268832556903362, 6.821216084063053e-05, 0.00023911258904263377, 0.000410013017244637, 0.0005809134454466403, 0.0007518138736486435, 0.0009227143018506467, 0.00109361473005265, 0.0012645151000469923, 0.0014354155864566565, 0.0016063160728663206, 0.001777216442860663, 0.0019481168128550053, 0.0021190172992646694, 0.0022899177856743336, 0.0024608182720839977, 0.0026317185256630182, 0.0028026190120726824]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 7.0, 5.0, 3.0, 4.0, 10.0, 5.0, 13.0, 15.0, 14.0, 13.0, 14.0, 23.0, 29.0, 33.0, 28.0, 37.0, 34.0, 41.0, 34.0, 26.0, 40.0, 39.0, 30.0, 50.0, 48.0, 48.0, 30.0, 38.0, 39.0, 35.0, 39.0, 27.0, 29.0, 15.0, 13.0, 25.0, 14.0, 14.0, 12.0, 2.0, 7.0, 4.0, 6.0, 5.0, 4.0, 5.0, 3.0, 3.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005670785903930664, -0.0005472302436828613, -0.0005273818969726562, -0.0005075335502624512, -0.0004876852035522461, -0.000467836856842041, -0.00044798851013183594, -0.00042814016342163086, -0.0004082918167114258, -0.0003884434700012207, -0.0003685951232910156, -0.00034874677658081055, -0.00032889842987060547, -0.0003090500831604004, -0.0002892017364501953, -0.00026935338973999023, -0.00024950504302978516, -0.00022965669631958008, -0.000209808349609375, -0.00018996000289916992, -0.00017011165618896484, -0.00015026330947875977, -0.0001304149627685547, -0.00011056661605834961, -9.071826934814453e-05, -7.086992263793945e-05, -5.1021575927734375e-05, -3.11732292175293e-05, -1.1324882507324219e-05, 8.52346420288086e-06, 2.8371810913085938e-05, 4.8220157623291016e-05, 6.80685043334961e-05, 8.791685104370117e-05, 0.00010776519775390625, 0.00012761354446411133, 0.0001474618911743164, 0.00016731023788452148, 0.00018715858459472656, 0.00020700693130493164, 0.00022685527801513672, 0.0002467036247253418, 0.0002665519714355469, 0.00028640031814575195, 0.00030624866485595703, 0.0003260970115661621, 0.0003459453582763672, 0.00036579370498657227, 0.00038564205169677734, 0.0004054903984069824, 0.0004253387451171875, 0.0004451870918273926, 0.00046503543853759766, 0.00048488378524780273, 0.0005047321319580078, 0.0005245804786682129, 0.000544428825378418, 0.000564277172088623, 0.0005841255187988281, 0.0006039738655090332, 0.0006238222122192383, 0.0006436705589294434, 0.0006635189056396484, 0.0006833672523498535, 0.0007032155990600586]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 1.0, 5.0, 8.0, 14.0, 7.0, 7.0, 11.0, 30.0, 23.0, 27.0, 21.0, 45.0, 28.0, 28.0, 28.0, 43.0, 44.0, 59.0, 40.0, 39.0, 41.0, 46.0, 42.0, 38.0, 23.0, 29.0, 29.0, 31.0, 32.0, 21.0, 24.0, 18.0, 15.0, 29.0, 17.0, 8.0, 13.0, 11.0, 5.0, 6.0, 3.0, 5.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.390625, -10.9859619140625, -10.581298828125, -10.1766357421875, -9.77197265625, -9.3673095703125, -8.962646484375, -8.5579833984375, -8.1533203125, -7.7486572265625, -7.343994140625, -6.9393310546875, -6.53466796875, -6.1300048828125, -5.725341796875, -5.3206787109375, -4.916015625, -4.5113525390625, -4.106689453125, -3.7020263671875, -3.29736328125, -2.8927001953125, -2.488037109375, -2.0833740234375, -1.6787109375, -1.2740478515625, -0.869384765625, -0.4647216796875, -0.06005859375, 0.3446044921875, 0.749267578125, 1.1539306640625, 1.55859375, 1.9632568359375, 2.367919921875, 2.7725830078125, 3.17724609375, 3.5819091796875, 3.986572265625, 4.3912353515625, 4.7958984375, 5.2005615234375, 5.605224609375, 6.0098876953125, 6.41455078125, 6.8192138671875, 7.223876953125, 7.6285400390625, 8.033203125, 8.4378662109375, 8.842529296875, 9.2471923828125, 9.65185546875, 10.0565185546875, 10.461181640625, 10.8658447265625, 11.2705078125, 11.6751708984375, 12.079833984375, 12.4844970703125, 12.88916015625, 13.2938232421875, 13.698486328125, 14.1031494140625, 14.5078125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 2.0, 3.0, 3.0, 6.0, 2.0, 8.0, 8.0, 7.0, 16.0, 20.0, 20.0, 48.0, 47.0, 81.0, 103.0, 141.0, 191.0, 374.0, 513.0, 829.0, 1568.0, 2957.0, 7042.0, 20606.0, 84329.0, 596278.0, 265816.0, 44538.0, 12708.0, 4935.0, 2167.0, 1177.0, 677.0, 439.0, 262.0, 171.0, 118.0, 95.0, 70.0, 47.0, 36.0, 26.0, 21.0, 16.0, 12.0, 9.0, 8.0, 6.0, 2.0, 7.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.421875, -22.6083984375, -21.794921875, -20.9814453125, -20.16796875, -19.3544921875, -18.541015625, -17.7275390625, -16.9140625, -16.1005859375, -15.287109375, -14.4736328125, -13.66015625, -12.8466796875, -12.033203125, -11.2197265625, -10.40625, -9.5927734375, -8.779296875, -7.9658203125, -7.15234375, -6.3388671875, -5.525390625, -4.7119140625, -3.8984375, -3.0849609375, -2.271484375, -1.4580078125, -0.64453125, 0.1689453125, 0.982421875, 1.7958984375, 2.609375, 3.4228515625, 4.236328125, 5.0498046875, 5.86328125, 6.6767578125, 7.490234375, 8.3037109375, 9.1171875, 9.9306640625, 10.744140625, 11.5576171875, 12.37109375, 13.1845703125, 13.998046875, 14.8115234375, 15.625, 16.4384765625, 17.251953125, 18.0654296875, 18.87890625, 19.6923828125, 20.505859375, 21.3193359375, 22.1328125, 22.9462890625, 23.759765625, 24.5732421875, 25.38671875, 26.2001953125, 27.013671875, 27.8271484375, 28.640625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 5.0, 9.0, 2.0, 4.0, 8.0, 8.0, 18.0, 8.0, 20.0, 11.0, 31.0, 25.0, 36.0, 33.0, 37.0, 52.0, 53.0, 61.0, 120.0, 390.0, 1558.0, 118.0, 74.0, 65.0, 55.0, 47.0, 37.0, 23.0, 30.0, 27.0, 18.0, 11.0, 14.0, 5.0, 6.0, 9.0, 8.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-34.21875, -33.0419921875, -31.865234375, -30.6884765625, -29.51171875, -28.3349609375, -27.158203125, -25.9814453125, -24.8046875, -23.6279296875, -22.451171875, -21.2744140625, -20.09765625, -18.9208984375, -17.744140625, -16.5673828125, -15.390625, -14.2138671875, -13.037109375, -11.8603515625, -10.68359375, -9.5068359375, -8.330078125, -7.1533203125, -5.9765625, -4.7998046875, -3.623046875, -2.4462890625, -1.26953125, -0.0927734375, 1.083984375, 2.2607421875, 3.4375, 4.6142578125, 5.791015625, 6.9677734375, 8.14453125, 9.3212890625, 10.498046875, 11.6748046875, 12.8515625, 14.0283203125, 15.205078125, 16.3818359375, 17.55859375, 18.7353515625, 19.912109375, 21.0888671875, 22.265625, 23.4423828125, 24.619140625, 25.7958984375, 26.97265625, 28.1494140625, 29.326171875, 30.5029296875, 31.6796875, 32.8564453125, 34.033203125, 35.2099609375, 36.38671875, 37.5634765625, 38.740234375, 39.9169921875, 41.09375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 2.0, 3.0, 6.0, 3.0, 8.0, 6.0, 4.0, 7.0, 15.0, 11.0, 21.0, 29.0, 44.0, 45.0, 68.0, 105.0, 190.0, 358.0, 774.0, 2994.0, 3121328.0, 17403.0, 1087.0, 485.0, 234.0, 140.0, 81.0, 58.0, 50.0, 32.0, 24.0, 16.0, 11.0, 15.0, 10.0, 8.0, 8.0, 4.0, 7.0, 4.0, 0.0, 4.0, 4.0, 1.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-115.75, -112.208984375, -108.66796875, -105.126953125, -101.5859375, -98.044921875, -94.50390625, -90.962890625, -87.421875, -83.880859375, -80.33984375, -76.798828125, -73.2578125, -69.716796875, -66.17578125, -62.634765625, -59.09375, -55.552734375, -52.01171875, -48.470703125, -44.9296875, -41.388671875, -37.84765625, -34.306640625, -30.765625, -27.224609375, -23.68359375, -20.142578125, -16.6015625, -13.060546875, -9.51953125, -5.978515625, -2.4375, 1.103515625, 4.64453125, 8.185546875, 11.7265625, 15.267578125, 18.80859375, 22.349609375, 25.890625, 29.431640625, 32.97265625, 36.513671875, 40.0546875, 43.595703125, 47.13671875, 50.677734375, 54.21875, 57.759765625, 61.30078125, 64.841796875, 68.3828125, 71.923828125, 75.46484375, 79.005859375, 82.546875, 86.087890625, 89.62890625, 93.169921875, 96.7109375, 100.251953125, 103.79296875, 107.333984375, 110.875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 97.0, 908.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-594.84130859375, -581.424072265625, -568.0068359375, -554.589599609375, -541.17236328125, -527.755126953125, -514.337890625, -500.9206848144531, -487.50347900390625, -474.08624267578125, -460.66900634765625, -447.25177001953125, -433.8345642089844, -420.4173278808594, -407.0000915527344, -393.5828552246094, -380.1656188964844, -366.7483825683594, -353.3311462402344, -339.9139404296875, -326.4967041015625, -313.0794677734375, -299.6622314453125, -286.2449951171875, -272.8277587890625, -259.4105224609375, -245.99330139160156, -232.57606506347656, -219.15884399414062, -205.74160766601562, -192.32437133789062, -178.90713500976562, -165.48989868164062, -152.07266235351562, -138.6554412841797, -125.23820495605469, -111.82097625732422, -98.40374755859375, -84.98651123046875, -71.56928253173828, -58.15205383300781, -44.734825134277344, -31.31759262084961, -17.900360107421875, -4.483131408691406, 8.934097290039062, 22.351333618164062, 35.76856231689453, 49.185791015625, 62.60301971435547, 76.02024841308594, 89.43748474121094, 102.8547134399414, 116.27194213867188, 129.68917846679688, 143.10641479492188, 156.5236358642578, 169.9408721923828, 183.35809326171875, 196.77532958984375, 210.19256591796875, 223.6097869873047, 237.0270233154297, 250.44424438476562, 263.8614807128906]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 8.0, 14.0, 9.0, 12.0, 7.0, 16.0, 13.0, 22.0, 24.0, 30.0, 25.0, 38.0, 42.0, 36.0, 27.0, 64.0, 46.0, 39.0, 46.0, 29.0, 42.0, 35.0, 34.0, 41.0, 34.0, 33.0, 28.0, 39.0, 22.0, 17.0, 18.0, 18.0, 13.0, 15.0, 13.0, 13.0, 6.0, 4.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-86.37127685546875, -83.74574279785156, -81.12020111083984, -78.49466705322266, -75.86913299560547, -73.24359893798828, -70.61805725097656, -67.99252319335938, -65.36698913574219, -62.741451263427734, -60.11591720581055, -57.490379333496094, -54.864845275878906, -52.23930740356445, -49.61376953125, -46.98823547363281, -44.36269760131836, -41.737159729003906, -39.11162567138672, -36.486087799072266, -33.86055374145508, -31.235015869140625, -28.609479904174805, -25.983943939208984, -23.358407974243164, -20.732872009277344, -18.107336044311523, -15.481799125671387, -12.856263160705566, -10.230727195739746, -7.605190277099609, -4.979654312133789, -2.3541183471679688, 0.27141785621643066, 2.89695405960083, 5.522490501403809, 8.148026466369629, 10.77356243133545, 13.399099349975586, 16.024635314941406, 18.650171279907227, 21.275707244873047, 23.901243209838867, 26.526779174804688, 29.15231704711914, 31.777851104736328, 34.40338897705078, 37.02892303466797, 39.65446090698242, 42.279998779296875, 44.90553283691406, 47.531070709228516, 50.1566047668457, 52.782142639160156, 55.407676696777344, 58.0332145690918, 60.65875244140625, 63.2842903137207, 65.90982818603516, 68.53536224365234, 71.16089630126953, 73.78643035888672, 76.41197204589844, 79.03750610351562, 81.66304016113281]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 5.0, 3.0, 6.0, 6.0, 3.0, 11.0, 12.0, 11.0, 16.0, 21.0, 20.0, 25.0, 25.0, 40.0, 30.0, 38.0, 29.0, 41.0, 43.0, 44.0, 39.0, 51.0, 36.0, 47.0, 38.0, 39.0, 35.0, 31.0, 34.0, 34.0, 31.0, 17.0, 22.0, 18.0, 15.0, 8.0, 10.0, 14.0, 11.0, 15.0, 8.0, 7.0, 5.0, 4.0, 4.0, 3.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.2421875, -13.7657470703125, -13.289306640625, -12.8128662109375, -12.33642578125, -11.8599853515625, -11.383544921875, -10.9071044921875, -10.4306640625, -9.9542236328125, -9.477783203125, -9.0013427734375, -8.52490234375, -8.0484619140625, -7.572021484375, -7.0955810546875, -6.619140625, -6.1427001953125, -5.666259765625, -5.1898193359375, -4.71337890625, -4.2369384765625, -3.760498046875, -3.2840576171875, -2.8076171875, -2.3311767578125, -1.854736328125, -1.3782958984375, -0.90185546875, -0.4254150390625, 0.051025390625, 0.5274658203125, 1.00390625, 1.4803466796875, 1.956787109375, 2.4332275390625, 2.90966796875, 3.3861083984375, 3.862548828125, 4.3389892578125, 4.8154296875, 5.2918701171875, 5.768310546875, 6.2447509765625, 6.72119140625, 7.1976318359375, 7.674072265625, 8.1505126953125, 8.626953125, 9.1033935546875, 9.579833984375, 10.0562744140625, 10.53271484375, 11.0091552734375, 11.485595703125, 11.9620361328125, 12.4384765625, 12.9149169921875, 13.391357421875, 13.8677978515625, 14.34423828125, 14.8206787109375, 15.297119140625, 15.7735595703125, 16.25]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 6.0, 2.0, 11.0, 6.0, 17.0, 18.0, 22.0, 27.0, 40.0, 46.0, 46.0, 47.0, 62.0, 81.0, 114.0, 155.0, 235.0, 363.0, 543.0, 998.0, 2738.0, 78344.0, 4076951.0, 28385.0, 2340.0, 955.0, 487.0, 325.0, 207.0, 154.0, 113.0, 87.0, 82.0, 57.0, 37.0, 35.0, 24.0, 31.0, 26.0, 18.0, 15.0, 7.0, 9.0, 5.0, 5.0, 3.0, 4.0, 1.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-123.4375, -119.74609375, -116.0546875, -112.36328125, -108.671875, -104.98046875, -101.2890625, -97.59765625, -93.90625, -90.21484375, -86.5234375, -82.83203125, -79.140625, -75.44921875, -71.7578125, -68.06640625, -64.375, -60.68359375, -56.9921875, -53.30078125, -49.609375, -45.91796875, -42.2265625, -38.53515625, -34.84375, -31.15234375, -27.4609375, -23.76953125, -20.078125, -16.38671875, -12.6953125, -9.00390625, -5.3125, -1.62109375, 2.0703125, 5.76171875, 9.453125, 13.14453125, 16.8359375, 20.52734375, 24.21875, 27.91015625, 31.6015625, 35.29296875, 38.984375, 42.67578125, 46.3671875, 50.05859375, 53.75, 57.44140625, 61.1328125, 64.82421875, 68.515625, 72.20703125, 75.8984375, 79.58984375, 83.28125, 86.97265625, 90.6640625, 94.35546875, 98.046875, 101.73828125, 105.4296875, 109.12109375, 112.8125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 14.0, 4.0, 11.0, 15.0, 18.0, 28.0, 44.0, 93.0, 145.0, 277.0, 494.0, 791.0, 722.0, 619.0, 344.0, 188.0, 93.0, 54.0, 38.0, 28.0, 15.0, 12.0, 5.0, 8.0, 4.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-34.84375, -33.824462890625, -32.80517578125, -31.785888671875, -30.7666015625, -29.747314453125, -28.72802734375, -27.708740234375, -26.689453125, -25.670166015625, -24.65087890625, -23.631591796875, -22.6123046875, -21.593017578125, -20.57373046875, -19.554443359375, -18.53515625, -17.515869140625, -16.49658203125, -15.477294921875, -14.4580078125, -13.438720703125, -12.41943359375, -11.400146484375, -10.380859375, -9.361572265625, -8.34228515625, -7.322998046875, -6.3037109375, -5.284423828125, -4.26513671875, -3.245849609375, -2.2265625, -1.207275390625, -0.18798828125, 0.831298828125, 1.8505859375, 2.869873046875, 3.88916015625, 4.908447265625, 5.927734375, 6.947021484375, 7.96630859375, 8.985595703125, 10.0048828125, 11.024169921875, 12.04345703125, 13.062744140625, 14.08203125, 15.101318359375, 16.12060546875, 17.139892578125, 18.1591796875, 19.178466796875, 20.19775390625, 21.217041015625, 22.236328125, 23.255615234375, 24.27490234375, 25.294189453125, 26.3134765625, 27.332763671875, 28.35205078125, 29.371337890625, 30.390625]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 3.0, 7.0, 6.0, 6.0, 7.0, 23.0, 33.0, 73.0, 168.0, 416.0, 1365.0, 5998.0, 122518.0, 3970776.0, 85828.0, 5117.0, 1245.0, 373.0, 149.0, 79.0, 35.0, 23.0, 5.0, 9.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.1875, -50.287109375, -48.38671875, -46.486328125, -44.5859375, -42.685546875, -40.78515625, -38.884765625, -36.984375, -35.083984375, -33.18359375, -31.283203125, -29.3828125, -27.482421875, -25.58203125, -23.681640625, -21.78125, -19.880859375, -17.98046875, -16.080078125, -14.1796875, -12.279296875, -10.37890625, -8.478515625, -6.578125, -4.677734375, -2.77734375, -0.876953125, 1.0234375, 2.923828125, 4.82421875, 6.724609375, 8.625, 10.525390625, 12.42578125, 14.326171875, 16.2265625, 18.126953125, 20.02734375, 21.927734375, 23.828125, 25.728515625, 27.62890625, 29.529296875, 31.4296875, 33.330078125, 35.23046875, 37.130859375, 39.03125, 40.931640625, 42.83203125, 44.732421875, 46.6328125, 48.533203125, 50.43359375, 52.333984375, 54.234375, 56.134765625, 58.03515625, 59.935546875, 61.8359375, 63.736328125, 65.63671875, 67.537109375, 69.4375]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 4.0, 1.0, 2.0, 4.0, 11.0, 15.0, 12.0, 30.0, 52.0, 98.0, 140.0, 136.0, 174.0, 118.0, 90.0, 59.0, 32.0, 23.0, 8.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.14165496826172, -111.93714141845703, -105.73263549804688, -99.52812194824219, -93.32361602783203, -87.11910247802734, -80.91459655761719, -74.7100830078125, -68.50556945800781, -62.30105972290039, -56.09654998779297, -49.89203643798828, -43.687530517578125, -37.48301696777344, -31.278507232666016, -25.073997497558594, -18.869491577148438, -12.664981842041016, -6.460471153259277, -0.25596046447753906, 5.948549270629883, 12.153059005737305, 18.35757064819336, 24.56208038330078, 30.766590118408203, 36.971099853515625, 43.17560958862305, 49.38011932373047, 55.584632873535156, 61.78913879394531, 67.99365234375, 74.19816589355469, 80.40266418457031, 86.607177734375, 92.81168365478516, 99.01619720458984, 105.220703125, 111.42521667480469, 117.62973022460938, 123.83423614501953, 130.0387420654297, 136.24325561523438, 142.44776916503906, 148.6522674560547, 154.85678100585938, 161.06129455566406, 167.26580810546875, 173.47030639648438, 179.67483520507812, 185.8793487548828, 192.0838623046875, 198.28836059570312, 204.4928741455078, 210.6973876953125, 216.9019012451172, 223.10641479492188, 229.3109130859375, 235.5154266357422, 241.71994018554688, 247.9244384765625, 254.1289520263672, 260.3334655761719, 266.5379638671875, 272.74249267578125, 278.9469909667969]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 7.0, 11.0, 7.0, 7.0, 11.0, 18.0, 23.0, 20.0, 18.0, 18.0, 30.0, 29.0, 28.0, 36.0, 53.0, 35.0, 43.0, 29.0, 34.0, 54.0, 47.0, 38.0, 44.0, 42.0, 30.0, 34.0, 37.0, 29.0, 26.0, 26.0, 20.0, 16.0, 24.0, 12.0, 15.0, 11.0, 8.0, 7.0, 6.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-74.46701049804688, -72.03323364257812, -69.5994644165039, -67.16568756103516, -64.73191833496094, -62.29814147949219, -59.8643684387207, -57.43059539794922, -54.996822357177734, -52.56304931640625, -50.129276275634766, -47.69550323486328, -45.26172637939453, -42.82795715332031, -40.39418029785156, -37.96040725708008, -35.526634216308594, -33.09286117553711, -30.659088134765625, -28.225313186645508, -25.791540145874023, -23.35776710510254, -20.923992156982422, -18.490219116210938, -16.056446075439453, -13.622673034667969, -11.188899040222168, -8.755125045776367, -6.321352005004883, -3.8875789642333984, -1.4538049697875977, 0.9799690246582031, 3.4137420654296875, 5.84751558303833, 8.281289100646973, 10.715063095092773, 13.148836135864258, 15.582609176635742, 18.01638412475586, 20.450157165527344, 22.883930206298828, 25.317703247070312, 27.751476287841797, 30.185251235961914, 32.61902618408203, 35.05279541015625, 37.486572265625, 39.920345306396484, 42.35411834716797, 44.78789138793945, 47.22166442871094, 49.65543746948242, 52.089210510253906, 54.522987365722656, 56.95676040649414, 59.390533447265625, 61.82430648803711, 64.2580795288086, 66.69185638427734, 69.12562561035156, 71.55940246582031, 73.99317169189453, 76.42694854736328, 78.8607177734375, 81.29449462890625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 5.0, 7.0, 6.0, 7.0, 13.0, 21.0, 10.0, 21.0, 22.0, 27.0, 37.0, 27.0, 26.0, 27.0, 43.0, 40.0, 51.0, 45.0, 40.0, 40.0, 44.0, 47.0, 44.0, 45.0, 41.0, 31.0, 31.0, 31.0, 24.0, 31.0, 22.0, 19.0, 11.0, 14.0, 8.0, 9.0, 6.0, 6.0, 7.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.75, -105.884765625, -102.01953125, -98.154296875, -94.2890625, -90.423828125, -86.55859375, -82.693359375, -78.828125, -74.962890625, -71.09765625, -67.232421875, -63.3671875, -59.501953125, -55.63671875, -51.771484375, -47.90625, -44.041015625, -40.17578125, -36.310546875, -32.4453125, -28.580078125, -24.71484375, -20.849609375, -16.984375, -13.119140625, -9.25390625, -5.388671875, -1.5234375, 2.341796875, 6.20703125, 10.072265625, 13.9375, 17.802734375, 21.66796875, 25.533203125, 29.3984375, 33.263671875, 37.12890625, 40.994140625, 44.859375, 48.724609375, 52.58984375, 56.455078125, 60.3203125, 64.185546875, 68.05078125, 71.916015625, 75.78125, 79.646484375, 83.51171875, 87.376953125, 91.2421875, 95.107421875, 98.97265625, 102.837890625, 106.703125, 110.568359375, 114.43359375, 118.298828125, 122.1640625, 126.029296875, 129.89453125, 133.759765625, 137.625]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 4.0, 2.0, 6.0, 3.0, 15.0, 17.0, 35.0, 32.0, 66.0, 92.0, 127.0, 203.0, 294.0, 466.0, 671.0, 980.0, 1550.0, 2391.0, 3659.0, 5815.0, 9282.0, 14637.0, 23675.0, 39263.0, 67856.0, 131128.0, 335987.0, 193083.0, 88745.0, 49338.0, 29691.0, 18183.0, 11234.0, 7176.0, 4450.0, 2925.0, 1837.0, 1239.0, 788.0, 513.0, 393.0, 222.0, 159.0, 108.0, 72.0, 53.0, 35.0, 19.0, 17.0, 14.0, 6.0, 3.0, 4.0, 1.0, 4.0], "bins": [-29.625, -28.795654296875, -27.96630859375, -27.136962890625, -26.3076171875, -25.478271484375, -24.64892578125, -23.819580078125, -22.990234375, -22.160888671875, -21.33154296875, -20.502197265625, -19.6728515625, -18.843505859375, -18.01416015625, -17.184814453125, -16.35546875, -15.526123046875, -14.69677734375, -13.867431640625, -13.0380859375, -12.208740234375, -11.37939453125, -10.550048828125, -9.720703125, -8.891357421875, -8.06201171875, -7.232666015625, -6.4033203125, -5.573974609375, -4.74462890625, -3.915283203125, -3.0859375, -2.256591796875, -1.42724609375, -0.597900390625, 0.2314453125, 1.060791015625, 1.89013671875, 2.719482421875, 3.548828125, 4.378173828125, 5.20751953125, 6.036865234375, 6.8662109375, 7.695556640625, 8.52490234375, 9.354248046875, 10.18359375, 11.012939453125, 11.84228515625, 12.671630859375, 13.5009765625, 14.330322265625, 15.15966796875, 15.989013671875, 16.818359375, 17.647705078125, 18.47705078125, 19.306396484375, 20.1357421875, 20.965087890625, 21.79443359375, 22.623779296875, 23.453125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [6.0, 1.0, 0.0, 2.0, 3.0, 6.0, 4.0, 5.0, 9.0, 5.0, 6.0, 10.0, 15.0, 8.0, 19.0, 30.0, 20.0, 19.0, 26.0, 31.0, 23.0, 30.0, 46.0, 28.0, 35.0, 30.0, 44.0, 37.0, 1062.0, 46.0, 34.0, 34.0, 36.0, 47.0, 20.0, 31.0, 25.0, 36.0, 19.0, 18.0, 21.0, 14.0, 10.0, 22.0, 15.0, 10.0, 6.0, 6.0, 9.0, 4.0, 9.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-59.84375, -57.76123046875, -55.6787109375, -53.59619140625, -51.513671875, -49.43115234375, -47.3486328125, -45.26611328125, -43.18359375, -41.10107421875, -39.0185546875, -36.93603515625, -34.853515625, -32.77099609375, -30.6884765625, -28.60595703125, -26.5234375, -24.44091796875, -22.3583984375, -20.27587890625, -18.193359375, -16.11083984375, -14.0283203125, -11.94580078125, -9.86328125, -7.78076171875, -5.6982421875, -3.61572265625, -1.533203125, 0.54931640625, 2.6318359375, 4.71435546875, 6.796875, 8.87939453125, 10.9619140625, 13.04443359375, 15.126953125, 17.20947265625, 19.2919921875, 21.37451171875, 23.45703125, 25.53955078125, 27.6220703125, 29.70458984375, 31.787109375, 33.86962890625, 35.9521484375, 38.03466796875, 40.1171875, 42.19970703125, 44.2822265625, 46.36474609375, 48.447265625, 50.52978515625, 52.6123046875, 54.69482421875, 56.77734375, 58.85986328125, 60.9423828125, 63.02490234375, 65.107421875, 67.18994140625, 69.2724609375, 71.35498046875, 73.4375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 10.0, 7.0, 6.0, 16.0, 21.0, 37.0, 43.0, 67.0, 118.0, 118.0, 216.0, 324.0, 431.0, 618.0, 828.0, 1266.0, 1682.0, 2478.0, 3545.0, 5064.0, 7246.0, 10395.0, 15251.0, 22262.0, 34136.0, 52261.0, 85464.0, 156801.0, 1338605.0, 135629.0, 76824.0, 47779.0, 30791.0, 20627.0, 14008.0, 9681.0, 6656.0, 4776.0, 3262.0, 2326.0, 1686.0, 1097.0, 800.0, 591.0, 388.0, 246.0, 218.0, 146.0, 94.0, 56.0, 57.0, 40.0, 18.0, 17.0, 2.0, 7.0, 6.0, 1.0], "bins": [-22.296875, -21.648681640625, -21.00048828125, -20.352294921875, -19.7041015625, -19.055908203125, -18.40771484375, -17.759521484375, -17.111328125, -16.463134765625, -15.81494140625, -15.166748046875, -14.5185546875, -13.870361328125, -13.22216796875, -12.573974609375, -11.92578125, -11.277587890625, -10.62939453125, -9.981201171875, -9.3330078125, -8.684814453125, -8.03662109375, -7.388427734375, -6.740234375, -6.092041015625, -5.44384765625, -4.795654296875, -4.1474609375, -3.499267578125, -2.85107421875, -2.202880859375, -1.5546875, -0.906494140625, -0.25830078125, 0.389892578125, 1.0380859375, 1.686279296875, 2.33447265625, 2.982666015625, 3.630859375, 4.279052734375, 4.92724609375, 5.575439453125, 6.2236328125, 6.871826171875, 7.52001953125, 8.168212890625, 8.81640625, 9.464599609375, 10.11279296875, 10.760986328125, 11.4091796875, 12.057373046875, 12.70556640625, 13.353759765625, 14.001953125, 14.650146484375, 15.29833984375, 15.946533203125, 16.5947265625, 17.242919921875, 17.89111328125, 18.539306640625, 19.1875]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 6.0, 6.0, 8.0, 5.0, 8.0, 7.0, 7.0, 11.0, 21.0, 22.0, 28.0, 36.0, 53.0, 35.0, 64.0, 63.0, 72.0, 80.0, 94.0, 70.0, 59.0, 45.0, 34.0, 24.0, 27.0, 25.0, 10.0, 15.0, 9.0, 12.0, 4.0, 9.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.015777587890625, -0.015307784080505371, -0.014837980270385742, -0.014368176460266113, -0.013898372650146484, -0.013428568840026855, -0.012958765029907227, -0.012488961219787598, -0.012019157409667969, -0.01154935359954834, -0.011079549789428711, -0.010609745979309082, -0.010139942169189453, -0.009670138359069824, -0.009200334548950195, -0.008730530738830566, -0.008260726928710938, -0.007790923118591309, -0.00732111930847168, -0.006851315498352051, -0.006381511688232422, -0.005911707878112793, -0.005441904067993164, -0.004972100257873535, -0.004502296447753906, -0.004032492637634277, -0.0035626888275146484, -0.0030928850173950195, -0.0026230812072753906, -0.0021532773971557617, -0.0016834735870361328, -0.001213669776916504, -0.000743865966796875, -0.0002740621566772461, 0.0001957416534423828, 0.0006655454635620117, 0.0011353492736816406, 0.0016051530838012695, 0.0020749568939208984, 0.0025447607040405273, 0.0030145645141601562, 0.003484368324279785, 0.003954172134399414, 0.004423975944519043, 0.004893779754638672, 0.005363583564758301, 0.00583338737487793, 0.006303191184997559, 0.0067729949951171875, 0.007242798805236816, 0.007712602615356445, 0.008182406425476074, 0.008652210235595703, 0.009122014045715332, 0.009591817855834961, 0.01006162166595459, 0.010531425476074219, 0.011001229286193848, 0.011471033096313477, 0.011940836906433105, 0.012410640716552734, 0.012880444526672363, 0.013350248336791992, 0.013820052146911621, 0.01428985595703125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 4.0, 8.0, 13.0, 10.0, 18.0, 21.0, 25.0, 33.0, 42.0, 66.0, 78.0, 102.0, 163.0, 251.0, 453.0, 984.0, 3486.0, 20073.0, 214883.0, 726643.0, 68885.0, 8641.0, 1965.0, 636.0, 337.0, 204.0, 127.0, 90.0, 67.0, 67.0, 46.0, 35.0, 27.0, 18.0, 14.0, 10.0, 8.0, 8.0, 8.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.1826171875, -0.1772899627685547, -0.17196273803710938, -0.16663551330566406, -0.16130828857421875, -0.15598106384277344, -0.15065383911132812, -0.1453266143798828, -0.1399993896484375, -0.1346721649169922, -0.12934494018554688, -0.12401771545410156, -0.11869049072265625, -0.11336326599121094, -0.10803604125976562, -0.10270881652832031, -0.097381591796875, -0.09205436706542969, -0.08672714233398438, -0.08139991760253906, -0.07607269287109375, -0.07074546813964844, -0.06541824340820312, -0.06009101867675781, -0.0547637939453125, -0.04943656921386719, -0.044109344482421875, -0.03878211975097656, -0.03345489501953125, -0.028127670288085938, -0.022800445556640625, -0.017473220825195312, -0.01214599609375, -0.0068187713623046875, -0.001491546630859375, 0.0038356781005859375, 0.00916290283203125, 0.014490127563476562, 0.019817352294921875, 0.025144577026367188, 0.0304718017578125, 0.03579902648925781, 0.041126251220703125, 0.04645347595214844, 0.05178070068359375, 0.05710792541503906, 0.062435150146484375, 0.06776237487792969, 0.073089599609375, 0.07841682434082031, 0.08374404907226562, 0.08907127380371094, 0.09439849853515625, 0.09972572326660156, 0.10505294799804688, 0.11038017272949219, 0.1157073974609375, 0.12103462219238281, 0.12636184692382812, 0.13168907165527344, 0.13701629638671875, 0.14234352111816406, 0.14767074584960938, 0.1529979705810547, 0.1583251953125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 7.0, 25.0, 55.0, 107.0, 186.0, 238.0, 170.0, 126.0, 49.0, 24.0, 9.0, 2.0, 9.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.04745020344853401, -0.046473149210214615, -0.04549609497189522, -0.04451904445886612, -0.04354199022054672, -0.042564935982227325, -0.04158788174390793, -0.04061082750558853, -0.03963377699255943, -0.038656722754240036, -0.03767966851592064, -0.03670261800289154, -0.035725563764572144, -0.03474850952625275, -0.03377145528793335, -0.03279440104961395, -0.031817346811294556, -0.03084029257297516, -0.02986324019730091, -0.028886185958981514, -0.027909133583307266, -0.02693207934498787, -0.025955025106668472, -0.024977972730994225, -0.024000920355319977, -0.02302386611700058, -0.022046813741326332, -0.021069759503006935, -0.020092707127332687, -0.01911565288901329, -0.018138598650693893, -0.017161546275019646, -0.016184493899345398, -0.015207440592348576, -0.014230387285351753, -0.013253333047032356, -0.012276280671358109, -0.011299226433038712, -0.01032217312604189, -0.009345119819045067, -0.008368067443370819, -0.007391014136373997, -0.006413960829377174, -0.005436907056719065, -0.004459853749722242, -0.00348280044272542, -0.0025057466700673103, -0.001528693363070488, -0.0005516400560736656, 0.00042541336733847857, 0.0014024667907506227, 0.0023795203305780888, 0.003356573637574911, 0.0043336269445717335, 0.005310680717229843, 0.0062877340242266655, 0.007264787331223488, 0.00824184063822031, 0.009218893945217133, 0.01019594818353653, 0.011173000559210777, 0.012150054797530174, 0.013127108104526997, 0.014104161411523819, 0.015081214718520641]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 0.0, 5.0, 4.0, 10.0, 4.0, 9.0, 10.0, 17.0, 10.0, 20.0, 19.0, 25.0, 19.0, 26.0, 33.0, 30.0, 32.0, 32.0, 41.0, 43.0, 37.0, 29.0, 44.0, 39.0, 44.0, 49.0, 32.0, 39.0, 37.0, 39.0, 36.0, 24.0, 28.0, 29.0, 16.0, 15.0, 15.0, 15.0, 11.0, 7.0, 5.0, 9.0, 0.0, 7.0, 4.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.007133781909942627, -0.0069072311744093895, -0.006680680438876152, -0.006454129703342915, -0.006227578967809677, -0.00600102823227644, -0.005774477496743202, -0.005547926761209965, -0.005321376025676727, -0.00509482529014349, -0.004868274554610252, -0.004641723819077015, -0.0044151730835437775, -0.00418862234801054, -0.0039620716124773026, -0.003735520876944065, -0.0035089701414108276, -0.00328241940587759, -0.0030558686703443527, -0.0028293179348111153, -0.002602767199277878, -0.0023762164637446404, -0.002149665728211403, -0.0019231149926781654, -0.001696564257144928, -0.0014700135216116905, -0.001243462786078453, -0.0010169120505452156, -0.0007903613150119781, -0.0005638105794787407, -0.00033725984394550323, -0.00011070910841226578, 0.00011584162712097168, 0.00034239236265420914, 0.0005689430981874466, 0.000795493833720684, 0.0010220445692539215, 0.001248595304787159, 0.0014751460403203964, 0.0017016967758536339, 0.0019282475113868713, 0.002154798246920109, 0.0023813489824533463, 0.0026078997179865837, 0.002834450453519821, 0.0030610011890530586, 0.003287551924586296, 0.0035141026601195335, 0.003740653395652771, 0.0039672041311860085, 0.004193754866719246, 0.004420305602252483, 0.004646856337785721, 0.004873407073318958, 0.005099957808852196, 0.005326508544385433, 0.005553059279918671, 0.005779610015451908, 0.006006160750985146, 0.006232711486518383, 0.0064592622220516205, 0.006685812957584858, 0.006912363693118095, 0.007138914428651333, 0.00736546516418457]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 3.0, 5.0, 4.0, 7.0, 6.0, 7.0, 13.0, 20.0, 11.0, 21.0, 22.0, 27.0, 37.0, 27.0, 26.0, 27.0, 45.0, 39.0, 50.0, 45.0, 40.0, 40.0, 44.0, 46.0, 46.0, 44.0, 41.0, 31.0, 31.0, 31.0, 24.0, 30.0, 23.0, 19.0, 11.0, 14.0, 8.0, 9.0, 6.0, 6.0, 8.0, 3.0, 4.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.75, -105.884765625, -102.01953125, -98.154296875, -94.2890625, -90.423828125, -86.55859375, -82.693359375, -78.828125, -74.962890625, -71.09765625, -67.232421875, -63.3671875, -59.501953125, -55.63671875, -51.771484375, -47.90625, -44.041015625, -40.17578125, -36.310546875, -32.4453125, -28.580078125, -24.71484375, -20.849609375, -16.984375, -13.119140625, -9.25390625, -5.388671875, -1.5234375, 2.341796875, 6.20703125, 10.072265625, 13.9375, 17.802734375, 21.66796875, 25.533203125, 29.3984375, 33.263671875, 37.12890625, 40.994140625, 44.859375, 48.724609375, 52.58984375, 56.455078125, 60.3203125, 64.185546875, 68.05078125, 71.916015625, 75.78125, 79.646484375, 83.51171875, 87.376953125, 91.2421875, 95.107421875, 98.97265625, 102.837890625, 106.703125, 110.568359375, 114.43359375, 118.298828125, 122.1640625, 126.029296875, 129.89453125, 133.759765625, 137.625]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 0.0, 4.0, 3.0, 6.0, 9.0, 12.0, 7.0, 12.0, 22.0, 32.0, 35.0, 60.0, 79.0, 121.0, 172.0, 232.0, 413.0, 675.0, 1125.0, 2183.0, 4241.0, 9612.0, 29252.0, 137225.0, 604133.0, 198386.0, 38332.0, 11515.0, 4876.0, 2388.0, 1342.0, 768.0, 420.0, 268.0, 173.0, 131.0, 82.0, 60.0, 47.0, 23.0, 22.0, 20.0, 11.0, 8.0, 6.0, 4.0, 7.0, 4.0, 2.0, 1.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-30.21875, -29.162109375, -28.10546875, -27.048828125, -25.9921875, -24.935546875, -23.87890625, -22.822265625, -21.765625, -20.708984375, -19.65234375, -18.595703125, -17.5390625, -16.482421875, -15.42578125, -14.369140625, -13.3125, -12.255859375, -11.19921875, -10.142578125, -9.0859375, -8.029296875, -6.97265625, -5.916015625, -4.859375, -3.802734375, -2.74609375, -1.689453125, -0.6328125, 0.423828125, 1.48046875, 2.537109375, 3.59375, 4.650390625, 5.70703125, 6.763671875, 7.8203125, 8.876953125, 9.93359375, 10.990234375, 12.046875, 13.103515625, 14.16015625, 15.216796875, 16.2734375, 17.330078125, 18.38671875, 19.443359375, 20.5, 21.556640625, 22.61328125, 23.669921875, 24.7265625, 25.783203125, 26.83984375, 27.896484375, 28.953125, 30.009765625, 31.06640625, 32.123046875, 33.1796875, 34.236328125, 35.29296875, 36.349609375, 37.40625]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 5.0, 6.0, 7.0, 15.0, 12.0, 17.0, 31.0, 48.0, 74.0, 72.0, 80.0, 82.0, 2144.0, 94.0, 77.0, 88.0, 61.0, 44.0, 28.0, 25.0, 20.0, 8.0, 7.0, 3.0, 4.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-402.25, -391.82421875, -381.3984375, -370.97265625, -360.546875, -350.12109375, -339.6953125, -329.26953125, -318.84375, -308.41796875, -297.9921875, -287.56640625, -277.140625, -266.71484375, -256.2890625, -245.86328125, -235.4375, -225.01171875, -214.5859375, -204.16015625, -193.734375, -183.30859375, -172.8828125, -162.45703125, -152.03125, -141.60546875, -131.1796875, -120.75390625, -110.328125, -99.90234375, -89.4765625, -79.05078125, -68.625, -58.19921875, -47.7734375, -37.34765625, -26.921875, -16.49609375, -6.0703125, 4.35546875, 14.78125, 25.20703125, 35.6328125, 46.05859375, 56.484375, 66.91015625, 77.3359375, 87.76171875, 98.1875, 108.61328125, 119.0390625, 129.46484375, 139.890625, 150.31640625, 160.7421875, 171.16796875, 181.59375, 192.01953125, 202.4453125, 212.87109375, 223.296875, 233.72265625, 244.1484375, 254.57421875, 265.0]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 3.0, 2.0, 10.0, 8.0, 19.0, 43.0, 71.0, 189.0, 358.0, 981.0, 3507.0, 210121.0, 2921668.0, 6584.0, 1261.0, 463.0, 217.0, 103.0, 46.0, 19.0, 8.0, 6.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-124.9375, -121.1669921875, -117.396484375, -113.6259765625, -109.85546875, -106.0849609375, -102.314453125, -98.5439453125, -94.7734375, -91.0029296875, -87.232421875, -83.4619140625, -79.69140625, -75.9208984375, -72.150390625, -68.3798828125, -64.609375, -60.8388671875, -57.068359375, -53.2978515625, -49.52734375, -45.7568359375, -41.986328125, -38.2158203125, -34.4453125, -30.6748046875, -26.904296875, -23.1337890625, -19.36328125, -15.5927734375, -11.822265625, -8.0517578125, -4.28125, -0.5107421875, 3.259765625, 7.0302734375, 10.80078125, 14.5712890625, 18.341796875, 22.1123046875, 25.8828125, 29.6533203125, 33.423828125, 37.1943359375, 40.96484375, 44.7353515625, 48.505859375, 52.2763671875, 56.046875, 59.8173828125, 63.587890625, 67.3583984375, 71.12890625, 74.8994140625, 78.669921875, 82.4404296875, 86.2109375, 89.9814453125, 93.751953125, 97.5224609375, 101.29296875, 105.0634765625, 108.833984375, 112.6044921875, 116.375]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 6.0, 1.0, 3.0, 3.0, 5.0, 9.0, 16.0, 17.0, 28.0, 61.0, 97.0, 150.0, 164.0, 150.0, 118.0, 70.0, 36.0, 33.0, 14.0, 7.0, 2.0, 5.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-292.106201171875, -282.26287841796875, -272.4195251464844, -262.5762023925781, -252.7328643798828, -242.8895263671875, -233.04620361328125, -223.20286560058594, -213.35952758789062, -203.5161895751953, -193.6728515625, -183.82952880859375, -173.98619079589844, -164.14285278320312, -154.29953002929688, -144.45619201660156, -134.61285400390625, -124.76951599121094, -114.92618560791016, -105.08285522460938, -95.23951721191406, -85.39617919921875, -75.55284881591797, -65.70951843261719, -55.866180419921875, -46.02284622192383, -36.17951202392578, -26.336177825927734, -16.492843627929688, -6.649509429931641, 3.1938247680664062, 13.037155151367188, 22.880523681640625, 32.72385787963867, 42.56719207763672, 52.410526275634766, 62.25386047363281, 72.09719848632812, 81.9405288696289, 91.78385925292969, 101.627197265625, 111.47053527832031, 121.3138656616211, 131.15719604492188, 141.0005340576172, 150.8438720703125, 160.68719482421875, 170.53053283691406, 180.37387084960938, 190.2172088623047, 200.060546875, 209.90386962890625, 219.74720764160156, 229.59054565429688, 239.43386840820312, 249.27720642089844, 259.12054443359375, 268.9638671875, 278.8072204589844, 288.6505432128906, 298.493896484375, 308.33721923828125, 318.1805419921875, 328.02386474609375, 337.8672180175781]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 4.0, 3.0, 10.0, 2.0, 6.0, 8.0, 10.0, 14.0, 12.0, 18.0, 18.0, 24.0, 23.0, 27.0, 35.0, 29.0, 31.0, 36.0, 43.0, 43.0, 52.0, 48.0, 59.0, 42.0, 34.0, 34.0, 35.0, 44.0, 34.0, 46.0, 29.0, 16.0, 25.0, 18.0, 18.0, 13.0, 14.0, 9.0, 10.0, 8.0, 3.0, 6.0, 1.0, 5.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-249.61895751953125, -241.98770141601562, -234.3564453125, -226.72518920898438, -219.09393310546875, -211.46267700195312, -203.8314208984375, -196.20016479492188, -188.56890869140625, -180.93765258789062, -173.306396484375, -165.67514038085938, -158.04388427734375, -150.41262817382812, -142.7813720703125, -135.15011596679688, -127.51886749267578, -119.88761138916016, -112.25635528564453, -104.6250991821289, -96.99384307861328, -89.36259460449219, -81.73133850097656, -74.10008239746094, -66.46882629394531, -58.83757019042969, -51.20631408691406, -43.57505798339844, -35.94380187988281, -28.312549591064453, -20.681293487548828, -13.050037384033203, -5.4187774658203125, 2.2124781608581543, 9.843733787536621, 17.47498893737793, 25.106245040893555, 32.73749923706055, 40.36875534057617, 48.0000114440918, 55.63126754760742, 63.26252365112305, 70.8937759399414, 78.52503204345703, 86.15628814697266, 93.78754425048828, 101.4188003540039, 109.05005645751953, 116.68131256103516, 124.31256866455078, 131.94381713867188, 139.5750732421875, 147.20632934570312, 154.83758544921875, 162.46884155273438, 170.10009765625, 177.73135375976562, 185.36260986328125, 192.99386596679688, 200.6251220703125, 208.25637817382812, 215.88763427734375, 223.51889038085938, 231.150146484375, 238.78140258789062]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 4.0, 7.0, 15.0, 17.0, 26.0, 30.0, 43.0, 59.0, 67.0, 80.0, 115.0, 151.0, 218.0, 264.0, 376.0, 463.0, 628.0, 844.0, 1040953.0, 1179.0, 731.0, 552.0, 431.0, 318.0, 225.0, 177.0, 136.0, 107.0, 68.0, 69.0, 50.0, 46.0, 22.0, 15.0, 19.0, 10.0, 9.0, 6.0, 5.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0], "bins": [-93.15234375, -90.47386932373047, -87.79540252685547, -85.11692810058594, -82.4384536743164, -79.7599868774414, -77.08151245117188, -74.40304565429688, -71.72457122802734, -69.04609680175781, -66.36763000488281, -63.68915557861328, -61.010684967041016, -58.33221435546875, -55.65373992919922, -52.97526931762695, -50.29679489135742, -47.618324279785156, -44.939849853515625, -42.26137924194336, -39.582908630371094, -36.90443420410156, -34.2259635925293, -31.54749298095703, -28.869020462036133, -26.190547943115234, -23.51207733154297, -20.83360481262207, -18.155132293701172, -15.476661682128906, -12.798189163208008, -10.119718551635742, -7.441246032714844, -4.762774467468262, -2.0843024253845215, 0.5941696166992188, 3.272641181945801, 5.951112747192383, 8.629585266113281, 11.308055877685547, 13.986528396606445, 16.665000915527344, 19.34347152709961, 22.021944046020508, 24.700416564941406, 27.378887176513672, 30.05735969543457, 32.73583221435547, 35.414302825927734, 38.0927734375, 40.77124786376953, 43.4497184753418, 46.12818908691406, 48.806663513183594, 51.48513412475586, 54.163604736328125, 56.842079162597656, 59.52054977416992, 62.19902420043945, 64.87749481201172, 67.55596923828125, 70.23443603515625, 72.91291046142578, 75.59138488769531, 78.26985168457031]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 8.0, 9.0, 5.0, 8.0, 5.0, 6.0, 8.0, 13.0, 16.0, 29.0, 50.0, 217.0, 51462004.0, 565.0, 69.0, 33.0, 14.0, 15.0, 15.0, 4.0, 6.0, 2.0, 3.0, 3.0, 3.0, 2.0, 1.0, 4.0, 7.0, 6.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-13196.8876953125, -12642.009765625, -12087.1318359375, -11532.25390625, -10977.3759765625, -10422.498046875, -9867.619140625, -9312.7421875, -8757.86328125, -8202.9853515625, -7648.107421875, -7093.2294921875, -6538.3515625, -5983.4736328125, -5428.59521484375, -4873.71728515625, -4318.83984375, -3763.9619140625, -3209.083984375, -2654.205810546875, -2099.327880859375, -1544.449951171875, -989.57177734375, -434.69384765625, 120.18408203125, 675.0620727539062, 1229.9400634765625, 1784.818115234375, 2339.696044921875, 2894.573974609375, 3449.4521484375, 4004.330078125, 4559.20703125, 5114.0849609375, 5668.962890625, 6223.8408203125, 6778.71875, 7333.5966796875, 7888.47509765625, 8443.353515625, 8998.23046875, 9553.1083984375, 10107.986328125, 10662.8642578125, 11217.7421875, 11772.6201171875, 12327.498046875, 12882.376953125, 13437.2548828125, 13992.1328125, 14547.0107421875, 15101.888671875, 15656.7666015625, 16211.64453125, 16766.5234375, 17321.400390625, 17876.279296875, 18431.158203125, 18986.03515625, 19540.9140625, 20095.791015625, 20650.669921875, 21205.546875, 21760.42578125, 22315.302734375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [6.0, 3.0, 8.0, 8.0, 13.0, 30.0, 29.0, 59.0, 58.0, 88.0, 127.0, 205.0, 342.0, 424.0, 682.0, 857.0, 1289.0, 1831.0, 2462.0, 3555.0, 5149.0, 7138.0, 10285.0, 14801.0, 21743.0, 32214.0, 47944.0, 73816.0, 116028.0, 189196.0, 351694.0, 2882895.0, 1677038.0, 334749.0, 182824.0, 112954.0, 71309.0, 46946.0, 31206.0, 20926.0, 14769.0, 10045.0, 6961.0, 4861.0, 3530.0, 2541.0, 1711.0, 1218.0, 898.0, 609.0, 405.0, 299.0, 227.0, 140.0, 105.0, 63.0, 63.0, 24.0, 23.0, 12.0, 6.0, 4.0, 6.0, 5.0], "bins": [-11.2890625, -10.9359130859375, -10.582763671875, -10.2296142578125, -9.87646484375, -9.5233154296875, -9.170166015625, -8.8170166015625, -8.4638671875, -8.1107177734375, -7.757568359375, -7.4044189453125, -7.05126953125, -6.6981201171875, -6.344970703125, -5.9918212890625, -5.638671875, -5.2855224609375, -4.932373046875, -4.5792236328125, -4.22607421875, -3.8729248046875, -3.519775390625, -3.1666259765625, -2.8134765625, -2.4603271484375, -2.107177734375, -1.7540283203125, -1.40087890625, -1.0477294921875, -0.694580078125, -0.3414306640625, 0.01171875, 0.3648681640625, 0.718017578125, 1.0711669921875, 1.42431640625, 1.7774658203125, 2.130615234375, 2.4837646484375, 2.8369140625, 3.1900634765625, 3.543212890625, 3.8963623046875, 4.24951171875, 4.6026611328125, 4.955810546875, 5.3089599609375, 5.662109375, 6.0152587890625, 6.368408203125, 6.7215576171875, 7.07470703125, 7.4278564453125, 7.781005859375, 8.1341552734375, 8.4873046875, 8.8404541015625, 9.193603515625, 9.5467529296875, 9.89990234375, 10.2530517578125, 10.606201171875, 10.9593505859375, 11.3125]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 3.0, 2.0, 2.0, 3.0, 6.0, 5.0, 8.0, 10.0, 14.0, 11.0, 8.0, 17.0, 19.0, 23.0, 21.0, 23.0, 29.0, 30.0, 33.0, 31.0, 37.0, 32.0, 44.0, 79.0, 179.0, 620.0, 209.0, 96.0, 58.0, 34.0, 26.0, 29.0, 35.0, 22.0, 35.0, 31.0, 20.0, 24.0, 18.0, 14.0, 15.0, 20.0, 6.0, 7.0, 7.0, 7.0, 4.0, 3.0, 3.0, 7.0, 6.0, 4.0, 1.0, 4.0, 0.0, 1.0, 1.0], "bins": [-25.453125, -24.671875, -23.890625, -23.109375, -22.328125, -21.546875, -20.765625, -19.984375, -19.203125, -18.421875, -17.640625, -16.859375, -16.078125, -15.296875, -14.515625, -13.734375, -12.953125, -12.171875, -11.390625, -10.609375, -9.828125, -9.046875, -8.265625, -7.484375, -6.703125, -5.921875, -5.140625, -4.359375, -3.578125, -2.796875, -2.015625, -1.234375, -0.453125, 0.328125, 1.109375, 1.890625, 2.671875, 3.453125, 4.234375, 5.015625, 5.796875, 6.578125, 7.359375, 8.140625, 8.921875, 9.703125, 10.484375, 11.265625, 12.046875, 12.828125, 13.609375, 14.390625, 15.171875, 15.953125, 16.734375, 17.515625, 18.296875, 19.078125, 19.859375, 20.640625, 21.421875, 22.203125, 22.984375, 23.765625, 24.546875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 4.0, 4.0, 7.0, 19.0, 22.0, 43.0, 49.0, 83.0, 95.0, 179.0, 212.0, 284.0, 416.0, 734.0, 1070.0, 1451.0, 2121.0, 3115.0, 4568.0, 6866.0, 10240.0, 15757.0, 24900.0, 39688.0, 64843.0, 109542.0, 193243.0, 392753.0, 3352404.0, 1319182.0, 325692.0, 167629.0, 96294.0, 57675.0, 35590.0, 21706.0, 14380.0, 9278.0, 6100.0, 4262.0, 2867.0, 1919.0, 1268.0, 852.0, 632.0, 474.0, 330.0, 181.0, 137.0, 99.0, 63.0, 44.0, 27.0, 13.0, 17.0, 8.0, 13.0, 2.0, 4.0], "bins": [-13.4921875, -13.0941162109375, -12.696044921875, -12.2979736328125, -11.89990234375, -11.5018310546875, -11.103759765625, -10.7056884765625, -10.3076171875, -9.9095458984375, -9.511474609375, -9.1134033203125, -8.71533203125, -8.3172607421875, -7.919189453125, -7.5211181640625, -7.123046875, -6.7249755859375, -6.326904296875, -5.9288330078125, -5.53076171875, -5.1326904296875, -4.734619140625, -4.3365478515625, -3.9384765625, -3.5404052734375, -3.142333984375, -2.7442626953125, -2.34619140625, -1.9481201171875, -1.550048828125, -1.1519775390625, -0.75390625, -0.3558349609375, 0.042236328125, 0.4403076171875, 0.83837890625, 1.2364501953125, 1.634521484375, 2.0325927734375, 2.4306640625, 2.8287353515625, 3.226806640625, 3.6248779296875, 4.02294921875, 4.4210205078125, 4.819091796875, 5.2171630859375, 5.615234375, 6.0133056640625, 6.411376953125, 6.8094482421875, 7.20751953125, 7.6055908203125, 8.003662109375, 8.4017333984375, 8.7998046875, 9.1978759765625, 9.595947265625, 9.9940185546875, 10.39208984375, 10.7901611328125, 11.188232421875, 11.5863037109375, 11.984375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 5.0, 11.0, 9.0, 9.0, 4.0, 7.0, 15.0, 17.0, 22.0, 18.0, 22.0, 19.0, 40.0, 29.0, 33.0, 42.0, 36.0, 44.0, 56.0, 77.0, 147.0, 425.0, 377.0, 144.0, 62.0, 39.0, 38.0, 34.0, 34.0, 33.0, 22.0, 25.0, 20.0, 15.0, 15.0, 12.0, 14.0, 13.0, 10.0, 9.0, 14.0, 3.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0], "bins": [-19.953125, -19.365234375, -18.77734375, -18.189453125, -17.6015625, -17.013671875, -16.42578125, -15.837890625, -15.25, -14.662109375, -14.07421875, -13.486328125, -12.8984375, -12.310546875, -11.72265625, -11.134765625, -10.546875, -9.958984375, -9.37109375, -8.783203125, -8.1953125, -7.607421875, -7.01953125, -6.431640625, -5.84375, -5.255859375, -4.66796875, -4.080078125, -3.4921875, -2.904296875, -2.31640625, -1.728515625, -1.140625, -0.552734375, 0.03515625, 0.623046875, 1.2109375, 1.798828125, 2.38671875, 2.974609375, 3.5625, 4.150390625, 4.73828125, 5.326171875, 5.9140625, 6.501953125, 7.08984375, 7.677734375, 8.265625, 8.853515625, 9.44140625, 10.029296875, 10.6171875, 11.205078125, 11.79296875, 12.380859375, 12.96875, 13.556640625, 14.14453125, 14.732421875, 15.3203125, 15.908203125, 16.49609375, 17.083984375, 17.671875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 3.0, 0.0, 0.0, 4.0, 11.0, 6.0, 3.0, 19.0, 14.0, 14.0, 41.0, 41.0, 55.0, 66.0, 98.0, 151.0, 186.0, 186.0, 375.0, 483.0, 672.0, 953.0, 1461.0, 2149.0, 3764.0, 7132.0, 15934.0, 43600.0, 260966.0, 5845277.0, 65527.0, 20857.0, 9086.0, 4406.0, 2701.0, 1540.0, 1036.0, 730.0, 442.0, 385.0, 280.0, 197.0, 122.0, 101.0, 103.0, 100.0, 39.0, 38.0, 42.0, 9.0, 15.0, 9.0, 6.0, 0.0, 6.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-43.375, -41.9365234375, -40.498046875, -39.0595703125, -37.62109375, -36.1826171875, -34.744140625, -33.3056640625, -31.8671875, -30.4287109375, -28.990234375, -27.5517578125, -26.11328125, -24.6748046875, -23.236328125, -21.7978515625, -20.359375, -18.9208984375, -17.482421875, -16.0439453125, -14.60546875, -13.1669921875, -11.728515625, -10.2900390625, -8.8515625, -7.4130859375, -5.974609375, -4.5361328125, -3.09765625, -1.6591796875, -0.220703125, 1.2177734375, 2.65625, 4.0947265625, 5.533203125, 6.9716796875, 8.41015625, 9.8486328125, 11.287109375, 12.7255859375, 14.1640625, 15.6025390625, 17.041015625, 18.4794921875, 19.91796875, 21.3564453125, 22.794921875, 24.2333984375, 25.671875, 27.1103515625, 28.548828125, 29.9873046875, 31.42578125, 32.8642578125, 34.302734375, 35.7412109375, 37.1796875, 38.6181640625, 40.056640625, 41.4951171875, 42.93359375, 44.3720703125, 45.810546875, 47.2490234375, 48.6875]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 5.0, 2.0, 2.0, 12.0, 7.0, 7.0, 6.0, 8.0, 21.0, 14.0, 15.0, 13.0, 18.0, 31.0, 32.0, 41.0, 35.0, 44.0, 48.0, 76.0, 133.0, 211.0, 515.0, 187.0, 106.0, 71.0, 59.0, 57.0, 37.0, 38.0, 32.0, 24.0, 22.0, 25.0, 18.0, 13.0, 8.0, 12.0, 9.0, 7.0, 6.0, 5.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3203125, -13.8343505859375, -13.348388671875, -12.8624267578125, -12.37646484375, -11.8905029296875, -11.404541015625, -10.9185791015625, -10.4326171875, -9.9466552734375, -9.460693359375, -8.9747314453125, -8.48876953125, -8.0028076171875, -7.516845703125, -7.0308837890625, -6.544921875, -6.0589599609375, -5.572998046875, -5.0870361328125, -4.60107421875, -4.1151123046875, -3.629150390625, -3.1431884765625, -2.6572265625, -2.1712646484375, -1.685302734375, -1.1993408203125, -0.71337890625, -0.2274169921875, 0.258544921875, 0.7445068359375, 1.23046875, 1.7164306640625, 2.202392578125, 2.6883544921875, 3.17431640625, 3.6602783203125, 4.146240234375, 4.6322021484375, 5.1181640625, 5.6041259765625, 6.090087890625, 6.5760498046875, 7.06201171875, 7.5479736328125, 8.033935546875, 8.5198974609375, 9.005859375, 9.4918212890625, 9.977783203125, 10.4637451171875, 10.94970703125, 11.4356689453125, 11.921630859375, 12.4075927734375, 12.8935546875, 13.3795166015625, 13.865478515625, 14.3514404296875, 14.83740234375, 15.3233642578125, 15.809326171875, 16.2952880859375, 16.78125]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 9.0, 22.0, 59.0, 176.0, 521.0, 132.0, 47.0, 19.0, 8.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-127.0884017944336, -124.15847778320312, -121.22855377197266, -118.29862976074219, -115.36871337890625, -112.43878936767578, -109.50886535644531, -106.57894134521484, -103.64901733398438, -100.7190933227539, -97.78916931152344, -94.8592529296875, -91.92932891845703, -88.99940490722656, -86.0694808959961, -83.13955688476562, -80.20964050292969, -77.27971649169922, -74.34979248046875, -71.41987609863281, -68.48995208740234, -65.56002807617188, -62.630104064941406, -59.70018005371094, -56.77025604248047, -53.84033203125, -50.9104118347168, -47.98048782348633, -45.05056381225586, -42.120643615722656, -39.19071960449219, -36.26079559326172, -33.330867767333984, -30.40094566345215, -27.47102165222168, -24.541099548339844, -21.611175537109375, -18.68125343322754, -15.751331329345703, -12.821407318115234, -9.891485214233398, -6.961562156677246, -4.031639575958252, -1.1017169952392578, 1.8282060623168945, 4.758129119873047, 7.688051223754883, 10.617975234985352, 13.547897338867188, 16.477819442749023, 19.407743453979492, 22.337665557861328, 25.267589569091797, 28.197511672973633, 31.12743377685547, 34.05735778808594, 36.987281799316406, 39.917205810546875, 42.84712600708008, 45.77705001831055, 48.706974029541016, 51.63689422607422, 54.56681823730469, 57.496742248535156, 60.42666244506836]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 9.0, 2.0, 3.0, 9.0, 13.0, 13.0, 16.0, 21.0, 18.0, 18.0, 29.0, 26.0, 22.0, 33.0, 45.0, 36.0, 44.0, 40.0, 45.0, 56.0, 44.0, 51.0, 43.0, 48.0, 38.0, 44.0, 44.0, 26.0, 23.0, 29.0, 16.0, 22.0, 24.0, 20.0, 11.0, 10.0, 5.0, 4.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.486909866333008, -21.770431518554688, -21.053953170776367, -20.337474822998047, -19.620994567871094, -18.904516220092773, -18.188037872314453, -17.471559524536133, -16.755081176757812, -16.038602828979492, -15.322123527526855, -14.605645179748535, -13.889165878295898, -13.172687530517578, -12.456209182739258, -11.739730834960938, -11.023250579833984, -10.306772232055664, -9.590292930603027, -8.873814582824707, -8.15733528137207, -7.44085693359375, -6.72437858581543, -6.007899761199951, -5.291420936584473, -4.574942111968994, -3.8584635257720947, -3.1419849395751953, -2.425506114959717, -1.7090272903442383, -0.992548942565918, -0.27607011795043945, 0.44040870666503906, 1.156887412071228, 1.873366117477417, 2.5898447036743164, 3.306323528289795, 4.022802352905273, 4.739280700683594, 5.455759525299072, 6.172238349914551, 6.888717174530029, 7.605195999145508, 8.321674346923828, 9.038152694702148, 9.754631996154785, 10.471110343933105, 11.187589645385742, 11.904067993164062, 12.620546340942383, 13.33702564239502, 14.05350399017334, 14.769983291625977, 15.486461639404297, 16.202939987182617, 16.919418334960938, 17.63589859008789, 18.35237693786621, 19.06885528564453, 19.785335540771484, 20.501813888549805, 21.218292236328125, 21.934770584106445, 22.651248931884766, 23.367727279663086]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 2.0, 7.0, 4.0, 9.0, 7.0, 9.0, 8.0, 15.0, 23.0, 20.0, 29.0, 41.0, 55.0, 74.0, 109.0, 155.0, 217.0, 307.0, 417.0, 638.0, 924.0, 1335.0, 2180.0, 3731.0, 7542.0, 20139.0, 4024544.0, 96241.0, 18237.0, 7451.0, 3755.0, 2132.0, 1282.0, 821.0, 534.0, 405.0, 246.0, 168.0, 123.0, 100.0, 66.0, 56.0, 36.0, 21.0, 15.0, 15.0, 8.0, 7.0, 8.0, 9.0, 9.0, 5.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04608154296875, -0.04463624954223633, -0.043190956115722656, -0.041745662689208984, -0.04030036926269531, -0.03885507583618164, -0.03740978240966797, -0.0359644889831543, -0.034519195556640625, -0.03307390213012695, -0.03162860870361328, -0.03018331527709961, -0.028738021850585938, -0.027292728424072266, -0.025847434997558594, -0.024402141571044922, -0.02295684814453125, -0.021511554718017578, -0.020066261291503906, -0.018620967864990234, -0.017175674438476562, -0.01573038101196289, -0.014285087585449219, -0.012839794158935547, -0.011394500732421875, -0.009949207305908203, -0.008503913879394531, -0.007058620452880859, -0.0056133270263671875, -0.004168033599853516, -0.0027227401733398438, -0.0012774467468261719, 0.0001678466796875, 0.0016131401062011719, 0.0030584335327148438, 0.004503726959228516, 0.0059490203857421875, 0.007394313812255859, 0.008839607238769531, 0.010284900665283203, 0.011730194091796875, 0.013175487518310547, 0.014620780944824219, 0.01606607437133789, 0.017511367797851562, 0.018956661224365234, 0.020401954650878906, 0.021847248077392578, 0.02329254150390625, 0.024737834930419922, 0.026183128356933594, 0.027628421783447266, 0.029073715209960938, 0.03051900863647461, 0.03196430206298828, 0.03340959548950195, 0.034854888916015625, 0.0363001823425293, 0.03774547576904297, 0.03919076919555664, 0.04063606262207031, 0.042081356048583984, 0.043526649475097656, 0.04497194290161133, 0.046417236328125]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 3.0, 6.0, 12.0, 9.0, 11.0, 12.0, 15.0, 13.0, 780.0, 18.0, 24.0, 14.0, 10.0, 7.0, 9.0, 5.0, 6.0, 9.0, 5.0, 2.0, 5.0, 2.0, 2.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0032958984375, -0.003184765577316284, -0.0030736327171325684, -0.0029624998569488525, -0.0028513669967651367, -0.002740234136581421, -0.002629101276397705, -0.0025179684162139893, -0.0024068355560302734, -0.0022957026958465576, -0.002184569835662842, -0.002073436975479126, -0.00196230411529541, -0.0018511712551116943, -0.0017400383949279785, -0.0016289055347442627, -0.0015177726745605469, -0.001406639814376831, -0.0012955069541931152, -0.0011843740940093994, -0.0010732412338256836, -0.0009621083736419678, -0.000850975513458252, -0.0007398426532745361, -0.0006287097930908203, -0.0005175769329071045, -0.00040644407272338867, -0.00029531121253967285, -0.00018417835235595703, -7.304549217224121e-05, 3.808736801147461e-05, 0.00014922022819519043, 0.00026035308837890625, 0.00037148594856262207, 0.0004826188087463379, 0.0005937516689300537, 0.0007048845291137695, 0.0008160173892974854, 0.0009271502494812012, 0.001038283109664917, 0.0011494159698486328, 0.0012605488300323486, 0.0013716816902160645, 0.0014828145503997803, 0.001593947410583496, 0.001705080270767212, 0.0018162131309509277, 0.0019273459911346436, 0.0020384788513183594, 0.002149611711502075, 0.002260744571685791, 0.002371877431869507, 0.0024830102920532227, 0.0025941431522369385, 0.0027052760124206543, 0.00281640887260437, 0.002927541732788086, 0.0030386745929718018, 0.0031498074531555176, 0.0032609403133392334, 0.0033720731735229492, 0.003483206033706665, 0.003594338893890381, 0.0037054717540740967, 0.0038166046142578125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 6.0, 9.0, 8.0, 15.0, 9.0, 21.0, 34.0, 36.0, 40.0, 63.0, 98.0, 128.0, 173.0, 237.0, 355.0, 540.0, 858.0, 1514.0, 3024.0, 7545.0, 31259.0, 699889.0, 3397520.0, 35638.0, 7961.0, 3105.0, 1562.0, 884.0, 503.0, 348.0, 237.0, 172.0, 139.0, 86.0, 61.0, 60.0, 40.0, 22.0, 18.0, 25.0, 10.0, 11.0, 4.0, 4.0, 5.0, 3.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0], "bins": [-0.0640869140625, -0.06214714050292969, -0.060207366943359375, -0.05826759338378906, -0.05632781982421875, -0.05438804626464844, -0.052448272705078125, -0.05050849914550781, -0.0485687255859375, -0.04662895202636719, -0.044689178466796875, -0.04274940490722656, -0.04080963134765625, -0.03886985778808594, -0.036930084228515625, -0.03499031066894531, -0.033050537109375, -0.031110763549804688, -0.029170989990234375, -0.027231216430664062, -0.02529144287109375, -0.023351669311523438, -0.021411895751953125, -0.019472122192382812, -0.0175323486328125, -0.015592575073242188, -0.013652801513671875, -0.011713027954101562, -0.00977325439453125, -0.007833480834960938, -0.005893707275390625, -0.0039539337158203125, -0.00201416015625, -7.43865966796875e-05, 0.001865386962890625, 0.0038051605224609375, 0.00574493408203125, 0.0076847076416015625, 0.009624481201171875, 0.011564254760742188, 0.0135040283203125, 0.015443801879882812, 0.017383575439453125, 0.019323348999023438, 0.02126312255859375, 0.023202896118164062, 0.025142669677734375, 0.027082443237304688, 0.029022216796875, 0.030961990356445312, 0.032901763916015625, 0.03484153747558594, 0.03678131103515625, 0.03872108459472656, 0.040660858154296875, 0.04260063171386719, 0.0445404052734375, 0.04648017883300781, 0.048419952392578125, 0.05035972595214844, 0.05229949951171875, 0.05423927307128906, 0.056179046630859375, 0.05811882019042969, 0.06005859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 5.0, 4.0, 8.0, 10.0, 14.0, 15.0, 6.0, 18.0, 18.0, 24.0, 18.0, 29.0, 22.0, 41.0, 46.0, 43.0, 76.0, 99.0, 197.0, 685.0, 1964.0, 208.0, 102.0, 87.0, 54.0, 53.0, 34.0, 29.0, 34.0, 26.0, 17.0, 18.0, 14.0, 13.0, 8.0, 11.0, 6.0, 9.0, 5.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.006591796875, -0.006392478942871094, -0.0061931610107421875, -0.005993843078613281, -0.005794525146484375, -0.005595207214355469, -0.0053958892822265625, -0.005196571350097656, -0.00499725341796875, -0.004797935485839844, -0.0045986175537109375, -0.004399299621582031, -0.004199981689453125, -0.004000663757324219, -0.0038013458251953125, -0.0036020278930664062, -0.0034027099609375, -0.0032033920288085938, -0.0030040740966796875, -0.0028047561645507812, -0.002605438232421875, -0.0024061203002929688, -0.0022068023681640625, -0.0020074844360351562, -0.00180816650390625, -0.0016088485717773438, -0.0014095306396484375, -0.0012102127075195312, -0.001010894775390625, -0.0008115768432617188, -0.0006122589111328125, -0.00041294097900390625, -0.000213623046875, -1.430511474609375e-05, 0.0001850128173828125, 0.00038433074951171875, 0.000583648681640625, 0.0007829666137695312, 0.0009822845458984375, 0.0011816024780273438, 0.00138092041015625, 0.0015802383422851562, 0.0017795562744140625, 0.0019788742065429688, 0.002178192138671875, 0.0023775100708007812, 0.0025768280029296875, 0.0027761459350585938, 0.0029754638671875, 0.0031747817993164062, 0.0033740997314453125, 0.0035734176635742188, 0.003772735595703125, 0.003972053527832031, 0.0041713714599609375, 0.004370689392089844, 0.00457000732421875, 0.004769325256347656, 0.0049686431884765625, 0.005167961120605469, 0.005367279052734375, 0.005566596984863281, 0.0057659149169921875, 0.005965232849121094, 0.00616455078125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 29.0, 146.0, 716.0, 88.0, 16.0, 6.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.37479522824287415, -0.3679015636444092, -0.3610078990459442, -0.35411423444747925, -0.3472205400466919, -0.34032687544822693, -0.33343321084976196, -0.326539546251297, -0.31964588165283203, -0.31275221705436707, -0.3058585524559021, -0.29896485805511475, -0.2920711934566498, -0.2851775288581848, -0.27828386425971985, -0.2713901996612549, -0.26449650526046753, -0.25760284066200256, -0.2507091760635376, -0.24381549656391144, -0.23692183196544647, -0.2300281524658203, -0.22313448786735535, -0.21624082326889038, -0.20934715867042542, -0.20245349407196045, -0.1955598145723343, -0.18866614997386932, -0.18177248537540436, -0.1748788058757782, -0.16798514127731323, -0.16109147667884827, -0.1541977971792221, -0.14730413258075714, -0.14041045308113098, -0.13351678848266602, -0.12662312388420105, -0.11972945183515549, -0.11283577978610992, -0.10594211518764496, -0.0990484431385994, -0.09215477108955383, -0.08526110649108887, -0.0783674344420433, -0.07147376239299774, -0.06458009779453278, -0.05768642574548721, -0.05079275742173195, -0.043899089097976685, -0.03700542077422142, -0.030111750587821007, -0.023218080401420593, -0.01632441207766533, -0.009430743753910065, -0.002537071704864502, 0.004356596618890762, 0.011250264942646027, 0.01814393326640129, 0.025037603452801704, 0.03193127363920212, 0.03882494196295738, 0.045718610286712646, 0.05261228233575821, 0.059505950659513474, 0.06639961898326874]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 6.0, 7.0, 10.0, 12.0, 13.0, 11.0, 21.0, 20.0, 25.0, 33.0, 31.0, 40.0, 50.0, 53.0, 60.0, 52.0, 58.0, 60.0, 43.0, 73.0, 49.0, 41.0, 41.0, 37.0, 31.0, 25.0, 25.0, 26.0, 14.0, 8.0, 8.0, 6.0, 3.0, 8.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02286916971206665, -0.022004876285791397, -0.021140580996870995, -0.020276285707950592, -0.01941199228167534, -0.018547698855400085, -0.017683403566479683, -0.01681910827755928, -0.015954814851284027, -0.0150905204936862, -0.014226226136088371, -0.013361931778490543, -0.012497637420892715, -0.011633343063294888, -0.01076904870569706, -0.009904754348099232, -0.009040459990501404, -0.008176165632903576, -0.007311871275305748, -0.00644757691770792, -0.005583282560110092, -0.004718988202512264, -0.0038546938449144363, -0.0029903994873166084, -0.0021261051297187805, -0.0012618107721209526, -0.0003975164145231247, 0.0004667779430747032, 0.0013310723006725311, 0.002195366658270359, 0.003059661015868187, 0.003923955373466015, 0.004788249731063843, 0.005652544088661671, 0.006516838446259499, 0.0073811328038573265, 0.008245427161455154, 0.009109721519052982, 0.00997401587665081, 0.010838310234248638, 0.011702604591846466, 0.012566898949444294, 0.013431193307042122, 0.01429548766463995, 0.015159782022237778, 0.01602407544851303, 0.016888370737433434, 0.017752666026353836, 0.01861695945262909, 0.019481252878904343, 0.020345548167824745, 0.021209843456745148, 0.0220741368830204, 0.022938430309295654, 0.023802725598216057, 0.02466702088713646, 0.025531314313411713, 0.026395607739686966, 0.02725990302860737, 0.02812419831752777, 0.028988491743803024, 0.029852785170078278, 0.03071708045899868, 0.03158137574791908, 0.032445669174194336]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 4.0, 4.0, 6.0, 9.0, 10.0, 19.0, 25.0, 25.0, 38.0, 60.0, 96.0, 82.0, 150.0, 212.0, 267.0, 371.0, 501.0, 718.0, 1104.0, 1586.0, 2277.0, 3767.0, 6124.0, 11795.0, 27518.0, 891881.0, 58857.0, 17838.0, 8689.0, 4908.0, 3126.0, 2055.0, 1302.0, 868.0, 660.0, 427.0, 306.0, 215.0, 142.0, 172.0, 88.0, 69.0, 38.0, 45.0, 30.0, 16.0, 18.0, 13.0, 11.0, 3.0, 7.0, 5.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.043243408203125, -0.04192399978637695, -0.040604591369628906, -0.03928518295288086, -0.03796577453613281, -0.036646366119384766, -0.03532695770263672, -0.03400754928588867, -0.032688140869140625, -0.03136873245239258, -0.03004932403564453, -0.028729915618896484, -0.027410507202148438, -0.02609109878540039, -0.024771690368652344, -0.023452281951904297, -0.02213287353515625, -0.020813465118408203, -0.019494056701660156, -0.01817464828491211, -0.016855239868164062, -0.015535831451416016, -0.014216423034667969, -0.012897014617919922, -0.011577606201171875, -0.010258197784423828, -0.008938789367675781, -0.007619380950927734, -0.0062999725341796875, -0.004980564117431641, -0.0036611557006835938, -0.002341747283935547, -0.0010223388671875, 0.0002970695495605469, 0.0016164779663085938, 0.0029358863830566406, 0.0042552947998046875, 0.005574703216552734, 0.006894111633300781, 0.008213520050048828, 0.009532928466796875, 0.010852336883544922, 0.012171745300292969, 0.013491153717041016, 0.014810562133789062, 0.01612997055053711, 0.017449378967285156, 0.018768787384033203, 0.02008819580078125, 0.021407604217529297, 0.022727012634277344, 0.02404642105102539, 0.025365829467773438, 0.026685237884521484, 0.02800464630126953, 0.029324054718017578, 0.030643463134765625, 0.03196287155151367, 0.03328227996826172, 0.034601688385009766, 0.03592109680175781, 0.03724050521850586, 0.038559913635253906, 0.03987932205200195, 0.04119873046875]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 5.0, 3.0, 3.0, 1.0, 3.0, 7.0, 10.0, 9.0, 13.0, 9.0, 19.0, 22.0, 773.0, 15.0, 24.0, 11.0, 10.0, 10.0, 7.0, 5.0, 7.0, 5.0, 8.0, 3.0, 4.0, 2.0, 1.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00324249267578125, -0.003132760524749756, -0.0030230283737182617, -0.0029132962226867676, -0.0028035640716552734, -0.0026938319206237793, -0.002584099769592285, -0.002474367618560791, -0.002364635467529297, -0.0022549033164978027, -0.0021451711654663086, -0.0020354390144348145, -0.0019257068634033203, -0.0018159747123718262, -0.001706242561340332, -0.0015965104103088379, -0.0014867782592773438, -0.0013770461082458496, -0.0012673139572143555, -0.0011575818061828613, -0.0010478496551513672, -0.000938117504119873, -0.0008283853530883789, -0.0007186532020568848, -0.0006089210510253906, -0.0004991888999938965, -0.00038945674896240234, -0.0002797245979309082, -0.00016999244689941406, -6.026029586791992e-05, 4.947185516357422e-05, 0.00015920400619506836, 0.0002689361572265625, 0.00037866830825805664, 0.0004884004592895508, 0.0005981326103210449, 0.0007078647613525391, 0.0008175969123840332, 0.0009273290634155273, 0.0010370612144470215, 0.0011467933654785156, 0.0012565255165100098, 0.001366257667541504, 0.001475989818572998, 0.0015857219696044922, 0.0016954541206359863, 0.0018051862716674805, 0.0019149184226989746, 0.0020246505737304688, 0.002134382724761963, 0.002244114875793457, 0.002353847026824951, 0.0024635791778564453, 0.0025733113288879395, 0.0026830434799194336, 0.0027927756309509277, 0.002902507781982422, 0.003012239933013916, 0.00312197208404541, 0.0032317042350769043, 0.0033414363861083984, 0.0034511685371398926, 0.0035609006881713867, 0.003670632839202881, 0.003780364990234375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 7.0, 3.0, 7.0, 8.0, 12.0, 11.0, 16.0, 25.0, 40.0, 58.0, 76.0, 116.0, 150.0, 230.0, 287.0, 453.0, 699.0, 1255.0, 2174.0, 4365.0, 11202.0, 58569.0, 883416.0, 63550.0, 11518.0, 4624.0, 2150.0, 1226.0, 786.0, 465.0, 308.0, 230.0, 171.0, 103.0, 62.0, 54.0, 41.0, 25.0, 19.0, 16.0, 14.0, 7.0, 7.0, 6.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.06536865234375, -0.0632944107055664, -0.06122016906738281, -0.05914592742919922, -0.057071685791015625, -0.05499744415283203, -0.05292320251464844, -0.050848960876464844, -0.04877471923828125, -0.046700477600097656, -0.04462623596191406, -0.04255199432373047, -0.040477752685546875, -0.03840351104736328, -0.03632926940917969, -0.034255027770996094, -0.0321807861328125, -0.030106544494628906, -0.028032302856445312, -0.02595806121826172, -0.023883819580078125, -0.02180957794189453, -0.019735336303710938, -0.017661094665527344, -0.01558685302734375, -0.013512611389160156, -0.011438369750976562, -0.009364128112792969, -0.007289886474609375, -0.005215644836425781, -0.0031414031982421875, -0.0010671615600585938, 0.001007080078125, 0.0030813217163085938, 0.0051555633544921875, 0.007229804992675781, 0.009304046630859375, 0.011378288269042969, 0.013452529907226562, 0.015526771545410156, 0.01760101318359375, 0.019675254821777344, 0.021749496459960938, 0.02382373809814453, 0.025897979736328125, 0.02797222137451172, 0.030046463012695312, 0.032120704650878906, 0.0341949462890625, 0.036269187927246094, 0.03834342956542969, 0.04041767120361328, 0.042491912841796875, 0.04456615447998047, 0.04664039611816406, 0.048714637756347656, 0.05078887939453125, 0.052863121032714844, 0.05493736267089844, 0.05701160430908203, 0.059085845947265625, 0.06116008758544922, 0.06323432922363281, 0.0653085708618164, 0.0673828125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 4.0, 4.0, 6.0, 6.0, 10.0, 16.0, 20.0, 10.0, 16.0, 22.0, 27.0, 24.0, 18.0, 31.0, 33.0, 47.0, 37.0, 40.0, 44.0, 53.0, 41.0, 66.0, 44.0, 39.0, 40.0, 35.0, 37.0, 32.0, 31.0, 24.0, 24.0, 15.0, 13.0, 16.0, 14.0, 11.0, 14.0, 12.0, 10.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.01322174072265625, -0.012802481651306152, -0.012383222579956055, -0.011963963508605957, -0.01154470443725586, -0.011125445365905762, -0.010706186294555664, -0.010286927223205566, -0.009867668151855469, -0.009448409080505371, -0.009029150009155273, -0.008609890937805176, -0.008190631866455078, -0.0077713727951049805, -0.007352113723754883, -0.006932854652404785, -0.0065135955810546875, -0.00609433650970459, -0.005675077438354492, -0.0052558183670043945, -0.004836559295654297, -0.004417300224304199, -0.0039980411529541016, -0.003578782081604004, -0.0031595230102539062, -0.0027402639389038086, -0.002321004867553711, -0.0019017457962036133, -0.0014824867248535156, -0.001063227653503418, -0.0006439685821533203, -0.00022470951080322266, 0.000194549560546875, 0.0006138086318969727, 0.0010330677032470703, 0.001452326774597168, 0.0018715858459472656, 0.0022908449172973633, 0.002710103988647461, 0.0031293630599975586, 0.0035486221313476562, 0.003967881202697754, 0.0043871402740478516, 0.004806399345397949, 0.005225658416748047, 0.0056449174880981445, 0.006064176559448242, 0.00648343563079834, 0.0069026947021484375, 0.007321953773498535, 0.007741212844848633, 0.00816047191619873, 0.008579730987548828, 0.008998990058898926, 0.009418249130249023, 0.009837508201599121, 0.010256767272949219, 0.010676026344299316, 0.011095285415649414, 0.011514544486999512, 0.01193380355834961, 0.012353062629699707, 0.012772321701049805, 0.013191580772399902, 0.01361083984375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 6.0, 7.0, 14.0, 15.0, 22.0, 21.0, 34.0, 70.0, 208.0, 837.0, 27596.0, 1016569.0, 2511.0, 362.0, 113.0, 49.0, 41.0, 18.0, 8.0, 8.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.033843994140625, -0.0328829288482666, -0.0319218635559082, -0.030960798263549805, -0.029999732971191406, -0.029038667678833008, -0.02807760238647461, -0.02711653709411621, -0.026155471801757812, -0.025194406509399414, -0.024233341217041016, -0.023272275924682617, -0.02231121063232422, -0.02135014533996582, -0.020389080047607422, -0.019428014755249023, -0.018466949462890625, -0.017505884170532227, -0.016544818878173828, -0.01558375358581543, -0.014622688293457031, -0.013661623001098633, -0.012700557708740234, -0.011739492416381836, -0.010778427124023438, -0.009817361831665039, -0.00885629653930664, -0.007895231246948242, -0.006934165954589844, -0.005973100662231445, -0.005012035369873047, -0.0040509700775146484, -0.00308990478515625, -0.0021288394927978516, -0.0011677742004394531, -0.0002067089080810547, 0.0007543563842773438, 0.0017154216766357422, 0.0026764869689941406, 0.003637552261352539, 0.0045986175537109375, 0.005559682846069336, 0.006520748138427734, 0.007481813430786133, 0.008442878723144531, 0.00940394401550293, 0.010365009307861328, 0.011326074600219727, 0.012287139892578125, 0.013248205184936523, 0.014209270477294922, 0.01517033576965332, 0.01613140106201172, 0.017092466354370117, 0.018053531646728516, 0.019014596939086914, 0.019975662231445312, 0.02093672752380371, 0.02189779281616211, 0.022858858108520508, 0.023819923400878906, 0.024780988693237305, 0.025742053985595703, 0.0267031192779541, 0.0276641845703125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 7.0, 14.0, 17.0, 24.0, 30.0, 64.0, 90.0, 117.0, 161.0, 115.0, 102.0, 86.0, 65.0, 32.0, 20.0, 14.0, 15.0, 5.0, 7.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.2695789337158203e-05, -1.2322328984737396e-05, -1.194886863231659e-05, -1.1575408279895782e-05, -1.1201947927474976e-05, -1.0828487575054169e-05, -1.0455027222633362e-05, -1.0081566870212555e-05, -9.708106517791748e-06, -9.334646165370941e-06, -8.961185812950134e-06, -8.587725460529327e-06, -8.21426510810852e-06, -7.840804755687714e-06, -7.467344403266907e-06, -7.0938840508461e-06, -6.720423698425293e-06, -6.346963346004486e-06, -5.973502993583679e-06, -5.600042641162872e-06, -5.2265822887420654e-06, -4.8531219363212585e-06, -4.479661583900452e-06, -4.106201231479645e-06, -3.732740879058838e-06, -3.359280526638031e-06, -2.985820174217224e-06, -2.6123598217964172e-06, -2.2388994693756104e-06, -1.8654391169548035e-06, -1.4919787645339966e-06, -1.1185184121131897e-06, -7.450580596923828e-07, -3.7159770727157593e-07, 1.862645149230957e-09, 3.7532299757003784e-07, 7.487833499908447e-07, 1.1222437024116516e-06, 1.4957040548324585e-06, 1.8691644072532654e-06, 2.2426247596740723e-06, 2.616085112094879e-06, 2.989545464515686e-06, 3.363005816936493e-06, 3.7364661693573e-06, 4.109926521778107e-06, 4.4833868741989136e-06, 4.8568472266197205e-06, 5.230307579040527e-06, 5.603767931461334e-06, 5.977228283882141e-06, 6.350688636302948e-06, 6.724148988723755e-06, 7.097609341144562e-06, 7.471069693565369e-06, 7.844530045986176e-06, 8.217990398406982e-06, 8.59145075082779e-06, 8.964911103248596e-06, 9.338371455669403e-06, 9.71183180809021e-06, 1.0085292160511017e-05, 1.0458752512931824e-05, 1.083221286535263e-05, 1.1205673217773438e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 0.0, 2.0, 6.0, 5.0, 9.0, 10.0, 20.0, 24.0, 41.0, 58.0, 85.0, 184.0, 292.0, 616.0, 1419.0, 4269.0, 20811.0, 952963.0, 56431.0, 7201.0, 2234.0, 903.0, 387.0, 251.0, 119.0, 56.0, 39.0, 32.0, 19.0, 18.0, 15.0, 9.0, 6.0, 4.0, 6.0, 4.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0222015380859375, -0.021500825881958008, -0.020800113677978516, -0.020099401473999023, -0.01939868927001953, -0.01869797706604004, -0.017997264862060547, -0.017296552658081055, -0.016595840454101562, -0.01589512825012207, -0.015194416046142578, -0.014493703842163086, -0.013792991638183594, -0.013092279434204102, -0.01239156723022461, -0.011690855026245117, -0.010990142822265625, -0.010289430618286133, -0.00958871841430664, -0.008888006210327148, -0.008187294006347656, -0.007486581802368164, -0.006785869598388672, -0.00608515739440918, -0.0053844451904296875, -0.004683732986450195, -0.003983020782470703, -0.003282308578491211, -0.0025815963745117188, -0.0018808841705322266, -0.0011801719665527344, -0.0004794597625732422, 0.00022125244140625, 0.0009219646453857422, 0.0016226768493652344, 0.0023233890533447266, 0.0030241012573242188, 0.003724813461303711, 0.004425525665283203, 0.005126237869262695, 0.0058269500732421875, 0.00652766227722168, 0.007228374481201172, 0.007929086685180664, 0.008629798889160156, 0.009330511093139648, 0.01003122329711914, 0.010731935501098633, 0.011432647705078125, 0.012133359909057617, 0.01283407211303711, 0.013534784317016602, 0.014235496520996094, 0.014936208724975586, 0.015636920928955078, 0.01633763313293457, 0.017038345336914062, 0.017739057540893555, 0.018439769744873047, 0.01914048194885254, 0.01984119415283203, 0.020541906356811523, 0.021242618560791016, 0.021943330764770508, 0.02264404296875]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 7.0, 6.0, 2.0, 5.0, 5.0, 6.0, 9.0, 14.0, 5.0, 27.0, 43.0, 53.0, 101.0, 191.0, 226.0, 110.0, 66.0, 44.0, 19.0, 17.0, 10.0, 5.0, 6.0, 3.0, 5.0, 5.0, 4.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.005062103271484375, -0.004882514476776123, -0.004702925682067871, -0.004523336887359619, -0.004343748092651367, -0.004164159297943115, -0.003984570503234863, -0.0038049817085266113, -0.0036253929138183594, -0.0034458041191101074, -0.0032662153244018555, -0.0030866265296936035, -0.0029070377349853516, -0.0027274489402770996, -0.0025478601455688477, -0.0023682713508605957, -0.0021886825561523438, -0.002009093761444092, -0.0018295049667358398, -0.0016499161720275879, -0.001470327377319336, -0.001290738582611084, -0.001111149787902832, -0.0009315609931945801, -0.0007519721984863281, -0.0005723834037780762, -0.0003927946090698242, -0.00021320581436157227, -3.361701965332031e-05, 0.00014597177505493164, 0.0003255605697631836, 0.0005051493644714355, 0.0006847381591796875, 0.0008643269538879395, 0.0010439157485961914, 0.0012235045433044434, 0.0014030933380126953, 0.0015826821327209473, 0.0017622709274291992, 0.0019418597221374512, 0.002121448516845703, 0.002301037311553955, 0.002480626106262207, 0.002660214900970459, 0.002839803695678711, 0.003019392490386963, 0.003198981285095215, 0.003378570079803467, 0.0035581588745117188, 0.0037377476692199707, 0.003917336463928223, 0.004096925258636475, 0.0042765140533447266, 0.0044561028480529785, 0.0046356916427612305, 0.004815280437469482, 0.004994869232177734, 0.005174458026885986, 0.005354046821594238, 0.00553363561630249, 0.005713224411010742, 0.005892813205718994, 0.006072402000427246, 0.006251990795135498, 0.00643157958984375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 7.0, 7.0, 17.0, 57.0, 613.0, 227.0, 20.0, 21.0, 9.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5319970846176147, -0.5064923763275146, -0.48098769783973694, -0.45548301935195923, -0.42997831106185913, -0.4044736325740814, -0.3789689540863037, -0.3534642457962036, -0.3279595673084259, -0.3024548888206482, -0.2769501805305481, -0.2514455020427704, -0.22594080865383148, -0.20043611526489258, -0.17493143677711487, -0.14942674338817596, -0.12392204999923706, -0.09841735661029816, -0.07291267067193985, -0.04740798473358154, -0.02190329134464264, 0.0036014020442962646, 0.029106080532073975, 0.05461077392101288, 0.08011546730995178, 0.10562016069889069, 0.1311248540878296, 0.1566295325756073, 0.1821342259645462, 0.2076389193534851, 0.23314359784126282, 0.2586482763290405, 0.2841529846191406, 0.30965766310691833, 0.33516237139701843, 0.36066704988479614, 0.38617175817489624, 0.41167643666267395, 0.43718111515045166, 0.46268582344055176, 0.48819050192832947, 0.5136951804161072, 0.5391998887062073, 0.5647045373916626, 0.5902092456817627, 0.6157139539718628, 0.6412186622619629, 0.6667233109474182, 0.6922280192375183, 0.7177327275276184, 0.7432373762130737, 0.7687420845031738, 0.7942467927932739, 0.819751501083374, 0.8452561497688293, 0.8707608580589294, 0.8962655067443848, 0.9217702150344849, 0.9472748637199402, 0.9727795720100403, 0.9982842803001404, 1.0237889289855957, 1.0492936372756958, 1.074798345565796, 1.100303053855896]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 5.0, 1.0, 1.0, 9.0, 7.0, 5.0, 12.0, 16.0, 28.0, 30.0, 58.0, 56.0, 90.0, 110.0, 132.0, 109.0, 94.0, 54.0, 37.0, 35.0, 17.0, 19.0, 6.0, 6.0, 5.0, 3.0, 6.0, 3.0, 3.0, 5.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.22098016738891602, -0.21454277634620667, -0.2081054002046585, -0.20166802406311035, -0.195230633020401, -0.18879324197769165, -0.1823558658361435, -0.17591848969459534, -0.169481098651886, -0.16304370760917664, -0.15660633146762848, -0.15016895532608032, -0.14373156428337097, -0.13729417324066162, -0.13085679709911346, -0.12441941350698471, -0.11798202991485596, -0.1115446463227272, -0.10510726273059845, -0.0986698791384697, -0.09223249554634094, -0.08579511195421219, -0.07935772836208344, -0.07292034476995468, -0.06648296117782593, -0.060045577585697174, -0.05360819399356842, -0.04717081040143967, -0.04073342680931091, -0.03429604321718216, -0.027858659625053406, -0.021421276032924652, -0.014983892440795898, -0.008546508848667145, -0.002109125256538391, 0.0043282583355903625, 0.010765641927719116, 0.01720302551984787, 0.023640409111976624, 0.030077792704105377, 0.03651517629623413, 0.042952559888362885, 0.04938994348049164, 0.05582732707262039, 0.062264710664749146, 0.0687020942568779, 0.07513947784900665, 0.0815768614411354, 0.08801424503326416, 0.09445162862539291, 0.10088901221752167, 0.10732639580965042, 0.11376377940177917, 0.12020116299390793, 0.12663854658603668, 0.13307592272758484, 0.1395133137702942, 0.14595070481300354, 0.1523880809545517, 0.15882545709609985, 0.1652628481388092, 0.17170023918151855, 0.1781376153230667, 0.18457499146461487, 0.19101238250732422]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 9.0, 5.0, 8.0, 7.0, 10.0, 8.0, 19.0, 17.0, 17.0, 35.0, 83.0, 305.0, 5383.0, 4151057.0, 36106.0, 878.0, 113.0, 55.0, 35.0, 22.0, 20.0, 11.0, 24.0, 7.0, 5.0, 5.0, 7.0, 4.0, 3.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-5.45703125, -5.29034423828125, -5.1236572265625, -4.95697021484375, -4.790283203125, -4.62359619140625, -4.4569091796875, -4.29022216796875, -4.12353515625, -3.95684814453125, -3.7901611328125, -3.62347412109375, -3.456787109375, -3.29010009765625, -3.1234130859375, -2.95672607421875, -2.7900390625, -2.62335205078125, -2.4566650390625, -2.28997802734375, -2.123291015625, -1.95660400390625, -1.7899169921875, -1.62322998046875, -1.45654296875, -1.28985595703125, -1.1231689453125, -0.95648193359375, -0.789794921875, -0.62310791015625, -0.4564208984375, -0.28973388671875, -0.123046875, 0.04364013671875, 0.2103271484375, 0.37701416015625, 0.543701171875, 0.71038818359375, 0.8770751953125, 1.04376220703125, 1.21044921875, 1.37713623046875, 1.5438232421875, 1.71051025390625, 1.877197265625, 2.04388427734375, 2.2105712890625, 2.37725830078125, 2.5439453125, 2.71063232421875, 2.8773193359375, 3.04400634765625, 3.210693359375, 3.37738037109375, 3.5440673828125, 3.71075439453125, 3.87744140625, 4.04412841796875, 4.2108154296875, 4.37750244140625, 4.544189453125, 4.71087646484375, 4.8775634765625, 5.04425048828125, 5.2109375]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 0.0, 4.0, 7.0, 12.0, 11.0, 10.0, 11.0, 13.0, 105.0, 698.0, 15.0, 20.0, 11.0, 9.0, 10.0, 5.0, 10.0, 5.0, 8.0, 6.0, 2.0, 4.0, 2.0, 2.0, 4.0, 6.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003204345703125, -0.0030953586101531982, -0.0029863715171813965, -0.0028773844242095947, -0.002768397331237793, -0.002659410238265991, -0.0025504231452941895, -0.0024414360523223877, -0.002332448959350586, -0.002223461866378784, -0.0021144747734069824, -0.0020054876804351807, -0.001896500587463379, -0.0017875134944915771, -0.0016785264015197754, -0.0015695393085479736, -0.0014605522155761719, -0.0013515651226043701, -0.0012425780296325684, -0.0011335909366607666, -0.0010246038436889648, -0.0009156167507171631, -0.0008066296577453613, -0.0006976425647735596, -0.0005886554718017578, -0.00047966837882995605, -0.0003706812858581543, -0.00026169419288635254, -0.00015270709991455078, -4.3720006942749023e-05, 6.526708602905273e-05, 0.0001742541790008545, 0.00028324127197265625, 0.000392228364944458, 0.0005012154579162598, 0.0006102025508880615, 0.0007191896438598633, 0.000828176736831665, 0.0009371638298034668, 0.0010461509227752686, 0.0011551380157470703, 0.001264125108718872, 0.0013731122016906738, 0.0014820992946624756, 0.0015910863876342773, 0.001700073480606079, 0.0018090605735778809, 0.0019180476665496826, 0.0020270347595214844, 0.002136021852493286, 0.002245008945465088, 0.0023539960384368896, 0.0024629831314086914, 0.002571970224380493, 0.002680957317352295, 0.0027899444103240967, 0.0028989315032958984, 0.0030079185962677, 0.003116905689239502, 0.0032258927822113037, 0.0033348798751831055, 0.0034438669681549072, 0.003552854061126709, 0.0036618411540985107, 0.0037708282470703125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 1.0, 4.0, 4.0, 7.0, 6.0, 8.0, 9.0, 16.0, 14.0, 29.0, 36.0, 30.0, 31.0, 48.0, 62.0, 67.0, 78.0, 97.0, 145.0, 366.0, 5935.0, 4175749.0, 10304.0, 401.0, 146.0, 145.0, 123.0, 96.0, 71.0, 60.0, 38.0, 37.0, 26.0, 27.0, 20.0, 11.0, 13.0, 9.0, 3.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.22265625, -1.1882705688476562, -1.1538848876953125, -1.1194992065429688, -1.085113525390625, -1.0507278442382812, -1.0163421630859375, -0.9819564819335938, -0.94757080078125, -0.9131851196289062, -0.8787994384765625, -0.8444137573242188, -0.810028076171875, -0.7756423950195312, -0.7412567138671875, -0.7068710327148438, -0.6724853515625, -0.6380996704101562, -0.6037139892578125, -0.5693283081054688, -0.534942626953125, -0.5005569458007812, -0.4661712646484375, -0.43178558349609375, -0.39739990234375, -0.36301422119140625, -0.3286285400390625, -0.29424285888671875, -0.259857177734375, -0.22547149658203125, -0.1910858154296875, -0.15670013427734375, -0.122314453125, -0.08792877197265625, -0.0535430908203125, -0.01915740966796875, 0.015228271484375, 0.04961395263671875, 0.0839996337890625, 0.11838531494140625, 0.15277099609375, 0.18715667724609375, 0.2215423583984375, 0.25592803955078125, 0.290313720703125, 0.32469940185546875, 0.3590850830078125, 0.39347076416015625, 0.4278564453125, 0.46224212646484375, 0.4966278076171875, 0.5310134887695312, 0.565399169921875, 0.5997848510742188, 0.6341705322265625, 0.6685562133789062, 0.70294189453125, 0.7373275756835938, 0.7717132568359375, 0.8060989379882812, 0.840484619140625, 0.8748703002929688, 0.9092559814453125, 0.9436416625976562, 0.97802734375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 4.0, 5.0, 6.0, 6.0, 11.0, 7.0, 19.0, 16.0, 27.0, 27.0, 33.0, 42.0, 42.0, 69.0, 65.0, 95.0, 95.0, 157.0, 209.0, 334.0, 1386.0, 352.0, 208.0, 153.0, 148.0, 136.0, 94.0, 72.0, 58.0, 35.0, 45.0, 25.0, 26.0, 19.0, 13.0, 9.0, 9.0, 5.0, 9.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.009490966796875, -0.009223520755767822, -0.008956074714660645, -0.008688628673553467, -0.008421182632446289, -0.008153736591339111, -0.007886290550231934, -0.007618844509124756, -0.007351398468017578, -0.0070839524269104, -0.006816506385803223, -0.006549060344696045, -0.006281614303588867, -0.0060141682624816895, -0.005746722221374512, -0.005479276180267334, -0.005211830139160156, -0.0049443840980529785, -0.004676938056945801, -0.004409492015838623, -0.004142045974731445, -0.0038745999336242676, -0.00360715389251709, -0.003339707851409912, -0.0030722618103027344, -0.0028048157691955566, -0.002537369728088379, -0.002269923686981201, -0.0020024776458740234, -0.0017350316047668457, -0.001467585563659668, -0.0012001395225524902, -0.0009326934814453125, -0.0006652474403381348, -0.00039780139923095703, -0.0001303553581237793, 0.00013709068298339844, 0.00040453672409057617, 0.0006719827651977539, 0.0009394288063049316, 0.0012068748474121094, 0.0014743208885192871, 0.0017417669296264648, 0.0020092129707336426, 0.0022766590118408203, 0.002544105052947998, 0.0028115510940551758, 0.0030789971351623535, 0.0033464431762695312, 0.003613889217376709, 0.0038813352584838867, 0.0041487812995910645, 0.004416227340698242, 0.00468367338180542, 0.004951119422912598, 0.005218565464019775, 0.005486011505126953, 0.005753457546234131, 0.006020903587341309, 0.006288349628448486, 0.006555795669555664, 0.006823241710662842, 0.0070906877517700195, 0.007358133792877197, 0.007625579833984375]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 12.0, 903.0, 95.0, 6.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18508395552635193, -0.13553155958652496, -0.085979163646698, -0.03642676770687103, 0.013125628232955933, 0.0626780241727829, 0.11223042011260986, 0.16178283095359802, 0.2113352119922638, 0.26088762283325195, 0.3104400038719177, 0.3599923849105835, 0.40954479575157166, 0.4590972065925598, 0.5086495876312256, 0.5582020282745361, 0.6077543497085571, 0.6573067307472229, 0.7068591117858887, 0.7564115524291992, 0.805963933467865, 0.8555163145065308, 0.9050687551498413, 0.9546211361885071, 1.0041735172271729, 1.0537259578704834, 1.1032782793045044, 1.152830719947815, 1.202383041381836, 1.2519354820251465, 1.301487922668457, 1.3510403633117676, 1.4005928039550781, 1.4501452445983887, 1.4996975660324097, 1.5492500066757202, 1.5988023281097412, 1.6483547687530518, 1.6979072093963623, 1.7474596500396729, 1.7970119714736938, 1.8465644121170044, 1.8961167335510254, 1.945669174194336, 1.9952216148376465, 2.044774055480957, 2.0943262577056885, 2.143878698348999, 2.1934311389923096, 2.24298357963562, 2.2925360202789307, 2.342088222503662, 2.3916406631469727, 2.441193103790283, 2.4907455444335938, 2.5402979850769043, 2.589850425720215, 2.6394028663635254, 2.688955307006836, 2.7385075092315674, 2.788059949874878, 2.8376123905181885, 2.887164831161499, 2.9367172718048096, 2.986269474029541]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 5.0, 7.0, 6.0, 17.0, 30.0, 53.0, 66.0, 82.0, 107.0, 120.0, 111.0, 106.0, 73.0, 89.0, 46.0, 32.0, 37.0, 12.0, 8.0, 5.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06322473287582397, -0.058313410729169846, -0.05340208858251572, -0.04849076271057129, -0.04357944056391716, -0.03866811841726303, -0.033756792545318604, -0.028845470398664474, -0.023934148252010345, -0.019022826105356216, -0.014111502096056938, -0.009200179018080235, -0.004288855940103531, 0.0006224662065505981, 0.005533790215849876, 0.010445114225149155, 0.015356436371803284, 0.020267758518457413, 0.02517908252775669, 0.03009040653705597, 0.0350017286837101, 0.03991305083036423, 0.044824376702308655, 0.049735698848962784, 0.05464702099561691, 0.05955834314227104, 0.06446966528892517, 0.0693809911608696, 0.07429231703281403, 0.07920363545417786, 0.08411496132612228, 0.08902628719806671, 0.09393760561943054, 0.09884893149137497, 0.1037602499127388, 0.10867157578468323, 0.11358289420604706, 0.11849422007799149, 0.12340554594993591, 0.12831686437129974, 0.13322818279266357, 0.1381395012140274, 0.14305083453655243, 0.14796215295791626, 0.1528734713792801, 0.15778478980064392, 0.16269612312316895, 0.16760744154453278, 0.1725187748670578, 0.17743009328842163, 0.18234142661094666, 0.18725274503231049, 0.19216406345367432, 0.19707539677619934, 0.20198671519756317, 0.206898033618927, 0.21180936694145203, 0.21672068536281586, 0.22163201868534088, 0.2265433371067047, 0.23145465552806854, 0.23636597394943237, 0.2412773072719574, 0.24618862569332123, 0.25109994411468506]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 7.0, 8.0, 8.0, 7.0, 19.0, 38.0, 59.0, 73.0, 120.0, 205.0, 311.0, 523.0, 849.0, 1385.0, 2221.0, 4175.0, 8198.0, 19674.0, 208105.0, 760547.0, 22494.0, 8832.0, 4467.0, 2443.0, 1455.0, 875.0, 541.0, 326.0, 230.0, 126.0, 87.0, 47.0, 30.0, 27.0, 14.0, 10.0, 10.0, 4.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09979248046875, -0.09694671630859375, -0.0941009521484375, -0.09125518798828125, -0.088409423828125, -0.08556365966796875, -0.0827178955078125, -0.07987213134765625, -0.0770263671875, -0.07418060302734375, -0.0713348388671875, -0.06848907470703125, -0.065643310546875, -0.06279754638671875, -0.0599517822265625, -0.05710601806640625, -0.05426025390625, -0.05141448974609375, -0.0485687255859375, -0.04572296142578125, -0.042877197265625, -0.04003143310546875, -0.0371856689453125, -0.03433990478515625, -0.031494140625, -0.02864837646484375, -0.0258026123046875, -0.02295684814453125, -0.020111083984375, -0.01726531982421875, -0.0144195556640625, -0.01157379150390625, -0.00872802734375, -0.00588226318359375, -0.0030364990234375, -0.00019073486328125, 0.002655029296875, 0.00550079345703125, 0.0083465576171875, 0.01119232177734375, 0.0140380859375, 0.01688385009765625, 0.0197296142578125, 0.02257537841796875, 0.025421142578125, 0.02826690673828125, 0.0311126708984375, 0.03395843505859375, 0.03680419921875, 0.03964996337890625, 0.0424957275390625, 0.04534149169921875, 0.048187255859375, 0.05103302001953125, 0.0538787841796875, 0.05672454833984375, 0.0595703125, 0.06241607666015625, 0.0652618408203125, 0.06810760498046875, 0.070953369140625, 0.07379913330078125, 0.0766448974609375, 0.07949066162109375, 0.08233642578125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 3.0, 4.0, 3.0, 0.0, 1.0, 3.0, 2.0, 7.0, 5.0, 5.0, 6.0, 13.0, 22.0, 18.0, 261.0, 518.0, 44.0, 17.0, 17.0, 15.0, 9.0, 7.0, 12.0, 4.0, 3.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00262451171875, -0.002489149570465088, -0.0023537874221801758, -0.0022184252738952637, -0.0020830631256103516, -0.0019477009773254395, -0.0018123388290405273, -0.0016769766807556152, -0.0015416145324707031, -0.001406252384185791, -0.001270890235900879, -0.0011355280876159668, -0.0010001659393310547, -0.0008648037910461426, -0.0007294416427612305, -0.0005940794944763184, -0.00045871734619140625, -0.00032335519790649414, -0.00018799304962158203, -5.263090133666992e-05, 8.273124694824219e-05, 0.0002180933952331543, 0.0003534555435180664, 0.0004888176918029785, 0.0006241798400878906, 0.0007595419883728027, 0.0008949041366577148, 0.001030266284942627, 0.001165628433227539, 0.0013009905815124512, 0.0014363527297973633, 0.0015717148780822754, 0.0017070770263671875, 0.0018424391746520996, 0.0019778013229370117, 0.002113163471221924, 0.002248525619506836, 0.002383887767791748, 0.00251924991607666, 0.0026546120643615723, 0.0027899742126464844, 0.0029253363609313965, 0.0030606985092163086, 0.0031960606575012207, 0.003331422805786133, 0.003466784954071045, 0.003602147102355957, 0.003737509250640869, 0.0038728713989257812, 0.004008233547210693, 0.0041435956954956055, 0.004278957843780518, 0.00441431999206543, 0.004549682140350342, 0.004685044288635254, 0.004820406436920166, 0.004955768585205078, 0.00509113073348999, 0.005226492881774902, 0.0053618550300598145, 0.0054972171783447266, 0.005632579326629639, 0.005767941474914551, 0.005903303623199463, 0.006038665771484375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 5.0, 8.0, 3.0, 6.0, 6.0, 13.0, 17.0, 7.0, 14.0, 15.0, 22.0, 24.0, 26.0, 23.0, 23.0, 37.0, 40.0, 48.0, 138.0, 678.0, 6885.0, 948294.0, 88679.0, 2769.0, 340.0, 102.0, 45.0, 40.0, 29.0, 45.0, 23.0, 23.0, 27.0, 22.0, 11.0, 16.0, 17.0, 6.0, 4.0, 8.0, 5.0, 4.0, 5.0, 5.0, 3.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.172119140625, -0.166534423828125, -0.16094970703125, -0.155364990234375, -0.1497802734375, -0.144195556640625, -0.13861083984375, -0.133026123046875, -0.12744140625, -0.121856689453125, -0.11627197265625, -0.110687255859375, -0.1051025390625, -0.099517822265625, -0.09393310546875, -0.088348388671875, -0.082763671875, -0.077178955078125, -0.07159423828125, -0.066009521484375, -0.0604248046875, -0.054840087890625, -0.04925537109375, -0.043670654296875, -0.0380859375, -0.032501220703125, -0.02691650390625, -0.021331787109375, -0.0157470703125, -0.010162353515625, -0.00457763671875, 0.001007080078125, 0.006591796875, 0.012176513671875, 0.01776123046875, 0.023345947265625, 0.0289306640625, 0.034515380859375, 0.04010009765625, 0.045684814453125, 0.05126953125, 0.056854248046875, 0.06243896484375, 0.068023681640625, 0.0736083984375, 0.079193115234375, 0.08477783203125, 0.090362548828125, 0.095947265625, 0.101531982421875, 0.10711669921875, 0.112701416015625, 0.1182861328125, 0.123870849609375, 0.12945556640625, 0.135040283203125, 0.140625, 0.146209716796875, 0.15179443359375, 0.157379150390625, 0.1629638671875, 0.168548583984375, 0.17413330078125, 0.179718017578125, 0.185302734375]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 3.0, 6.0, 7.0, 2.0, 9.0, 11.0, 21.0, 13.0, 10.0, 13.0, 20.0, 23.0, 29.0, 29.0, 18.0, 29.0, 37.0, 33.0, 36.0, 56.0, 54.0, 33.0, 39.0, 51.0, 43.0, 47.0, 34.0, 24.0, 30.0, 38.0, 32.0, 21.0, 22.0, 24.0, 20.0, 11.0, 16.0, 9.0, 12.0, 8.0, 2.0, 3.0, 5.0, 9.0, 7.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0084381103515625, -0.00816357135772705, -0.007889032363891602, -0.007614493370056152, -0.007339954376220703, -0.007065415382385254, -0.006790876388549805, -0.0065163373947143555, -0.006241798400878906, -0.005967259407043457, -0.005692720413208008, -0.005418181419372559, -0.005143642425537109, -0.00486910343170166, -0.004594564437866211, -0.004320025444030762, -0.0040454864501953125, -0.0037709474563598633, -0.003496408462524414, -0.003221869468688965, -0.0029473304748535156, -0.0026727914810180664, -0.002398252487182617, -0.002123713493347168, -0.0018491744995117188, -0.0015746355056762695, -0.0013000965118408203, -0.001025557518005371, -0.0007510185241699219, -0.00047647953033447266, -0.00020194053649902344, 7.259845733642578e-05, 0.000347137451171875, 0.0006216764450073242, 0.0008962154388427734, 0.0011707544326782227, 0.0014452934265136719, 0.001719832420349121, 0.0019943714141845703, 0.0022689104080200195, 0.0025434494018554688, 0.002817988395690918, 0.003092527389526367, 0.0033670663833618164, 0.0036416053771972656, 0.003916144371032715, 0.004190683364868164, 0.004465222358703613, 0.0047397613525390625, 0.005014300346374512, 0.005288839340209961, 0.00556337833404541, 0.005837917327880859, 0.006112456321716309, 0.006386995315551758, 0.006661534309387207, 0.006936073303222656, 0.0072106122970581055, 0.007485151290893555, 0.007759690284729004, 0.008034229278564453, 0.008308768272399902, 0.008583307266235352, 0.0088578462600708, 0.00913238525390625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 4.0, 4.0, 4.0, 9.0, 10.0, 12.0, 14.0, 21.0, 72.0, 195.0, 3720.0, 1042250.0, 1972.0, 145.0, 41.0, 25.0, 17.0, 17.0, 9.0, 3.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2000732421875, -0.1918811798095703, -0.18368911743164062, -0.17549705505371094, -0.16730499267578125, -0.15911293029785156, -0.15092086791992188, -0.1427288055419922, -0.1345367431640625, -0.1263446807861328, -0.11815261840820312, -0.10996055603027344, -0.10176849365234375, -0.09357643127441406, -0.08538436889648438, -0.07719230651855469, -0.069000244140625, -0.06080818176269531, -0.052616119384765625, -0.04442405700683594, -0.03623199462890625, -0.028039932250976562, -0.019847869873046875, -0.011655807495117188, -0.0034637451171875, 0.0047283172607421875, 0.012920379638671875, 0.021112442016601562, 0.02930450439453125, 0.03749656677246094, 0.045688629150390625, 0.05388069152832031, 0.06207275390625, 0.07026481628417969, 0.07845687866210938, 0.08664894104003906, 0.09484100341796875, 0.10303306579589844, 0.11122512817382812, 0.11941719055175781, 0.1276092529296875, 0.1358013153076172, 0.14399337768554688, 0.15218544006347656, 0.16037750244140625, 0.16856956481933594, 0.17676162719726562, 0.1849536895751953, 0.193145751953125, 0.2013378143310547, 0.20952987670898438, 0.21772193908691406, 0.22591400146484375, 0.23410606384277344, 0.24229812622070312, 0.2504901885986328, 0.2586822509765625, 0.2668743133544922, 0.2750663757324219, 0.28325843811035156, 0.29145050048828125, 0.29964256286621094, 0.3078346252441406, 0.3160266876220703, 0.32421875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 2.0, 1.0, 8.0, 7.0, 5.0, 6.0, 13.0, 3.0, 19.0, 70.0, 223.0, 488.0, 95.0, 22.0, 8.0, 8.0, 5.0, 3.0, 1.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000301361083984375, -0.0002925582230091095, -0.000283755362033844, -0.0002749525010585785, -0.000266149640083313, -0.0002573467791080475, -0.000248543918132782, -0.00023974105715751648, -0.00023093819618225098, -0.00022213533520698547, -0.00021333247423171997, -0.00020452961325645447, -0.00019572675228118896, -0.00018692389130592346, -0.00017812103033065796, -0.00016931816935539246, -0.00016051530838012695, -0.00015171244740486145, -0.00014290958642959595, -0.00013410672545433044, -0.00012530386447906494, -0.00011650100350379944, -0.00010769814252853394, -9.889528155326843e-05, -9.009242057800293e-05, -8.128955960273743e-05, -7.248669862747192e-05, -6.368383765220642e-05, -5.488097667694092e-05, -4.6078115701675415e-05, -3.727525472640991e-05, -2.847239375114441e-05, -1.9669532775878906e-05, -1.0866671800613403e-05, -2.0638108253479004e-06, 6.7390501499176025e-06, 1.5541911125183105e-05, 2.434477210044861e-05, 3.314763307571411e-05, 4.1950494050979614e-05, 5.075335502624512e-05, 5.955621600151062e-05, 6.835907697677612e-05, 7.716193795204163e-05, 8.596479892730713e-05, 9.476765990257263e-05, 0.00010357052087783813, 0.00011237338185310364, 0.00012117624282836914, 0.00012997910380363464, 0.00013878196477890015, 0.00014758482575416565, 0.00015638768672943115, 0.00016519054770469666, 0.00017399340867996216, 0.00018279626965522766, 0.00019159913063049316, 0.00020040199160575867, 0.00020920485258102417, 0.00021800771355628967, 0.00022681057453155518, 0.00023561343550682068, 0.0002444162964820862, 0.0002532191574573517, 0.0002620220184326172]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 7.0, 8.0, 10.0, 12.0, 13.0, 18.0, 37.0, 72.0, 158.0, 421.0, 1991.0, 44031.0, 996333.0, 4420.0, 626.0, 176.0, 82.0, 43.0, 33.0, 18.0, 14.0, 8.0, 7.0, 4.0, 1.0, 4.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.306396484375, -0.2981548309326172, -0.2899131774902344, -0.28167152404785156, -0.27342987060546875, -0.26518821716308594, -0.2569465637207031, -0.2487049102783203, -0.2404632568359375, -0.2322216033935547, -0.22397994995117188, -0.21573829650878906, -0.20749664306640625, -0.19925498962402344, -0.19101333618164062, -0.1827716827392578, -0.174530029296875, -0.1662883758544922, -0.15804672241210938, -0.14980506896972656, -0.14156341552734375, -0.13332176208496094, -0.12508010864257812, -0.11683845520019531, -0.1085968017578125, -0.10035514831542969, -0.09211349487304688, -0.08387184143066406, -0.07563018798828125, -0.06738853454589844, -0.059146881103515625, -0.05090522766113281, -0.04266357421875, -0.03442192077636719, -0.026180267333984375, -0.017938613891601562, -0.00969696044921875, -0.0014553070068359375, 0.006786346435546875, 0.015027999877929688, 0.0232696533203125, 0.03151130676269531, 0.039752960205078125, 0.04799461364746094, 0.05623626708984375, 0.06447792053222656, 0.07271957397460938, 0.08096122741699219, 0.089202880859375, 0.09744453430175781, 0.10568618774414062, 0.11392784118652344, 0.12216949462890625, 0.13041114807128906, 0.13865280151367188, 0.1468944549560547, 0.1551361083984375, 0.1633777618408203, 0.17161941528320312, 0.17986106872558594, 0.18810272216796875, 0.19634437561035156, 0.20458602905273438, 0.2128276824951172, 0.2210693359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 1.0, 2.0, 3.0, 2.0, 5.0, 8.0, 15.0, 17.0, 23.0, 32.0, 112.0, 598.0, 67.0, 37.0, 24.0, 17.0, 8.0, 6.0, 8.0, 8.0, 4.0, 1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.10369873046875, -0.1011195182800293, -0.0985403060913086, -0.09596109390258789, -0.09338188171386719, -0.09080266952514648, -0.08822345733642578, -0.08564424514770508, -0.08306503295898438, -0.08048582077026367, -0.07790660858154297, -0.07532739639282227, -0.07274818420410156, -0.07016897201538086, -0.06758975982666016, -0.06501054763793945, -0.06243133544921875, -0.05985212326049805, -0.057272911071777344, -0.05469369888305664, -0.05211448669433594, -0.049535274505615234, -0.04695606231689453, -0.04437685012817383, -0.041797637939453125, -0.03921842575073242, -0.03663921356201172, -0.034060001373291016, -0.03148078918457031, -0.02890157699584961, -0.026322364807128906, -0.023743152618408203, -0.0211639404296875, -0.018584728240966797, -0.016005516052246094, -0.01342630386352539, -0.010847091674804688, -0.008267879486083984, -0.005688667297363281, -0.003109455108642578, -0.000530242919921875, 0.002048969268798828, 0.004628181457519531, 0.007207393646240234, 0.009786605834960938, 0.01236581802368164, 0.014945030212402344, 0.017524242401123047, 0.02010345458984375, 0.022682666778564453, 0.025261878967285156, 0.02784109115600586, 0.030420303344726562, 0.032999515533447266, 0.03557872772216797, 0.03815793991088867, 0.040737152099609375, 0.04331636428833008, 0.04589557647705078, 0.048474788665771484, 0.05105400085449219, 0.05363321304321289, 0.056212425231933594, 0.0587916374206543, 0.061370849609375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 7.0, 21.0, 572.0, 390.0, 11.0, 8.0, 5.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.33193016052246094, -0.2947441041469574, -0.25755804777145386, -0.22037196159362793, -0.1831859052181244, -0.14599984884262085, -0.10881377756595612, -0.07162770628929138, -0.03444164991378784, 0.002744413912296295, 0.03993047773838043, 0.07711654156446457, 0.1143026053905487, 0.15148866176605225, 0.18867473304271698, 0.2258608043193817, 0.26304686069488525, 0.3002329170703888, 0.33741897344589233, 0.37460505962371826, 0.4117911159992218, 0.44897717237472534, 0.48616325855255127, 0.5233492851257324, 0.5605353713035583, 0.5977214574813843, 0.6349074840545654, 0.6720935702323914, 0.7092796564102173, 0.7464656829833984, 0.7836517691612244, 0.8208378553390503, 0.8580238819122314, 0.8952099680900574, 0.9323959946632385, 0.9695820808410645, 1.0067681074142456, 1.0439541339874268, 1.0811402797698975, 1.1183263063430786, 1.1555123329162598, 1.192698359489441, 1.2298845052719116, 1.2670705318450928, 1.304256558418274, 1.341442584991455, 1.3786287307739258, 1.415814757347107, 1.4530009031295776, 1.4901869297027588, 1.5273730754852295, 1.5645591020584106, 1.6017451286315918, 1.6389312744140625, 1.6761173009872437, 1.7133033275604248, 1.7504894733428955, 1.7876754999160767, 1.8248616456985474, 1.8620476722717285, 1.8992336988449097, 1.9364197254180908, 1.9736058712005615, 2.0107920169830322, 2.047977924346924]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 1.0, 2.0, 8.0, 4.0, 6.0, 17.0, 23.0, 21.0, 44.0, 40.0, 60.0, 87.0, 88.0, 110.0, 109.0, 106.0, 73.0, 66.0, 48.0, 29.0, 18.0, 16.0, 8.0, 6.0, 4.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14507275819778442, -0.14050769805908203, -0.13594263792037964, -0.13137759268283844, -0.12681253254413605, -0.12224747240543365, -0.11768241226673126, -0.11311735212802887, -0.10855229943990707, -0.10398723930120468, -0.09942218661308289, -0.0948571264743805, -0.0902920663356781, -0.0857270136475563, -0.08116195350885391, -0.07659690082073212, -0.07203184068202972, -0.06746678054332733, -0.06290172785520554, -0.05833666771650314, -0.05377161130309105, -0.049206554889678955, -0.04464149475097656, -0.04007643833756447, -0.035511381924152374, -0.03094632551074028, -0.026381267234683037, -0.021816208958625793, -0.0172511525452137, -0.012686096131801605, -0.008121037855744362, -0.0035559795796871185, 0.0010090768337249756, 0.005574134178459644, 0.010139191523194313, 0.014704248867928982, 0.01926930621266365, 0.023834362626075745, 0.028399420902132988, 0.03296447917819023, 0.037529535591602325, 0.04209459200501442, 0.046659648418426514, 0.051224708557128906, 0.055789764970541, 0.060354821383953094, 0.06491988152265549, 0.06948493421077728, 0.07404999434947968, 0.07861505448818207, 0.08318010717630386, 0.08774516731500626, 0.09231022000312805, 0.09687528014183044, 0.10144034028053284, 0.10600540041923523, 0.11057045310735703, 0.11513551324605942, 0.11970056593418121, 0.1242656260728836, 0.128830686211586, 0.1333957314491272, 0.1379607915878296, 0.14252585172653198, 0.14709091186523438]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 8.0, 2.0, 4.0, 2.0, 4.0, 0.0, 4.0, 2.0, 6.0, 2.0, 4.0, 10.0, 10.0, 4.0, 4.0, 22.0, 12.0, 12.0, 28.0, 16.0, 30.0, 20.0, 1165.0, 4192649.0, 46.0, 24.0, 28.0, 22.0, 18.0, 14.0, 12.0, 12.0, 14.0, 10.0, 12.0, 6.0, 8.0, 8.0, 6.0, 4.0, 2.0, 6.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0], "bins": [-3.58984375, -3.47845458984375, -3.3670654296875, -3.25567626953125, -3.144287109375, -3.03289794921875, -2.9215087890625, -2.81011962890625, -2.69873046875, -2.58734130859375, -2.4759521484375, -2.36456298828125, -2.253173828125, -2.14178466796875, -2.0303955078125, -1.91900634765625, -1.8076171875, -1.69622802734375, -1.5848388671875, -1.47344970703125, -1.362060546875, -1.25067138671875, -1.1392822265625, -1.02789306640625, -0.91650390625, -0.80511474609375, -0.6937255859375, -0.58233642578125, -0.470947265625, -0.35955810546875, -0.2481689453125, -0.13677978515625, -0.025390625, 0.08599853515625, 0.1973876953125, 0.30877685546875, 0.420166015625, 0.53155517578125, 0.6429443359375, 0.75433349609375, 0.86572265625, 0.97711181640625, 1.0885009765625, 1.19989013671875, 1.311279296875, 1.42266845703125, 1.5340576171875, 1.64544677734375, 1.7568359375, 1.86822509765625, 1.9796142578125, 2.09100341796875, 2.202392578125, 2.31378173828125, 2.4251708984375, 2.53656005859375, 2.64794921875, 2.75933837890625, 2.8707275390625, 2.98211669921875, 3.093505859375, 3.20489501953125, 3.3162841796875, 3.42767333984375, 3.5390625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 1.0, 3.0, 4.0, 6.0, 5.0, 12.0, 9.0, 11.0, 10.0, 65.0, 270.0, 358.0, 121.0, 26.0, 14.0, 11.0, 14.0, 8.0, 5.0, 7.0, 12.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026531219482421875, -0.002556413412094116, -0.002459704875946045, -0.0023629963397979736, -0.0022662878036499023, -0.002169579267501831, -0.0020728707313537598, -0.0019761621952056885, -0.0018794536590576172, -0.001782745122909546, -0.0016860365867614746, -0.0015893280506134033, -0.001492619514465332, -0.0013959109783172607, -0.0012992024421691895, -0.0012024939060211182, -0.0011057853698730469, -0.0010090768337249756, -0.0009123682975769043, -0.000815659761428833, -0.0007189512252807617, -0.0006222426891326904, -0.0005255341529846191, -0.00042882561683654785, -0.00033211708068847656, -0.00023540854454040527, -0.00013870000839233398, -4.1991472244262695e-05, 5.4717063903808594e-05, 0.00015142560005187988, 0.00024813413619995117, 0.00034484267234802246, 0.00044155120849609375, 0.000538259744644165, 0.0006349682807922363, 0.0007316768169403076, 0.0008283853530883789, 0.0009250938892364502, 0.0010218024253845215, 0.0011185109615325928, 0.001215219497680664, 0.0013119280338287354, 0.0014086365699768066, 0.001505345106124878, 0.0016020536422729492, 0.0016987621784210205, 0.0017954707145690918, 0.001892179250717163, 0.0019888877868652344, 0.0020855963230133057, 0.002182304859161377, 0.0022790133953094482, 0.0023757219314575195, 0.002472430467605591, 0.002569139003753662, 0.0026658475399017334, 0.0027625560760498047, 0.002859264612197876, 0.0029559731483459473, 0.0030526816844940186, 0.00314939022064209, 0.003246098756790161, 0.0033428072929382324, 0.0034395158290863037, 0.003536224365234375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 5.0, 7.0, 11.0, 13.0, 18.0, 46.0, 42.0, 96.0, 177.0, 570.0, 4191451.0, 1300.0, 229.0, 113.0, 76.0, 36.0, 27.0, 20.0, 16.0, 9.0, 5.0, 1.0, 4.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.6044921875, -1.5660247802734375, -1.527557373046875, -1.4890899658203125, -1.45062255859375, -1.4121551513671875, -1.373687744140625, -1.3352203369140625, -1.2967529296875, -1.2582855224609375, -1.219818115234375, -1.1813507080078125, -1.14288330078125, -1.1044158935546875, -1.065948486328125, -1.0274810791015625, -0.989013671875, -0.9505462646484375, -0.912078857421875, -0.8736114501953125, -0.83514404296875, -0.7966766357421875, -0.758209228515625, -0.7197418212890625, -0.6812744140625, -0.6428070068359375, -0.604339599609375, -0.5658721923828125, -0.52740478515625, -0.4889373779296875, -0.450469970703125, -0.4120025634765625, -0.37353515625, -0.3350677490234375, -0.296600341796875, -0.2581329345703125, -0.21966552734375, -0.1811981201171875, -0.142730712890625, -0.1042633056640625, -0.0657958984375, -0.0273284912109375, 0.011138916015625, 0.0496063232421875, 0.08807373046875, 0.1265411376953125, 0.165008544921875, 0.2034759521484375, 0.241943359375, 0.2804107666015625, 0.318878173828125, 0.3573455810546875, 0.39581298828125, 0.4342803955078125, 0.472747802734375, 0.5112152099609375, 0.5496826171875, 0.5881500244140625, 0.626617431640625, 0.6650848388671875, 0.70355224609375, 0.7420196533203125, 0.780487060546875, 0.8189544677734375, 0.857421875]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 5.0, 21.0, 35.0, 58.0, 175.0, 724.0, 2379.0, 421.0, 142.0, 63.0, 24.0, 11.0, 6.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.007232666015625, -0.0067288875579833984, -0.006225109100341797, -0.005721330642700195, -0.005217552185058594, -0.004713773727416992, -0.004209995269775391, -0.003706216812133789, -0.0032024383544921875, -0.002698659896850586, -0.0021948814392089844, -0.0016911029815673828, -0.0011873245239257812, -0.0006835460662841797, -0.00017976760864257812, 0.00032401084899902344, 0.000827789306640625, 0.0013315677642822266, 0.0018353462219238281, 0.0023391246795654297, 0.0028429031372070312, 0.003346681594848633, 0.0038504600524902344, 0.004354238510131836, 0.0048580169677734375, 0.005361795425415039, 0.005865573883056641, 0.006369352340698242, 0.006873130798339844, 0.007376909255981445, 0.007880687713623047, 0.008384466171264648, 0.00888824462890625, 0.009392023086547852, 0.009895801544189453, 0.010399580001831055, 0.010903358459472656, 0.011407136917114258, 0.01191091537475586, 0.012414693832397461, 0.012918472290039062, 0.013422250747680664, 0.013926029205322266, 0.014429807662963867, 0.014933586120605469, 0.01543736457824707, 0.015941143035888672, 0.016444921493530273, 0.016948699951171875, 0.017452478408813477, 0.017956256866455078, 0.01846003532409668, 0.01896381378173828, 0.019467592239379883, 0.019971370697021484, 0.020475149154663086, 0.020978927612304688, 0.02148270606994629, 0.02198648452758789, 0.022490262985229492, 0.022994041442871094, 0.023497819900512695, 0.024001598358154297, 0.0245053768157959, 0.0250091552734375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 1007.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.9065403938293457, -3.822207450866699, -3.7378745079040527, -3.6535415649414062, -3.5692083835601807, -3.484875440597534, -3.4005424976348877, -3.316209554672241, -3.2318763732910156, -3.147543430328369, -3.0632104873657227, -2.978877544403076, -2.8945443630218506, -2.810211420059204, -2.7258784770965576, -2.641545534133911, -2.5572125911712646, -2.472879648208618, -2.3885467052459717, -2.304213523864746, -2.2198805809020996, -2.135547637939453, -2.0512146949768066, -1.9668817520141602, -1.8825486898422241, -1.7982157468795776, -1.7138826847076416, -1.6295497417449951, -1.5452167987823486, -1.4608837366104126, -1.3765507936477661, -1.29221773147583, -1.2078847885131836, -1.123551845550537, -1.039218783378601, -0.9548858404159546, -0.8705528378486633, -0.7862198352813721, -0.7018868923187256, -0.6175538897514343, -0.5332208871841431, -0.4488878846168518, -0.36455491185188293, -0.28022193908691406, -0.1958889365196228, -0.11155593395233154, -0.02722299098968506, 0.0571100115776062, 0.14144301414489746, 0.22577600181102753, 0.3101089894771576, 0.39444196224212646, 0.4787749648094177, 0.563107967376709, 0.6474409103393555, 0.7317739129066467, 0.816106915473938, 0.9004399180412292, 0.9847729206085205, 1.069105863571167, 1.1534388065338135, 1.2377718687057495, 1.322104811668396, 1.406437873840332, 1.4907708168029785]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 5.0, 7.0, 33.0, 67.0, 150.0, 258.0, 254.0, 130.0, 83.0, 22.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10984247922897339, -0.10001415014266968, -0.09018582105636597, -0.08035749197006226, -0.07052916288375854, -0.06070083752274513, -0.05087251216173172, -0.04104418307542801, -0.031215853989124298, -0.021387524902820587, -0.011559197679162025, -0.0017308704555034637, 0.008097458630800247, 0.017925787717103958, 0.02775411307811737, 0.03758244216442108, 0.04741077125072479, 0.0572391003370285, 0.06706742942333221, 0.07689575850963593, 0.08672408759593964, 0.09655241668224335, 0.10638073831796646, 0.11620906740427017, 0.1260373890399933, 0.135865718126297, 0.1456940472126007, 0.15552237629890442, 0.16535070538520813, 0.17517903447151184, 0.18500736355781555, 0.19483569264411926, 0.20466402173042297, 0.21449235081672668, 0.2243206799030304, 0.2341490089893341, 0.24397733807563782, 0.25380566716194153, 0.26363399624824524, 0.27346232533454895, 0.28329065442085266, 0.29311898350715637, 0.3029473125934601, 0.3127756416797638, 0.3226039707660675, 0.3324322998523712, 0.3422606289386749, 0.35208895802497864, 0.36191725730895996, 0.37174558639526367, 0.3815739154815674, 0.3914022445678711, 0.4012305736541748, 0.4110589027404785, 0.4208872318267822, 0.43071556091308594, 0.44054388999938965, 0.45037221908569336, 0.46020054817199707, 0.4700288772583008, 0.4798572063446045, 0.4896855354309082, 0.4995138645172119, 0.5093421936035156, 0.5191705226898193]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 4.0, 5.0, 5.0, 9.0, 5.0, 12.0, 13.0, 13.0, 21.0, 22.0, 38.0, 41.0, 43.0, 64.0, 65.0, 101.0, 733272.0, 314337.0, 135.0, 67.0, 51.0, 39.0, 40.0, 35.0, 31.0, 23.0, 13.0, 7.0, 12.0, 9.0, 5.0, 2.0, 2.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.57958984375, -0.563018798828125, -0.54644775390625, -0.529876708984375, -0.5133056640625, -0.496734619140625, -0.48016357421875, -0.463592529296875, -0.447021484375, -0.430450439453125, -0.41387939453125, -0.397308349609375, -0.3807373046875, -0.364166259765625, -0.34759521484375, -0.331024169921875, -0.314453125, -0.297882080078125, -0.28131103515625, -0.264739990234375, -0.2481689453125, -0.231597900390625, -0.21502685546875, -0.198455810546875, -0.181884765625, -0.165313720703125, -0.14874267578125, -0.132171630859375, -0.1156005859375, -0.099029541015625, -0.08245849609375, -0.065887451171875, -0.04931640625, -0.032745361328125, -0.01617431640625, 0.000396728515625, 0.0169677734375, 0.033538818359375, 0.05010986328125, 0.066680908203125, 0.083251953125, 0.099822998046875, 0.11639404296875, 0.132965087890625, 0.1495361328125, 0.166107177734375, 0.18267822265625, 0.199249267578125, 0.2158203125, 0.232391357421875, 0.24896240234375, 0.265533447265625, 0.2821044921875, 0.298675537109375, 0.31524658203125, 0.331817626953125, 0.348388671875, 0.364959716796875, 0.38153076171875, 0.398101806640625, 0.4146728515625, 0.431243896484375, 0.44781494140625, 0.464385986328125, 0.48095703125]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 13.0, 93.0, 337.0, 399.0, 152.0, 20.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004711151123046875, -0.004057705402374268, -0.00340425968170166, -0.0027508139610290527, -0.0020973682403564453, -0.0014439225196838379, -0.0007904767990112305, -0.00013703107833862305, 0.0005164146423339844, 0.0011698603630065918, 0.0018233060836791992, 0.0024767518043518066, 0.003130197525024414, 0.0037836432456970215, 0.004437088966369629, 0.005090534687042236, 0.005743980407714844, 0.006397426128387451, 0.007050871849060059, 0.007704317569732666, 0.008357763290405273, 0.00901120901107788, 0.009664654731750488, 0.010318100452423096, 0.010971546173095703, 0.01162499189376831, 0.012278437614440918, 0.012931883335113525, 0.013585329055786133, 0.01423877477645874, 0.014892220497131348, 0.015545666217803955, 0.016199111938476562, 0.01685255765914917, 0.017506003379821777, 0.018159449100494385, 0.018812894821166992, 0.0194663405418396, 0.020119786262512207, 0.020773231983184814, 0.021426677703857422, 0.02208012342453003, 0.022733569145202637, 0.023387014865875244, 0.02404046058654785, 0.02469390630722046, 0.025347352027893066, 0.026000797748565674, 0.02665424346923828, 0.02730768918991089, 0.027961134910583496, 0.028614580631256104, 0.02926802635192871, 0.02992147207260132, 0.030574917793273926, 0.031228363513946533, 0.03188180923461914, 0.03253525495529175, 0.033188700675964355, 0.03384214639663696, 0.03449559211730957, 0.03514903783798218, 0.035802483558654785, 0.03645592927932739, 0.037109375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 5.0, 5.0, 6.0, 5.0, 5.0, 6.0, 15.0, 15.0, 18.0, 20.0, 33.0, 45.0, 70.0, 111.0, 188.0, 419.0, 1019.0, 3313.0, 15866.0, 148859.0, 781412.0, 81985.0, 10857.0, 2615.0, 834.0, 334.0, 172.0, 107.0, 52.0, 46.0, 30.0, 23.0, 13.0, 13.0, 8.0, 9.0, 4.0, 4.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.132080078125, -0.12800216674804688, -0.12392425537109375, -0.11984634399414062, -0.1157684326171875, -0.11169052124023438, -0.10761260986328125, -0.10353469848632812, -0.099456787109375, -0.09537887573242188, -0.09130096435546875, -0.08722305297851562, -0.0831451416015625, -0.07906723022460938, -0.07498931884765625, -0.07091140747070312, -0.06683349609375, -0.06275558471679688, -0.05867767333984375, -0.054599761962890625, -0.0505218505859375, -0.046443939208984375, -0.04236602783203125, -0.038288116455078125, -0.034210205078125, -0.030132293701171875, -0.02605438232421875, -0.021976470947265625, -0.0178985595703125, -0.013820648193359375, -0.00974273681640625, -0.005664825439453125, -0.0015869140625, 0.002490997314453125, 0.00656890869140625, 0.010646820068359375, 0.0147247314453125, 0.018802642822265625, 0.02288055419921875, 0.026958465576171875, 0.031036376953125, 0.035114288330078125, 0.03919219970703125, 0.043270111083984375, 0.0473480224609375, 0.051425933837890625, 0.05550384521484375, 0.059581756591796875, 0.06365966796875, 0.06773757934570312, 0.07181549072265625, 0.07589340209960938, 0.0799713134765625, 0.08404922485351562, 0.08812713623046875, 0.09220504760742188, 0.096282958984375, 0.10036087036132812, 0.10443878173828125, 0.10851669311523438, 0.1125946044921875, 0.11667251586914062, 0.12075042724609375, 0.12482833862304688, 0.12890625]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 5.0, 3.0, 3.0, 7.0, 7.0, 6.0, 12.0, 17.0, 12.0, 19.0, 26.0, 36.0, 36.0, 44.0, 46.0, 56.0, 57.0, 56.0, 62.0, 66.0, 75.0, 58.0, 49.0, 42.0, 35.0, 27.0, 29.0, 25.0, 21.0, 21.0, 7.0, 9.0, 8.0, 5.0, 1.0, 7.0, 5.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0318603515625, -0.03075122833251953, -0.029642105102539062, -0.028532981872558594, -0.027423858642578125, -0.026314735412597656, -0.025205612182617188, -0.02409648895263672, -0.02298736572265625, -0.02187824249267578, -0.020769119262695312, -0.019659996032714844, -0.018550872802734375, -0.017441749572753906, -0.016332626342773438, -0.015223503112792969, -0.0141143798828125, -0.013005256652832031, -0.011896133422851562, -0.010787010192871094, -0.009677886962890625, -0.008568763732910156, -0.0074596405029296875, -0.006350517272949219, -0.00524139404296875, -0.004132270812988281, -0.0030231475830078125, -0.0019140243530273438, -0.000804901123046875, 0.00030422210693359375, 0.0014133453369140625, 0.0025224685668945312, 0.003631591796875, 0.004740715026855469, 0.0058498382568359375, 0.006958961486816406, 0.008068084716796875, 0.009177207946777344, 0.010286331176757812, 0.011395454406738281, 0.01250457763671875, 0.013613700866699219, 0.014722824096679688, 0.015831947326660156, 0.016941070556640625, 0.018050193786621094, 0.019159317016601562, 0.02026844024658203, 0.0213775634765625, 0.02248668670654297, 0.023595809936523438, 0.024704933166503906, 0.025814056396484375, 0.026923179626464844, 0.028032302856445312, 0.02914142608642578, 0.03025054931640625, 0.03135967254638672, 0.03246879577636719, 0.033577919006347656, 0.034687042236328125, 0.035796165466308594, 0.03690528869628906, 0.03801441192626953, 0.03912353515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 4.0, 10.0, 12.0, 17.0, 27.0, 35.0, 60.0, 118.0, 294.0, 844.0, 4709.0, 712970.0, 324071.0, 4074.0, 769.0, 235.0, 107.0, 66.0, 38.0, 25.0, 15.0, 7.0, 10.0, 4.0, 4.0, 4.0, 1.0, 6.0, 1.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39599609375, -0.38232421875, -0.36865234375, -0.35498046875, -0.34130859375, -0.32763671875, -0.31396484375, -0.30029296875, -0.28662109375, -0.27294921875, -0.25927734375, -0.24560546875, -0.23193359375, -0.21826171875, -0.20458984375, -0.19091796875, -0.17724609375, -0.16357421875, -0.14990234375, -0.13623046875, -0.12255859375, -0.10888671875, -0.09521484375, -0.08154296875, -0.06787109375, -0.05419921875, -0.04052734375, -0.02685546875, -0.01318359375, 0.00048828125, 0.01416015625, 0.02783203125, 0.04150390625, 0.05517578125, 0.06884765625, 0.08251953125, 0.09619140625, 0.10986328125, 0.12353515625, 0.13720703125, 0.15087890625, 0.16455078125, 0.17822265625, 0.19189453125, 0.20556640625, 0.21923828125, 0.23291015625, 0.24658203125, 0.26025390625, 0.27392578125, 0.28759765625, 0.30126953125, 0.31494140625, 0.32861328125, 0.34228515625, 0.35595703125, 0.36962890625, 0.38330078125, 0.39697265625, 0.41064453125, 0.42431640625, 0.43798828125, 0.45166015625, 0.46533203125, 0.47900390625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 16.0, 41.0, 161.0, 412.0, 245.0, 69.0, 17.0, 7.0, 5.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.657838821411133e-05, -6.471201777458191e-05, -6.284564733505249e-05, -6.097927689552307e-05, -5.911290645599365e-05, -5.7246536016464233e-05, -5.5380165576934814e-05, -5.3513795137405396e-05, -5.1647424697875977e-05, -4.978105425834656e-05, -4.791468381881714e-05, -4.604831337928772e-05, -4.41819429397583e-05, -4.231557250022888e-05, -4.044920206069946e-05, -3.8582831621170044e-05, -3.6716461181640625e-05, -3.4850090742111206e-05, -3.298372030258179e-05, -3.111734986305237e-05, -2.925097942352295e-05, -2.738460898399353e-05, -2.551823854446411e-05, -2.3651868104934692e-05, -2.1785497665405273e-05, -1.9919127225875854e-05, -1.8052756786346436e-05, -1.6186386346817017e-05, -1.4320015907287598e-05, -1.2453645467758179e-05, -1.058727502822876e-05, -8.72090458869934e-06, -6.854534149169922e-06, -4.988163709640503e-06, -3.121793270111084e-06, -1.255422830581665e-06, 6.109476089477539e-07, 2.477318048477173e-06, 4.343688488006592e-06, 6.210058927536011e-06, 8.07642936706543e-06, 9.942799806594849e-06, 1.1809170246124268e-05, 1.3675540685653687e-05, 1.5541911125183105e-05, 1.7408281564712524e-05, 1.9274652004241943e-05, 2.1141022443771362e-05, 2.300739288330078e-05, 2.48737633228302e-05, 2.674013376235962e-05, 2.8606504201889038e-05, 3.0472874641418457e-05, 3.2339245080947876e-05, 3.4205615520477295e-05, 3.6071985960006714e-05, 3.793835639953613e-05, 3.980472683906555e-05, 4.167109727859497e-05, 4.353746771812439e-05, 4.540383815765381e-05, 4.727020859718323e-05, 4.9136579036712646e-05, 5.1002949476242065e-05, 5.2869319915771484e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 5.0, 6.0, 6.0, 8.0, 8.0, 14.0, 25.0, 36.0, 108.0, 273.0, 1514.0, 362982.0, 681655.0, 1455.0, 259.0, 96.0, 29.0, 23.0, 18.0, 7.0, 9.0, 7.0, 3.0, 2.0, 1.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.734375, -1.67657470703125, -1.6187744140625, -1.56097412109375, -1.503173828125, -1.44537353515625, -1.3875732421875, -1.32977294921875, -1.27197265625, -1.21417236328125, -1.1563720703125, -1.09857177734375, -1.040771484375, -0.98297119140625, -0.9251708984375, -0.86737060546875, -0.8095703125, -0.75177001953125, -0.6939697265625, -0.63616943359375, -0.578369140625, -0.52056884765625, -0.4627685546875, -0.40496826171875, -0.34716796875, -0.28936767578125, -0.2315673828125, -0.17376708984375, -0.115966796875, -0.05816650390625, -0.0003662109375, 0.05743408203125, 0.115234375, 0.17303466796875, 0.2308349609375, 0.28863525390625, 0.346435546875, 0.40423583984375, 0.4620361328125, 0.51983642578125, 0.57763671875, 0.63543701171875, 0.6932373046875, 0.75103759765625, 0.808837890625, 0.86663818359375, 0.9244384765625, 0.98223876953125, 1.0400390625, 1.09783935546875, 1.1556396484375, 1.21343994140625, 1.271240234375, 1.32904052734375, 1.3868408203125, 1.44464111328125, 1.50244140625, 1.56024169921875, 1.6180419921875, 1.67584228515625, 1.733642578125, 1.79144287109375, 1.8492431640625, 1.90704345703125, 1.96484375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 5.0, 3.0, 5.0, 8.0, 43.0, 414.0, 435.0, 39.0, 18.0, 9.0, 6.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.66748046875, -0.6516036987304688, -0.6357269287109375, -0.6198501586914062, -0.603973388671875, -0.5880966186523438, -0.5722198486328125, -0.5563430786132812, -0.54046630859375, -0.5245895385742188, -0.5087127685546875, -0.49283599853515625, -0.476959228515625, -0.46108245849609375, -0.4452056884765625, -0.42932891845703125, -0.4134521484375, -0.39757537841796875, -0.3816986083984375, -0.36582183837890625, -0.349945068359375, -0.33406829833984375, -0.3181915283203125, -0.30231475830078125, -0.28643798828125, -0.27056121826171875, -0.2546844482421875, -0.23880767822265625, -0.222930908203125, -0.20705413818359375, -0.1911773681640625, -0.17530059814453125, -0.159423828125, -0.14354705810546875, -0.1276702880859375, -0.11179351806640625, -0.095916748046875, -0.08003997802734375, -0.0641632080078125, -0.04828643798828125, -0.03240966796875, -0.01653289794921875, -0.0006561279296875, 0.01522064208984375, 0.031097412109375, 0.04697418212890625, 0.0628509521484375, 0.07872772216796875, 0.0946044921875, 0.11048126220703125, 0.1263580322265625, 0.14223480224609375, 0.158111572265625, 0.17398834228515625, 0.1898651123046875, 0.20574188232421875, 0.22161865234375, 0.23749542236328125, 0.2533721923828125, 0.26924896240234375, 0.285125732421875, 0.30100250244140625, 0.3168792724609375, 0.33275604248046875, 0.3486328125]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 266.0, 728.0, 15.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.218753814697266, -9.009576797485352, -8.800399780273438, -8.59122371673584, -8.382046699523926, -8.172869682312012, -7.963692665100098, -7.754515647888184, -7.545339107513428, -7.336162090301514, -7.126985549926758, -6.917808532714844, -6.70863151550293, -6.499454975128174, -6.29027795791626, -6.081101417541504, -5.87192440032959, -5.662747383117676, -5.45357084274292, -5.244393825531006, -5.03521728515625, -4.826040267944336, -4.616863250732422, -4.407686233520508, -4.198509693145752, -3.989332914352417, -3.780156135559082, -3.570979118347168, -3.361802339553833, -3.152625560760498, -2.943448543548584, -2.734271764755249, -2.525094985961914, -2.315918207168579, -2.106741428375244, -1.89756441116333, -1.6883876323699951, -1.4792108535766602, -1.2700339555740356, -1.0608570575714111, -0.8516802787780762, -0.6425034403800964, -0.4333266019821167, -0.22414976358413696, -0.014972925186157227, 0.19420385360717773, 0.40338075160980225, 0.6125576496124268, 0.8217344284057617, 1.0309112071990967, 1.2400881052017212, 1.4492650032043457, 1.6584417819976807, 1.8676185607910156, 2.0767955780029297, 2.2859723567962646, 2.4951491355895996, 2.7043259143829346, 2.9135026931762695, 3.1226797103881836, 3.3318564891815186, 3.5410332679748535, 3.7502102851867676, 3.9593870639801025, 4.1685638427734375]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [2.0, 11.0, 19.0, 46.0, 96.0, 170.0, 175.0, 194.0, 150.0, 91.0, 40.0, 20.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21443456411361694, -0.16775739192962646, -0.12108021229505539, -0.07440303266048431, -0.027725860476493835, 0.018951311707496643, 0.06562849879264832, 0.1123056709766388, 0.15898284316062927, 0.20566001534461975, 0.25233718752861023, 0.2990143895149231, 0.3456915616989136, 0.39236873388290405, 0.43904590606689453, 0.485723078250885, 0.5324002504348755, 0.579077422618866, 0.6257545948028564, 0.6724317669868469, 0.7191089391708374, 0.7657861113548279, 0.8124632835388184, 0.8591405153274536, 0.9058176279067993, 0.9524948000907898, 0.9991719722747803, 1.0458492040634155, 1.0925263166427612, 1.1392035484313965, 1.1858806610107422, 1.2325578927993774, 1.2792350053787231, 1.3259122371673584, 1.372589349746704, 1.4192665815353394, 1.465943694114685, 1.5126209259033203, 1.559298038482666, 1.6059752702713013, 1.652652382850647, 1.6993296146392822, 1.746006727218628, 1.7926839590072632, 1.8393610715866089, 1.8860383033752441, 1.9327154159545898, 1.979392647743225, 2.0260698795318604, 2.072746992111206, 2.119424343109131, 2.1661014556884766, 2.2127785682678223, 2.259455680847168, 2.3061330318450928, 2.3528101444244385, 2.399487257003784, 2.44616436958313, 2.4928417205810547, 2.5395188331604004, 2.586195945739746, 2.632873058319092, 2.6795504093170166, 2.7262275218963623, 2.772904634475708]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 8.0, 12.0, 25.0, 61.0, 114.0, 219.0, 692.0, 21295.0, 4170898.0, 671.0, 135.0, 44.0, 30.0, 18.0, 16.0, 13.0, 6.0, 12.0, 4.0, 4.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.275390625, -1.2444229125976562, -1.2134552001953125, -1.1824874877929688, -1.151519775390625, -1.1205520629882812, -1.0895843505859375, -1.0586166381835938, -1.02764892578125, -0.9966812133789062, -0.9657135009765625, -0.9347457885742188, -0.903778076171875, -0.8728103637695312, -0.8418426513671875, -0.8108749389648438, -0.7799072265625, -0.7489395141601562, -0.7179718017578125, -0.6870040893554688, -0.656036376953125, -0.6250686645507812, -0.5941009521484375, -0.5631332397460938, -0.53216552734375, -0.5011978149414062, -0.4702301025390625, -0.43926239013671875, -0.408294677734375, -0.37732696533203125, -0.3463592529296875, -0.31539154052734375, -0.284423828125, -0.25345611572265625, -0.2224884033203125, -0.19152069091796875, -0.160552978515625, -0.12958526611328125, -0.0986175537109375, -0.06764984130859375, -0.03668212890625, -0.00571441650390625, 0.0252532958984375, 0.05622100830078125, 0.087188720703125, 0.11815643310546875, 0.1491241455078125, 0.18009185791015625, 0.2110595703125, 0.24202728271484375, 0.2729949951171875, 0.30396270751953125, 0.334930419921875, 0.36589813232421875, 0.3968658447265625, 0.42783355712890625, 0.45880126953125, 0.48976898193359375, 0.5207366943359375, 0.5517044067382812, 0.582672119140625, 0.6136398315429688, 0.6446075439453125, 0.6755752563476562, 0.70654296875]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 12.0, 27.0, 92.0, 181.0, 243.0, 219.0, 150.0, 59.0, 19.0, 5.0, 7.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006366729736328125, -0.005647838115692139, -0.004928946495056152, -0.004210054874420166, -0.0034911632537841797, -0.0027722716331481934, -0.002053380012512207, -0.0013344883918762207, -0.0006155967712402344, 0.00010329484939575195, 0.0008221864700317383, 0.0015410780906677246, 0.002259969711303711, 0.0029788613319396973, 0.0036977529525756836, 0.00441664457321167, 0.005135536193847656, 0.005854427814483643, 0.006573319435119629, 0.007292211055755615, 0.008011102676391602, 0.008729994297027588, 0.009448885917663574, 0.01016777753829956, 0.010886669158935547, 0.011605560779571533, 0.01232445240020752, 0.013043344020843506, 0.013762235641479492, 0.014481127262115479, 0.015200018882751465, 0.01591891050338745, 0.016637802124023438, 0.017356693744659424, 0.01807558536529541, 0.018794476985931396, 0.019513368606567383, 0.02023226022720337, 0.020951151847839355, 0.021670043468475342, 0.022388935089111328, 0.023107826709747314, 0.0238267183303833, 0.024545609951019287, 0.025264501571655273, 0.02598339319229126, 0.026702284812927246, 0.027421176433563232, 0.02814006805419922, 0.028858959674835205, 0.02957785129547119, 0.030296742916107178, 0.031015634536743164, 0.03173452615737915, 0.03245341777801514, 0.03317230939865112, 0.03389120101928711, 0.034610092639923096, 0.03532898426055908, 0.03604787588119507, 0.036766767501831055, 0.03748565912246704, 0.03820455074310303, 0.038923442363739014, 0.039642333984375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 16.0, 38.0, 93.0, 196.0, 396.0, 5271.0, 4187249.0, 640.0, 210.0, 98.0, 44.0, 14.0, 6.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.44140625, -4.336151123046875, -4.23089599609375, -4.125640869140625, -4.0203857421875, -3.915130615234375, -3.80987548828125, -3.704620361328125, -3.599365234375, -3.494110107421875, -3.38885498046875, -3.283599853515625, -3.1783447265625, -3.073089599609375, -2.96783447265625, -2.862579345703125, -2.75732421875, -2.652069091796875, -2.54681396484375, -2.441558837890625, -2.3363037109375, -2.231048583984375, -2.12579345703125, -2.020538330078125, -1.915283203125, -1.810028076171875, -1.70477294921875, -1.599517822265625, -1.4942626953125, -1.389007568359375, -1.28375244140625, -1.178497314453125, -1.0732421875, -0.967987060546875, -0.86273193359375, -0.757476806640625, -0.6522216796875, -0.546966552734375, -0.44171142578125, -0.336456298828125, -0.231201171875, -0.125946044921875, -0.02069091796875, 0.084564208984375, 0.1898193359375, 0.295074462890625, 0.40032958984375, 0.505584716796875, 0.61083984375, 0.716094970703125, 0.82135009765625, 0.926605224609375, 1.0318603515625, 1.137115478515625, 1.24237060546875, 1.347625732421875, 1.452880859375, 1.558135986328125, 1.66339111328125, 1.768646240234375, 1.8739013671875, 1.979156494140625, 2.08441162109375, 2.189666748046875, 2.294921875]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 10.0, 33.0, 175.0, 3500.0, 281.0, 55.0, 21.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.329833984375, -0.3234386444091797, -0.3170433044433594, -0.31064796447753906, -0.30425262451171875, -0.29785728454589844, -0.2914619445800781, -0.2850666046142578, -0.2786712646484375, -0.2722759246826172, -0.2658805847167969, -0.25948524475097656, -0.25308990478515625, -0.24669456481933594, -0.24029922485351562, -0.2339038848876953, -0.227508544921875, -0.2211132049560547, -0.21471786499023438, -0.20832252502441406, -0.20192718505859375, -0.19553184509277344, -0.18913650512695312, -0.1827411651611328, -0.1763458251953125, -0.1699504852294922, -0.16355514526367188, -0.15715980529785156, -0.15076446533203125, -0.14436912536621094, -0.13797378540039062, -0.1315784454345703, -0.12518310546875, -0.11878776550292969, -0.11239242553710938, -0.10599708557128906, -0.09960174560546875, -0.09320640563964844, -0.08681106567382812, -0.08041572570800781, -0.0740203857421875, -0.06762504577636719, -0.061229705810546875, -0.05483436584472656, -0.04843902587890625, -0.04204368591308594, -0.035648345947265625, -0.029253005981445312, -0.022857666015625, -0.016462326049804688, -0.010066986083984375, -0.0036716461181640625, 0.00272369384765625, 0.009119033813476562, 0.015514373779296875, 0.021909713745117188, 0.0283050537109375, 0.03470039367675781, 0.041095733642578125, 0.04749107360839844, 0.05388641357421875, 0.06028175354003906, 0.06667709350585938, 0.07307243347167969, 0.0794677734375]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 15.0, 484.0, 492.0, 16.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.230857849121094, -6.075089454650879, -5.919321537017822, -5.763553142547607, -5.607785224914551, -5.452016830444336, -5.296248435974121, -5.1404805183410645, -4.98471212387085, -4.828943729400635, -4.673175811767578, -4.517407417297363, -4.361639499664307, -4.205871105194092, -4.050103187561035, -3.8943347930908203, -3.7385666370391846, -3.582798480987549, -3.427030324935913, -3.2712621688842773, -3.1154937744140625, -2.9597256183624268, -2.803957462310791, -2.648189067840576, -2.4924211502075195, -2.336652994155884, -2.180884838104248, -2.025116443634033, -1.8693482875823975, -1.7135801315307617, -1.557811975479126, -1.4020437002182007, -1.2462756633758545, -1.0905075073242188, -0.9347392320632935, -0.7789710760116577, -0.6232028603553772, -0.4674346446990967, -0.31166648864746094, -0.15589821338653564, -0.00013005733489990234, 0.15563814342021942, 0.31140634417533875, 0.4671745300292969, 0.6229427456855774, 0.7787109613418579, 0.9344791173934937, 1.090247392654419, 1.2460155487060547, 1.4017837047576904, 1.5575519800186157, 1.7133201360702515, 1.8690884113311768, 2.0248565673828125, 2.1806247234344482, 2.336392879486084, 2.492161273956299, 2.6479294300079346, 2.8036975860595703, 2.959465980529785, 3.115234136581421, 3.2710022926330566, 3.4267704486846924, 3.582538604736328, 3.738306760787964]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 5.0, 8.0, 12.0, 37.0, 46.0, 85.0, 111.0, 131.0, 131.0, 141.0, 96.0, 79.0, 58.0, 34.0, 13.0, 7.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5178771615028381, -0.5001544952392578, -0.4824318289756775, -0.4647091329097748, -0.44698646664619446, -0.42926380038261414, -0.4115411043167114, -0.3938184380531311, -0.3760957717895508, -0.35837310552597046, -0.34065043926239014, -0.3229277431964874, -0.3052050769329071, -0.2874824106693268, -0.2697597146034241, -0.25203704833984375, -0.23431438207626343, -0.2165917158126831, -0.1988690346479416, -0.18114635348320007, -0.16342368721961975, -0.14570102095603943, -0.1279783397912979, -0.110255666077137, -0.09253299236297607, -0.07481031864881516, -0.057087644934654236, -0.03936497122049332, -0.021642297506332397, -0.003919623792171478, 0.013803049921989441, 0.03152572363615036, 0.049248456954956055, 0.06697113066911697, 0.0846938043832779, 0.10241647809743881, 0.12013915181159973, 0.13786181807518005, 0.15558449923992157, 0.17330718040466309, 0.1910298466682434, 0.20875251293182373, 0.22647519409656525, 0.24419787526130676, 0.2619205415248871, 0.2796432077884674, 0.2973659038543701, 0.31508857011795044, 0.33281123638153076, 0.3505339026451111, 0.3682565689086914, 0.3859792649745941, 0.40370193123817444, 0.42142459750175476, 0.43914729356765747, 0.4568699598312378, 0.4745926260948181, 0.49231529235839844, 0.5100379586219788, 0.5277606248855591, 0.5454833507537842, 0.5632060170173645, 0.5809286832809448, 0.5986513495445251, 0.6163740158081055]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 8.0, 6.0, 6.0, 10.0, 9.0, 16.0, 23.0, 23.0, 32.0, 63.0, 101.0, 148.0, 271.0, 680.0, 2331.0, 17434.0, 741059.0, 273256.0, 10044.0, 1794.0, 551.0, 264.0, 136.0, 81.0, 59.0, 37.0, 26.0, 19.0, 20.0, 12.0, 5.0, 7.0, 9.0, 5.0, 2.0, 1.0, 2.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.55029296875, -0.5330352783203125, -0.515777587890625, -0.4985198974609375, -0.48126220703125, -0.4640045166015625, -0.446746826171875, -0.4294891357421875, -0.4122314453125, -0.3949737548828125, -0.377716064453125, -0.3604583740234375, -0.34320068359375, -0.3259429931640625, -0.308685302734375, -0.2914276123046875, -0.274169921875, -0.2569122314453125, -0.239654541015625, -0.2223968505859375, -0.20513916015625, -0.1878814697265625, -0.170623779296875, -0.1533660888671875, -0.1361083984375, -0.1188507080078125, -0.101593017578125, -0.0843353271484375, -0.06707763671875, -0.0498199462890625, -0.032562255859375, -0.0153045654296875, 0.001953125, 0.0192108154296875, 0.036468505859375, 0.0537261962890625, 0.07098388671875, 0.0882415771484375, 0.105499267578125, 0.1227569580078125, 0.1400146484375, 0.1572723388671875, 0.174530029296875, 0.1917877197265625, 0.20904541015625, 0.2263031005859375, 0.243560791015625, 0.2608184814453125, 0.278076171875, 0.2953338623046875, 0.312591552734375, 0.3298492431640625, 0.34710693359375, 0.3643646240234375, 0.381622314453125, 0.3988800048828125, 0.4161376953125, 0.4333953857421875, 0.450653076171875, 0.4679107666015625, 0.48516845703125, 0.5024261474609375, 0.519683837890625, 0.5369415283203125, 0.55419921875]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 11.0, 11.0, 28.0, 24.0, 40.0, 61.0, 94.0, 113.0, 129.0, 105.0, 100.0, 90.0, 60.0, 44.0, 40.0, 29.0, 12.0, 4.0, 0.0, 3.0, 4.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03485107421875, -0.03368806838989258, -0.032525062561035156, -0.031362056732177734, -0.030199050903320312, -0.02903604507446289, -0.02787303924560547, -0.026710033416748047, -0.025547027587890625, -0.024384021759033203, -0.02322101593017578, -0.02205801010131836, -0.020895004272460938, -0.019731998443603516, -0.018568992614746094, -0.017405986785888672, -0.01624298095703125, -0.015079975128173828, -0.013916969299316406, -0.012753963470458984, -0.011590957641601562, -0.01042795181274414, -0.009264945983886719, -0.008101940155029297, -0.006938934326171875, -0.005775928497314453, -0.004612922668457031, -0.0034499168395996094, -0.0022869110107421875, -0.0011239051818847656, 3.910064697265625e-05, 0.0012021064758300781, 0.0023651123046875, 0.003528118133544922, 0.004691123962402344, 0.005854129791259766, 0.0070171356201171875, 0.00818014144897461, 0.009343147277832031, 0.010506153106689453, 0.011669158935546875, 0.012832164764404297, 0.013995170593261719, 0.01515817642211914, 0.016321182250976562, 0.017484188079833984, 0.018647193908691406, 0.019810199737548828, 0.02097320556640625, 0.022136211395263672, 0.023299217224121094, 0.024462223052978516, 0.025625228881835938, 0.02678823471069336, 0.02795124053955078, 0.029114246368408203, 0.030277252197265625, 0.03144025802612305, 0.03260326385498047, 0.03376626968383789, 0.03492927551269531, 0.036092281341552734, 0.037255287170410156, 0.03841829299926758, 0.039581298828125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 0.0, 0.0, 0.0, 1.0, 7.0, 3.0, 2.0, 9.0, 9.0, 13.0, 14.0, 13.0, 21.0, 45.0, 45.0, 61.0, 109.0, 158.0, 304.0, 615.0, 1484.0, 5785.0, 55555.0, 834541.0, 136358.0, 9722.0, 2002.0, 749.0, 340.0, 199.0, 118.0, 69.0, 49.0, 56.0, 18.0, 25.0, 28.0, 9.0, 2.0, 5.0, 2.0, 4.0, 6.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.275390625, -0.26720428466796875, -0.2590179443359375, -0.25083160400390625, -0.242645263671875, -0.23445892333984375, -0.2262725830078125, -0.21808624267578125, -0.20989990234375, -0.20171356201171875, -0.1935272216796875, -0.18534088134765625, -0.177154541015625, -0.16896820068359375, -0.1607818603515625, -0.15259552001953125, -0.1444091796875, -0.13622283935546875, -0.1280364990234375, -0.11985015869140625, -0.111663818359375, -0.10347747802734375, -0.0952911376953125, -0.08710479736328125, -0.07891845703125, -0.07073211669921875, -0.0625457763671875, -0.05435943603515625, -0.046173095703125, -0.03798675537109375, -0.0298004150390625, -0.02161407470703125, -0.013427734375, -0.00524139404296875, 0.0029449462890625, 0.01113128662109375, 0.019317626953125, 0.02750396728515625, 0.0356903076171875, 0.04387664794921875, 0.05206298828125, 0.06024932861328125, 0.0684356689453125, 0.07662200927734375, 0.084808349609375, 0.09299468994140625, 0.1011810302734375, 0.10936737060546875, 0.1175537109375, 0.12574005126953125, 0.1339263916015625, 0.14211273193359375, 0.150299072265625, 0.15848541259765625, 0.1666717529296875, 0.17485809326171875, 0.18304443359375, 0.19123077392578125, 0.1994171142578125, 0.20760345458984375, 0.215789794921875, 0.22397613525390625, 0.2321624755859375, 0.24034881591796875, 0.24853515625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 3.0, 5.0, 8.0, 8.0, 9.0, 14.0, 12.0, 25.0, 22.0, 32.0, 38.0, 25.0, 51.0, 61.0, 55.0, 46.0, 45.0, 41.0, 55.0, 64.0, 49.0, 43.0, 48.0, 34.0, 40.0, 25.0, 30.0, 21.0, 19.0, 12.0, 23.0, 10.0, 5.0, 4.0, 5.0, 4.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.09014892578125, -0.0874776840209961, -0.08480644226074219, -0.08213520050048828, -0.07946395874023438, -0.07679271697998047, -0.07412147521972656, -0.07145023345947266, -0.06877899169921875, -0.06610774993896484, -0.06343650817871094, -0.06076526641845703, -0.058094024658203125, -0.05542278289794922, -0.05275154113769531, -0.050080299377441406, -0.0474090576171875, -0.044737815856933594, -0.04206657409667969, -0.03939533233642578, -0.036724090576171875, -0.03405284881591797, -0.03138160705566406, -0.028710365295410156, -0.02603912353515625, -0.023367881774902344, -0.020696640014648438, -0.01802539825439453, -0.015354156494140625, -0.012682914733886719, -0.010011672973632812, -0.007340431213378906, -0.004669189453125, -0.0019979476928710938, 0.0006732940673828125, 0.0033445358276367188, 0.006015777587890625, 0.008687019348144531, 0.011358261108398438, 0.014029502868652344, 0.01670074462890625, 0.019371986389160156, 0.022043228149414062, 0.02471446990966797, 0.027385711669921875, 0.03005695343017578, 0.03272819519042969, 0.035399436950683594, 0.0380706787109375, 0.040741920471191406, 0.04341316223144531, 0.04608440399169922, 0.048755645751953125, 0.05142688751220703, 0.05409812927246094, 0.056769371032714844, 0.05944061279296875, 0.062111854553222656, 0.06478309631347656, 0.06745433807373047, 0.07012557983398438, 0.07279682159423828, 0.07546806335449219, 0.0781393051147461, 0.080810546875]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 4.0, 2.0, 4.0, 4.0, 3.0, 6.0, 11.0, 9.0, 18.0, 13.0, 29.0, 44.0, 78.0, 138.0, 249.0, 491.0, 1144.0, 3573.0, 18404.0, 575708.0, 428326.0, 15058.0, 3065.0, 1084.0, 465.0, 280.0, 129.0, 75.0, 44.0, 33.0, 16.0, 17.0, 13.0, 6.0, 7.0, 4.0, 5.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18701171875, -0.18195152282714844, -0.17689132690429688, -0.1718311309814453, -0.16677093505859375, -0.1617107391357422, -0.15665054321289062, -0.15159034729003906, -0.1465301513671875, -0.14146995544433594, -0.13640975952148438, -0.1313495635986328, -0.12628936767578125, -0.12122917175292969, -0.11616897583007812, -0.11110877990722656, -0.106048583984375, -0.10098838806152344, -0.09592819213867188, -0.09086799621582031, -0.08580780029296875, -0.08074760437011719, -0.07568740844726562, -0.07062721252441406, -0.0655670166015625, -0.06050682067871094, -0.055446624755859375, -0.05038642883300781, -0.04532623291015625, -0.04026603698730469, -0.035205841064453125, -0.030145645141601562, -0.02508544921875, -0.020025253295898438, -0.014965057373046875, -0.009904861450195312, -0.00484466552734375, 0.0002155303955078125, 0.005275726318359375, 0.010335922241210938, 0.0153961181640625, 0.020456314086914062, 0.025516510009765625, 0.030576705932617188, 0.03563690185546875, 0.04069709777832031, 0.045757293701171875, 0.05081748962402344, 0.055877685546875, 0.06093788146972656, 0.06599807739257812, 0.07105827331542969, 0.07611846923828125, 0.08117866516113281, 0.08623886108398438, 0.09129905700683594, 0.0963592529296875, 0.10141944885253906, 0.10647964477539062, 0.11153984069824219, 0.11660003662109375, 0.12166023254394531, 0.12672042846679688, 0.13178062438964844, 0.1368408203125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 5.0, 4.0, 7.0, 6.0, 9.0, 30.0, 26.0, 25.0, 20.0, 36.0, 52.0, 59.0, 80.0, 91.0, 85.0, 91.0, 79.0, 63.0, 47.0, 39.0, 40.0, 22.0, 18.0, 16.0, 10.0, 13.0, 10.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.953975677490234e-06, -9.62521880865097e-06, -9.296461939811707e-06, -8.967705070972443e-06, -8.638948202133179e-06, -8.310191333293915e-06, -7.981434464454651e-06, -7.652677595615387e-06, -7.323920726776123e-06, -6.995163857936859e-06, -6.666406989097595e-06, -6.337650120258331e-06, -6.008893251419067e-06, -5.6801363825798035e-06, -5.3513795137405396e-06, -5.022622644901276e-06, -4.693865776062012e-06, -4.365108907222748e-06, -4.036352038383484e-06, -3.70759516954422e-06, -3.378838300704956e-06, -3.050081431865692e-06, -2.7213245630264282e-06, -2.3925676941871643e-06, -2.0638108253479004e-06, -1.7350539565086365e-06, -1.4062970876693726e-06, -1.0775402188301086e-06, -7.487833499908447e-07, -4.200264811515808e-07, -9.12696123123169e-08, 2.3748725652694702e-07, 5.662441253662109e-07, 8.950009942054749e-07, 1.2237578630447388e-06, 1.5525147318840027e-06, 1.8812716007232666e-06, 2.2100284695625305e-06, 2.5387853384017944e-06, 2.8675422072410583e-06, 3.1962990760803223e-06, 3.525055944919586e-06, 3.85381281375885e-06, 4.182569682598114e-06, 4.511326551437378e-06, 4.840083420276642e-06, 5.168840289115906e-06, 5.49759715795517e-06, 5.826354026794434e-06, 6.1551108956336975e-06, 6.4838677644729614e-06, 6.812624633312225e-06, 7.141381502151489e-06, 7.470138370990753e-06, 7.798895239830017e-06, 8.127652108669281e-06, 8.456408977508545e-06, 8.785165846347809e-06, 9.113922715187073e-06, 9.442679584026337e-06, 9.7714364528656e-06, 1.0100193321704865e-05, 1.0428950190544128e-05, 1.0757707059383392e-05, 1.1086463928222656e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 8.0, 9.0, 11.0, 26.0, 23.0, 27.0, 79.0, 102.0, 316.0, 791.0, 3860.0, 390129.0, 647294.0, 4455.0, 849.0, 284.0, 126.0, 59.0, 38.0, 22.0, 20.0, 11.0, 6.0, 6.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.38134765625, -0.37076568603515625, -0.3601837158203125, -0.34960174560546875, -0.339019775390625, -0.32843780517578125, -0.3178558349609375, -0.30727386474609375, -0.29669189453125, -0.28610992431640625, -0.2755279541015625, -0.26494598388671875, -0.254364013671875, -0.24378204345703125, -0.2332000732421875, -0.22261810302734375, -0.2120361328125, -0.20145416259765625, -0.1908721923828125, -0.18029022216796875, -0.169708251953125, -0.15912628173828125, -0.1485443115234375, -0.13796234130859375, -0.12738037109375, -0.11679840087890625, -0.1062164306640625, -0.09563446044921875, -0.085052490234375, -0.07447052001953125, -0.0638885498046875, -0.05330657958984375, -0.042724609375, -0.03214263916015625, -0.0215606689453125, -0.01097869873046875, -0.000396728515625, 0.01018524169921875, 0.0207672119140625, 0.03134918212890625, 0.04193115234375, 0.05251312255859375, 0.0630950927734375, 0.07367706298828125, 0.084259033203125, 0.09484100341796875, 0.1054229736328125, 0.11600494384765625, 0.1265869140625, 0.13716888427734375, 0.1477508544921875, 0.15833282470703125, 0.168914794921875, 0.17949676513671875, 0.1900787353515625, 0.20066070556640625, 0.21124267578125, 0.22182464599609375, 0.2324066162109375, 0.24298858642578125, 0.253570556640625, 0.26415252685546875, 0.2747344970703125, 0.28531646728515625, 0.2958984375]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 2.0, 8.0, 12.0, 8.0, 15.0, 15.0, 26.0, 37.0, 43.0, 65.0, 92.0, 118.0, 99.0, 100.0, 92.0, 78.0, 48.0, 44.0, 26.0, 19.0, 15.0, 9.0, 4.0, 9.0, 5.0, 4.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08978271484375, -0.08675289154052734, -0.08372306823730469, -0.08069324493408203, -0.07766342163085938, -0.07463359832763672, -0.07160377502441406, -0.0685739517211914, -0.06554412841796875, -0.0625143051147461, -0.05948448181152344, -0.05645465850830078, -0.053424835205078125, -0.05039501190185547, -0.04736518859863281, -0.044335365295410156, -0.0413055419921875, -0.038275718688964844, -0.03524589538574219, -0.03221607208251953, -0.029186248779296875, -0.02615642547607422, -0.023126602172851562, -0.020096778869628906, -0.01706695556640625, -0.014037132263183594, -0.011007308959960938, -0.007977485656738281, -0.004947662353515625, -0.0019178390502929688, 0.0011119842529296875, 0.004141807556152344, 0.007171630859375, 0.010201454162597656, 0.013231277465820312, 0.01626110076904297, 0.019290924072265625, 0.02232074737548828, 0.025350570678710938, 0.028380393981933594, 0.03141021728515625, 0.034440040588378906, 0.03746986389160156, 0.04049968719482422, 0.043529510498046875, 0.04655933380126953, 0.04958915710449219, 0.052618980407714844, 0.0556488037109375, 0.058678627014160156, 0.06170845031738281, 0.06473827362060547, 0.06776809692382812, 0.07079792022705078, 0.07382774353027344, 0.0768575668334961, 0.07988739013671875, 0.0829172134399414, 0.08594703674316406, 0.08897686004638672, 0.09200668334960938, 0.09503650665283203, 0.09806632995605469, 0.10109615325927734, 0.1041259765625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 13.0, 200.0, 694.0, 82.0, 15.0, 0.0, 5.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-6.193597316741943, -6.070174217224121, -5.946751594543457, -5.823328495025635, -5.699905872344971, -5.576482772827148, -5.453060150146484, -5.329637050628662, -5.20621395111084, -5.082790851593018, -4.9593682289123535, -4.835945129394531, -4.712522506713867, -4.589099407196045, -4.465676784515381, -4.342253684997559, -4.2188310623168945, -4.095407962799072, -3.971985340118408, -3.848562479019165, -3.725139617919922, -3.6017165184020996, -3.4782936573028564, -3.3548707962036133, -3.23144793510437, -3.108025074005127, -2.984602212905884, -2.8611793518066406, -2.7377562522888184, -2.6143336296081543, -2.490910530090332, -2.367487668991089, -2.244065046310425, -2.1206421852111816, -1.9972193241119385, -1.8737963438034058, -1.7503734827041626, -1.6269506216049194, -1.5035276412963867, -1.3801047801971436, -1.2566819190979004, -1.1332590579986572, -1.009836196899414, -0.8864132165908813, -0.7629903554916382, -0.639567494392395, -0.5161445736885071, -0.39272165298461914, -0.269298791885376, -0.14587590098381042, -0.022453010082244873, 0.10096988081932068, 0.22439277172088623, 0.3478156328201294, 0.47123855352401733, 0.5946614742279053, 0.7180843353271484, 0.8415071964263916, 0.9649301171302795, 1.0883530378341675, 1.2117758989334106, 1.3351987600326538, 1.4586217403411865, 1.5820446014404297, 1.7054674625396729]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 4.0, 7.0, 6.0, 6.0, 8.0, 12.0, 22.0, 23.0, 27.0, 49.0, 47.0, 47.0, 67.0, 74.0, 74.0, 71.0, 69.0, 67.0, 57.0, 37.0, 55.0, 32.0, 34.0, 23.0, 27.0, 21.0, 18.0, 10.0, 7.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8834232687950134, -0.8562690615653992, -0.8291148543357849, -0.8019606471061707, -0.7748064398765564, -0.7476522326469421, -0.7204980254173279, -0.6933438181877136, -0.6661896109580994, -0.6390354037284851, -0.6118811964988708, -0.5847269892692566, -0.5575727820396423, -0.5304185748100281, -0.5032643675804138, -0.47611016035079956, -0.4489559531211853, -0.42180174589157104, -0.3946475386619568, -0.36749333143234253, -0.34033912420272827, -0.313184916973114, -0.28603070974349976, -0.2588765025138855, -0.23172229528427124, -0.20456808805465698, -0.17741388082504272, -0.15025967359542847, -0.12310546636581421, -0.09595125913619995, -0.0687970519065857, -0.041642844676971436, -0.014488637447357178, 0.01266556978225708, 0.03981977701187134, 0.0669739842414856, 0.09412819147109985, 0.12128239870071411, 0.14843660593032837, 0.17559081315994263, 0.20274502038955688, 0.22989922761917114, 0.2570534348487854, 0.28420764207839966, 0.3113618493080139, 0.3385160565376282, 0.36567026376724243, 0.3928244709968567, 0.41997867822647095, 0.4471328854560852, 0.47428709268569946, 0.5014412999153137, 0.528595507144928, 0.5557497143745422, 0.5829039216041565, 0.6100581288337708, 0.637212336063385, 0.6643665432929993, 0.6915207505226135, 0.7186749577522278, 0.745829164981842, 0.7729833722114563, 0.8001375794410706, 0.8272917866706848, 0.8544459939002991]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 6.0, 6.0, 11.0, 11.0, 14.0, 21.0, 43.0, 55.0, 82.0, 143.0, 228.0, 607.0, 2037.0, 18551.0, 4040482.0, 127022.0, 4159.0, 564.0, 138.0, 46.0, 20.0, 5.0, 12.0, 3.0, 7.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.75537109375, -0.7322921752929688, -0.7092132568359375, -0.6861343383789062, -0.663055419921875, -0.6399765014648438, -0.6168975830078125, -0.5938186645507812, -0.57073974609375, -0.5476608276367188, -0.5245819091796875, -0.5015029907226562, -0.478424072265625, -0.45534515380859375, -0.4322662353515625, -0.40918731689453125, -0.3861083984375, -0.36302947998046875, -0.3399505615234375, -0.31687164306640625, -0.293792724609375, -0.27071380615234375, -0.2476348876953125, -0.22455596923828125, -0.20147705078125, -0.17839813232421875, -0.1553192138671875, -0.13224029541015625, -0.109161376953125, -0.08608245849609375, -0.0630035400390625, -0.03992462158203125, -0.016845703125, 0.00623321533203125, 0.0293121337890625, 0.05239105224609375, 0.075469970703125, 0.09854888916015625, 0.1216278076171875, 0.14470672607421875, 0.16778564453125, 0.19086456298828125, 0.2139434814453125, 0.23702239990234375, 0.260101318359375, 0.28318023681640625, 0.3062591552734375, 0.32933807373046875, 0.3524169921875, 0.37549591064453125, 0.3985748291015625, 0.42165374755859375, 0.444732666015625, 0.46781158447265625, 0.4908905029296875, 0.5139694213867188, 0.53704833984375, 0.5601272583007812, 0.5832061767578125, 0.6062850952148438, 0.629364013671875, 0.6524429321289062, 0.6755218505859375, 0.6986007690429688, 0.7216796875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 5.0, 6.0, 7.0, 11.0, 14.0, 23.0, 31.0, 35.0, 42.0, 61.0, 59.0, 73.0, 67.0, 91.0, 77.0, 86.0, 62.0, 56.0, 45.0, 40.0, 32.0, 23.0, 18.0, 11.0, 10.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.031829833984375, -0.030960559844970703, -0.030091285705566406, -0.02922201156616211, -0.028352737426757812, -0.027483463287353516, -0.02661418914794922, -0.025744915008544922, -0.024875640869140625, -0.024006366729736328, -0.02313709259033203, -0.022267818450927734, -0.021398544311523438, -0.02052927017211914, -0.019659996032714844, -0.018790721893310547, -0.01792144775390625, -0.017052173614501953, -0.016182899475097656, -0.01531362533569336, -0.014444351196289062, -0.013575077056884766, -0.012705802917480469, -0.011836528778076172, -0.010967254638671875, -0.010097980499267578, -0.009228706359863281, -0.008359432220458984, -0.0074901580810546875, -0.006620883941650391, -0.005751609802246094, -0.004882335662841797, -0.0040130615234375, -0.003143787384033203, -0.0022745132446289062, -0.0014052391052246094, -0.0005359649658203125, 0.0003333091735839844, 0.0012025833129882812, 0.002071857452392578, 0.002941131591796875, 0.003810405731201172, 0.004679679870605469, 0.005548954010009766, 0.0064182281494140625, 0.007287502288818359, 0.008156776428222656, 0.009026050567626953, 0.00989532470703125, 0.010764598846435547, 0.011633872985839844, 0.01250314712524414, 0.013372421264648438, 0.014241695404052734, 0.015110969543457031, 0.015980243682861328, 0.016849517822265625, 0.017718791961669922, 0.01858806610107422, 0.019457340240478516, 0.020326614379882812, 0.02119588851928711, 0.022065162658691406, 0.022934436798095703, 0.0238037109375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 2.0, 14.0, 28.0, 68.0, 255.0, 1755.0, 4189751.0, 2141.0, 187.0, 46.0, 19.0, 10.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.421875, -5.31024169921875, -5.1986083984375, -5.08697509765625, -4.975341796875, -4.86370849609375, -4.7520751953125, -4.64044189453125, -4.52880859375, -4.41717529296875, -4.3055419921875, -4.19390869140625, -4.082275390625, -3.97064208984375, -3.8590087890625, -3.74737548828125, -3.6357421875, -3.52410888671875, -3.4124755859375, -3.30084228515625, -3.189208984375, -3.07757568359375, -2.9659423828125, -2.85430908203125, -2.74267578125, -2.63104248046875, -2.5194091796875, -2.40777587890625, -2.296142578125, -2.18450927734375, -2.0728759765625, -1.96124267578125, -1.849609375, -1.73797607421875, -1.6263427734375, -1.51470947265625, -1.403076171875, -1.29144287109375, -1.1798095703125, -1.06817626953125, -0.95654296875, -0.84490966796875, -0.7332763671875, -0.62164306640625, -0.510009765625, -0.39837646484375, -0.2867431640625, -0.17510986328125, -0.0634765625, 0.04815673828125, 0.1597900390625, 0.27142333984375, 0.383056640625, 0.49468994140625, 0.6063232421875, 0.71795654296875, 0.82958984375, 0.94122314453125, 1.0528564453125, 1.16448974609375, 1.276123046875, 1.38775634765625, 1.4993896484375, 1.61102294921875, 1.72265625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 6.0, 20.0, 82.0, 988.0, 2804.0, 136.0, 24.0, 8.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46826171875, -0.4589195251464844, -0.44957733154296875, -0.4402351379394531, -0.4308929443359375, -0.4215507507324219, -0.41220855712890625, -0.4028663635253906, -0.393524169921875, -0.3841819763183594, -0.37483978271484375, -0.3654975891113281, -0.3561553955078125, -0.3468132019042969, -0.33747100830078125, -0.3281288146972656, -0.31878662109375, -0.3094444274902344, -0.30010223388671875, -0.2907600402832031, -0.2814178466796875, -0.2720756530761719, -0.26273345947265625, -0.2533912658691406, -0.244049072265625, -0.23470687866210938, -0.22536468505859375, -0.21602249145507812, -0.2066802978515625, -0.19733810424804688, -0.18799591064453125, -0.17865371704101562, -0.1693115234375, -0.15996932983398438, -0.15062713623046875, -0.14128494262695312, -0.1319427490234375, -0.12260055541992188, -0.11325836181640625, -0.10391616821289062, -0.094573974609375, -0.08523178100585938, -0.07588958740234375, -0.06654739379882812, -0.0572052001953125, -0.047863006591796875, -0.03852081298828125, -0.029178619384765625, -0.01983642578125, -0.010494232177734375, -0.00115203857421875, 0.008190155029296875, 0.0175323486328125, 0.026874542236328125, 0.03621673583984375, 0.045558929443359375, 0.054901123046875, 0.06424331665039062, 0.07358551025390625, 0.08292770385742188, 0.0922698974609375, 0.10161209106445312, 0.11095428466796875, 0.12029647827148438, 0.129638671875]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 9.0, 24.0, 823.0, 151.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.602726459503174, -2.4565622806549072, -2.3103981018066406, -2.164233922958374, -2.0180697441101074, -1.8719054460525513, -1.7257411479949951, -1.5795769691467285, -1.433412790298462, -1.2872486114501953, -1.1410844326019287, -0.9949201345443726, -0.848755955696106, -0.7025917768478394, -0.556427538394928, -0.4102632999420166, -0.26409912109375, -0.11793491244316101, 0.02822929620742798, 0.17439350485801697, 0.32055771350860596, 0.46672189235687256, 0.6128861308097839, 0.7590503692626953, 0.9052145481109619, 1.0513787269592285, 1.1975429058074951, 1.3437072038650513, 1.4898713827133179, 1.6360355615615845, 1.7821998596191406, 1.9283640384674072, 2.0745277404785156, 2.2206919193267822, 2.366856098175049, 2.5130202770233154, 2.659184455871582, 2.8053488731384277, 2.9515130519866943, 3.097677230834961, 3.2438414096832275, 3.390005588531494, 3.5361697673797607, 3.6823339462280273, 3.828498363494873, 3.9746623039245605, 4.120826721191406, 4.266990661621094, 4.4131550788879395, 4.559319496154785, 4.705483436584473, 4.851647853851318, 4.997811794281006, 5.143976211547852, 5.290140151977539, 5.436304569244385, 5.5824689865112305, 5.728633403778076, 5.874797344207764, 6.020961761474609, 6.167125701904297, 6.313290119171143, 6.45945405960083, 6.605618476867676, 6.751782417297363]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 3.0, 13.0, 19.0, 23.0, 37.0, 43.0, 79.0, 66.0, 103.0, 93.0, 96.0, 90.0, 88.0, 74.0, 67.0, 29.0, 30.0, 20.0, 15.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.895254373550415, -0.8700814247131348, -0.8449084758758545, -0.819735586643219, -0.7945626378059387, -0.7693896889686584, -0.744216799736023, -0.7190438508987427, -0.6938709020614624, -0.6686979532241821, -0.6435250043869019, -0.6183521151542664, -0.5931791663169861, -0.5680062174797058, -0.5428333282470703, -0.51766037940979, -0.49248743057250977, -0.4673144817352295, -0.4421415627002716, -0.4169686436653137, -0.39179569482803345, -0.3666227459907532, -0.3414498269557953, -0.3162769079208374, -0.29110395908355713, -0.26593101024627686, -0.24075809121131897, -0.2155851572751999, -0.1904122233390808, -0.16523928940296173, -0.14006635546684265, -0.11489342153072357, -0.08972054719924927, -0.06454761326313019, -0.03937467932701111, -0.014201745390892029, 0.01097118854522705, 0.03614412248134613, 0.06131705641746521, 0.08648999035358429, 0.11166292428970337, 0.13683585822582245, 0.16200879216194153, 0.1871817260980606, 0.2123546600341797, 0.23752759397029877, 0.26270052790641785, 0.28787344694137573, 0.313046395778656, 0.3382193446159363, 0.36339226365089417, 0.38856518268585205, 0.4137381315231323, 0.4389110803604126, 0.4640839993953705, 0.48925691843032837, 0.5144298672676086, 0.5396028161048889, 0.5647757053375244, 0.5899486541748047, 0.615121603012085, 0.6402945518493652, 0.6654675006866455, 0.690640389919281, 0.7158133387565613]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 5.0, 6.0, 7.0, 18.0, 22.0, 23.0, 49.0, 88.0, 145.0, 264.0, 450.0, 1036.0, 4035.0, 32557.0, 770616.0, 222425.0, 13014.0, 2227.0, 749.0, 336.0, 159.0, 117.0, 64.0, 44.0, 25.0, 16.0, 10.0, 14.0, 9.0, 3.0, 2.0, 2.0, 0.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.525390625, -0.5098495483398438, -0.4943084716796875, -0.47876739501953125, -0.463226318359375, -0.44768524169921875, -0.4321441650390625, -0.41660308837890625, -0.40106201171875, -0.38552093505859375, -0.3699798583984375, -0.35443878173828125, -0.338897705078125, -0.32335662841796875, -0.3078155517578125, -0.29227447509765625, -0.2767333984375, -0.26119232177734375, -0.2456512451171875, -0.23011016845703125, -0.214569091796875, -0.19902801513671875, -0.1834869384765625, -0.16794586181640625, -0.15240478515625, -0.13686370849609375, -0.1213226318359375, -0.10578155517578125, -0.090240478515625, -0.07469940185546875, -0.0591583251953125, -0.04361724853515625, -0.028076171875, -0.01253509521484375, 0.0030059814453125, 0.01854705810546875, 0.034088134765625, 0.04962921142578125, 0.0651702880859375, 0.08071136474609375, 0.09625244140625, 0.11179351806640625, 0.1273345947265625, 0.14287567138671875, 0.158416748046875, 0.17395782470703125, 0.1894989013671875, 0.20503997802734375, 0.2205810546875, 0.23612213134765625, 0.2516632080078125, 0.26720428466796875, 0.282745361328125, 0.29828643798828125, 0.3138275146484375, 0.32936859130859375, 0.34490966796875, 0.36045074462890625, 0.3759918212890625, 0.39153289794921875, 0.407073974609375, 0.42261505126953125, 0.4381561279296875, 0.45369720458984375, 0.46923828125]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 11.0, 9.0, 20.0, 29.0, 48.0, 54.0, 69.0, 74.0, 92.0, 107.0, 116.0, 80.0, 73.0, 75.0, 55.0, 40.0, 17.0, 12.0, 8.0, 8.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06683349609375, -0.06501054763793945, -0.0631875991821289, -0.06136465072631836, -0.05954170227050781, -0.057718753814697266, -0.05589580535888672, -0.05407285690307617, -0.052249908447265625, -0.05042695999145508, -0.04860401153564453, -0.046781063079833984, -0.04495811462402344, -0.04313516616821289, -0.041312217712402344, -0.0394892692565918, -0.03766632080078125, -0.0358433723449707, -0.034020423889160156, -0.03219747543334961, -0.030374526977539062, -0.028551578521728516, -0.02672863006591797, -0.024905681610107422, -0.023082733154296875, -0.021259784698486328, -0.01943683624267578, -0.017613887786865234, -0.015790939331054688, -0.01396799087524414, -0.012145042419433594, -0.010322093963623047, -0.0084991455078125, -0.006676197052001953, -0.004853248596191406, -0.0030303001403808594, -0.0012073516845703125, 0.0006155967712402344, 0.0024385452270507812, 0.004261493682861328, 0.006084442138671875, 0.007907390594482422, 0.009730339050292969, 0.011553287506103516, 0.013376235961914062, 0.01519918441772461, 0.017022132873535156, 0.018845081329345703, 0.02066802978515625, 0.022490978240966797, 0.024313926696777344, 0.02613687515258789, 0.027959823608398438, 0.029782772064208984, 0.03160572052001953, 0.03342866897583008, 0.035251617431640625, 0.03707456588745117, 0.03889751434326172, 0.040720462799072266, 0.04254341125488281, 0.04436635971069336, 0.046189308166503906, 0.04801225662231445, 0.049835205078125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 4.0, 4.0, 7.0, 11.0, 12.0, 16.0, 21.0, 32.0, 49.0, 66.0, 108.0, 183.0, 362.0, 914.0, 2851.0, 14932.0, 218539.0, 755561.0, 46290.0, 5799.0, 1480.0, 562.0, 307.0, 172.0, 97.0, 63.0, 33.0, 24.0, 20.0, 6.0, 9.0, 9.0, 6.0, 1.0, 0.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.272216796875, -0.262908935546875, -0.25360107421875, -0.244293212890625, -0.2349853515625, -0.225677490234375, -0.21636962890625, -0.207061767578125, -0.19775390625, -0.188446044921875, -0.17913818359375, -0.169830322265625, -0.1605224609375, -0.151214599609375, -0.14190673828125, -0.132598876953125, -0.123291015625, -0.113983154296875, -0.10467529296875, -0.095367431640625, -0.0860595703125, -0.076751708984375, -0.06744384765625, -0.058135986328125, -0.048828125, -0.039520263671875, -0.03021240234375, -0.020904541015625, -0.0115966796875, -0.002288818359375, 0.00701904296875, 0.016326904296875, 0.025634765625, 0.034942626953125, 0.04425048828125, 0.053558349609375, 0.0628662109375, 0.072174072265625, 0.08148193359375, 0.090789794921875, 0.10009765625, 0.109405517578125, 0.11871337890625, 0.128021240234375, 0.1373291015625, 0.146636962890625, 0.15594482421875, 0.165252685546875, 0.174560546875, 0.183868408203125, 0.19317626953125, 0.202484130859375, 0.2117919921875, 0.221099853515625, 0.23040771484375, 0.239715576171875, 0.2490234375, 0.258331298828125, 0.26763916015625, 0.276947021484375, 0.2862548828125, 0.295562744140625, 0.30487060546875, 0.314178466796875, 0.323486328125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 7.0, 7.0, 7.0, 11.0, 11.0, 11.0, 24.0, 18.0, 28.0, 39.0, 43.0, 69.0, 55.0, 83.0, 51.0, 57.0, 73.0, 49.0, 57.0, 50.0, 48.0, 51.0, 31.0, 42.0, 15.0, 12.0, 14.0, 9.0, 8.0, 3.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.14697265625, -0.14201736450195312, -0.13706207275390625, -0.13210678100585938, -0.1271514892578125, -0.12219619750976562, -0.11724090576171875, -0.11228561401367188, -0.107330322265625, -0.10237503051757812, -0.09741973876953125, -0.09246444702148438, -0.0875091552734375, -0.08255386352539062, -0.07759857177734375, -0.07264328002929688, -0.06768798828125, -0.06273269653320312, -0.05777740478515625, -0.052822113037109375, -0.0478668212890625, -0.042911529541015625, -0.03795623779296875, -0.033000946044921875, -0.028045654296875, -0.023090362548828125, -0.01813507080078125, -0.013179779052734375, -0.0082244873046875, -0.003269195556640625, 0.00168609619140625, 0.006641387939453125, 0.0115966796875, 0.016551971435546875, 0.02150726318359375, 0.026462554931640625, 0.0314178466796875, 0.036373138427734375, 0.04132843017578125, 0.046283721923828125, 0.051239013671875, 0.056194305419921875, 0.06114959716796875, 0.06610488891601562, 0.0710601806640625, 0.07601547241210938, 0.08097076416015625, 0.08592605590820312, 0.09088134765625, 0.09583663940429688, 0.10079193115234375, 0.10574722290039062, 0.1107025146484375, 0.11565780639648438, 0.12061309814453125, 0.12556838989257812, 0.130523681640625, 0.13547897338867188, 0.14043426513671875, 0.14538955688476562, 0.1503448486328125, 0.15530014038085938, 0.16025543212890625, 0.16521072387695312, 0.170166015625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 7.0, 18.0, 29.0, 38.0, 57.0, 107.0, 164.0, 265.0, 546.0, 1455.0, 4444.0, 20916.0, 257700.0, 689687.0, 60316.0, 8577.0, 2397.0, 885.0, 404.0, 208.0, 99.0, 79.0, 44.0, 33.0, 13.0, 11.0, 8.0, 5.0, 6.0, 9.0, 2.0, 4.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08416748046875, -0.08147335052490234, -0.07877922058105469, -0.07608509063720703, -0.07339096069335938, -0.07069683074951172, -0.06800270080566406, -0.0653085708618164, -0.06261444091796875, -0.059920310974121094, -0.05722618103027344, -0.05453205108642578, -0.051837921142578125, -0.04914379119873047, -0.04644966125488281, -0.043755531311035156, -0.0410614013671875, -0.038367271423339844, -0.03567314147949219, -0.03297901153564453, -0.030284881591796875, -0.02759075164794922, -0.024896621704101562, -0.022202491760253906, -0.01950836181640625, -0.016814231872558594, -0.014120101928710938, -0.011425971984863281, -0.008731842041015625, -0.006037712097167969, -0.0033435821533203125, -0.0006494522094726562, 0.002044677734375, 0.004738807678222656, 0.0074329376220703125, 0.010127067565917969, 0.012821197509765625, 0.015515327453613281, 0.018209457397460938, 0.020903587341308594, 0.02359771728515625, 0.026291847229003906, 0.028985977172851562, 0.03168010711669922, 0.034374237060546875, 0.03706836700439453, 0.03976249694824219, 0.042456626892089844, 0.0451507568359375, 0.047844886779785156, 0.05053901672363281, 0.05323314666748047, 0.055927276611328125, 0.05862140655517578, 0.06131553649902344, 0.0640096664428711, 0.06670379638671875, 0.0693979263305664, 0.07209205627441406, 0.07478618621826172, 0.07748031616210938, 0.08017444610595703, 0.08286857604980469, 0.08556270599365234, 0.0882568359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 4.0, 8.0, 13.0, 23.0, 22.0, 43.0, 50.0, 91.0, 109.0, 101.0, 111.0, 113.0, 104.0, 54.0, 56.0, 32.0, 16.0, 19.0, 11.0, 6.0, 8.0, 5.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.463859558105469e-06, -8.000992238521576e-06, -7.538124918937683e-06, -7.07525759935379e-06, -6.6123902797698975e-06, -6.149522960186005e-06, -5.686655640602112e-06, -5.223788321018219e-06, -4.760921001434326e-06, -4.298053681850433e-06, -3.8351863622665405e-06, -3.3723190426826477e-06, -2.909451723098755e-06, -2.446584403514862e-06, -1.9837170839309692e-06, -1.5208497643470764e-06, -1.0579824447631836e-06, -5.951151251792908e-07, -1.3224780559539795e-07, 3.3061951398849487e-07, 7.934868335723877e-07, 1.2563541531562805e-06, 1.7192214727401733e-06, 2.182088792324066e-06, 2.644956111907959e-06, 3.107823431491852e-06, 3.5706907510757446e-06, 4.0335580706596375e-06, 4.49642539024353e-06, 4.959292709827423e-06, 5.422160029411316e-06, 5.885027348995209e-06, 6.3478946685791016e-06, 6.810761988162994e-06, 7.273629307746887e-06, 7.73649662733078e-06, 8.199363946914673e-06, 8.662231266498566e-06, 9.125098586082458e-06, 9.587965905666351e-06, 1.0050833225250244e-05, 1.0513700544834137e-05, 1.097656786441803e-05, 1.1439435184001923e-05, 1.1902302503585815e-05, 1.2365169823169708e-05, 1.2828037142753601e-05, 1.3290904462337494e-05, 1.3753771781921387e-05, 1.421663910150528e-05, 1.4679506421089172e-05, 1.5142373740673065e-05, 1.5605241060256958e-05, 1.606810837984085e-05, 1.6530975699424744e-05, 1.6993843019008636e-05, 1.745671033859253e-05, 1.7919577658176422e-05, 1.8382444977760315e-05, 1.8845312297344208e-05, 1.93081796169281e-05, 1.9771046936511993e-05, 2.0233914256095886e-05, 2.069678157567978e-05, 2.1159648895263672e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 5.0, 5.0, 9.0, 6.0, 12.0, 17.0, 21.0, 34.0, 55.0, 76.0, 135.0, 189.0, 416.0, 932.0, 3484.0, 41509.0, 914711.0, 79908.0, 4895.0, 1098.0, 420.0, 223.0, 136.0, 90.0, 64.0, 25.0, 21.0, 13.0, 15.0, 8.0, 12.0, 4.0, 3.0, 2.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.138427734375, -0.1343059539794922, -0.13018417358398438, -0.12606239318847656, -0.12194061279296875, -0.11781883239746094, -0.11369705200195312, -0.10957527160644531, -0.1054534912109375, -0.10133171081542969, -0.09720993041992188, -0.09308815002441406, -0.08896636962890625, -0.08484458923339844, -0.08072280883789062, -0.07660102844238281, -0.072479248046875, -0.06835746765136719, -0.06423568725585938, -0.06011390686035156, -0.05599212646484375, -0.05187034606933594, -0.047748565673828125, -0.04362678527832031, -0.0395050048828125, -0.03538322448730469, -0.031261444091796875, -0.027139663696289062, -0.02301788330078125, -0.018896102905273438, -0.014774322509765625, -0.010652542114257812, -0.00653076171875, -0.0024089813232421875, 0.001712799072265625, 0.0058345794677734375, 0.00995635986328125, 0.014078140258789062, 0.018199920654296875, 0.022321701049804688, 0.0264434814453125, 0.030565261840820312, 0.034687042236328125, 0.03880882263183594, 0.04293060302734375, 0.04705238342285156, 0.051174163818359375, 0.05529594421386719, 0.059417724609375, 0.06353950500488281, 0.06766128540039062, 0.07178306579589844, 0.07590484619140625, 0.08002662658691406, 0.08414840698242188, 0.08827018737792969, 0.0923919677734375, 0.09651374816894531, 0.10063552856445312, 0.10475730895996094, 0.10887908935546875, 0.11300086975097656, 0.11712265014648438, 0.12124443054199219, 0.1253662109375]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 4.0, 9.0, 7.0, 14.0, 16.0, 23.0, 36.0, 51.0, 50.0, 56.0, 83.0, 107.0, 85.0, 92.0, 95.0, 66.0, 48.0, 38.0, 33.0, 25.0, 7.0, 11.0, 9.0, 9.0, 5.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05865478515625, -0.05679130554199219, -0.054927825927734375, -0.05306434631347656, -0.05120086669921875, -0.04933738708496094, -0.047473907470703125, -0.04561042785644531, -0.0437469482421875, -0.04188346862792969, -0.040019989013671875, -0.03815650939941406, -0.03629302978515625, -0.03442955017089844, -0.032566070556640625, -0.030702590942382812, -0.028839111328125, -0.026975631713867188, -0.025112152099609375, -0.023248672485351562, -0.02138519287109375, -0.019521713256835938, -0.017658233642578125, -0.015794754028320312, -0.0139312744140625, -0.012067794799804688, -0.010204315185546875, -0.008340835571289062, -0.00647735595703125, -0.0046138763427734375, -0.002750396728515625, -0.0008869171142578125, 0.0009765625, 0.0028400421142578125, 0.004703521728515625, 0.0065670013427734375, 0.00843048095703125, 0.010293960571289062, 0.012157440185546875, 0.014020919799804688, 0.0158843994140625, 0.017747879028320312, 0.019611358642578125, 0.021474838256835938, 0.02333831787109375, 0.025201797485351562, 0.027065277099609375, 0.028928756713867188, 0.030792236328125, 0.03265571594238281, 0.034519195556640625, 0.03638267517089844, 0.03824615478515625, 0.04010963439941406, 0.041973114013671875, 0.04383659362792969, 0.0457000732421875, 0.04756355285644531, 0.049427032470703125, 0.05129051208496094, 0.05315399169921875, 0.05501747131347656, 0.056880950927734375, 0.05874443054199219, 0.06060791015625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 19.0, 144.0, 461.0, 299.0, 57.0, 10.0, 7.0, 5.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8198766708374023, -1.7395495176315308, -1.6592223644256592, -1.5788952112197876, -1.498568058013916, -1.418241024017334, -1.3379138708114624, -1.2575867176055908, -1.1772595643997192, -1.0969324111938477, -1.016605257987976, -0.9362781643867493, -0.8559510111808777, -0.7756238579750061, -0.6952967643737793, -0.6149696111679077, -0.5346424579620361, -0.45431530475616455, -0.37398818135261536, -0.29366105794906616, -0.21333390474319458, -0.133006751537323, -0.052679628133773804, 0.02764749526977539, 0.10797464847564697, 0.18830178678035736, 0.26862892508506775, 0.34895604848861694, 0.4292832016944885, 0.5096103549003601, 0.5899374485015869, 0.6702646017074585, 0.7505917549133301, 0.8309189081192017, 0.9112460613250732, 0.9915731549263, 1.0719003677368164, 1.1522274017333984, 1.23255455493927, 1.3128817081451416, 1.3932088613510132, 1.4735360145568848, 1.5538631677627563, 1.634190320968628, 1.71451735496521, 1.794844627380371, 1.8751716613769531, 1.9554988145828247, 2.0358259677886963, 2.1161530017852783, 2.1964802742004395, 2.2768073081970215, 2.3571345806121826, 2.4374616146087646, 2.517788887023926, 2.598115921020508, 2.67844295501709, 2.758769989013672, 2.839097261428833, 2.919424295425415, 2.999751567840576, 3.080078601837158, 3.1604058742523193, 3.2407329082489014, 3.3210601806640625]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 5.0, 12.0, 10.0, 11.0, 17.0, 20.0, 15.0, 25.0, 36.0, 32.0, 40.0, 39.0, 45.0, 57.0, 51.0, 55.0, 61.0, 50.0, 48.0, 46.0, 55.0, 47.0, 37.0, 28.0, 30.0, 37.0, 23.0, 14.0, 8.0, 13.0, 7.0, 10.0, 4.0, 2.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.929733395576477, -0.9043305516242981, -0.8789277076721191, -0.853524923324585, -0.828122079372406, -0.802719235420227, -0.7773164510726929, -0.7519136071205139, -0.726510763168335, -0.701107919216156, -0.675705075263977, -0.6503022909164429, -0.6248994469642639, -0.599496603012085, -0.5740938186645508, -0.5486909747123718, -0.5232881307601929, -0.4978852868080139, -0.47248247265815735, -0.4470796585083008, -0.4216768145561218, -0.39627397060394287, -0.3708711564540863, -0.34546834230422974, -0.3200654983520508, -0.2946626543998718, -0.26925984025001526, -0.2438570111989975, -0.21845418214797974, -0.19305135309696198, -0.1676485240459442, -0.14224569499492645, -0.11684286594390869, -0.09144003689289093, -0.06603720784187317, -0.04063437879085541, -0.015231549739837646, 0.010171279311180115, 0.035574108362197876, 0.06097693741321564, 0.0863797664642334, 0.11178259551525116, 0.13718542456626892, 0.16258825361728668, 0.18799108266830444, 0.2133939117193222, 0.23879674077033997, 0.26419955492019653, 0.2896023988723755, 0.31500524282455444, 0.340408056974411, 0.3658108711242676, 0.39121371507644653, 0.4166165590286255, 0.44201937317848206, 0.4674221873283386, 0.4928250312805176, 0.5182278752326965, 0.5436307191848755, 0.5690335035324097, 0.5944363474845886, 0.6198391914367676, 0.6452419757843018, 0.6706448197364807, 0.6960476636886597]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 2.0, 4.0, 6.0, 5.0, 11.0, 17.0, 19.0, 45.0, 73.0, 154.0, 297.0, 938.0, 3872.0, 68626.0, 4096433.0, 21314.0, 1886.0, 391.0, 107.0, 40.0, 23.0, 11.0, 4.0, 3.0, 5.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.48583984375, -0.4630889892578125, -0.440338134765625, -0.4175872802734375, -0.39483642578125, -0.3720855712890625, -0.349334716796875, -0.3265838623046875, -0.3038330078125, -0.2810821533203125, -0.258331298828125, -0.2355804443359375, -0.21282958984375, -0.1900787353515625, -0.167327880859375, -0.1445770263671875, -0.121826171875, -0.0990753173828125, -0.076324462890625, -0.0535736083984375, -0.03082275390625, -0.0080718994140625, 0.014678955078125, 0.0374298095703125, 0.0601806640625, 0.0829315185546875, 0.105682373046875, 0.1284332275390625, 0.15118408203125, 0.1739349365234375, 0.196685791015625, 0.2194366455078125, 0.2421875, 0.2649383544921875, 0.287689208984375, 0.3104400634765625, 0.33319091796875, 0.3559417724609375, 0.378692626953125, 0.4014434814453125, 0.4241943359375, 0.4469451904296875, 0.469696044921875, 0.4924468994140625, 0.51519775390625, 0.5379486083984375, 0.560699462890625, 0.5834503173828125, 0.606201171875, 0.6289520263671875, 0.651702880859375, 0.6744537353515625, 0.69720458984375, 0.7199554443359375, 0.742706298828125, 0.7654571533203125, 0.7882080078125, 0.8109588623046875, 0.833709716796875, 0.8564605712890625, 0.87921142578125, 0.9019622802734375, 0.924713134765625, 0.9474639892578125, 0.97021484375]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 8.0, 7.0, 12.0, 23.0, 34.0, 35.0, 66.0, 63.0, 67.0, 81.0, 103.0, 83.0, 98.0, 76.0, 71.0, 44.0, 39.0, 40.0, 19.0, 11.0, 8.0, 7.0, 2.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06475830078125, -0.06309700012207031, -0.061435699462890625, -0.05977439880371094, -0.05811309814453125, -0.05645179748535156, -0.054790496826171875, -0.05312919616699219, -0.0514678955078125, -0.04980659484863281, -0.048145294189453125, -0.04648399353027344, -0.04482269287109375, -0.04316139221191406, -0.041500091552734375, -0.03983879089355469, -0.038177490234375, -0.03651618957519531, -0.034854888916015625, -0.03319358825683594, -0.03153228759765625, -0.029870986938476562, -0.028209686279296875, -0.026548385620117188, -0.0248870849609375, -0.023225784301757812, -0.021564483642578125, -0.019903182983398438, -0.01824188232421875, -0.016580581665039062, -0.014919281005859375, -0.013257980346679688, -0.0115966796875, -0.009935379028320312, -0.008274078369140625, -0.0066127777099609375, -0.00495147705078125, -0.0032901763916015625, -0.001628875732421875, 3.24249267578125e-05, 0.0016937255859375, 0.0033550262451171875, 0.005016326904296875, 0.0066776275634765625, 0.00833892822265625, 0.010000228881835938, 0.011661529541015625, 0.013322830200195312, 0.014984130859375, 0.016645431518554688, 0.018306732177734375, 0.019968032836914062, 0.02162933349609375, 0.023290634155273438, 0.024951934814453125, 0.026613235473632812, 0.0282745361328125, 0.029935836791992188, 0.031597137451171875, 0.03325843811035156, 0.03491973876953125, 0.03658103942871094, 0.038242340087890625, 0.03990364074707031, 0.04156494140625]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 9.0, 19.0, 26.0, 78.0, 167.0, 1024.0, 4191848.0, 717.0, 186.0, 91.0, 64.0, 32.0, 12.0, 10.0, 3.0, 5.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.716796875, -1.605682373046875, -1.49456787109375, -1.383453369140625, -1.2723388671875, -1.161224365234375, -1.05010986328125, -0.938995361328125, -0.827880859375, -0.716766357421875, -0.60565185546875, -0.494537353515625, -0.3834228515625, -0.272308349609375, -0.16119384765625, -0.050079345703125, 0.06103515625, 0.172149658203125, 0.28326416015625, 0.394378662109375, 0.5054931640625, 0.616607666015625, 0.72772216796875, 0.838836669921875, 0.949951171875, 1.061065673828125, 1.17218017578125, 1.283294677734375, 1.3944091796875, 1.505523681640625, 1.61663818359375, 1.727752685546875, 1.8388671875, 1.949981689453125, 2.06109619140625, 2.172210693359375, 2.2833251953125, 2.394439697265625, 2.50555419921875, 2.616668701171875, 2.727783203125, 2.838897705078125, 2.95001220703125, 3.061126708984375, 3.1722412109375, 3.283355712890625, 3.39447021484375, 3.505584716796875, 3.61669921875, 3.727813720703125, 3.83892822265625, 3.950042724609375, 4.0611572265625, 4.172271728515625, 4.28338623046875, 4.394500732421875, 4.505615234375, 4.616729736328125, 4.72784423828125, 4.838958740234375, 4.9500732421875, 5.061187744140625, 5.17230224609375, 5.283416748046875, 5.39453125]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 13.0, 242.0, 3727.0, 91.0, 13.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.207763671875, -0.19328689575195312, -0.17881011962890625, -0.16433334350585938, -0.1498565673828125, -0.13537979125976562, -0.12090301513671875, -0.10642623901367188, -0.091949462890625, -0.07747268676757812, -0.06299591064453125, -0.048519134521484375, -0.0340423583984375, -0.019565582275390625, -0.00508880615234375, 0.009387969970703125, 0.02386474609375, 0.038341522216796875, 0.05281829833984375, 0.06729507446289062, 0.0817718505859375, 0.09624862670898438, 0.11072540283203125, 0.12520217895507812, 0.139678955078125, 0.15415573120117188, 0.16863250732421875, 0.18310928344726562, 0.1975860595703125, 0.21206283569335938, 0.22653961181640625, 0.24101638793945312, 0.2554931640625, 0.2699699401855469, 0.28444671630859375, 0.2989234924316406, 0.3134002685546875, 0.3278770446777344, 0.34235382080078125, 0.3568305969238281, 0.371307373046875, 0.3857841491699219, 0.40026092529296875, 0.4147377014160156, 0.4292144775390625, 0.4436912536621094, 0.45816802978515625, 0.4726448059082031, 0.48712158203125, 0.5015983581542969, 0.5160751342773438, 0.5305519104003906, 0.5450286865234375, 0.5595054626464844, 0.5739822387695312, 0.5884590148925781, 0.602935791015625, 0.6174125671386719, 0.6318893432617188, 0.6463661193847656, 0.6608428955078125, 0.6753196716308594, 0.6897964477539062, 0.7042732238769531, 0.71875]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 19.0, 990.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.337606430053711, -11.087301254272461, -10.836997032165527, -10.586692810058594, -10.336387634277344, -10.086082458496094, -9.83577823638916, -9.585474014282227, -9.335168838500977, -9.084863662719727, -8.834559440612793, -8.58425521850586, -8.33395004272461, -8.08364486694336, -7.833340644836426, -7.583035945892334, -7.332731246948242, -7.08242654800415, -6.832121849060059, -6.581817150115967, -6.331512451171875, -6.081207752227783, -5.830903053283691, -5.5805983543396, -5.330293655395508, -5.079988956451416, -4.829684257507324, -4.579379558563232, -4.329074859619141, -4.078770160675049, -3.828465461730957, -3.5781607627868652, -3.3278555870056152, -3.0775508880615234, -2.8272461891174316, -2.57694149017334, -2.326636791229248, -2.0763320922851562, -1.8260273933410645, -1.5757226943969727, -1.3254179954528809, -1.075113296508789, -0.8248085975646973, -0.5745038986206055, -0.32419919967651367, -0.07389450073242188, 0.17641019821166992, 0.4267148971557617, 0.6770195960998535, 0.9273242950439453, 1.177628993988037, 1.427933692932129, 1.6782383918762207, 1.9285430908203125, 2.1788477897644043, 2.429152488708496, 2.679457187652588, 2.9297618865966797, 3.1800665855407715, 3.4303712844848633, 3.680675983428955, 3.930980682373047, 4.181285381317139, 4.4315900802612305, 4.681894779205322]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 10.0, 19.0, 32.0, 72.0, 133.0, 190.0, 186.0, 173.0, 107.0, 45.0, 17.0, 15.0, 8.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2306691408157349, -1.1987781524658203, -1.1668870449066162, -1.1349960565567017, -1.1031049489974976, -1.071213960647583, -1.039322853088379, -1.0074318647384644, -0.975540816783905, -0.9436497688293457, -0.9117587208747864, -0.879867672920227, -0.8479766845703125, -0.8160855770111084, -0.7841945886611938, -0.7523035407066345, -0.7204124927520752, -0.6885214447975159, -0.6566303968429565, -0.6247393488883972, -0.5928483009338379, -0.5609573125839233, -0.529066264629364, -0.4971752166748047, -0.46528416872024536, -0.43339312076568604, -0.4015020728111267, -0.36961105465888977, -0.33772000670433044, -0.3058289587497711, -0.2739379405975342, -0.24204689264297485, -0.21015572547912598, -0.17826467752456665, -0.14637364447116852, -0.11448260396718979, -0.08259156346321106, -0.05070051550865173, -0.0188094824552536, 0.013081550598144531, 0.04497259855270386, 0.07686363905668259, 0.10875467956066132, 0.14064571261405945, 0.17253676056861877, 0.2044278085231781, 0.23631884157657623, 0.26820987462997437, 0.3001009225845337, 0.331991970539093, 0.36388301849365234, 0.3957740366458893, 0.4276650846004486, 0.45955613255500793, 0.4914471507072449, 0.5233381986618042, 0.5552292466163635, 0.5871202945709229, 0.6190113425254822, 0.6509023904800415, 0.682793378829956, 0.7146844863891602, 0.7465754747390747, 0.778466522693634, 0.8103575706481934]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 0.0, 4.0, 0.0, 7.0, 4.0, 6.0, 5.0, 20.0, 15.0, 12.0, 21.0, 29.0, 42.0, 69.0, 67.0, 136.0, 230.0, 407.0, 831.0, 2238.0, 7645.0, 40504.0, 401394.0, 526977.0, 53715.0, 9516.0, 2623.0, 983.0, 406.0, 208.0, 142.0, 89.0, 65.0, 40.0, 25.0, 29.0, 11.0, 13.0, 12.0, 6.0, 5.0, 2.0, 4.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2310791015625, -0.22339439392089844, -0.21570968627929688, -0.2080249786376953, -0.20034027099609375, -0.1926555633544922, -0.18497085571289062, -0.17728614807128906, -0.1696014404296875, -0.16191673278808594, -0.15423202514648438, -0.1465473175048828, -0.13886260986328125, -0.1311779022216797, -0.12349319458007812, -0.11580848693847656, -0.108123779296875, -0.10043907165527344, -0.09275436401367188, -0.08506965637207031, -0.07738494873046875, -0.06970024108886719, -0.062015533447265625, -0.05433082580566406, -0.0466461181640625, -0.03896141052246094, -0.031276702880859375, -0.023591995239257812, -0.01590728759765625, -0.008222579956054688, -0.000537872314453125, 0.0071468353271484375, 0.01483154296875, 0.022516250610351562, 0.030200958251953125, 0.03788566589355469, 0.04557037353515625, 0.05325508117675781, 0.060939788818359375, 0.06862449645996094, 0.0763092041015625, 0.08399391174316406, 0.09167861938476562, 0.09936332702636719, 0.10704803466796875, 0.11473274230957031, 0.12241744995117188, 0.13010215759277344, 0.137786865234375, 0.14547157287597656, 0.15315628051757812, 0.1608409881591797, 0.16852569580078125, 0.1762104034423828, 0.18389511108398438, 0.19157981872558594, 0.1992645263671875, 0.20694923400878906, 0.21463394165039062, 0.2223186492919922, 0.23000335693359375, 0.2376880645751953, 0.24537277221679688, 0.25305747985839844, 0.2607421875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 4.0, 11.0, 11.0, 18.0, 31.0, 27.0, 46.0, 67.0, 71.0, 80.0, 89.0, 99.0, 74.0, 77.0, 91.0, 55.0, 46.0, 43.0, 18.0, 13.0, 13.0, 7.0, 5.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.053314208984375, -0.05176544189453125, -0.0502166748046875, -0.04866790771484375, -0.047119140625, -0.04557037353515625, -0.0440216064453125, -0.04247283935546875, -0.040924072265625, -0.03937530517578125, -0.0378265380859375, -0.03627777099609375, -0.03472900390625, -0.03318023681640625, -0.0316314697265625, -0.03008270263671875, -0.028533935546875, -0.02698516845703125, -0.0254364013671875, -0.02388763427734375, -0.0223388671875, -0.02079010009765625, -0.0192413330078125, -0.01769256591796875, -0.016143798828125, -0.01459503173828125, -0.0130462646484375, -0.01149749755859375, -0.00994873046875, -0.00839996337890625, -0.0068511962890625, -0.00530242919921875, -0.003753662109375, -0.00220489501953125, -0.0006561279296875, 0.00089263916015625, 0.00244140625, 0.00399017333984375, 0.0055389404296875, 0.00708770751953125, 0.008636474609375, 0.01018524169921875, 0.0117340087890625, 0.01328277587890625, 0.01483154296875, 0.01638031005859375, 0.0179290771484375, 0.01947784423828125, 0.021026611328125, 0.02257537841796875, 0.0241241455078125, 0.02567291259765625, 0.0272216796875, 0.02877044677734375, 0.0303192138671875, 0.03186798095703125, 0.033416748046875, 0.03496551513671875, 0.0365142822265625, 0.03806304931640625, 0.03961181640625, 0.04116058349609375, 0.0427093505859375, 0.04425811767578125, 0.045806884765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 4.0, 4.0, 2.0, 12.0, 9.0, 19.0, 26.0, 40.0, 46.0, 69.0, 98.0, 168.0, 349.0, 705.0, 1722.0, 6268.0, 45383.0, 694434.0, 274536.0, 18655.0, 3639.0, 1196.0, 491.0, 254.0, 154.0, 90.0, 55.0, 40.0, 23.0, 19.0, 17.0, 6.0, 3.0, 8.0, 4.0, 4.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3095703125, -0.3011589050292969, -0.29274749755859375, -0.2843360900878906, -0.2759246826171875, -0.2675132751464844, -0.25910186767578125, -0.2506904602050781, -0.242279052734375, -0.23386764526367188, -0.22545623779296875, -0.21704483032226562, -0.2086334228515625, -0.20022201538085938, -0.19181060791015625, -0.18339920043945312, -0.17498779296875, -0.16657638549804688, -0.15816497802734375, -0.14975357055664062, -0.1413421630859375, -0.13293075561523438, -0.12451934814453125, -0.11610794067382812, -0.107696533203125, -0.09928512573242188, -0.09087371826171875, -0.08246231079101562, -0.0740509033203125, -0.06563949584960938, -0.05722808837890625, -0.048816680908203125, -0.0404052734375, -0.031993865966796875, -0.02358245849609375, -0.015171051025390625, -0.0067596435546875, 0.001651763916015625, 0.01006317138671875, 0.018474578857421875, 0.026885986328125, 0.035297393798828125, 0.04370880126953125, 0.052120208740234375, 0.0605316162109375, 0.06894302368164062, 0.07735443115234375, 0.08576583862304688, 0.09417724609375, 0.10258865356445312, 0.11100006103515625, 0.11941146850585938, 0.1278228759765625, 0.13623428344726562, 0.14464569091796875, 0.15305709838867188, 0.161468505859375, 0.16987991333007812, 0.17829132080078125, 0.18670272827148438, 0.1951141357421875, 0.20352554321289062, 0.21193695068359375, 0.22034835815429688, 0.228759765625]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 0.0, 4.0, 7.0, 2.0, 8.0, 11.0, 15.0, 14.0, 19.0, 22.0, 34.0, 24.0, 44.0, 38.0, 51.0, 53.0, 61.0, 69.0, 66.0, 65.0, 63.0, 44.0, 53.0, 47.0, 41.0, 39.0, 24.0, 24.0, 16.0, 13.0, 10.0, 7.0, 2.0, 7.0, 5.0, 1.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18798828125, -0.18285369873046875, -0.1777191162109375, -0.17258453369140625, -0.167449951171875, -0.16231536865234375, -0.1571807861328125, -0.15204620361328125, -0.14691162109375, -0.14177703857421875, -0.1366424560546875, -0.13150787353515625, -0.126373291015625, -0.12123870849609375, -0.1161041259765625, -0.11096954345703125, -0.1058349609375, -0.10070037841796875, -0.0955657958984375, -0.09043121337890625, -0.085296630859375, -0.08016204833984375, -0.0750274658203125, -0.06989288330078125, -0.06475830078125, -0.05962371826171875, -0.0544891357421875, -0.04935455322265625, -0.044219970703125, -0.03908538818359375, -0.0339508056640625, -0.02881622314453125, -0.023681640625, -0.01854705810546875, -0.0134124755859375, -0.00827789306640625, -0.003143310546875, 0.00199127197265625, 0.0071258544921875, 0.01226043701171875, 0.01739501953125, 0.02252960205078125, 0.0276641845703125, 0.03279876708984375, 0.037933349609375, 0.04306793212890625, 0.0482025146484375, 0.05333709716796875, 0.0584716796875, 0.06360626220703125, 0.0687408447265625, 0.07387542724609375, 0.079010009765625, 0.08414459228515625, 0.0892791748046875, 0.09441375732421875, 0.09954833984375, 0.10468292236328125, 0.1098175048828125, 0.11495208740234375, 0.120086669921875, 0.12522125244140625, 0.1303558349609375, 0.13549041748046875, 0.140625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 8.0, 12.0, 14.0, 37.0, 83.0, 209.0, 616.0, 2170.0, 19794.0, 896211.0, 122781.0, 4987.0, 1072.0, 335.0, 120.0, 54.0, 19.0, 11.0, 12.0, 6.0, 3.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0892333984375, -0.08470916748046875, -0.0801849365234375, -0.07566070556640625, -0.071136474609375, -0.06661224365234375, -0.0620880126953125, -0.05756378173828125, -0.05303955078125, -0.04851531982421875, -0.0439910888671875, -0.03946685791015625, -0.034942626953125, -0.03041839599609375, -0.0258941650390625, -0.02136993408203125, -0.016845703125, -0.01232147216796875, -0.0077972412109375, -0.00327301025390625, 0.001251220703125, 0.00577545166015625, 0.0102996826171875, 0.01482391357421875, 0.01934814453125, 0.02387237548828125, 0.0283966064453125, 0.03292083740234375, 0.037445068359375, 0.04196929931640625, 0.0464935302734375, 0.05101776123046875, 0.0555419921875, 0.06006622314453125, 0.0645904541015625, 0.06911468505859375, 0.073638916015625, 0.07816314697265625, 0.0826873779296875, 0.08721160888671875, 0.09173583984375, 0.09626007080078125, 0.1007843017578125, 0.10530853271484375, 0.109832763671875, 0.11435699462890625, 0.1188812255859375, 0.12340545654296875, 0.1279296875, 0.13245391845703125, 0.1369781494140625, 0.14150238037109375, 0.146026611328125, 0.15055084228515625, 0.1550750732421875, 0.15959930419921875, 0.16412353515625, 0.16864776611328125, 0.1731719970703125, 0.17769622802734375, 0.182220458984375, 0.18674468994140625, 0.1912689208984375, 0.19579315185546875, 0.2003173828125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 7.0, 5.0, 10.0, 16.0, 17.0, 40.0, 84.0, 100.0, 131.0, 170.0, 148.0, 112.0, 67.0, 42.0, 25.0, 14.0, 11.0, 9.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.294778823852539e-05, -2.23526731133461e-05, -2.175755798816681e-05, -2.116244286298752e-05, -2.0567327737808228e-05, -1.9972212612628937e-05, -1.9377097487449646e-05, -1.8781982362270355e-05, -1.8186867237091064e-05, -1.7591752111911774e-05, -1.6996636986732483e-05, -1.6401521861553192e-05, -1.58064067363739e-05, -1.521129161119461e-05, -1.461617648601532e-05, -1.4021061360836029e-05, -1.3425946235656738e-05, -1.2830831110477448e-05, -1.2235715985298157e-05, -1.1640600860118866e-05, -1.1045485734939575e-05, -1.0450370609760284e-05, -9.855255484580994e-06, -9.260140359401703e-06, -8.665025234222412e-06, -8.069910109043121e-06, -7.4747949838638306e-06, -6.87967985868454e-06, -6.284564733505249e-06, -5.689449608325958e-06, -5.0943344831466675e-06, -4.499219357967377e-06, -3.904104232788086e-06, -3.308989107608795e-06, -2.7138739824295044e-06, -2.1187588572502136e-06, -1.5236437320709229e-06, -9.285286068916321e-07, -3.334134817123413e-07, 2.6170164346694946e-07, 8.568167686462402e-07, 1.451931893825531e-06, 2.0470470190048218e-06, 2.6421621441841125e-06, 3.2372772693634033e-06, 3.832392394542694e-06, 4.427507519721985e-06, 5.022622644901276e-06, 5.617737770080566e-06, 6.212852895259857e-06, 6.807968020439148e-06, 7.403083145618439e-06, 7.99819827079773e-06, 8.59331339597702e-06, 9.188428521156311e-06, 9.783543646335602e-06, 1.0378658771514893e-05, 1.0973773896694183e-05, 1.1568889021873474e-05, 1.2164004147052765e-05, 1.2759119272232056e-05, 1.3354234397411346e-05, 1.3949349522590637e-05, 1.4544464647769928e-05, 1.5139579772949219e-05]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 1.0, 7.0, 11.0, 14.0, 22.0, 31.0, 41.0, 69.0, 150.0, 279.0, 673.0, 2170.0, 15702.0, 728531.0, 290262.0, 7991.0, 1534.0, 534.0, 223.0, 126.0, 75.0, 36.0, 26.0, 17.0, 11.0, 11.0, 3.0, 3.0, 5.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1414794921875, -0.1377429962158203, -0.13400650024414062, -0.13027000427246094, -0.12653350830078125, -0.12279701232910156, -0.11906051635742188, -0.11532402038574219, -0.1115875244140625, -0.10785102844238281, -0.10411453247070312, -0.10037803649902344, -0.09664154052734375, -0.09290504455566406, -0.08916854858398438, -0.08543205261230469, -0.081695556640625, -0.07795906066894531, -0.07422256469726562, -0.07048606872558594, -0.06674957275390625, -0.06301307678222656, -0.059276580810546875, -0.05554008483886719, -0.0518035888671875, -0.04806709289550781, -0.044330596923828125, -0.04059410095214844, -0.03685760498046875, -0.03312110900878906, -0.029384613037109375, -0.025648117065429688, -0.02191162109375, -0.018175125122070312, -0.014438629150390625, -0.010702133178710938, -0.00696563720703125, -0.0032291412353515625, 0.000507354736328125, 0.0042438507080078125, 0.0079803466796875, 0.011716842651367188, 0.015453338623046875, 0.019189834594726562, 0.02292633056640625, 0.026662826538085938, 0.030399322509765625, 0.03413581848144531, 0.037872314453125, 0.04160881042480469, 0.045345306396484375, 0.04908180236816406, 0.05281829833984375, 0.05655479431152344, 0.060291290283203125, 0.06402778625488281, 0.0677642822265625, 0.07150077819824219, 0.07523727416992188, 0.07897377014160156, 0.08271026611328125, 0.08644676208496094, 0.09018325805664062, 0.09391975402832031, 0.09765625]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 3.0, 8.0, 11.0, 12.0, 17.0, 34.0, 47.0, 78.0, 96.0, 128.0, 113.0, 142.0, 106.0, 72.0, 49.0, 43.0, 17.0, 11.0, 9.0, 8.0, 3.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08221435546875, -0.07968330383300781, -0.07715225219726562, -0.07462120056152344, -0.07209014892578125, -0.06955909729003906, -0.06702804565429688, -0.06449699401855469, -0.0619659423828125, -0.05943489074707031, -0.056903839111328125, -0.05437278747558594, -0.05184173583984375, -0.04931068420410156, -0.046779632568359375, -0.04424858093261719, -0.041717529296875, -0.03918647766113281, -0.036655426025390625, -0.03412437438964844, -0.03159332275390625, -0.029062271118164062, -0.026531219482421875, -0.024000167846679688, -0.0214691162109375, -0.018938064575195312, -0.016407012939453125, -0.013875961303710938, -0.01134490966796875, -0.008813858032226562, -0.006282806396484375, -0.0037517547607421875, -0.001220703125, 0.0013103485107421875, 0.003841400146484375, 0.0063724517822265625, 0.00890350341796875, 0.011434555053710938, 0.013965606689453125, 0.016496658325195312, 0.0190277099609375, 0.021558761596679688, 0.024089813232421875, 0.026620864868164062, 0.02915191650390625, 0.03168296813964844, 0.034214019775390625, 0.03674507141113281, 0.039276123046875, 0.04180717468261719, 0.044338226318359375, 0.04686927795410156, 0.04940032958984375, 0.05193138122558594, 0.054462432861328125, 0.05699348449707031, 0.0595245361328125, 0.06205558776855469, 0.06458663940429688, 0.06711769104003906, 0.06964874267578125, 0.07217979431152344, 0.07471084594726562, 0.07724189758300781, 0.07977294921875]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 5.0, 20.0, 78.0, 316.0, 405.0, 133.0, 32.0, 11.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.2983202934265137, -3.2270288467407227, -3.1557374000549316, -3.0844459533691406, -3.0131545066833496, -2.9418630599975586, -2.8705716133117676, -2.7992801666259766, -2.7279887199401855, -2.6566972732543945, -2.5854058265686035, -2.5141143798828125, -2.4428229331970215, -2.3715314865112305, -2.3002400398254395, -2.2289485931396484, -2.1576571464538574, -2.0863656997680664, -2.0150742530822754, -1.9437828063964844, -1.8724913597106934, -1.8011999130249023, -1.7299084663391113, -1.6586170196533203, -1.5873253345489502, -1.5160338878631592, -1.4447424411773682, -1.3734509944915771, -1.3021595478057861, -1.2308681011199951, -1.159576654434204, -1.088285207748413, -1.0169938802719116, -0.9457024335861206, -0.8744109869003296, -0.8031195402145386, -0.7318280935287476, -0.6605366468429565, -0.5892451405525208, -0.5179536938667297, -0.4466622471809387, -0.3753708004951477, -0.3040793538093567, -0.2327878773212433, -0.16149643063545227, -0.09020498394966125, -0.01891350746154785, 0.052377939224243164, 0.12366938591003418, 0.1949608325958252, 0.2662522792816162, 0.3375437557697296, 0.40883520245552063, 0.48012664914131165, 0.551418125629425, 0.6227095723152161, 0.6940010190010071, 0.7652924656867981, 0.8365839123725891, 0.9078754186630249, 0.9791668653488159, 1.050458312034607, 1.121749758720398, 1.193041205406189, 1.26433265209198]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 9.0, 7.0, 18.0, 8.0, 18.0, 28.0, 26.0, 30.0, 42.0, 32.0, 50.0, 54.0, 41.0, 56.0, 62.0, 48.0, 49.0, 53.0, 44.0, 52.0, 41.0, 36.0, 34.0, 18.0, 27.0, 17.0, 23.0, 16.0, 13.0, 7.0, 9.0, 7.0, 4.0, 5.0, 5.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7578319311141968, -0.7336319088935852, -0.7094318866729736, -0.6852318048477173, -0.6610317826271057, -0.6368317604064941, -0.6126317381858826, -0.588431715965271, -0.5642316341400146, -0.5400316119194031, -0.5158315896987915, -0.49163153767585754, -0.4674314856529236, -0.443231463432312, -0.41903144121170044, -0.3948313891887665, -0.3706313669681549, -0.34643134474754333, -0.3222312927246094, -0.2980312705039978, -0.27383121848106384, -0.24963119626045227, -0.2254311591386795, -0.20123112201690674, -0.17703108489513397, -0.1528310477733612, -0.12863101065158844, -0.10443098098039627, -0.0802309438586235, -0.05603090673685074, -0.03183087706565857, -0.007630839943885803, 0.016569197177886963, 0.04076923429965973, 0.0649692714214325, 0.08916930109262466, 0.11336933821439743, 0.1375693678855896, 0.16176940500736237, 0.18596944212913513, 0.2101694792509079, 0.23436951637268066, 0.25856953859329224, 0.2827695906162262, 0.30696961283683777, 0.33116966485977173, 0.3553696870803833, 0.3795697093009949, 0.40376976132392883, 0.4279697835445404, 0.45216983556747437, 0.47636985778808594, 0.5005698800086975, 0.5247699618339539, 0.5489699840545654, 0.573170006275177, 0.5973700284957886, 0.6215700507164001, 0.6457700729370117, 0.6699701547622681, 0.6941701769828796, 0.7183701992034912, 0.7425702214241028, 0.7667702436447144, 0.7909703254699707]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 7.0, 12.0, 11.0, 21.0, 17.0, 42.0, 57.0, 102.0, 178.0, 386.0, 802.0, 2168.0, 7307.0, 45422.0, 3790447.0, 325829.0, 16049.0, 3505.0, 1109.0, 376.0, 189.0, 81.0, 66.0, 28.0, 21.0, 15.0, 13.0, 2.0, 4.0, 4.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.30419921875, -0.2919197082519531, -0.27964019775390625, -0.2673606872558594, -0.2550811767578125, -0.24280166625976562, -0.23052215576171875, -0.21824264526367188, -0.205963134765625, -0.19368362426757812, -0.18140411376953125, -0.16912460327148438, -0.1568450927734375, -0.14456558227539062, -0.13228607177734375, -0.12000656127929688, -0.10772705078125, -0.09544754028320312, -0.08316802978515625, -0.07088851928710938, -0.0586090087890625, -0.046329498291015625, -0.03404998779296875, -0.021770477294921875, -0.009490966796875, 0.002788543701171875, 0.01506805419921875, 0.027347564697265625, 0.0396270751953125, 0.051906585693359375, 0.06418609619140625, 0.07646560668945312, 0.0887451171875, 0.10102462768554688, 0.11330413818359375, 0.12558364868164062, 0.1378631591796875, 0.15014266967773438, 0.16242218017578125, 0.17470169067382812, 0.186981201171875, 0.19926071166992188, 0.21154022216796875, 0.22381973266601562, 0.2360992431640625, 0.24837875366210938, 0.26065826416015625, 0.2729377746582031, 0.28521728515625, 0.2974967956542969, 0.30977630615234375, 0.3220558166503906, 0.3343353271484375, 0.3466148376464844, 0.35889434814453125, 0.3711738586425781, 0.383453369140625, 0.3957328796386719, 0.40801239013671875, 0.4202919006347656, 0.4325714111328125, 0.4448509216308594, 0.45713043212890625, 0.4694099426269531, 0.481689453125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 2.0, 9.0, 11.0, 18.0, 21.0, 28.0, 32.0, 55.0, 41.0, 64.0, 83.0, 89.0, 82.0, 96.0, 77.0, 68.0, 46.0, 44.0, 42.0, 28.0, 24.0, 21.0, 8.0, 8.0, 2.0, 0.0, 1.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.044097900390625, -0.042702674865722656, -0.04130744934082031, -0.03991222381591797, -0.038516998291015625, -0.03712177276611328, -0.03572654724121094, -0.034331321716308594, -0.03293609619140625, -0.031540870666503906, -0.030145645141601562, -0.02875041961669922, -0.027355194091796875, -0.02595996856689453, -0.024564743041992188, -0.023169517517089844, -0.0217742919921875, -0.020379066467285156, -0.018983840942382812, -0.01758861541748047, -0.016193389892578125, -0.014798164367675781, -0.013402938842773438, -0.012007713317871094, -0.01061248779296875, -0.009217262268066406, -0.007822036743164062, -0.006426811218261719, -0.005031585693359375, -0.0036363601684570312, -0.0022411346435546875, -0.0008459091186523438, 0.00054931640625, 0.0019445419311523438, 0.0033397674560546875, 0.004734992980957031, 0.006130218505859375, 0.007525444030761719, 0.008920669555664062, 0.010315895080566406, 0.01171112060546875, 0.013106346130371094, 0.014501571655273438, 0.01589679718017578, 0.017292022705078125, 0.01868724822998047, 0.020082473754882812, 0.021477699279785156, 0.0228729248046875, 0.024268150329589844, 0.025663375854492188, 0.02705860137939453, 0.028453826904296875, 0.02984905242919922, 0.031244277954101562, 0.032639503479003906, 0.03403472900390625, 0.035429954528808594, 0.03682518005371094, 0.03822040557861328, 0.039615631103515625, 0.04101085662841797, 0.04240608215332031, 0.043801307678222656, 0.045196533203125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 5.0, 4.0, 3.0, 4.0, 6.0, 13.0, 12.0, 17.0, 28.0, 53.0, 96.0, 112.0, 214.0, 394.0, 1071.0, 3853.0, 34434.0, 4087200.0, 58713.0, 5710.0, 1356.0, 482.0, 204.0, 115.0, 59.0, 35.0, 20.0, 24.0, 14.0, 16.0, 3.0, 2.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.5087890625, -0.4931640625, -0.4775390625, -0.4619140625, -0.4462890625, -0.4306640625, -0.4150390625, -0.3994140625, -0.3837890625, -0.3681640625, -0.3525390625, -0.3369140625, -0.3212890625, -0.3056640625, -0.2900390625, -0.2744140625, -0.2587890625, -0.2431640625, -0.2275390625, -0.2119140625, -0.1962890625, -0.1806640625, -0.1650390625, -0.1494140625, -0.1337890625, -0.1181640625, -0.1025390625, -0.0869140625, -0.0712890625, -0.0556640625, -0.0400390625, -0.0244140625, -0.0087890625, 0.0068359375, 0.0224609375, 0.0380859375, 0.0537109375, 0.0693359375, 0.0849609375, 0.1005859375, 0.1162109375, 0.1318359375, 0.1474609375, 0.1630859375, 0.1787109375, 0.1943359375, 0.2099609375, 0.2255859375, 0.2412109375, 0.2568359375, 0.2724609375, 0.2880859375, 0.3037109375, 0.3193359375, 0.3349609375, 0.3505859375, 0.3662109375, 0.3818359375, 0.3974609375, 0.4130859375, 0.4287109375, 0.4443359375, 0.4599609375, 0.4755859375, 0.4912109375]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 9.0, 16.0, 29.0, 55.0, 153.0, 564.0, 2186.0, 692.0, 165.0, 82.0, 43.0, 22.0, 12.0, 10.0, 9.0, 7.0, 2.0, 5.0, 3.0, 0.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.18896484375, -0.1839313507080078, -0.17889785766601562, -0.17386436462402344, -0.16883087158203125, -0.16379737854003906, -0.15876388549804688, -0.1537303924560547, -0.1486968994140625, -0.1436634063720703, -0.13862991333007812, -0.13359642028808594, -0.12856292724609375, -0.12352943420410156, -0.11849594116210938, -0.11346244812011719, -0.108428955078125, -0.10339546203613281, -0.09836196899414062, -0.09332847595214844, -0.08829498291015625, -0.08326148986816406, -0.07822799682617188, -0.07319450378417969, -0.0681610107421875, -0.06312751770019531, -0.058094024658203125, -0.05306053161621094, -0.04802703857421875, -0.04299354553222656, -0.037960052490234375, -0.03292655944824219, -0.02789306640625, -0.022859573364257812, -0.017826080322265625, -0.012792587280273438, -0.00775909423828125, -0.0027256011962890625, 0.002307891845703125, 0.0073413848876953125, 0.0123748779296875, 0.017408370971679688, 0.022441864013671875, 0.027475357055664062, 0.03250885009765625, 0.03754234313964844, 0.042575836181640625, 0.04760932922363281, 0.052642822265625, 0.05767631530761719, 0.06270980834960938, 0.06774330139160156, 0.07277679443359375, 0.07781028747558594, 0.08284378051757812, 0.08787727355957031, 0.0929107666015625, 0.09794425964355469, 0.10297775268554688, 0.10801124572753906, 0.11304473876953125, 0.11807823181152344, 0.12311172485351562, 0.1281452178955078, 0.1331787109375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 15.0, 777.0, 220.0, 6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5291391611099243, -0.3442678451538086, -0.15939649939537048, 0.025474846363067627, 0.21034616231918335, 0.3952174782752991, 0.5800888538360596, 0.7649601697921753, 0.949831485748291, 1.1347028017044067, 1.3195741176605225, 1.5044455528259277, 1.689316749572754, 1.8741881847381592, 2.0590596199035645, 2.2439308166503906, 2.428802013397217, 2.613673448562622, 2.7985446453094482, 2.9834160804748535, 3.1682872772216797, 3.353158712387085, 3.5380301475524902, 3.7229013442993164, 3.9077727794647217, 4.092644214630127, 4.277515411376953, 4.462386608123779, 4.647258281707764, 4.83212947845459, 5.017000675201416, 5.201871871948242, 5.386743068695068, 5.5716142654418945, 5.756485939025879, 5.941357135772705, 6.126228332519531, 6.311099529266357, 6.495971202850342, 6.680842399597168, 6.865713596343994, 7.05058479309082, 7.235456466674805, 7.420327663421631, 7.605198860168457, 7.790070056915283, 7.974941730499268, 8.159812927246094, 8.344684600830078, 8.529556274414062, 8.71442699432373, 8.899298667907715, 9.0841703414917, 9.269041061401367, 9.453912734985352, 9.638784408569336, 9.823655128479004, 10.008526802062988, 10.193397521972656, 10.37826919555664, 10.563140869140625, 10.748011589050293, 10.932883262634277, 11.117753982543945, 11.30262565612793]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 15.0, 13.0, 18.0, 24.0, 27.0, 16.0, 37.0, 53.0, 47.0, 53.0, 69.0, 58.0, 68.0, 65.0, 73.0, 57.0, 52.0, 46.0, 41.0, 47.0, 27.0, 20.0, 20.0, 14.0, 8.0, 11.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3802456855773926, -0.3659658133983612, -0.35168594121932983, -0.33740609884262085, -0.3231262266635895, -0.3088463544845581, -0.29456648230552673, -0.28028661012649536, -0.266006737947464, -0.2517268657684326, -0.23744700849056244, -0.22316713631153107, -0.2088872641324997, -0.19460740685462952, -0.18032753467559814, -0.16604766249656677, -0.1517678052186966, -0.13748793303966522, -0.12320806831121445, -0.10892820358276367, -0.0946483314037323, -0.08036846667528152, -0.06608860194683075, -0.05180872976779938, -0.0375288650393486, -0.02324899658560753, -0.008969129994511604, 0.00531073659658432, 0.019590605050325394, 0.03387047350406647, 0.04815033823251724, 0.062430210411548615, 0.07671007513999939, 0.09098993986845016, 0.10526981204748154, 0.11954967677593231, 0.13382954895496368, 0.14810940623283386, 0.16238927841186523, 0.1766691505908966, 0.19094902276992798, 0.20522889494895935, 0.21950875222682953, 0.2337886244058609, 0.24806849658489227, 0.26234835386276245, 0.2766282260417938, 0.2909080982208252, 0.3051879405975342, 0.31946781277656555, 0.3337476849555969, 0.3480275273323059, 0.3623073995113373, 0.37658727169036865, 0.3908671438694, 0.4051470160484314, 0.41942688822746277, 0.43370676040649414, 0.4479866325855255, 0.4622665047645569, 0.47654634714126587, 0.49082621932029724, 0.5051060914993286, 0.5193859338760376, 0.5336658358573914]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 4.0, 7.0, 3.0, 9.0, 7.0, 14.0, 28.0, 26.0, 34.0, 39.0, 49.0, 62.0, 93.0, 142.0, 234.0, 424.0, 795.0, 2238.0, 8111.0, 50287.0, 473172.0, 453094.0, 47658.0, 7843.0, 2169.0, 896.0, 423.0, 215.0, 126.0, 86.0, 64.0, 56.0, 33.0, 26.0, 20.0, 18.0, 19.0, 7.0, 6.0, 7.0, 6.0, 5.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.2330322265625, -0.22637176513671875, -0.2197113037109375, -0.21305084228515625, -0.206390380859375, -0.19972991943359375, -0.1930694580078125, -0.18640899658203125, -0.17974853515625, -0.17308807373046875, -0.1664276123046875, -0.15976715087890625, -0.153106689453125, -0.14644622802734375, -0.1397857666015625, -0.13312530517578125, -0.12646484375, -0.11980438232421875, -0.1131439208984375, -0.10648345947265625, -0.099822998046875, -0.09316253662109375, -0.0865020751953125, -0.07984161376953125, -0.07318115234375, -0.06652069091796875, -0.0598602294921875, -0.05319976806640625, -0.046539306640625, -0.03987884521484375, -0.0332183837890625, -0.02655792236328125, -0.0198974609375, -0.01323699951171875, -0.0065765380859375, 8.392333984375e-05, 0.006744384765625, 0.01340484619140625, 0.0200653076171875, 0.02672576904296875, 0.03338623046875, 0.04004669189453125, 0.0467071533203125, 0.05336761474609375, 0.060028076171875, 0.06668853759765625, 0.0733489990234375, 0.08000946044921875, 0.086669921875, 0.09333038330078125, 0.0999908447265625, 0.10665130615234375, 0.113311767578125, 0.11997222900390625, 0.1266326904296875, 0.13329315185546875, 0.13995361328125, 0.14661407470703125, 0.1532745361328125, 0.15993499755859375, 0.166595458984375, 0.17325592041015625, 0.1799163818359375, 0.18657684326171875, 0.1932373046875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 7.0, 9.0, 18.0, 28.0, 31.0, 76.0, 79.0, 85.0, 123.0, 118.0, 127.0, 82.0, 80.0, 55.0, 44.0, 17.0, 8.0, 6.0, 6.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.053131103515625, -0.051320552825927734, -0.04951000213623047, -0.0476994514465332, -0.04588890075683594, -0.04407835006713867, -0.042267799377441406, -0.04045724868774414, -0.038646697998046875, -0.03683614730834961, -0.035025596618652344, -0.03321504592895508, -0.03140449523925781, -0.029593944549560547, -0.02778339385986328, -0.025972843170166016, -0.02416229248046875, -0.022351741790771484, -0.02054119110107422, -0.018730640411376953, -0.016920089721679688, -0.015109539031982422, -0.013298988342285156, -0.01148843765258789, -0.009677886962890625, -0.00786733627319336, -0.006056785583496094, -0.004246234893798828, -0.0024356842041015625, -0.0006251335144042969, 0.0011854171752929688, 0.0029959678649902344, 0.0048065185546875, 0.006617069244384766, 0.008427619934082031, 0.010238170623779297, 0.012048721313476562, 0.013859272003173828, 0.015669822692871094, 0.01748037338256836, 0.019290924072265625, 0.02110147476196289, 0.022912025451660156, 0.024722576141357422, 0.026533126831054688, 0.028343677520751953, 0.03015422821044922, 0.031964778900146484, 0.03377532958984375, 0.035585880279541016, 0.03739643096923828, 0.03920698165893555, 0.04101753234863281, 0.04282808303833008, 0.044638633728027344, 0.04644918441772461, 0.048259735107421875, 0.05007028579711914, 0.051880836486816406, 0.05369138717651367, 0.05550193786621094, 0.0573124885559082, 0.05912303924560547, 0.060933589935302734, 0.062744140625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 4.0, 9.0, 5.0, 8.0, 11.0, 12.0, 16.0, 29.0, 29.0, 57.0, 93.0, 107.0, 183.0, 256.0, 496.0, 769.0, 1677.0, 3887.0, 10270.0, 29402.0, 94666.0, 277863.0, 378316.0, 168899.0, 53085.0, 17034.0, 6114.0, 2444.0, 1129.0, 649.0, 352.0, 233.0, 140.0, 91.0, 67.0, 39.0, 30.0, 23.0, 18.0, 12.0, 9.0, 8.0, 4.0, 3.0, 7.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07708740234375, -0.0745391845703125, -0.071990966796875, -0.0694427490234375, -0.06689453125, -0.0643463134765625, -0.061798095703125, -0.0592498779296875, -0.05670166015625, -0.0541534423828125, -0.051605224609375, -0.0490570068359375, -0.0465087890625, -0.0439605712890625, -0.041412353515625, -0.0388641357421875, -0.03631591796875, -0.0337677001953125, -0.031219482421875, -0.0286712646484375, -0.026123046875, -0.0235748291015625, -0.021026611328125, -0.0184783935546875, -0.01593017578125, -0.0133819580078125, -0.010833740234375, -0.0082855224609375, -0.0057373046875, -0.0031890869140625, -0.000640869140625, 0.0019073486328125, 0.00445556640625, 0.0070037841796875, 0.009552001953125, 0.0121002197265625, 0.0146484375, 0.0171966552734375, 0.019744873046875, 0.0222930908203125, 0.02484130859375, 0.0273895263671875, 0.029937744140625, 0.0324859619140625, 0.0350341796875, 0.0375823974609375, 0.040130615234375, 0.0426788330078125, 0.04522705078125, 0.0477752685546875, 0.050323486328125, 0.0528717041015625, 0.055419921875, 0.0579681396484375, 0.060516357421875, 0.0630645751953125, 0.06561279296875, 0.0681610107421875, 0.070709228515625, 0.0732574462890625, 0.0758056640625, 0.0783538818359375, 0.080902099609375, 0.0834503173828125, 0.08599853515625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 11.0, 11.0, 12.0, 14.0, 6.0, 25.0, 25.0, 33.0, 33.0, 20.0, 30.0, 28.0, 45.0, 36.0, 46.0, 44.0, 41.0, 40.0, 28.0, 49.0, 42.0, 34.0, 32.0, 30.0, 44.0, 36.0, 28.0, 28.0, 25.0, 26.0, 10.0, 13.0, 14.0, 9.0, 8.0, 12.0, 6.0, 7.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.09332275390625, -0.0903768539428711, -0.08743095397949219, -0.08448505401611328, -0.08153915405273438, -0.07859325408935547, -0.07564735412597656, -0.07270145416259766, -0.06975555419921875, -0.06680965423583984, -0.06386375427246094, -0.06091785430908203, -0.057971954345703125, -0.05502605438232422, -0.05208015441894531, -0.049134254455566406, -0.0461883544921875, -0.043242454528808594, -0.04029655456542969, -0.03735065460205078, -0.034404754638671875, -0.03145885467529297, -0.028512954711914062, -0.025567054748535156, -0.02262115478515625, -0.019675254821777344, -0.016729354858398438, -0.013783454895019531, -0.010837554931640625, -0.007891654968261719, -0.0049457550048828125, -0.0019998550415039062, 0.000946044921875, 0.0038919448852539062, 0.0068378448486328125, 0.009783744812011719, 0.012729644775390625, 0.01567554473876953, 0.018621444702148438, 0.021567344665527344, 0.02451324462890625, 0.027459144592285156, 0.030405044555664062, 0.03335094451904297, 0.036296844482421875, 0.03924274444580078, 0.04218864440917969, 0.045134544372558594, 0.0480804443359375, 0.051026344299316406, 0.05397224426269531, 0.05691814422607422, 0.059864044189453125, 0.06280994415283203, 0.06575584411621094, 0.06870174407958984, 0.07164764404296875, 0.07459354400634766, 0.07753944396972656, 0.08048534393310547, 0.08343124389648438, 0.08637714385986328, 0.08932304382324219, 0.0922689437866211, 0.09521484375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 1.0, 2.0, 6.0, 10.0, 13.0, 16.0, 22.0, 28.0, 36.0, 73.0, 82.0, 141.0, 264.0, 493.0, 956.0, 2293.0, 6828.0, 34812.0, 309018.0, 578800.0, 94499.0, 13578.0, 3734.0, 1346.0, 659.0, 327.0, 203.0, 123.0, 60.0, 30.0, 31.0, 19.0, 10.0, 8.0, 12.0, 10.0, 3.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.044921875, -0.04338502883911133, -0.041848182678222656, -0.040311336517333984, -0.03877449035644531, -0.03723764419555664, -0.03570079803466797, -0.0341639518737793, -0.032627105712890625, -0.031090259552001953, -0.02955341339111328, -0.02801656723022461, -0.026479721069335938, -0.024942874908447266, -0.023406028747558594, -0.021869182586669922, -0.02033233642578125, -0.018795490264892578, -0.017258644104003906, -0.015721797943115234, -0.014184951782226562, -0.01264810562133789, -0.011111259460449219, -0.009574413299560547, -0.008037567138671875, -0.006500720977783203, -0.004963874816894531, -0.0034270286560058594, -0.0018901824951171875, -0.0003533363342285156, 0.0011835098266601562, 0.002720355987548828, 0.0042572021484375, 0.005794048309326172, 0.007330894470214844, 0.008867740631103516, 0.010404586791992188, 0.01194143295288086, 0.013478279113769531, 0.015015125274658203, 0.016551971435546875, 0.018088817596435547, 0.01962566375732422, 0.02116250991821289, 0.022699356079101562, 0.024236202239990234, 0.025773048400878906, 0.027309894561767578, 0.02884674072265625, 0.030383586883544922, 0.031920433044433594, 0.033457279205322266, 0.03499412536621094, 0.03653097152709961, 0.03806781768798828, 0.03960466384887695, 0.041141510009765625, 0.0426783561706543, 0.04421520233154297, 0.04575204849243164, 0.04728889465332031, 0.048825740814208984, 0.050362586975097656, 0.05189943313598633, 0.053436279296875]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 18.0, 16.0, 13.0, 22.0, 35.0, 38.0, 56.0, 57.0, 58.0, 58.0, 52.0, 79.0, 64.0, 59.0, 51.0, 48.0, 66.0, 44.0, 27.0, 27.0, 21.0, 26.0, 9.0, 13.0, 12.0, 9.0, 3.0, 7.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.344650268554688e-06, -8.106231689453125e-06, -7.867813110351562e-06, -7.62939453125e-06, -7.3909759521484375e-06, -7.152557373046875e-06, -6.9141387939453125e-06, -6.67572021484375e-06, -6.4373016357421875e-06, -6.198883056640625e-06, -5.9604644775390625e-06, -5.7220458984375e-06, -5.4836273193359375e-06, -5.245208740234375e-06, -5.0067901611328125e-06, -4.76837158203125e-06, -4.5299530029296875e-06, -4.291534423828125e-06, -4.0531158447265625e-06, -3.814697265625e-06, -3.5762786865234375e-06, -3.337860107421875e-06, -3.0994415283203125e-06, -2.86102294921875e-06, -2.6226043701171875e-06, -2.384185791015625e-06, -2.1457672119140625e-06, -1.9073486328125e-06, -1.6689300537109375e-06, -1.430511474609375e-06, -1.1920928955078125e-06, -9.5367431640625e-07, -7.152557373046875e-07, -4.76837158203125e-07, -2.384185791015625e-07, 0.0, 2.384185791015625e-07, 4.76837158203125e-07, 7.152557373046875e-07, 9.5367431640625e-07, 1.1920928955078125e-06, 1.430511474609375e-06, 1.6689300537109375e-06, 1.9073486328125e-06, 2.1457672119140625e-06, 2.384185791015625e-06, 2.6226043701171875e-06, 2.86102294921875e-06, 3.0994415283203125e-06, 3.337860107421875e-06, 3.5762786865234375e-06, 3.814697265625e-06, 4.0531158447265625e-06, 4.291534423828125e-06, 4.5299530029296875e-06, 4.76837158203125e-06, 5.0067901611328125e-06, 5.245208740234375e-06, 5.4836273193359375e-06, 5.7220458984375e-06, 5.9604644775390625e-06, 6.198883056640625e-06, 6.4373016357421875e-06, 6.67572021484375e-06, 6.9141387939453125e-06]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 4.0, 6.0, 7.0, 12.0, 24.0, 25.0, 64.0, 93.0, 155.0, 390.0, 1129.0, 6029.0, 149837.0, 845781.0, 40515.0, 3072.0, 752.0, 311.0, 141.0, 79.0, 51.0, 27.0, 12.0, 9.0, 12.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0882568359375, -0.08552742004394531, -0.08279800415039062, -0.08006858825683594, -0.07733917236328125, -0.07460975646972656, -0.07188034057617188, -0.06915092468261719, -0.0664215087890625, -0.06369209289550781, -0.060962677001953125, -0.05823326110839844, -0.05550384521484375, -0.05277442932128906, -0.050045013427734375, -0.04731559753417969, -0.044586181640625, -0.04185676574707031, -0.039127349853515625, -0.03639793395996094, -0.03366851806640625, -0.030939102172851562, -0.028209686279296875, -0.025480270385742188, -0.0227508544921875, -0.020021438598632812, -0.017292022705078125, -0.014562606811523438, -0.01183319091796875, -0.009103775024414062, -0.006374359130859375, -0.0036449432373046875, -0.00091552734375, 0.0018138885498046875, 0.004543304443359375, 0.0072727203369140625, 0.01000213623046875, 0.012731552124023438, 0.015460968017578125, 0.018190383911132812, 0.0209197998046875, 0.023649215698242188, 0.026378631591796875, 0.029108047485351562, 0.03183746337890625, 0.03456687927246094, 0.037296295166015625, 0.04002571105957031, 0.042755126953125, 0.04548454284667969, 0.048213958740234375, 0.05094337463378906, 0.05367279052734375, 0.05640220642089844, 0.059131622314453125, 0.06186103820800781, 0.0645904541015625, 0.06731986999511719, 0.07004928588867188, 0.07277870178222656, 0.07550811767578125, 0.07823753356933594, 0.08096694946289062, 0.08369636535644531, 0.08642578125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 3.0, 8.0, 4.0, 8.0, 4.0, 15.0, 14.0, 21.0, 41.0, 47.0, 73.0, 77.0, 100.0, 89.0, 94.0, 90.0, 72.0, 59.0, 54.0, 34.0, 33.0, 26.0, 15.0, 6.0, 9.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.06671142578125, -0.0649576187133789, -0.06320381164550781, -0.06145000457763672, -0.059696197509765625, -0.05794239044189453, -0.05618858337402344, -0.054434776306152344, -0.05268096923828125, -0.050927162170410156, -0.04917335510253906, -0.04741954803466797, -0.045665740966796875, -0.04391193389892578, -0.04215812683105469, -0.040404319763183594, -0.0386505126953125, -0.036896705627441406, -0.03514289855957031, -0.03338909149169922, -0.031635284423828125, -0.02988147735595703, -0.028127670288085938, -0.026373863220214844, -0.02462005615234375, -0.022866249084472656, -0.021112442016601562, -0.01935863494873047, -0.017604827880859375, -0.01585102081298828, -0.014097213745117188, -0.012343406677246094, -0.010589599609375, -0.008835792541503906, -0.0070819854736328125, -0.005328178405761719, -0.003574371337890625, -0.0018205642700195312, -6.67572021484375e-05, 0.0016870498657226562, 0.00344085693359375, 0.005194664001464844, 0.0069484710693359375, 0.008702278137207031, 0.010456085205078125, 0.012209892272949219, 0.013963699340820312, 0.015717506408691406, 0.0174713134765625, 0.019225120544433594, 0.020978927612304688, 0.02273273468017578, 0.024486541748046875, 0.02624034881591797, 0.027994155883789062, 0.029747962951660156, 0.03150177001953125, 0.033255577087402344, 0.03500938415527344, 0.03676319122314453, 0.038516998291015625, 0.04027080535888672, 0.04202461242675781, 0.043778419494628906, 0.0455322265625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 6.0, 4.0, 7.0, 16.0, 19.0, 45.0, 116.0, 173.0, 239.0, 212.0, 103.0, 36.0, 17.0, 7.0, 7.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.6135438680648804, -0.5823544263839722, -0.5511650443077087, -0.5199756026268005, -0.4887861907482147, -0.4575967788696289, -0.4264073669910431, -0.3952179551124573, -0.3640285134315491, -0.33283910155296326, -0.30164968967437744, -0.27046024799346924, -0.23927083611488342, -0.2080814242362976, -0.1768920123577118, -0.14570258557796478, -0.11451318860054016, -0.08332376927137375, -0.052134353667497635, -0.02094493806362152, 0.010244481265544891, 0.041433900594711304, 0.07262331247329712, 0.10381273925304413, 0.13500215113162994, 0.16619156301021576, 0.19738098978996277, 0.22857040166854858, 0.2597598135471344, 0.2909492254257202, 0.3221386671066284, 0.35332807898521423, 0.38451749086380005, 0.41570690274238586, 0.4468963146209717, 0.4780857563018799, 0.5092751383781433, 0.5404645800590515, 0.5716539621353149, 0.6028434038162231, 0.6340328454971313, 0.6652222871780396, 0.696411669254303, 0.7276011109352112, 0.7587904930114746, 0.7899799346923828, 0.821169376373291, 0.8523587584495544, 0.8835481405258179, 0.9147375822067261, 0.9459269642829895, 0.9771164059638977, 1.0083057880401611, 1.0394952297210693, 1.0706846714019775, 1.1018741130828857, 1.133063554763794, 1.1642529964447021, 1.1954424381256104, 1.226631760597229, 1.2578212022781372, 1.2890106439590454, 1.3202000856399536, 1.3513895273208618, 1.3825788497924805]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 9.0, 11.0, 17.0, 12.0, 18.0, 19.0, 20.0, 13.0, 32.0, 38.0, 24.0, 42.0, 36.0, 41.0, 38.0, 58.0, 50.0, 46.0, 61.0, 49.0, 41.0, 49.0, 30.0, 30.0, 29.0, 26.0, 26.0, 27.0, 30.0, 11.0, 10.0, 9.0, 8.0, 10.0, 7.0, 4.0, 7.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0], "bins": [-0.699662983417511, -0.6814414262771606, -0.6632199287414551, -0.6449983716011047, -0.6267768144607544, -0.6085553169250488, -0.5903337597846985, -0.5721122026443481, -0.5538907051086426, -0.5356691479682922, -0.5174476504325867, -0.49922609329223633, -0.481004536151886, -0.46278300881385803, -0.4445614814758301, -0.42633992433547974, -0.4081183671951294, -0.38989683985710144, -0.3716752827167511, -0.35345375537872314, -0.3352321982383728, -0.31701067090034485, -0.2987891435623169, -0.28056758642196655, -0.2623460590839386, -0.24412451684474945, -0.2259029746055603, -0.20768144726753235, -0.1894599050283432, -0.17123836278915405, -0.1530168354511261, -0.13479529321193695, -0.11657381057739258, -0.09835226833820343, -0.08013073354959488, -0.06190919503569603, -0.04368765652179718, -0.025466114282608032, -0.007244579493999481, 0.01097695529460907, 0.029198497533798218, 0.04742003604769707, 0.06564157456159592, 0.08386310935020447, 0.10208465158939362, 0.12030619382858276, 0.13852772116661072, 0.15674926340579987, 0.174970805644989, 0.19319234788417816, 0.2114138901233673, 0.22963541746139526, 0.2478569597005844, 0.26607850193977356, 0.2843000292778015, 0.30252158641815186, 0.3207431137561798, 0.33896464109420776, 0.3571861982345581, 0.37540772557258606, 0.393629252910614, 0.41185081005096436, 0.4300723373889923, 0.44829386472702026, 0.4665154218673706]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 9.0, 6.0, 12.0, 27.0, 57.0, 121.0, 336.0, 1337.0, 11563.0, 3693197.0, 480890.0, 5794.0, 701.0, 158.0, 57.0, 21.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1258544921875, -0.11527442932128906, -0.10469436645507812, -0.09411430358886719, -0.08353424072265625, -0.07295417785644531, -0.062374114990234375, -0.05179405212402344, -0.0412139892578125, -0.030633926391601562, -0.020053863525390625, -0.009473800659179688, 0.00110626220703125, 0.011686325073242188, 0.022266387939453125, 0.03284645080566406, 0.043426513671875, 0.05400657653808594, 0.06458663940429688, 0.07516670227050781, 0.08574676513671875, 0.09632682800292969, 0.10690689086914062, 0.11748695373535156, 0.1280670166015625, 0.13864707946777344, 0.14922714233398438, 0.1598072052001953, 0.17038726806640625, 0.1809673309326172, 0.19154739379882812, 0.20212745666503906, 0.21270751953125, 0.22328758239746094, 0.23386764526367188, 0.2444477081298828, 0.25502777099609375, 0.2656078338623047, 0.2761878967285156, 0.28676795959472656, 0.2973480224609375, 0.30792808532714844, 0.3185081481933594, 0.3290882110595703, 0.33966827392578125, 0.3502483367919922, 0.3608283996582031, 0.37140846252441406, 0.381988525390625, 0.39256858825683594, 0.4031486511230469, 0.4137287139892578, 0.42430877685546875, 0.4348888397216797, 0.4454689025878906, 0.45604896545410156, 0.4666290283203125, 0.47720909118652344, 0.4877891540527344, 0.4983692169189453, 0.5089492797851562, 0.5195293426513672, 0.5301094055175781, 0.5406894683837891, 0.55126953125]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 7.0, 4.0, 11.0, 21.0, 20.0, 41.0, 52.0, 65.0, 85.0, 97.0, 101.0, 97.0, 92.0, 93.0, 64.0, 51.0, 32.0, 32.0, 12.0, 5.0, 9.0, 3.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04998779296875, -0.04837369918823242, -0.046759605407714844, -0.045145511627197266, -0.04353141784667969, -0.04191732406616211, -0.04030323028564453, -0.03868913650512695, -0.037075042724609375, -0.0354609489440918, -0.03384685516357422, -0.03223276138305664, -0.030618667602539062, -0.029004573822021484, -0.027390480041503906, -0.025776386260986328, -0.02416229248046875, -0.022548198699951172, -0.020934104919433594, -0.019320011138916016, -0.017705917358398438, -0.01609182357788086, -0.014477729797363281, -0.012863636016845703, -0.011249542236328125, -0.009635448455810547, -0.008021354675292969, -0.006407260894775391, -0.0047931671142578125, -0.0031790733337402344, -0.0015649795532226562, 4.9114227294921875e-05, 0.0016632080078125, 0.003277301788330078, 0.004891395568847656, 0.006505489349365234, 0.008119583129882812, 0.00973367691040039, 0.011347770690917969, 0.012961864471435547, 0.014575958251953125, 0.016190052032470703, 0.01780414581298828, 0.01941823959350586, 0.021032333374023438, 0.022646427154541016, 0.024260520935058594, 0.025874614715576172, 0.02748870849609375, 0.029102802276611328, 0.030716896057128906, 0.032330989837646484, 0.03394508361816406, 0.03555917739868164, 0.03717327117919922, 0.0387873649597168, 0.040401458740234375, 0.04201555252075195, 0.04362964630126953, 0.04524374008178711, 0.04685783386230469, 0.048471927642822266, 0.050086021423339844, 0.05170011520385742, 0.053314208984375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 5.0, 4.0, 11.0, 20.0, 25.0, 38.0, 59.0, 124.0, 184.0, 355.0, 882.0, 4083.0, 60956.0, 4023928.0, 96570.0, 4971.0, 1069.0, 425.0, 240.0, 119.0, 81.0, 57.0, 27.0, 21.0, 14.0, 8.0, 3.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.252197265625, -0.24489784240722656, -0.23759841918945312, -0.2302989959716797, -0.22299957275390625, -0.2157001495361328, -0.20840072631835938, -0.20110130310058594, -0.1938018798828125, -0.18650245666503906, -0.17920303344726562, -0.1719036102294922, -0.16460418701171875, -0.1573047637939453, -0.15000534057617188, -0.14270591735839844, -0.135406494140625, -0.12810707092285156, -0.12080764770507812, -0.11350822448730469, -0.10620880126953125, -0.09890937805175781, -0.09160995483398438, -0.08431053161621094, -0.0770111083984375, -0.06971168518066406, -0.062412261962890625, -0.05511283874511719, -0.04781341552734375, -0.04051399230957031, -0.033214569091796875, -0.025915145874023438, -0.01861572265625, -0.011316299438476562, -0.004016876220703125, 0.0032825469970703125, 0.01058197021484375, 0.017881393432617188, 0.025180816650390625, 0.03248023986816406, 0.0397796630859375, 0.04707908630371094, 0.054378509521484375, 0.06167793273925781, 0.06897735595703125, 0.07627677917480469, 0.08357620239257812, 0.09087562561035156, 0.098175048828125, 0.10547447204589844, 0.11277389526367188, 0.12007331848144531, 0.12737274169921875, 0.1346721649169922, 0.14197158813476562, 0.14927101135253906, 0.1565704345703125, 0.16386985778808594, 0.17116928100585938, 0.1784687042236328, 0.18576812744140625, 0.1930675506591797, 0.20036697387695312, 0.20766639709472656, 0.2149658203125]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 2.0, 8.0, 18.0, 38.0, 52.0, 169.0, 518.0, 1950.0, 877.0, 245.0, 84.0, 45.0, 27.0, 10.0, 17.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06488037109375, -0.06244373321533203, -0.06000709533691406, -0.057570457458496094, -0.055133819580078125, -0.052697181701660156, -0.05026054382324219, -0.04782390594482422, -0.04538726806640625, -0.04295063018798828, -0.04051399230957031, -0.038077354431152344, -0.035640716552734375, -0.033204078674316406, -0.030767440795898438, -0.02833080291748047, -0.0258941650390625, -0.02345752716064453, -0.021020889282226562, -0.018584251403808594, -0.016147613525390625, -0.013710975646972656, -0.011274337768554688, -0.008837699890136719, -0.00640106201171875, -0.003964424133300781, -0.0015277862548828125, 0.0009088516235351562, 0.003345489501953125, 0.005782127380371094, 0.008218765258789062, 0.010655403137207031, 0.013092041015625, 0.015528678894042969, 0.017965316772460938, 0.020401954650878906, 0.022838592529296875, 0.025275230407714844, 0.027711868286132812, 0.03014850616455078, 0.03258514404296875, 0.03502178192138672, 0.03745841979980469, 0.039895057678222656, 0.042331695556640625, 0.044768333435058594, 0.04720497131347656, 0.04964160919189453, 0.0520782470703125, 0.05451488494873047, 0.05695152282714844, 0.059388160705566406, 0.061824798583984375, 0.06426143646240234, 0.06669807434082031, 0.06913471221923828, 0.07157135009765625, 0.07400798797607422, 0.07644462585449219, 0.07888126373291016, 0.08131790161132812, 0.0837545394897461, 0.08619117736816406, 0.08862781524658203, 0.091064453125]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 3.0, 10.0, 165.0, 654.0, 162.0, 11.0, 1.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.2986419200897217, -1.259749412536621, -1.22085702419281, -1.1819645166397095, -1.1430721282958984, -1.1041796207427979, -1.0652871131896973, -1.0263947248458862, -0.9875022172927856, -0.9486097693443298, -0.909717321395874, -0.8708248138427734, -0.8319323658943176, -0.7930399179458618, -0.754147469997406, -0.7152550220489502, -0.6763625741004944, -0.6374701261520386, -0.5985776782035828, -0.559685230255127, -0.5207927227020264, -0.48190027475357056, -0.44300782680511475, -0.40411534905433655, -0.36522290110588074, -0.3263304531574249, -0.28743797540664673, -0.24854552745819092, -0.2096530646085739, -0.1707606017589569, -0.1318681538105011, -0.0929756760597229, -0.05408322811126709, -0.015190768986940384, 0.023701690137386322, 0.06259414553642273, 0.10148660838603973, 0.14037907123565674, 0.17927151918411255, 0.21816399693489075, 0.25705644488334656, 0.29594889283180237, 0.33484137058258057, 0.3737338185310364, 0.4126262664794922, 0.4515187442302704, 0.4904111921787262, 0.5293036699295044, 0.5681961178779602, 0.607088565826416, 0.6459810137748718, 0.6848734617233276, 0.7237659692764282, 0.762658417224884, 0.8015508651733398, 0.8404433727264404, 0.8793357610702515, 0.9182282090187073, 0.9571206569671631, 0.9960131645202637, 1.0349055528640747, 1.0737980604171753, 1.1126904487609863, 1.151582956314087, 1.1904754638671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 7.0, 8.0, 8.0, 14.0, 25.0, 26.0, 40.0, 72.0, 70.0, 69.0, 102.0, 71.0, 84.0, 74.0, 78.0, 72.0, 54.0, 42.0, 31.0, 17.0, 14.0, 12.0, 7.0, 6.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2951192855834961, -0.28560593724250793, -0.2760925590991974, -0.26657921075820923, -0.2570658326148987, -0.24755248427391052, -0.23803912103176117, -0.22852575778961182, -0.21901240944862366, -0.2094990462064743, -0.19998568296432495, -0.1904723346233368, -0.18095897138118744, -0.17144560813903809, -0.16193224489688873, -0.15241888165473938, -0.14290551841259003, -0.13339215517044067, -0.12387879937887192, -0.11436543613672256, -0.10485208034515381, -0.09533871710300446, -0.0858253538608551, -0.07631199806928635, -0.066798634827137, -0.05728527531027794, -0.047771915793418884, -0.03825855255126953, -0.028745193034410477, -0.019231833517551422, -0.009718470275402069, -0.000205114483833313, 0.00930824875831604, 0.018821608275175095, 0.0283349696546793, 0.0378483310341835, 0.04736169055104256, 0.05687505006790161, 0.06638841331005096, 0.07590176910161972, 0.08541513234376907, 0.09492849558591843, 0.10444185137748718, 0.11395521461963654, 0.12346857786178589, 0.13298192620277405, 0.1424953043460846, 0.15200865268707275, 0.1615220159292221, 0.17103537917137146, 0.1805487424135208, 0.19006210565567017, 0.19957545399665833, 0.20908881723880768, 0.21860218048095703, 0.2281155288219452, 0.23762890696525574, 0.2471422702074051, 0.25665563344955444, 0.2661689817905426, 0.27568235993385315, 0.2851957082748413, 0.29470908641815186, 0.30422243475914, 0.3137357831001282]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 1.0, 5.0, 9.0, 13.0, 19.0, 21.0, 30.0, 26.0, 34.0, 45.0, 69.0, 108.0, 168.0, 282.0, 496.0, 1046.0, 2479.0, 7388.0, 32194.0, 198582.0, 581992.0, 182151.0, 29702.0, 6982.0, 2366.0, 988.0, 495.0, 284.0, 163.0, 115.0, 82.0, 54.0, 35.0, 26.0, 22.0, 19.0, 21.0, 5.0, 5.0, 7.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.14306640625, -0.1385211944580078, -0.13397598266601562, -0.12943077087402344, -0.12488555908203125, -0.12034034729003906, -0.11579513549804688, -0.11124992370605469, -0.1067047119140625, -0.10215950012207031, -0.09761428833007812, -0.09306907653808594, -0.08852386474609375, -0.08397865295410156, -0.07943344116210938, -0.07488822937011719, -0.070343017578125, -0.06579780578613281, -0.061252593994140625, -0.05670738220214844, -0.05216217041015625, -0.04761695861816406, -0.043071746826171875, -0.03852653503417969, -0.0339813232421875, -0.029436111450195312, -0.024890899658203125, -0.020345687866210938, -0.01580047607421875, -0.011255264282226562, -0.006710052490234375, -0.0021648406982421875, 0.00238037109375, 0.0069255828857421875, 0.011470794677734375, 0.016016006469726562, 0.02056121826171875, 0.025106430053710938, 0.029651641845703125, 0.03419685363769531, 0.0387420654296875, 0.04328727722167969, 0.047832489013671875, 0.05237770080566406, 0.05692291259765625, 0.06146812438964844, 0.06601333618164062, 0.07055854797363281, 0.075103759765625, 0.07964897155761719, 0.08419418334960938, 0.08873939514160156, 0.09328460693359375, 0.09782981872558594, 0.10237503051757812, 0.10692024230957031, 0.1114654541015625, 0.11601066589355469, 0.12055587768554688, 0.12510108947753906, 0.12964630126953125, 0.13419151306152344, 0.13873672485351562, 0.1432819366455078, 0.1478271484375]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 4.0, 13.0, 11.0, 23.0, 18.0, 34.0, 42.0, 57.0, 67.0, 82.0, 81.0, 102.0, 92.0, 88.0, 66.0, 52.0, 50.0, 33.0, 30.0, 20.0, 11.0, 7.0, 3.0, 5.0, 3.0, 2.0, 2.0, 0.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.036163330078125, -0.03475379943847656, -0.033344268798828125, -0.03193473815917969, -0.03052520751953125, -0.029115676879882812, -0.027706146240234375, -0.026296615600585938, -0.0248870849609375, -0.023477554321289062, -0.022068023681640625, -0.020658493041992188, -0.01924896240234375, -0.017839431762695312, -0.016429901123046875, -0.015020370483398438, -0.01361083984375, -0.012201309204101562, -0.010791778564453125, -0.009382247924804688, -0.00797271728515625, -0.0065631866455078125, -0.005153656005859375, -0.0037441253662109375, -0.0023345947265625, -0.0009250640869140625, 0.000484466552734375, 0.0018939971923828125, 0.00330352783203125, 0.0047130584716796875, 0.006122589111328125, 0.0075321197509765625, 0.008941650390625, 0.010351181030273438, 0.011760711669921875, 0.013170242309570312, 0.01457977294921875, 0.015989303588867188, 0.017398834228515625, 0.018808364868164062, 0.0202178955078125, 0.021627426147460938, 0.023036956787109375, 0.024446487426757812, 0.02585601806640625, 0.027265548706054688, 0.028675079345703125, 0.030084609985351562, 0.031494140625, 0.03290367126464844, 0.034313201904296875, 0.03572273254394531, 0.03713226318359375, 0.03854179382324219, 0.039951324462890625, 0.04136085510253906, 0.0427703857421875, 0.04417991638183594, 0.045589447021484375, 0.04699897766113281, 0.04840850830078125, 0.04981803894042969, 0.051227569580078125, 0.05263710021972656, 0.054046630859375]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 5.0, 2.0, 5.0, 5.0, 9.0, 17.0, 14.0, 25.0, 33.0, 50.0, 43.0, 65.0, 108.0, 171.0, 239.0, 341.0, 580.0, 1064.0, 1981.0, 4376.0, 10682.0, 28865.0, 84318.0, 238118.0, 367984.0, 200130.0, 68874.0, 23466.0, 8933.0, 3735.0, 1778.0, 913.0, 505.0, 335.0, 251.0, 161.0, 117.0, 68.0, 52.0, 31.0, 32.0, 24.0, 20.0, 7.0, 11.0, 3.0, 12.0, 3.0, 5.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.07061767578125, -0.06843852996826172, -0.06625938415527344, -0.06408023834228516, -0.061901092529296875, -0.059721946716308594, -0.05754280090332031, -0.05536365509033203, -0.05318450927734375, -0.05100536346435547, -0.04882621765136719, -0.046647071838378906, -0.044467926025390625, -0.042288780212402344, -0.04010963439941406, -0.03793048858642578, -0.0357513427734375, -0.03357219696044922, -0.03139305114746094, -0.029213905334472656, -0.027034759521484375, -0.024855613708496094, -0.022676467895507812, -0.02049732208251953, -0.01831817626953125, -0.01613903045654297, -0.013959884643554688, -0.011780738830566406, -0.009601593017578125, -0.007422447204589844, -0.0052433013916015625, -0.0030641555786132812, -0.000885009765625, 0.0012941360473632812, 0.0034732818603515625, 0.005652427673339844, 0.007831573486328125, 0.010010719299316406, 0.012189865112304688, 0.014369010925292969, 0.01654815673828125, 0.01872730255126953, 0.020906448364257812, 0.023085594177246094, 0.025264739990234375, 0.027443885803222656, 0.029623031616210938, 0.03180217742919922, 0.0339813232421875, 0.03616046905517578, 0.03833961486816406, 0.040518760681152344, 0.042697906494140625, 0.044877052307128906, 0.04705619812011719, 0.04923534393310547, 0.05141448974609375, 0.05359363555908203, 0.05577278137207031, 0.057951927185058594, 0.060131072998046875, 0.062310218811035156, 0.06448936462402344, 0.06666851043701172, 0.06884765625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 3.0, 7.0, 2.0, 3.0, 19.0, 14.0, 12.0, 15.0, 12.0, 23.0, 14.0, 16.0, 22.0, 22.0, 30.0, 34.0, 24.0, 33.0, 41.0, 37.0, 53.0, 39.0, 34.0, 42.0, 37.0, 37.0, 33.0, 35.0, 34.0, 44.0, 26.0, 33.0, 21.0, 25.0, 21.0, 13.0, 21.0, 14.0, 12.0, 6.0, 10.0, 4.0, 3.0, 8.0, 2.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.08792877197265625, -0.0851593017578125, -0.08238983154296875, -0.079620361328125, -0.07685089111328125, -0.0740814208984375, -0.07131195068359375, -0.06854248046875, -0.06577301025390625, -0.0630035400390625, -0.06023406982421875, -0.057464599609375, -0.05469512939453125, -0.0519256591796875, -0.04915618896484375, -0.04638671875, -0.04361724853515625, -0.0408477783203125, -0.03807830810546875, -0.035308837890625, -0.03253936767578125, -0.0297698974609375, -0.02700042724609375, -0.02423095703125, -0.02146148681640625, -0.0186920166015625, -0.01592254638671875, -0.013153076171875, -0.01038360595703125, -0.0076141357421875, -0.00484466552734375, -0.0020751953125, 0.00069427490234375, 0.0034637451171875, 0.00623321533203125, 0.009002685546875, 0.01177215576171875, 0.0145416259765625, 0.01731109619140625, 0.02008056640625, 0.02285003662109375, 0.0256195068359375, 0.02838897705078125, 0.031158447265625, 0.03392791748046875, 0.0366973876953125, 0.03946685791015625, 0.042236328125, 0.04500579833984375, 0.0477752685546875, 0.05054473876953125, 0.053314208984375, 0.05608367919921875, 0.0588531494140625, 0.06162261962890625, 0.06439208984375, 0.06716156005859375, 0.0699310302734375, 0.07270050048828125, 0.075469970703125, 0.07823944091796875, 0.0810089111328125, 0.08377838134765625, 0.0865478515625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 5.0, 6.0, 6.0, 2.0, 4.0, 4.0, 14.0, 11.0, 28.0, 23.0, 42.0, 80.0, 113.0, 188.0, 367.0, 742.0, 1464.0, 3583.0, 13146.0, 83725.0, 503546.0, 374936.0, 51876.0, 9243.0, 2828.0, 1198.0, 622.0, 318.0, 163.0, 84.0, 54.0, 39.0, 22.0, 24.0, 21.0, 14.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035186767578125, -0.03382730484008789, -0.03246784210205078, -0.031108379364013672, -0.029748916625976562, -0.028389453887939453, -0.027029991149902344, -0.025670528411865234, -0.024311065673828125, -0.022951602935791016, -0.021592140197753906, -0.020232677459716797, -0.018873214721679688, -0.017513751983642578, -0.01615428924560547, -0.01479482650756836, -0.01343536376953125, -0.01207590103149414, -0.010716438293457031, -0.009356975555419922, -0.007997512817382812, -0.006638050079345703, -0.005278587341308594, -0.003919124603271484, -0.002559661865234375, -0.0012001991271972656, 0.00015926361083984375, 0.0015187263488769531, 0.0028781890869140625, 0.004237651824951172, 0.005597114562988281, 0.006956577301025391, 0.0083160400390625, 0.00967550277709961, 0.011034965515136719, 0.012394428253173828, 0.013753890991210938, 0.015113353729248047, 0.016472816467285156, 0.017832279205322266, 0.019191741943359375, 0.020551204681396484, 0.021910667419433594, 0.023270130157470703, 0.024629592895507812, 0.025989055633544922, 0.02734851837158203, 0.02870798110961914, 0.03006744384765625, 0.03142690658569336, 0.03278636932373047, 0.03414583206176758, 0.03550529479980469, 0.0368647575378418, 0.038224220275878906, 0.039583683013916016, 0.040943145751953125, 0.042302608489990234, 0.043662071228027344, 0.04502153396606445, 0.04638099670410156, 0.04774045944213867, 0.04909992218017578, 0.05045938491821289, 0.05181884765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 11.0, 7.0, 6.0, 6.0, 18.0, 21.0, 28.0, 22.0, 46.0, 41.0, 51.0, 63.0, 86.0, 80.0, 67.0, 91.0, 58.0, 67.0, 50.0, 41.0, 35.0, 37.0, 17.0, 14.0, 13.0, 11.0, 2.0, 4.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.238719940185547e-06, -8.968636393547058e-06, -8.69855284690857e-06, -8.42846930027008e-06, -8.158385753631592e-06, -7.888302206993103e-06, -7.618218660354614e-06, -7.3481351137161255e-06, -7.078051567077637e-06, -6.807968020439148e-06, -6.537884473800659e-06, -6.26780092716217e-06, -5.997717380523682e-06, -5.727633833885193e-06, -5.457550287246704e-06, -5.187466740608215e-06, -4.9173831939697266e-06, -4.647299647331238e-06, -4.377216100692749e-06, -4.10713255405426e-06, -3.8370490074157715e-06, -3.5669654607772827e-06, -3.296881914138794e-06, -3.026798367500305e-06, -2.7567148208618164e-06, -2.4866312742233276e-06, -2.216547727584839e-06, -1.94646418094635e-06, -1.6763806343078613e-06, -1.4062970876693726e-06, -1.1362135410308838e-06, -8.66129994392395e-07, -5.960464477539062e-07, -3.259629011154175e-07, -5.587935447692871e-08, 2.1420419216156006e-07, 4.842877388000488e-07, 7.543712854385376e-07, 1.0244548320770264e-06, 1.2945383787155151e-06, 1.564621925354004e-06, 1.8347054719924927e-06, 2.1047890186309814e-06, 2.3748725652694702e-06, 2.644956111907959e-06, 2.9150396585464478e-06, 3.1851232051849365e-06, 3.4552067518234253e-06, 3.725290298461914e-06, 3.995373845100403e-06, 4.265457391738892e-06, 4.53554093837738e-06, 4.805624485015869e-06, 5.075708031654358e-06, 5.345791578292847e-06, 5.6158751249313354e-06, 5.885958671569824e-06, 6.156042218208313e-06, 6.426125764846802e-06, 6.6962093114852905e-06, 6.966292858123779e-06, 7.236376404762268e-06, 7.506459951400757e-06, 7.776543498039246e-06, 8.046627044677734e-06]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 4.0, 11.0, 20.0, 19.0, 29.0, 51.0, 86.0, 194.0, 441.0, 1280.0, 6875.0, 178391.0, 815947.0, 40581.0, 3134.0, 833.0, 321.0, 150.0, 79.0, 46.0, 22.0, 20.0, 6.0, 11.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0758056640625, -0.0733041763305664, -0.07080268859863281, -0.06830120086669922, -0.06579971313476562, -0.06329822540283203, -0.06079673767089844, -0.058295249938964844, -0.05579376220703125, -0.053292274475097656, -0.05079078674316406, -0.04828929901123047, -0.045787811279296875, -0.04328632354736328, -0.04078483581542969, -0.038283348083496094, -0.0357818603515625, -0.033280372619628906, -0.030778884887695312, -0.02827739715576172, -0.025775909423828125, -0.02327442169189453, -0.020772933959960938, -0.018271446228027344, -0.01576995849609375, -0.013268470764160156, -0.010766983032226562, -0.008265495300292969, -0.005764007568359375, -0.0032625198364257812, -0.0007610321044921875, 0.0017404556274414062, 0.004241943359375, 0.006743431091308594, 0.009244918823242188, 0.011746406555175781, 0.014247894287109375, 0.01674938201904297, 0.019250869750976562, 0.021752357482910156, 0.02425384521484375, 0.026755332946777344, 0.029256820678710938, 0.03175830841064453, 0.034259796142578125, 0.03676128387451172, 0.03926277160644531, 0.041764259338378906, 0.0442657470703125, 0.046767234802246094, 0.04926872253417969, 0.05177021026611328, 0.054271697998046875, 0.05677318572998047, 0.05927467346191406, 0.061776161193847656, 0.06427764892578125, 0.06677913665771484, 0.06928062438964844, 0.07178211212158203, 0.07428359985351562, 0.07678508758544922, 0.07928657531738281, 0.0817880630493164, 0.08428955078125]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 9.0, 6.0, 14.0, 16.0, 28.0, 43.0, 56.0, 64.0, 91.0, 116.0, 109.0, 116.0, 112.0, 63.0, 58.0, 34.0, 26.0, 17.0, 10.0, 8.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.077392578125, -0.07548236846923828, -0.07357215881347656, -0.07166194915771484, -0.06975173950195312, -0.0678415298461914, -0.06593132019042969, -0.06402111053466797, -0.06211090087890625, -0.06020069122314453, -0.05829048156738281, -0.056380271911621094, -0.054470062255859375, -0.052559852600097656, -0.05064964294433594, -0.04873943328857422, -0.0468292236328125, -0.04491901397705078, -0.04300880432128906, -0.041098594665527344, -0.039188385009765625, -0.037278175354003906, -0.03536796569824219, -0.03345775604248047, -0.03154754638671875, -0.02963733673095703, -0.027727127075195312, -0.025816917419433594, -0.023906707763671875, -0.021996498107910156, -0.020086288452148438, -0.01817607879638672, -0.016265869140625, -0.014355659484863281, -0.012445449829101562, -0.010535240173339844, -0.008625030517578125, -0.006714820861816406, -0.0048046112060546875, -0.0028944015502929688, -0.00098419189453125, 0.0009260177612304688, 0.0028362274169921875, 0.004746437072753906, 0.006656646728515625, 0.008566856384277344, 0.010477066040039062, 0.012387275695800781, 0.0142974853515625, 0.01620769500732422, 0.018117904663085938, 0.020028114318847656, 0.021938323974609375, 0.023848533630371094, 0.025758743286132812, 0.02766895294189453, 0.02957916259765625, 0.03148937225341797, 0.03339958190917969, 0.035309791564941406, 0.037220001220703125, 0.039130210876464844, 0.04104042053222656, 0.04295063018798828, 0.04486083984375]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 19.0, 25.0, 89.0, 220.0, 354.0, 215.0, 51.0, 26.0, 8.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.457648754119873, -1.4097726345062256, -1.3618963956832886, -1.3140202760696411, -1.2661441564559937, -1.2182679176330566, -1.1703917980194092, -1.1225156784057617, -1.0746394395828247, -1.0267633199691772, -0.978887140750885, -0.9310109615325928, -0.8831347823143005, -0.8352586030960083, -0.7873824834823608, -0.7395063042640686, -0.6916301846504211, -0.6437540054321289, -0.5958778858184814, -0.5480017066001892, -0.500125527381897, -0.4522493779659271, -0.4043732285499573, -0.35649704933166504, -0.3086208999156952, -0.26074475049972534, -0.2128685712814331, -0.16499242186546326, -0.11711625754833221, -0.06924009323120117, -0.021363943815231323, 0.026512235403060913, 0.07438838481903076, 0.1222645491361618, 0.17014071345329285, 0.2180168628692627, 0.26589304208755493, 0.3137691915035248, 0.36164534091949463, 0.40952152013778687, 0.4573976695537567, 0.5052738189697266, 0.5531499981880188, 0.601026177406311, 0.6489022970199585, 0.6967784762382507, 0.744654655456543, 0.7925307750701904, 0.8404069542884827, 0.8882831335067749, 0.9361592531204224, 0.9840354323387146, 1.0319116115570068, 1.0797877311706543, 1.1276638507843018, 1.1755400896072388, 1.2234162092208862, 1.2712923288345337, 1.3191685676574707, 1.3670446872711182, 1.4149208068847656, 1.4627970457077026, 1.51067316532135, 1.558549404144287, 1.6064255237579346]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 3.0, 1.0, 8.0, 6.0, 13.0, 9.0, 18.0, 16.0, 19.0, 22.0, 26.0, 28.0, 25.0, 30.0, 32.0, 39.0, 36.0, 37.0, 38.0, 61.0, 52.0, 48.0, 38.0, 50.0, 29.0, 39.0, 33.0, 26.0, 35.0, 25.0, 22.0, 29.0, 14.0, 16.0, 22.0, 9.0, 8.0, 9.0, 5.0, 4.0, 6.0, 3.0, 9.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44726884365081787, -0.4306333065032959, -0.4139977693557739, -0.39736223220825195, -0.38072669506073, -0.364091157913208, -0.34745562076568604, -0.33082008361816406, -0.3141845464706421, -0.2975490093231201, -0.28091347217559814, -0.26427793502807617, -0.2476423978805542, -0.23100686073303223, -0.21437132358551025, -0.19773578643798828, -0.1811002492904663, -0.16446471214294434, -0.14782917499542236, -0.1311936378479004, -0.11455810070037842, -0.09792256355285645, -0.08128702640533447, -0.0646514892578125, -0.04801595211029053, -0.031380414962768555, -0.014744877815246582, 0.0018906593322753906, 0.018526196479797363, 0.035161733627319336, 0.05179727077484131, 0.06843280792236328, 0.08506834506988525, 0.10170388221740723, 0.1183394193649292, 0.13497495651245117, 0.15161049365997314, 0.16824603080749512, 0.1848815679550171, 0.20151710510253906, 0.21815264225006104, 0.234788179397583, 0.251423716545105, 0.26805925369262695, 0.2846947908401489, 0.3013303279876709, 0.31796586513519287, 0.33460140228271484, 0.3512369394302368, 0.3678724765777588, 0.38450801372528076, 0.40114355087280273, 0.4177790880203247, 0.4344146251678467, 0.45105016231536865, 0.4676856994628906, 0.4843212366104126, 0.5009567737579346, 0.5175923109054565, 0.5342278480529785, 0.5508633852005005, 0.5674989223480225, 0.5841344594955444, 0.6007699966430664, 0.6174055337905884]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 9.0, 35.0, 279.0, 95618.0, 4097979.0, 324.0, 36.0, 11.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2025146484375, -0.16275978088378906, -0.12300491333007812, -0.08325004577636719, -0.04349517822265625, -0.0037403106689453125, 0.036014556884765625, 0.07576942443847656, 0.1155242919921875, 0.15527915954589844, 0.19503402709960938, 0.2347888946533203, 0.27454376220703125, 0.3142986297607422, 0.3540534973144531, 0.39380836486816406, 0.433563232421875, 0.47331809997558594, 0.5130729675292969, 0.5528278350830078, 0.5925827026367188, 0.6323375701904297, 0.6720924377441406, 0.7118473052978516, 0.7516021728515625, 0.7913570404052734, 0.8311119079589844, 0.8708667755126953, 0.9106216430664062, 0.9503765106201172, 0.9901313781738281, 1.029886245727539, 1.06964111328125, 1.109395980834961, 1.1491508483886719, 1.1889057159423828, 1.2286605834960938, 1.2684154510498047, 1.3081703186035156, 1.3479251861572266, 1.3876800537109375, 1.4274349212646484, 1.4671897888183594, 1.5069446563720703, 1.5466995239257812, 1.5864543914794922, 1.6262092590332031, 1.665964126586914, 1.705718994140625, 1.745473861694336, 1.7852287292480469, 1.8249835968017578, 1.8647384643554688, 1.9044933319091797, 1.9442481994628906, 1.9840030670166016, 2.0237579345703125, 2.0635128021240234, 2.1032676696777344, 2.1430225372314453, 2.1827774047851562, 2.222532272338867, 2.262287139892578, 2.302042007446289, 2.341796875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 4.0, 5.0, 5.0, 10.0, 10.0, 11.0, 13.0, 18.0, 31.0, 39.0, 48.0, 58.0, 69.0, 63.0, 75.0, 80.0, 80.0, 63.0, 73.0, 67.0, 49.0, 29.0, 22.0, 18.0, 20.0, 22.0, 7.0, 10.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03167724609375, -0.03033161163330078, -0.028985977172851562, -0.027640342712402344, -0.026294708251953125, -0.024949073791503906, -0.023603439331054688, -0.02225780487060547, -0.02091217041015625, -0.01956653594970703, -0.018220901489257812, -0.016875267028808594, -0.015529632568359375, -0.014183998107910156, -0.012838363647460938, -0.011492729187011719, -0.0101470947265625, -0.008801460266113281, -0.0074558258056640625, -0.006110191345214844, -0.004764556884765625, -0.0034189224243164062, -0.0020732879638671875, -0.0007276535034179688, 0.00061798095703125, 0.0019636154174804688, 0.0033092498779296875, 0.004654884338378906, 0.006000518798828125, 0.007346153259277344, 0.008691787719726562, 0.010037422180175781, 0.011383056640625, 0.012728691101074219, 0.014074325561523438, 0.015419960021972656, 0.016765594482421875, 0.018111228942871094, 0.019456863403320312, 0.02080249786376953, 0.02214813232421875, 0.02349376678466797, 0.024839401245117188, 0.026185035705566406, 0.027530670166015625, 0.028876304626464844, 0.030221939086914062, 0.03156757354736328, 0.0329132080078125, 0.03425884246826172, 0.03560447692871094, 0.036950111389160156, 0.038295745849609375, 0.039641380310058594, 0.04098701477050781, 0.04233264923095703, 0.04367828369140625, 0.04502391815185547, 0.04636955261230469, 0.047715187072753906, 0.049060821533203125, 0.050406455993652344, 0.05175209045410156, 0.05309772491455078, 0.054443359375]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 3.0, 6.0, 9.0, 14.0, 23.0, 43.0, 50.0, 94.0, 174.0, 426.0, 1121.0, 4411.0, 30643.0, 1098781.0, 3001169.0, 48430.0, 6283.0, 1461.0, 575.0, 249.0, 123.0, 78.0, 49.0, 29.0, 8.0, 13.0, 6.0, 5.0, 1.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1591796875, -0.15436935424804688, -0.14955902099609375, -0.14474868774414062, -0.1399383544921875, -0.13512802124023438, -0.13031768798828125, -0.12550735473632812, -0.120697021484375, -0.11588668823242188, -0.11107635498046875, -0.10626602172851562, -0.1014556884765625, -0.09664535522460938, -0.09183502197265625, -0.08702468872070312, -0.08221435546875, -0.07740402221679688, -0.07259368896484375, -0.06778335571289062, -0.0629730224609375, -0.058162689208984375, -0.05335235595703125, -0.048542022705078125, -0.043731689453125, -0.038921356201171875, -0.03411102294921875, -0.029300689697265625, -0.0244903564453125, -0.019680023193359375, -0.01486968994140625, -0.010059356689453125, -0.0052490234375, -0.000438690185546875, 0.00437164306640625, 0.009181976318359375, 0.0139923095703125, 0.018802642822265625, 0.02361297607421875, 0.028423309326171875, 0.033233642578125, 0.038043975830078125, 0.04285430908203125, 0.047664642333984375, 0.0524749755859375, 0.057285308837890625, 0.06209564208984375, 0.06690597534179688, 0.07171630859375, 0.07652664184570312, 0.08133697509765625, 0.08614730834960938, 0.0909576416015625, 0.09576797485351562, 0.10057830810546875, 0.10538864135742188, 0.110198974609375, 0.11500930786132812, 0.11981964111328125, 0.12462997436523438, 0.1294403076171875, 0.13425064086914062, 0.13906097412109375, 0.14387130737304688, 0.148681640625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 12.0, 17.0, 25.0, 47.0, 84.0, 186.0, 579.0, 1816.0, 774.0, 288.0, 109.0, 53.0, 30.0, 18.0, 5.0, 8.0, 3.0, 5.0, 6.0, 4.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.060272216796875, -0.057820796966552734, -0.05536937713623047, -0.0529179573059082, -0.05046653747558594, -0.04801511764526367, -0.045563697814941406, -0.04311227798461914, -0.040660858154296875, -0.03820943832397461, -0.035758018493652344, -0.03330659866333008, -0.030855178833007812, -0.028403759002685547, -0.02595233917236328, -0.023500919342041016, -0.02104949951171875, -0.018598079681396484, -0.01614665985107422, -0.013695240020751953, -0.011243820190429688, -0.008792400360107422, -0.006340980529785156, -0.0038895606994628906, -0.001438140869140625, 0.0010132789611816406, 0.0034646987915039062, 0.005916118621826172, 0.008367538452148438, 0.010818958282470703, 0.013270378112792969, 0.015721797943115234, 0.0181732177734375, 0.020624637603759766, 0.02307605743408203, 0.025527477264404297, 0.027978897094726562, 0.030430316925048828, 0.032881736755371094, 0.03533315658569336, 0.037784576416015625, 0.04023599624633789, 0.042687416076660156, 0.04513883590698242, 0.04759025573730469, 0.05004167556762695, 0.05249309539794922, 0.054944515228271484, 0.05739593505859375, 0.059847354888916016, 0.06229877471923828, 0.06475019454956055, 0.06720161437988281, 0.06965303421020508, 0.07210445404052734, 0.07455587387084961, 0.07700729370117188, 0.07945871353149414, 0.0819101333618164, 0.08436155319213867, 0.08681297302246094, 0.0892643928527832, 0.09171581268310547, 0.09416723251342773, 0.09661865234375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 23.0, 312.0, 565.0, 84.0, 12.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9110252857208252, -1.8704955577850342, -1.8299659490585327, -1.7894362211227417, -1.7489064931869507, -1.7083768844604492, -1.6678471565246582, -1.6273174285888672, -1.5867877006530762, -1.5462579727172852, -1.5057283639907837, -1.4651986360549927, -1.4246689081192017, -1.3841392993927002, -1.3436095714569092, -1.3030798435211182, -1.2625502347946167, -1.2220205068588257, -1.1814908981323242, -1.1409611701965332, -1.1004314422607422, -1.0599017143249512, -1.0193721055984497, -0.9788423776626587, -0.9383127093315125, -0.8977830410003662, -0.8572533130645752, -0.816723644733429, -0.7761939764022827, -0.7356642484664917, -0.6951345801353455, -0.6546049118041992, -0.6140751838684082, -0.573545515537262, -0.533015787601471, -0.4924861192703247, -0.4519564211368561, -0.41142672300338745, -0.3708970546722412, -0.3303673565387726, -0.28983765840530396, -0.24930796027183533, -0.2087782770395279, -0.16824859380722046, -0.12771889567375183, -0.0871891975402832, -0.04665951430797577, -0.006129831075668335, 0.03439986705780029, 0.07492955774068832, 0.11545924842357635, 0.1559889316558838, 0.19651862978935242, 0.23704832792282104, 0.2775779962539673, 0.3181076943874359, 0.35863739252090454, 0.39916709065437317, 0.4396967887878418, 0.48022645711898804, 0.5207561254501343, 0.5612858533859253, 0.6018155217170715, 0.6423451900482178, 0.6828749179840088]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 3.0, 7.0, 15.0, 19.0, 26.0, 21.0, 34.0, 50.0, 51.0, 59.0, 60.0, 70.0, 64.0, 79.0, 80.0, 64.0, 80.0, 49.0, 38.0, 52.0, 21.0, 23.0, 13.0, 8.0, 6.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18119663000106812, -0.17265945672988892, -0.16412228345870972, -0.15558511018753052, -0.1470479518175125, -0.1385107785463333, -0.1299736052751541, -0.12143643200397491, -0.11289926618337631, -0.10436209291219711, -0.09582492709159851, -0.08728775382041931, -0.07875058054924011, -0.07021341472864151, -0.06167624145746231, -0.05313907191157341, -0.04460190236568451, -0.03606473281979561, -0.02752756141126156, -0.01899039000272751, -0.010453220456838608, -0.001916050910949707, 0.006621122360229492, 0.015158291906118393, 0.023695461452007294, 0.032232630997896194, 0.040769800543785095, 0.049306973814964294, 0.057844143360853195, 0.0663813129067421, 0.0749184861779213, 0.0834556519985199, 0.0919928252696991, 0.1005299985408783, 0.1090671643614769, 0.1176043376326561, 0.1261415034532547, 0.1346786767244339, 0.1432158499956131, 0.1517530232667923, 0.1602901816368103, 0.1688273549079895, 0.1773645281791687, 0.1859017014503479, 0.1944388598203659, 0.2029760330915451, 0.2115132063627243, 0.2200503796339035, 0.2285875529050827, 0.2371247261762619, 0.2456618994474411, 0.2541990578174591, 0.2627362310886383, 0.2712734043598175, 0.2798105776309967, 0.2883477509021759, 0.2968849241733551, 0.3054220974445343, 0.3139592707157135, 0.3224964439868927, 0.3310336172580719, 0.3395707607269287, 0.3481079339981079, 0.3566451072692871, 0.3651822805404663]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 3.0, 5.0, 16.0, 22.0, 24.0, 44.0, 76.0, 128.0, 247.0, 639.0, 1872.0, 8000.0, 64946.0, 714664.0, 233917.0, 18529.0, 3534.0, 1049.0, 393.0, 191.0, 94.0, 52.0, 30.0, 26.0, 12.0, 10.0, 9.0, 8.0, 2.0, 2.0, 4.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.189453125, -0.18236541748046875, -0.1752777099609375, -0.16819000244140625, -0.161102294921875, -0.15401458740234375, -0.1469268798828125, -0.13983917236328125, -0.13275146484375, -0.12566375732421875, -0.1185760498046875, -0.11148834228515625, -0.104400634765625, -0.09731292724609375, -0.0902252197265625, -0.08313751220703125, -0.0760498046875, -0.06896209716796875, -0.0618743896484375, -0.05478668212890625, -0.047698974609375, -0.04061126708984375, -0.0335235595703125, -0.02643585205078125, -0.01934814453125, -0.01226043701171875, -0.0051727294921875, 0.00191497802734375, 0.009002685546875, 0.01609039306640625, 0.0231781005859375, 0.03026580810546875, 0.037353515625, 0.04444122314453125, 0.0515289306640625, 0.05861663818359375, 0.065704345703125, 0.07279205322265625, 0.0798797607421875, 0.08696746826171875, 0.09405517578125, 0.10114288330078125, 0.1082305908203125, 0.11531829833984375, 0.122406005859375, 0.12949371337890625, 0.1365814208984375, 0.14366912841796875, 0.1507568359375, 0.15784454345703125, 0.1649322509765625, 0.17201995849609375, 0.179107666015625, 0.18619537353515625, 0.1932830810546875, 0.20037078857421875, 0.20745849609375, 0.21454620361328125, 0.2216339111328125, 0.22872161865234375, 0.235809326171875, 0.24289703369140625, 0.2499847412109375, 0.25707244873046875, 0.26416015625]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 8.0, 8.0, 8.0, 26.0, 15.0, 28.0, 44.0, 39.0, 70.0, 58.0, 69.0, 80.0, 80.0, 82.0, 82.0, 64.0, 51.0, 45.0, 39.0, 24.0, 24.0, 16.0, 15.0, 9.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035552978515625, -0.03415870666503906, -0.032764434814453125, -0.03137016296386719, -0.02997589111328125, -0.028581619262695312, -0.027187347412109375, -0.025793075561523438, -0.0243988037109375, -0.023004531860351562, -0.021610260009765625, -0.020215988159179688, -0.01882171630859375, -0.017427444458007812, -0.016033172607421875, -0.014638900756835938, -0.01324462890625, -0.011850357055664062, -0.010456085205078125, -0.009061813354492188, -0.00766754150390625, -0.0062732696533203125, -0.004878997802734375, -0.0034847259521484375, -0.0020904541015625, -0.0006961822509765625, 0.000698089599609375, 0.0020923614501953125, 0.00348663330078125, 0.0048809051513671875, 0.006275177001953125, 0.0076694488525390625, 0.009063720703125, 0.010457992553710938, 0.011852264404296875, 0.013246536254882812, 0.01464080810546875, 0.016035079956054688, 0.017429351806640625, 0.018823623657226562, 0.0202178955078125, 0.021612167358398438, 0.023006439208984375, 0.024400711059570312, 0.02579498291015625, 0.027189254760742188, 0.028583526611328125, 0.029977798461914062, 0.0313720703125, 0.03276634216308594, 0.034160614013671875, 0.03555488586425781, 0.03694915771484375, 0.03834342956542969, 0.039737701416015625, 0.04113197326660156, 0.0425262451171875, 0.04392051696777344, 0.045314788818359375, 0.04670906066894531, 0.04810333251953125, 0.04949760437011719, 0.050891876220703125, 0.05228614807128906, 0.053680419921875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 6.0, 6.0, 11.0, 11.0, 12.0, 19.0, 27.0, 43.0, 57.0, 91.0, 149.0, 234.0, 466.0, 1022.0, 2931.0, 10680.0, 59474.0, 384709.0, 483494.0, 84727.0, 14373.0, 3575.0, 1168.0, 528.0, 248.0, 152.0, 100.0, 62.0, 40.0, 29.0, 33.0, 21.0, 11.0, 12.0, 10.0, 6.0, 8.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.12005615234375, -0.1161947250366211, -0.11233329772949219, -0.10847187042236328, -0.10461044311523438, -0.10074901580810547, -0.09688758850097656, -0.09302616119384766, -0.08916473388671875, -0.08530330657958984, -0.08144187927246094, -0.07758045196533203, -0.07371902465820312, -0.06985759735107422, -0.06599617004394531, -0.062134742736816406, -0.0582733154296875, -0.054411888122558594, -0.05055046081542969, -0.04668903350830078, -0.042827606201171875, -0.03896617889404297, -0.03510475158691406, -0.031243324279785156, -0.02738189697265625, -0.023520469665527344, -0.019659042358398438, -0.01579761505126953, -0.011936187744140625, -0.008074760437011719, -0.0042133331298828125, -0.00035190582275390625, 0.003509521484375, 0.007370948791503906, 0.011232376098632812, 0.015093803405761719, 0.018955230712890625, 0.02281665802001953, 0.026678085327148438, 0.030539512634277344, 0.03440093994140625, 0.038262367248535156, 0.04212379455566406, 0.04598522186279297, 0.049846649169921875, 0.05370807647705078, 0.05756950378417969, 0.061430931091308594, 0.0652923583984375, 0.0691537857055664, 0.07301521301269531, 0.07687664031982422, 0.08073806762695312, 0.08459949493408203, 0.08846092224121094, 0.09232234954833984, 0.09618377685546875, 0.10004520416259766, 0.10390663146972656, 0.10776805877685547, 0.11162948608398438, 0.11549091339111328, 0.11935234069824219, 0.1232137680053711, 0.1270751953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 7.0, 5.0, 3.0, 8.0, 4.0, 15.0, 8.0, 11.0, 17.0, 25.0, 34.0, 32.0, 28.0, 42.0, 42.0, 32.0, 41.0, 47.0, 59.0, 37.0, 49.0, 57.0, 50.0, 34.0, 41.0, 35.0, 44.0, 26.0, 22.0, 24.0, 22.0, 16.0, 15.0, 11.0, 19.0, 13.0, 10.0, 5.0, 7.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1094970703125, -0.10598182678222656, -0.10246658325195312, -0.09895133972167969, -0.09543609619140625, -0.09192085266113281, -0.08840560913085938, -0.08489036560058594, -0.0813751220703125, -0.07785987854003906, -0.07434463500976562, -0.07082939147949219, -0.06731414794921875, -0.06379890441894531, -0.060283660888671875, -0.05676841735839844, -0.053253173828125, -0.04973793029785156, -0.046222686767578125, -0.04270744323730469, -0.03919219970703125, -0.03567695617675781, -0.032161712646484375, -0.028646469116210938, -0.0251312255859375, -0.021615982055664062, -0.018100738525390625, -0.014585494995117188, -0.01107025146484375, -0.0075550079345703125, -0.004039764404296875, -0.0005245208740234375, 0.00299072265625, 0.0065059661865234375, 0.010021209716796875, 0.013536453247070312, 0.01705169677734375, 0.020566940307617188, 0.024082183837890625, 0.027597427368164062, 0.0311126708984375, 0.03462791442871094, 0.038143157958984375, 0.04165840148925781, 0.04517364501953125, 0.04868888854980469, 0.052204132080078125, 0.05571937561035156, 0.059234619140625, 0.06274986267089844, 0.06626510620117188, 0.06978034973144531, 0.07329559326171875, 0.07681083679199219, 0.08032608032226562, 0.08384132385253906, 0.0873565673828125, 0.09087181091308594, 0.09438705444335938, 0.09790229797363281, 0.10141754150390625, 0.10493278503417969, 0.10844802856445312, 0.11196327209472656, 0.115478515625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 11.0, 25.0, 41.0, 85.0, 174.0, 380.0, 817.0, 2181.0, 13170.0, 487659.0, 526003.0, 14274.0, 2218.0, 795.0, 338.0, 168.0, 96.0, 50.0, 23.0, 24.0, 10.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07147216796875, -0.0690908432006836, -0.06670951843261719, -0.06432819366455078, -0.061946868896484375, -0.05956554412841797, -0.05718421936035156, -0.054802894592285156, -0.05242156982421875, -0.050040245056152344, -0.04765892028808594, -0.04527759552001953, -0.042896270751953125, -0.04051494598388672, -0.03813362121582031, -0.035752296447753906, -0.0333709716796875, -0.030989646911621094, -0.028608322143554688, -0.02622699737548828, -0.023845672607421875, -0.02146434783935547, -0.019083023071289062, -0.016701698303222656, -0.01432037353515625, -0.011939048767089844, -0.009557723999023438, -0.007176399230957031, -0.004795074462890625, -0.0024137496948242188, -3.24249267578125e-05, 0.0023488998413085938, 0.004730224609375, 0.007111549377441406, 0.009492874145507812, 0.011874198913574219, 0.014255523681640625, 0.01663684844970703, 0.019018173217773438, 0.021399497985839844, 0.02378082275390625, 0.026162147521972656, 0.028543472290039062, 0.03092479705810547, 0.033306121826171875, 0.03568744659423828, 0.03806877136230469, 0.040450096130371094, 0.0428314208984375, 0.045212745666503906, 0.04759407043457031, 0.04997539520263672, 0.052356719970703125, 0.05473804473876953, 0.05711936950683594, 0.059500694274902344, 0.06188201904296875, 0.06426334381103516, 0.06664466857910156, 0.06902599334716797, 0.07140731811523438, 0.07378864288330078, 0.07616996765136719, 0.0785512924194336, 0.0809326171875]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 7.0, 5.0, 11.0, 19.0, 40.0, 48.0, 67.0, 94.0, 115.0, 116.0, 122.0, 112.0, 88.0, 69.0, 39.0, 16.0, 21.0, 13.0, 4.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2934207916259766e-05, -1.2516044080257416e-05, -1.2097880244255066e-05, -1.1679716408252716e-05, -1.1261552572250366e-05, -1.0843388736248016e-05, -1.0425224900245667e-05, -1.0007061064243317e-05, -9.588897228240967e-06, -9.170733392238617e-06, -8.752569556236267e-06, -8.334405720233917e-06, -7.916241884231567e-06, -7.4980780482292175e-06, -7.079914212226868e-06, -6.661750376224518e-06, -6.243586540222168e-06, -5.825422704219818e-06, -5.407258868217468e-06, -4.989095032215118e-06, -4.5709311962127686e-06, -4.152767360210419e-06, -3.734603524208069e-06, -3.316439688205719e-06, -2.898275852203369e-06, -2.4801120162010193e-06, -2.0619481801986694e-06, -1.6437843441963196e-06, -1.2256205081939697e-06, -8.074566721916199e-07, -3.8929283618927e-07, 2.8870999813079834e-08, 4.470348358154297e-07, 8.651986718177795e-07, 1.2833625078201294e-06, 1.7015263438224792e-06, 2.119690179824829e-06, 2.537854015827179e-06, 2.956017851829529e-06, 3.3741816878318787e-06, 3.7923455238342285e-06, 4.210509359836578e-06, 4.628673195838928e-06, 5.046837031841278e-06, 5.465000867843628e-06, 5.883164703845978e-06, 6.301328539848328e-06, 6.7194923758506775e-06, 7.137656211853027e-06, 7.555820047855377e-06, 7.973983883857727e-06, 8.392147719860077e-06, 8.810311555862427e-06, 9.228475391864777e-06, 9.646639227867126e-06, 1.0064803063869476e-05, 1.0482966899871826e-05, 1.0901130735874176e-05, 1.1319294571876526e-05, 1.1737458407878876e-05, 1.2155622243881226e-05, 1.2573786079883575e-05, 1.2991949915885925e-05, 1.3410113751888275e-05, 1.3828277587890625e-05]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 9.0, 4.0, 10.0, 13.0, 31.0, 37.0, 60.0, 130.0, 315.0, 1109.0, 8549.0, 699311.0, 332456.0, 5123.0, 836.0, 299.0, 131.0, 62.0, 38.0, 11.0, 9.0, 11.0, 5.0, 8.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1268310546875, -0.12357139587402344, -0.12031173706054688, -0.11705207824707031, -0.11379241943359375, -0.11053276062011719, -0.10727310180664062, -0.10401344299316406, -0.1007537841796875, -0.09749412536621094, -0.09423446655273438, -0.09097480773925781, -0.08771514892578125, -0.08445549011230469, -0.08119583129882812, -0.07793617248535156, -0.074676513671875, -0.07141685485839844, -0.06815719604492188, -0.06489753723144531, -0.06163787841796875, -0.05837821960449219, -0.055118560791015625, -0.05185890197753906, -0.0485992431640625, -0.04533958435058594, -0.042079925537109375, -0.03882026672363281, -0.03556060791015625, -0.03230094909667969, -0.029041290283203125, -0.025781631469726562, -0.02252197265625, -0.019262313842773438, -0.016002655029296875, -0.012742996215820312, -0.00948333740234375, -0.0062236785888671875, -0.002964019775390625, 0.0002956390380859375, 0.0035552978515625, 0.0068149566650390625, 0.010074615478515625, 0.013334274291992188, 0.01659393310546875, 0.019853591918945312, 0.023113250732421875, 0.026372909545898438, 0.029632568359375, 0.03289222717285156, 0.036151885986328125, 0.03941154479980469, 0.04267120361328125, 0.04593086242675781, 0.049190521240234375, 0.05245018005371094, 0.0557098388671875, 0.05896949768066406, 0.062229156494140625, 0.06548881530761719, 0.06874847412109375, 0.07200813293457031, 0.07526779174804688, 0.07852745056152344, 0.081787109375]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 1.0, 1.0, 5.0, 4.0, 4.0, 2.0, 6.0, 5.0, 11.0, 5.0, 13.0, 16.0, 21.0, 23.0, 37.0, 51.0, 73.0, 71.0, 71.0, 87.0, 81.0, 78.0, 68.0, 48.0, 48.0, 48.0, 32.0, 20.0, 14.0, 13.0, 7.0, 9.0, 3.0, 5.0, 6.0, 3.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.034576416015625, -0.03337526321411133, -0.032174110412597656, -0.030972957611083984, -0.029771804809570312, -0.02857065200805664, -0.02736949920654297, -0.026168346405029297, -0.024967193603515625, -0.023766040802001953, -0.02256488800048828, -0.02136373519897461, -0.020162582397460938, -0.018961429595947266, -0.017760276794433594, -0.016559123992919922, -0.01535797119140625, -0.014156818389892578, -0.012955665588378906, -0.011754512786865234, -0.010553359985351562, -0.00935220718383789, -0.008151054382324219, -0.006949901580810547, -0.005748748779296875, -0.004547595977783203, -0.0033464431762695312, -0.0021452903747558594, -0.0009441375732421875, 0.0002570152282714844, 0.0014581680297851562, 0.002659320831298828, 0.0038604736328125, 0.005061626434326172, 0.006262779235839844, 0.007463932037353516, 0.008665084838867188, 0.00986623764038086, 0.011067390441894531, 0.012268543243408203, 0.013469696044921875, 0.014670848846435547, 0.01587200164794922, 0.01707315444946289, 0.018274307250976562, 0.019475460052490234, 0.020676612854003906, 0.021877765655517578, 0.02307891845703125, 0.024280071258544922, 0.025481224060058594, 0.026682376861572266, 0.027883529663085938, 0.02908468246459961, 0.03028583526611328, 0.03148698806762695, 0.032688140869140625, 0.0338892936706543, 0.03509044647216797, 0.03629159927368164, 0.03749275207519531, 0.038693904876708984, 0.039895057678222656, 0.04109621047973633, 0.04229736328125]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 24.0, 131.0, 539.0, 263.0, 40.0, 9.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4021776914596558, -1.3266102075576782, -1.2510428428649902, -1.1754753589630127, -1.0999078750610352, -1.0243403911590576, -0.9487730264663696, -0.8732055425643921, -0.7976381182670593, -0.7220706939697266, -0.646503210067749, -0.5709357857704163, -0.4953683316707611, -0.41980087757110596, -0.3442334532737732, -0.26866596937179565, -0.1930985450744629, -0.11753109842538834, -0.04196365177631378, 0.033603787422180176, 0.10917124152183533, 0.18473869562149048, 0.26030611991882324, 0.3358736038208008, 0.41144102811813354, 0.4870084822177887, 0.5625759363174438, 0.6381433606147766, 0.7137107849121094, 0.7892782688140869, 0.8648456931114197, 0.9404131770133972, 1.0159804821014404, 1.091547966003418, 1.167115330696106, 1.2426828145980835, 1.318250298500061, 1.393817663192749, 1.4693851470947266, 1.544952630996704, 1.6205201148986816, 1.6960875988006592, 1.7716549634933472, 1.8472224473953247, 1.9227899312973022, 1.9983572959899902, 2.0739247798919678, 2.1494922637939453, 2.2250595092773438, 2.3006269931793213, 2.376194477081299, 2.4517617225646973, 2.527329206466675, 2.6028966903686523, 2.67846417427063, 2.7540316581726074, 2.829599142074585, 2.9051666259765625, 2.98073410987854, 3.0563015937805176, 3.131868839263916, 3.2074363231658936, 3.283003807067871, 3.3585712909698486, 3.434138774871826]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 6.0, 8.0, 7.0, 8.0, 9.0, 12.0, 18.0, 20.0, 18.0, 27.0, 27.0, 27.0, 32.0, 38.0, 42.0, 55.0, 26.0, 40.0, 60.0, 39.0, 36.0, 47.0, 40.0, 34.0, 40.0, 34.0, 33.0, 37.0, 32.0, 27.0, 20.0, 20.0, 20.0, 8.0, 13.0, 5.0, 13.0, 4.0, 4.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4833560585975647, -0.46654993295669556, -0.4497438371181488, -0.43293771147727966, -0.4161316156387329, -0.39932548999786377, -0.38251936435699463, -0.3657132387161255, -0.34890714287757874, -0.3321010172367096, -0.31529492139816284, -0.2984887957572937, -0.28168267011642456, -0.2648765742778778, -0.24807044863700867, -0.23126433789730072, -0.21445822715759277, -0.19765211641788483, -0.18084600567817688, -0.16403988003730774, -0.1472337692975998, -0.13042765855789185, -0.1136215403676033, -0.09681542217731476, -0.08000931143760681, -0.06320320069789886, -0.04639708250761032, -0.029590968042612076, -0.01278485357761383, 0.004021257162094116, 0.02082737535238266, 0.037633493542671204, 0.054439663887023926, 0.07124577462673187, 0.08805189281702042, 0.10485801100730896, 0.1216641217470169, 0.13847023248672485, 0.155276358127594, 0.17208246886730194, 0.1888885796070099, 0.20569469034671783, 0.22250080108642578, 0.23930692672729492, 0.25611305236816406, 0.2729191482067108, 0.28972527384757996, 0.3065313696861267, 0.32333749532699585, 0.340143620967865, 0.35694971680641174, 0.3737558424472809, 0.39056193828582764, 0.4073680639266968, 0.4241741895675659, 0.44098031520843506, 0.4577864110469818, 0.47459253668785095, 0.4913986325263977, 0.5082047581672668, 0.525010883808136, 0.5418169498443604, 0.5586230754852295, 0.5754292011260986, 0.5922353267669678]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 2.0, 5.0, 4.0, 6.0, 7.0, 15.0, 26.0, 29.0, 45.0, 64.0, 91.0, 129.0, 199.0, 355.0, 603.0, 1048.0, 2331.0, 5936.0, 20278.0, 129371.0, 3495508.0, 478344.0, 43069.0, 9867.0, 3459.0, 1515.0, 826.0, 408.0, 262.0, 149.0, 104.0, 70.0, 45.0, 39.0, 27.0, 12.0, 10.0, 4.0, 5.0, 7.0, 6.0, 2.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1064453125, -0.10319328308105469, -0.09994125366210938, -0.09668922424316406, -0.09343719482421875, -0.09018516540527344, -0.08693313598632812, -0.08368110656738281, -0.0804290771484375, -0.07717704772949219, -0.07392501831054688, -0.07067298889160156, -0.06742095947265625, -0.06416893005371094, -0.060916900634765625, -0.05766487121582031, -0.054412841796875, -0.05116081237792969, -0.047908782958984375, -0.04465675354003906, -0.04140472412109375, -0.03815269470214844, -0.034900665283203125, -0.03164863586425781, -0.0283966064453125, -0.025144577026367188, -0.021892547607421875, -0.018640518188476562, -0.01538848876953125, -0.012136459350585938, -0.008884429931640625, -0.0056324005126953125, -0.00238037109375, 0.0008716583251953125, 0.004123687744140625, 0.0073757171630859375, 0.01062774658203125, 0.013879776000976562, 0.017131805419921875, 0.020383834838867188, 0.0236358642578125, 0.026887893676757812, 0.030139923095703125, 0.03339195251464844, 0.03664398193359375, 0.03989601135253906, 0.043148040771484375, 0.04640007019042969, 0.049652099609375, 0.05290412902832031, 0.056156158447265625, 0.05940818786621094, 0.06266021728515625, 0.06591224670410156, 0.06916427612304688, 0.07241630554199219, 0.0756683349609375, 0.07892036437988281, 0.08217239379882812, 0.08542442321777344, 0.08867645263671875, 0.09192848205566406, 0.09518051147460938, 0.09843254089355469, 0.1016845703125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 8.0, 7.0, 7.0, 12.0, 20.0, 34.0, 32.0, 45.0, 52.0, 54.0, 62.0, 80.0, 69.0, 99.0, 81.0, 63.0, 57.0, 50.0, 33.0, 34.0, 38.0, 22.0, 14.0, 10.0, 6.0, 6.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.037322998046875, -0.03589296340942383, -0.034462928771972656, -0.033032894134521484, -0.03160285949707031, -0.03017282485961914, -0.02874279022216797, -0.027312755584716797, -0.025882720947265625, -0.024452686309814453, -0.02302265167236328, -0.02159261703491211, -0.020162582397460938, -0.018732547760009766, -0.017302513122558594, -0.015872478485107422, -0.01444244384765625, -0.013012409210205078, -0.011582374572753906, -0.010152339935302734, -0.008722305297851562, -0.007292270660400391, -0.005862236022949219, -0.004432201385498047, -0.003002166748046875, -0.0015721321105957031, -0.00014209747314453125, 0.0012879371643066406, 0.0027179718017578125, 0.004148006439208984, 0.005578041076660156, 0.007008075714111328, 0.0084381103515625, 0.009868144989013672, 0.011298179626464844, 0.012728214263916016, 0.014158248901367188, 0.01558828353881836, 0.01701831817626953, 0.018448352813720703, 0.019878387451171875, 0.021308422088623047, 0.02273845672607422, 0.02416849136352539, 0.025598526000976562, 0.027028560638427734, 0.028458595275878906, 0.029888629913330078, 0.03131866455078125, 0.03274869918823242, 0.034178733825683594, 0.035608768463134766, 0.03703880310058594, 0.03846883773803711, 0.03989887237548828, 0.04132890701293945, 0.042758941650390625, 0.0441889762878418, 0.04561901092529297, 0.04704904556274414, 0.04847908020019531, 0.049909114837646484, 0.051339149475097656, 0.05276918411254883, 0.05419921875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 12.0, 7.0, 10.0, 20.0, 36.0, 40.0, 78.0, 101.0, 212.0, 412.0, 855.0, 2107.0, 7356.0, 44187.0, 1939567.0, 2142648.0, 45150.0, 7291.0, 2194.0, 927.0, 391.0, 267.0, 126.0, 95.0, 67.0, 45.0, 22.0, 16.0, 5.0, 18.0, 7.0, 2.0, 5.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.154296875, -0.14975929260253906, -0.14522171020507812, -0.1406841278076172, -0.13614654541015625, -0.1316089630126953, -0.12707138061523438, -0.12253379821777344, -0.1179962158203125, -0.11345863342285156, -0.10892105102539062, -0.10438346862792969, -0.09984588623046875, -0.09530830383300781, -0.09077072143554688, -0.08623313903808594, -0.081695556640625, -0.07715797424316406, -0.07262039184570312, -0.06808280944824219, -0.06354522705078125, -0.05900764465332031, -0.054470062255859375, -0.04993247985839844, -0.0453948974609375, -0.04085731506347656, -0.036319732666015625, -0.03178215026855469, -0.02724456787109375, -0.022706985473632812, -0.018169403076171875, -0.013631820678710938, -0.00909423828125, -0.0045566558837890625, -1.9073486328125e-05, 0.0045185089111328125, 0.00905609130859375, 0.013593673706054688, 0.018131256103515625, 0.022668838500976562, 0.0272064208984375, 0.03174400329589844, 0.036281585693359375, 0.04081916809082031, 0.04535675048828125, 0.04989433288574219, 0.054431915283203125, 0.05896949768066406, 0.063507080078125, 0.06804466247558594, 0.07258224487304688, 0.07711982727050781, 0.08165740966796875, 0.08619499206542969, 0.09073257446289062, 0.09527015686035156, 0.0998077392578125, 0.10434532165527344, 0.10888290405273438, 0.11342048645019531, 0.11795806884765625, 0.12249565124511719, 0.12703323364257812, 0.13157081604003906, 0.1361083984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 7.0, 3.0, 9.0, 14.0, 31.0, 46.0, 121.0, 303.0, 1415.0, 1560.0, 334.0, 112.0, 68.0, 16.0, 12.0, 13.0, 3.0, 5.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0496826171875, -0.04732036590576172, -0.04495811462402344, -0.042595863342285156, -0.040233612060546875, -0.037871360778808594, -0.03550910949707031, -0.03314685821533203, -0.03078460693359375, -0.02842235565185547, -0.026060104370117188, -0.023697853088378906, -0.021335601806640625, -0.018973350524902344, -0.016611099243164062, -0.014248847961425781, -0.0118865966796875, -0.009524345397949219, -0.0071620941162109375, -0.004799842834472656, -0.002437591552734375, -7.534027099609375e-05, 0.0022869110107421875, 0.004649162292480469, 0.00701141357421875, 0.009373664855957031, 0.011735916137695312, 0.014098167419433594, 0.016460418701171875, 0.018822669982910156, 0.021184921264648438, 0.02354717254638672, 0.025909423828125, 0.02827167510986328, 0.030633926391601562, 0.032996177673339844, 0.035358428955078125, 0.037720680236816406, 0.04008293151855469, 0.04244518280029297, 0.04480743408203125, 0.04716968536376953, 0.04953193664550781, 0.051894187927246094, 0.054256439208984375, 0.056618690490722656, 0.05898094177246094, 0.06134319305419922, 0.0637054443359375, 0.06606769561767578, 0.06842994689941406, 0.07079219818115234, 0.07315444946289062, 0.0755167007446289, 0.07787895202636719, 0.08024120330810547, 0.08260345458984375, 0.08496570587158203, 0.08732795715332031, 0.0896902084350586, 0.09205245971679688, 0.09441471099853516, 0.09677696228027344, 0.09913921356201172, 0.10150146484375]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 4.0, 12.0, 29.0, 47.0, 132.0, 226.0, 238.0, 161.0, 83.0, 35.0, 12.0, 5.0, 6.0, 5.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12455452978610992, -0.11257180571556091, -0.1005890816450119, -0.08860635757446289, -0.07662363350391388, -0.06464090943336487, -0.052658192813396454, -0.04067546874284744, -0.02869274467229843, -0.01671002060174942, -0.004727298393845558, 0.007255423814058304, 0.019238147884607315, 0.031220871955156326, 0.04320359230041504, 0.05518631637096405, 0.06716904044151306, 0.07915176451206207, 0.09113448858261108, 0.1031172126531601, 0.1150999367237091, 0.12708266079425812, 0.13906538486480713, 0.15104809403419495, 0.16303083300590515, 0.17501355707645416, 0.18699628114700317, 0.19897900521755219, 0.2109617292881012, 0.2229444533586502, 0.23492717742919922, 0.24690988659858704, 0.25889262557029724, 0.27087533473968506, 0.28285807371139526, 0.2948407828807831, 0.3068235218524933, 0.3188062310218811, 0.3307889699935913, 0.3427716791629791, 0.35475441813468933, 0.36673712730407715, 0.37871986627578735, 0.39070257544517517, 0.4026853144168854, 0.4146680235862732, 0.4266507625579834, 0.4386334717273712, 0.45061618089675903, 0.46259889006614685, 0.47458162903785706, 0.4865643382072449, 0.4985470771789551, 0.5105298161506653, 0.5225124955177307, 0.5344952344894409, 0.5464779734611511, 0.5584607124328613, 0.5704433917999268, 0.582426130771637, 0.5944088697433472, 0.6063916087150574, 0.6183742880821228, 0.630357027053833, 0.6423397660255432]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 3.0, 5.0, 3.0, 8.0, 11.0, 15.0, 19.0, 31.0, 34.0, 41.0, 55.0, 61.0, 53.0, 73.0, 62.0, 64.0, 75.0, 56.0, 72.0, 63.0, 53.0, 36.0, 31.0, 21.0, 16.0, 16.0, 9.0, 10.0, 2.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.18634295463562012, -0.1795329749584198, -0.1727229803800583, -0.16591300070285797, -0.15910302102565765, -0.15229302644729614, -0.14548304677009583, -0.1386730670928955, -0.1318630874156952, -0.12505310773849487, -0.11824312061071396, -0.11143313348293304, -0.10462315380573273, -0.09781316667795181, -0.0910031795501709, -0.08419319987297058, -0.07738320529460907, -0.07057321816682816, -0.06376323848962784, -0.056953251361846924, -0.05014326795935631, -0.04333328455686569, -0.03652329742908478, -0.029713314026594162, -0.022903330624103546, -0.01609334722161293, -0.009283361956477165, -0.0024733766913414, 0.004336606711149216, 0.011146590113639832, 0.017956577241420746, 0.02476656064391136, 0.03157654404640198, 0.03838652744889259, 0.04519651085138321, 0.052006497979164124, 0.05881648138165474, 0.06562646478414536, 0.07243645191192627, 0.07924643158912659, 0.0860564187169075, 0.09286640584468842, 0.09967638552188873, 0.10648637264966965, 0.11329635977745056, 0.12010633945465088, 0.1269163191318512, 0.1337263137102127, 0.14053629338741302, 0.14734627306461334, 0.15415626764297485, 0.16096624732017517, 0.1677762269973755, 0.1745862066745758, 0.18139620125293732, 0.18820618093013763, 0.19501617550849915, 0.20182615518569946, 0.20863614976406097, 0.2154461294412613, 0.2222561091184616, 0.22906610369682312, 0.23587608337402344, 0.24268606305122375, 0.24949604272842407]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 1.0, 6.0, 8.0, 12.0, 13.0, 20.0, 25.0, 61.0, 79.0, 148.0, 251.0, 541.0, 1273.0, 4073.0, 18807.0, 139879.0, 650646.0, 199740.0, 25017.0, 5081.0, 1567.0, 597.0, 284.0, 152.0, 106.0, 56.0, 37.0, 34.0, 12.0, 11.0, 6.0, 5.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.177490234375, -0.17235755920410156, -0.16722488403320312, -0.1620922088623047, -0.15695953369140625, -0.1518268585205078, -0.14669418334960938, -0.14156150817871094, -0.1364288330078125, -0.13129615783691406, -0.12616348266601562, -0.12103080749511719, -0.11589813232421875, -0.11076545715332031, -0.10563278198242188, -0.10050010681152344, -0.095367431640625, -0.09023475646972656, -0.08510208129882812, -0.07996940612792969, -0.07483673095703125, -0.06970405578613281, -0.06457138061523438, -0.05943870544433594, -0.0543060302734375, -0.04917335510253906, -0.044040679931640625, -0.03890800476074219, -0.03377532958984375, -0.028642654418945312, -0.023509979248046875, -0.018377304077148438, -0.01324462890625, -0.008111953735351562, -0.002979278564453125, 0.0021533966064453125, 0.00728607177734375, 0.012418746948242188, 0.017551422119140625, 0.022684097290039062, 0.0278167724609375, 0.03294944763183594, 0.038082122802734375, 0.04321479797363281, 0.04834747314453125, 0.05348014831542969, 0.058612823486328125, 0.06374549865722656, 0.068878173828125, 0.07401084899902344, 0.07914352416992188, 0.08427619934082031, 0.08940887451171875, 0.09454154968261719, 0.09967422485351562, 0.10480690002441406, 0.1099395751953125, 0.11507225036621094, 0.12020492553710938, 0.1253376007080078, 0.13047027587890625, 0.1356029510498047, 0.14073562622070312, 0.14586830139160156, 0.1510009765625]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 5.0, 5.0, 7.0, 21.0, 18.0, 27.0, 35.0, 33.0, 39.0, 61.0, 70.0, 73.0, 57.0, 88.0, 58.0, 71.0, 62.0, 57.0, 50.0, 34.0, 29.0, 35.0, 19.0, 12.0, 8.0, 12.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03741455078125, -0.03600883483886719, -0.034603118896484375, -0.03319740295410156, -0.03179168701171875, -0.030385971069335938, -0.028980255126953125, -0.027574539184570312, -0.0261688232421875, -0.024763107299804688, -0.023357391357421875, -0.021951675415039062, -0.02054595947265625, -0.019140243530273438, -0.017734527587890625, -0.016328811645507812, -0.014923095703125, -0.013517379760742188, -0.012111663818359375, -0.010705947875976562, -0.00930023193359375, -0.007894515991210938, -0.006488800048828125, -0.0050830841064453125, -0.0036773681640625, -0.0022716522216796875, -0.000865936279296875, 0.0005397796630859375, 0.00194549560546875, 0.0033512115478515625, 0.004756927490234375, 0.0061626434326171875, 0.007568359375, 0.008974075317382812, 0.010379791259765625, 0.011785507202148438, 0.01319122314453125, 0.014596939086914062, 0.016002655029296875, 0.017408370971679688, 0.0188140869140625, 0.020219802856445312, 0.021625518798828125, 0.023031234741210938, 0.02443695068359375, 0.025842666625976562, 0.027248382568359375, 0.028654098510742188, 0.030059814453125, 0.03146553039550781, 0.032871246337890625, 0.03427696228027344, 0.03568267822265625, 0.03708839416503906, 0.038494110107421875, 0.03989982604980469, 0.0413055419921875, 0.04271125793457031, 0.044116973876953125, 0.04552268981933594, 0.04692840576171875, 0.04833412170410156, 0.049739837646484375, 0.05114555358886719, 0.05255126953125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 5.0, 4.0, 3.0, 7.0, 13.0, 15.0, 11.0, 17.0, 20.0, 23.0, 29.0, 57.0, 63.0, 118.0, 195.0, 382.0, 741.0, 1736.0, 4499.0, 13166.0, 44586.0, 171033.0, 439589.0, 268189.0, 72590.0, 20289.0, 6562.0, 2332.0, 1021.0, 518.0, 234.0, 146.0, 108.0, 69.0, 55.0, 30.0, 28.0, 18.0, 16.0, 10.0, 11.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.085205078125, -0.08251571655273438, -0.07982635498046875, -0.07713699340820312, -0.0744476318359375, -0.07175827026367188, -0.06906890869140625, -0.06637954711914062, -0.063690185546875, -0.061000823974609375, -0.05831146240234375, -0.055622100830078125, -0.0529327392578125, -0.050243377685546875, -0.04755401611328125, -0.044864654541015625, -0.04217529296875, -0.039485931396484375, -0.03679656982421875, -0.034107208251953125, -0.0314178466796875, -0.028728485107421875, -0.02603912353515625, -0.023349761962890625, -0.020660400390625, -0.017971038818359375, -0.01528167724609375, -0.012592315673828125, -0.0099029541015625, -0.007213592529296875, -0.00452423095703125, -0.001834869384765625, 0.0008544921875, 0.003543853759765625, 0.00623321533203125, 0.008922576904296875, 0.0116119384765625, 0.014301300048828125, 0.01699066162109375, 0.019680023193359375, 0.022369384765625, 0.025058746337890625, 0.02774810791015625, 0.030437469482421875, 0.0331268310546875, 0.035816192626953125, 0.03850555419921875, 0.041194915771484375, 0.04388427734375, 0.046573638916015625, 0.04926300048828125, 0.051952362060546875, 0.0546417236328125, 0.057331085205078125, 0.06002044677734375, 0.06270980834960938, 0.065399169921875, 0.06808853149414062, 0.07077789306640625, 0.07346725463867188, 0.0761566162109375, 0.07884597778320312, 0.08153533935546875, 0.08422470092773438, 0.0869140625]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 4.0, 3.0, 6.0, 3.0, 6.0, 10.0, 5.0, 17.0, 22.0, 22.0, 23.0, 23.0, 19.0, 22.0, 28.0, 36.0, 37.0, 40.0, 41.0, 46.0, 48.0, 31.0, 59.0, 42.0, 43.0, 41.0, 44.0, 35.0, 37.0, 33.0, 17.0, 23.0, 23.0, 19.0, 17.0, 22.0, 15.0, 11.0, 8.0, 6.0, 3.0, 7.0, 5.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.11529541015625, -0.11187458038330078, -0.10845375061035156, -0.10503292083740234, -0.10161209106445312, -0.0981912612915039, -0.09477043151855469, -0.09134960174560547, -0.08792877197265625, -0.08450794219970703, -0.08108711242675781, -0.0776662826538086, -0.07424545288085938, -0.07082462310791016, -0.06740379333496094, -0.06398296356201172, -0.0605621337890625, -0.05714130401611328, -0.05372047424316406, -0.050299644470214844, -0.046878814697265625, -0.043457984924316406, -0.04003715515136719, -0.03661632537841797, -0.03319549560546875, -0.02977466583251953, -0.026353836059570312, -0.022933006286621094, -0.019512176513671875, -0.016091346740722656, -0.012670516967773438, -0.009249687194824219, -0.005828857421875, -0.0024080276489257812, 0.0010128021240234375, 0.004433631896972656, 0.007854461669921875, 0.011275291442871094, 0.014696121215820312, 0.01811695098876953, 0.02153778076171875, 0.02495861053466797, 0.028379440307617188, 0.031800270080566406, 0.035221099853515625, 0.038641929626464844, 0.04206275939941406, 0.04548358917236328, 0.0489044189453125, 0.05232524871826172, 0.05574607849121094, 0.059166908264160156, 0.06258773803710938, 0.0660085678100586, 0.06942939758300781, 0.07285022735595703, 0.07627105712890625, 0.07969188690185547, 0.08311271667480469, 0.0865335464477539, 0.08995437622070312, 0.09337520599365234, 0.09679603576660156, 0.10021686553955078, 0.1036376953125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 3.0, 1.0, 5.0, 3.0, 7.0, 9.0, 12.0, 25.0, 24.0, 34.0, 32.0, 66.0, 94.0, 160.0, 281.0, 551.0, 1423.0, 5832.0, 72791.0, 697082.0, 251215.0, 14741.0, 2371.0, 850.0, 384.0, 197.0, 114.0, 88.0, 51.0, 24.0, 30.0, 21.0, 11.0, 12.0, 6.0, 5.0, 2.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0716552734375, -0.06970357894897461, -0.06775188446044922, -0.06580018997192383, -0.06384849548339844, -0.06189680099487305, -0.059945106506347656, -0.057993412017822266, -0.056041717529296875, -0.054090023040771484, -0.052138328552246094, -0.0501866340637207, -0.04823493957519531, -0.04628324508666992, -0.04433155059814453, -0.04237985610961914, -0.04042816162109375, -0.03847646713256836, -0.03652477264404297, -0.03457307815551758, -0.03262138366699219, -0.030669689178466797, -0.028717994689941406, -0.026766300201416016, -0.024814605712890625, -0.022862911224365234, -0.020911216735839844, -0.018959522247314453, -0.017007827758789062, -0.015056133270263672, -0.013104438781738281, -0.01115274429321289, -0.0092010498046875, -0.007249355316162109, -0.005297660827636719, -0.003345966339111328, -0.0013942718505859375, 0.0005574226379394531, 0.0025091171264648438, 0.004460811614990234, 0.006412506103515625, 0.008364200592041016, 0.010315895080566406, 0.012267589569091797, 0.014219284057617188, 0.016170978546142578, 0.01812267303466797, 0.02007436752319336, 0.02202606201171875, 0.02397775650024414, 0.02592945098876953, 0.027881145477294922, 0.029832839965820312, 0.0317845344543457, 0.033736228942871094, 0.035687923431396484, 0.037639617919921875, 0.039591312408447266, 0.041543006896972656, 0.04349470138549805, 0.04544639587402344, 0.04739809036254883, 0.04934978485107422, 0.05130147933959961, 0.053253173828125]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 3.0, 4.0, 12.0, 7.0, 18.0, 27.0, 38.0, 82.0, 79.0, 104.0, 109.0, 89.0, 111.0, 89.0, 76.0, 51.0, 39.0, 34.0, 13.0, 8.0, 6.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.59634780883789e-06, -9.213574230670929e-06, -8.830800652503967e-06, -8.448027074337006e-06, -8.065253496170044e-06, -7.682479918003082e-06, -7.299706339836121e-06, -6.916932761669159e-06, -6.534159183502197e-06, -6.151385605335236e-06, -5.768612027168274e-06, -5.385838449001312e-06, -5.003064870834351e-06, -4.620291292667389e-06, -4.237517714500427e-06, -3.8547441363334656e-06, -3.471970558166504e-06, -3.0891969799995422e-06, -2.7064234018325806e-06, -2.323649823665619e-06, -1.9408762454986572e-06, -1.5581026673316956e-06, -1.1753290891647339e-06, -7.925555109977722e-07, -4.0978193283081055e-07, -2.7008354663848877e-08, 3.557652235031128e-07, 7.385388016700745e-07, 1.1213123798370361e-06, 1.5040859580039978e-06, 1.8868595361709595e-06, 2.269633114337921e-06, 2.652406692504883e-06, 3.0351802706718445e-06, 3.417953848838806e-06, 3.800727427005768e-06, 4.1835010051727295e-06, 4.566274583339691e-06, 4.949048161506653e-06, 5.3318217396736145e-06, 5.714595317840576e-06, 6.097368896007538e-06, 6.4801424741744995e-06, 6.862916052341461e-06, 7.245689630508423e-06, 7.6284632086753845e-06, 8.011236786842346e-06, 8.394010365009308e-06, 8.77678394317627e-06, 9.159557521343231e-06, 9.542331099510193e-06, 9.925104677677155e-06, 1.0307878255844116e-05, 1.0690651834011078e-05, 1.107342541217804e-05, 1.1456198990345001e-05, 1.1838972568511963e-05, 1.2221746146678925e-05, 1.2604519724845886e-05, 1.2987293303012848e-05, 1.337006688117981e-05, 1.3752840459346771e-05, 1.4135614037513733e-05, 1.4518387615680695e-05, 1.4901161193847656e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 3.0, 11.0, 21.0, 34.0, 61.0, 134.0, 279.0, 699.0, 2057.0, 15601.0, 473873.0, 534100.0, 18189.0, 2175.0, 707.0, 290.0, 146.0, 74.0, 45.0, 23.0, 10.0, 3.0, 7.0, 0.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.06817626953125, -0.0658273696899414, -0.06347846984863281, -0.06112957000732422, -0.058780670166015625, -0.05643177032470703, -0.05408287048339844, -0.051733970642089844, -0.04938507080078125, -0.047036170959472656, -0.04468727111816406, -0.04233837127685547, -0.039989471435546875, -0.03764057159423828, -0.03529167175292969, -0.032942771911621094, -0.0305938720703125, -0.028244972229003906, -0.025896072387695312, -0.02354717254638672, -0.021198272705078125, -0.01884937286376953, -0.016500473022460938, -0.014151573181152344, -0.01180267333984375, -0.009453773498535156, -0.0071048736572265625, -0.004755973815917969, -0.002407073974609375, -5.817413330078125e-05, 0.0022907257080078125, 0.004639625549316406, 0.006988525390625, 0.009337425231933594, 0.011686325073242188, 0.014035224914550781, 0.016384124755859375, 0.01873302459716797, 0.021081924438476562, 0.023430824279785156, 0.02577972412109375, 0.028128623962402344, 0.030477523803710938, 0.03282642364501953, 0.035175323486328125, 0.03752422332763672, 0.03987312316894531, 0.042222023010253906, 0.0445709228515625, 0.046919822692871094, 0.04926872253417969, 0.05161762237548828, 0.053966522216796875, 0.05631542205810547, 0.05866432189941406, 0.061013221740722656, 0.06336212158203125, 0.06571102142333984, 0.06805992126464844, 0.07040882110595703, 0.07275772094726562, 0.07510662078857422, 0.07745552062988281, 0.0798044204711914, 0.0821533203125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 15.0, 14.0, 16.0, 35.0, 41.0, 77.0, 103.0, 116.0, 147.0, 121.0, 110.0, 75.0, 52.0, 28.0, 22.0, 13.0, 7.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0555419921875, -0.05338096618652344, -0.051219940185546875, -0.04905891418457031, -0.04689788818359375, -0.04473686218261719, -0.042575836181640625, -0.04041481018066406, -0.0382537841796875, -0.03609275817871094, -0.033931732177734375, -0.03177070617675781, -0.02960968017578125, -0.027448654174804688, -0.025287628173828125, -0.023126602172851562, -0.020965576171875, -0.018804550170898438, -0.016643524169921875, -0.014482498168945312, -0.01232147216796875, -0.010160446166992188, -0.007999420166015625, -0.0058383941650390625, -0.0036773681640625, -0.0015163421630859375, 0.000644683837890625, 0.0028057098388671875, 0.00496673583984375, 0.0071277618408203125, 0.009288787841796875, 0.011449813842773438, 0.01361083984375, 0.015771865844726562, 0.017932891845703125, 0.020093917846679688, 0.02225494384765625, 0.024415969848632812, 0.026576995849609375, 0.028738021850585938, 0.0308990478515625, 0.03306007385253906, 0.035221099853515625, 0.03738212585449219, 0.03954315185546875, 0.04170417785644531, 0.043865203857421875, 0.04602622985839844, 0.048187255859375, 0.05034828186035156, 0.052509307861328125, 0.05467033386230469, 0.05683135986328125, 0.05899238586425781, 0.061153411865234375, 0.06331443786621094, 0.0654754638671875, 0.06763648986816406, 0.06979751586914062, 0.07195854187011719, 0.07411956787109375, 0.07628059387207031, 0.07844161987304688, 0.08060264587402344, 0.082763671875]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 24.0, 52.0, 160.0, 306.0, 263.0, 126.0, 45.0, 18.0, 5.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9197190999984741, -0.8734528422355652, -0.8271865844726562, -0.7809203267097473, -0.7346540689468384, -0.6883878111839294, -0.6421215534210205, -0.5958552956581116, -0.5495890378952026, -0.5033227801322937, -0.45705652236938477, -0.41079026460647583, -0.3645240068435669, -0.31825774908065796, -0.271991491317749, -0.2257252335548401, -0.17945897579193115, -0.13319271802902222, -0.08692646026611328, -0.040660202503204346, 0.00560605525970459, 0.051872313022613525, 0.09813857078552246, 0.1444048285484314, 0.19067108631134033, 0.23693734407424927, 0.2832036018371582, 0.32946985960006714, 0.3757361173629761, 0.422002375125885, 0.46826863288879395, 0.5145348906517029, 0.5608012676239014, 0.6070675253868103, 0.6533337831497192, 0.6996000409126282, 0.7458662986755371, 0.792132556438446, 0.838398814201355, 0.8846650719642639, 0.9309313297271729, 0.9771975874900818, 1.0234638452529907, 1.0697300434112549, 1.1159963607788086, 1.1622626781463623, 1.2085288763046265, 1.2547950744628906, 1.3010613918304443, 1.347327709197998, 1.3935939073562622, 1.4398601055145264, 1.48612642288208, 1.5323927402496338, 1.578658938407898, 1.624925136566162, 1.6711914539337158, 1.7174577713012695, 1.7637239694595337, 1.8099901676177979, 1.8562564849853516, 1.9025228023529053, 1.9487890005111694, 1.9950551986694336, 2.0413215160369873]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 4.0, 1.0, 1.0, 1.0, 7.0, 2.0, 9.0, 8.0, 5.0, 10.0, 8.0, 9.0, 20.0, 16.0, 25.0, 23.0, 22.0, 25.0, 35.0, 31.0, 28.0, 35.0, 41.0, 53.0, 37.0, 42.0, 38.0, 40.0, 43.0, 24.0, 43.0, 41.0, 28.0, 38.0, 33.0, 21.0, 24.0, 26.0, 19.0, 18.0, 17.0, 9.0, 15.0, 11.0, 5.0, 7.0, 4.0, 1.0, 2.0, 3.0, 3.0, 4.0, 1.0, 1.0], "bins": [-0.5754107236862183, -0.5594831705093384, -0.5435556769371033, -0.5276281237602234, -0.5117006301879883, -0.4957730770111084, -0.4798455536365509, -0.4639180302619934, -0.4479905068874359, -0.4320629835128784, -0.4161354601383209, -0.4002079367637634, -0.38428038358688354, -0.36835289001464844, -0.35242533683776855, -0.33649781346321106, -0.32057029008865356, -0.30464276671409607, -0.2887152433395386, -0.2727877199649811, -0.2568601965904236, -0.2409326583147049, -0.2250051200389862, -0.2090775966644287, -0.19315007328987122, -0.17722254991531372, -0.16129502654075623, -0.14536748826503754, -0.12943996489048004, -0.11351244151592255, -0.09758491069078445, -0.08165737986564636, -0.06572991609573364, -0.04980238899588585, -0.033874861896038055, -0.017947334796190262, -0.0020198076963424683, 0.013907715678215027, 0.02983524650335312, 0.04576277732849121, 0.061690300703048706, 0.0776178240776062, 0.0935453549027443, 0.10947288572788239, 0.12540040910243988, 0.14132793247699738, 0.15725547075271606, 0.17318299412727356, 0.18911051750183105, 0.20503804087638855, 0.22096556425094604, 0.23689310252666473, 0.25282061100006104, 0.2687481641769409, 0.2846756875514984, 0.3006032109260559, 0.3165307343006134, 0.3324582576751709, 0.3483857810497284, 0.3643133044242859, 0.38024085760116577, 0.3961683511734009, 0.41209590435028076, 0.42802342772483826, 0.44395095109939575]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 10.0, 10.0, 16.0, 28.0, 53.0, 73.0, 174.0, 381.0, 821.0, 2277.0, 8050.0, 53420.0, 3885506.0, 220999.0, 16163.0, 3826.0, 1278.0, 610.0, 266.0, 129.0, 82.0, 47.0, 19.0, 14.0, 10.0, 6.0, 5.0, 6.0, 7.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12646484375, -0.120361328125, -0.1142578125, -0.108154296875, -0.10205078125, -0.095947265625, -0.08984375, -0.083740234375, -0.07763671875, -0.071533203125, -0.0654296875, -0.059326171875, -0.05322265625, -0.047119140625, -0.041015625, -0.034912109375, -0.02880859375, -0.022705078125, -0.0166015625, -0.010498046875, -0.00439453125, 0.001708984375, 0.0078125, 0.013916015625, 0.02001953125, 0.026123046875, 0.0322265625, 0.038330078125, 0.04443359375, 0.050537109375, 0.056640625, 0.062744140625, 0.06884765625, 0.074951171875, 0.0810546875, 0.087158203125, 0.09326171875, 0.099365234375, 0.10546875, 0.111572265625, 0.11767578125, 0.123779296875, 0.1298828125, 0.135986328125, 0.14208984375, 0.148193359375, 0.154296875, 0.160400390625, 0.16650390625, 0.172607421875, 0.1787109375, 0.184814453125, 0.19091796875, 0.197021484375, 0.203125, 0.209228515625, 0.21533203125, 0.221435546875, 0.2275390625, 0.233642578125, 0.23974609375, 0.245849609375, 0.251953125, 0.258056640625, 0.26416015625]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 9.0, 14.0, 11.0, 19.0, 17.0, 35.0, 43.0, 57.0, 51.0, 58.0, 65.0, 76.0, 72.0, 74.0, 77.0, 56.0, 49.0, 51.0, 33.0, 38.0, 20.0, 17.0, 15.0, 5.0, 10.0, 9.0, 6.0, 2.0, 1.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04052734375, -0.039058685302734375, -0.03759002685546875, -0.036121368408203125, -0.0346527099609375, -0.033184051513671875, -0.03171539306640625, -0.030246734619140625, -0.028778076171875, -0.027309417724609375, -0.02584075927734375, -0.024372100830078125, -0.0229034423828125, -0.021434783935546875, -0.01996612548828125, -0.018497467041015625, -0.01702880859375, -0.015560150146484375, -0.01409149169921875, -0.012622833251953125, -0.0111541748046875, -0.009685516357421875, -0.00821685791015625, -0.006748199462890625, -0.005279541015625, -0.003810882568359375, -0.00234222412109375, -0.000873565673828125, 0.0005950927734375, 0.002063751220703125, 0.00353240966796875, 0.005001068115234375, 0.0064697265625, 0.007938385009765625, 0.00940704345703125, 0.010875701904296875, 0.0123443603515625, 0.013813018798828125, 0.01528167724609375, 0.016750335693359375, 0.018218994140625, 0.019687652587890625, 0.02115631103515625, 0.022624969482421875, 0.0240936279296875, 0.025562286376953125, 0.02703094482421875, 0.028499603271484375, 0.02996826171875, 0.031436920166015625, 0.03290557861328125, 0.034374237060546875, 0.0358428955078125, 0.037311553955078125, 0.03878021240234375, 0.040248870849609375, 0.041717529296875, 0.043186187744140625, 0.04465484619140625, 0.046123504638671875, 0.0475921630859375, 0.049060821533203125, 0.05052947998046875, 0.051998138427734375, 0.053466796875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 4.0, 3.0, 7.0, 4.0, 8.0, 6.0, 15.0, 9.0, 20.0, 26.0, 42.0, 56.0, 89.0, 98.0, 177.0, 254.0, 449.0, 907.0, 2019.0, 5507.0, 17584.0, 87191.0, 3324005.0, 686237.0, 49790.0, 12240.0, 4023.0, 1612.0, 755.0, 409.0, 249.0, 139.0, 104.0, 75.0, 55.0, 42.0, 23.0, 18.0, 8.0, 11.0, 5.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.11456298828125, -0.11072444915771484, -0.10688591003417969, -0.10304737091064453, -0.09920883178710938, -0.09537029266357422, -0.09153175354003906, -0.0876932144165039, -0.08385467529296875, -0.0800161361694336, -0.07617759704589844, -0.07233905792236328, -0.06850051879882812, -0.06466197967529297, -0.06082344055175781, -0.056984901428222656, -0.0531463623046875, -0.049307823181152344, -0.04546928405761719, -0.04163074493408203, -0.037792205810546875, -0.03395366668701172, -0.030115127563476562, -0.026276588439941406, -0.02243804931640625, -0.018599510192871094, -0.014760971069335938, -0.010922431945800781, -0.007083892822265625, -0.0032453536987304688, 0.0005931854248046875, 0.004431724548339844, 0.008270263671875, 0.012108802795410156, 0.015947341918945312, 0.01978588104248047, 0.023624420166015625, 0.02746295928955078, 0.03130149841308594, 0.035140037536621094, 0.03897857666015625, 0.042817115783691406, 0.04665565490722656, 0.05049419403076172, 0.054332733154296875, 0.05817127227783203, 0.06200981140136719, 0.06584835052490234, 0.0696868896484375, 0.07352542877197266, 0.07736396789550781, 0.08120250701904297, 0.08504104614257812, 0.08887958526611328, 0.09271812438964844, 0.0965566635131836, 0.10039520263671875, 0.1042337417602539, 0.10807228088378906, 0.11191082000732422, 0.11574935913085938, 0.11958789825439453, 0.12342643737792969, 0.12726497650146484, 0.131103515625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 12.0, 12.0, 37.0, 100.0, 360.0, 2565.0, 696.0, 152.0, 49.0, 36.0, 20.0, 10.0, 7.0, 4.0, 2.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08538818359375, -0.08260536193847656, -0.07982254028320312, -0.07703971862792969, -0.07425689697265625, -0.07147407531738281, -0.06869125366210938, -0.06590843200683594, -0.0631256103515625, -0.06034278869628906, -0.057559967041015625, -0.05477714538574219, -0.05199432373046875, -0.04921150207519531, -0.046428680419921875, -0.04364585876464844, -0.040863037109375, -0.03808021545410156, -0.035297393798828125, -0.03251457214355469, -0.02973175048828125, -0.026948928833007812, -0.024166107177734375, -0.021383285522460938, -0.0186004638671875, -0.015817642211914062, -0.013034820556640625, -0.010251998901367188, -0.00746917724609375, -0.0046863555908203125, -0.001903533935546875, 0.0008792877197265625, 0.003662109375, 0.0064449310302734375, 0.009227752685546875, 0.012010574340820312, 0.01479339599609375, 0.017576217651367188, 0.020359039306640625, 0.023141860961914062, 0.0259246826171875, 0.028707504272460938, 0.031490325927734375, 0.03427314758300781, 0.03705596923828125, 0.03983879089355469, 0.042621612548828125, 0.04540443420410156, 0.048187255859375, 0.05097007751464844, 0.053752899169921875, 0.05653572082519531, 0.05931854248046875, 0.06210136413574219, 0.06488418579101562, 0.06766700744628906, 0.0704498291015625, 0.07323265075683594, 0.07601547241210938, 0.07879829406738281, 0.08158111572265625, 0.08436393737792969, 0.08714675903320312, 0.08992958068847656, 0.09271240234375]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 9.0, 17.0, 93.0, 247.0, 364.0, 187.0, 50.0, 13.0, 6.0, 2.0, 6.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18564081192016602, -0.1691482663154602, -0.1526557058095932, -0.1361631602048874, -0.11967060714960098, -0.10317805409431458, -0.08668550848960876, -0.07019295543432236, -0.05370040237903595, -0.03720784932374954, -0.020715299993753433, -0.004222750663757324, 0.012269802391529083, 0.02876235544681549, 0.0452549010515213, 0.06174745410680771, 0.07824000716209412, 0.09473256021738052, 0.11122511327266693, 0.12771765887737274, 0.14421021938323975, 0.16070276498794556, 0.17719531059265137, 0.19368785619735718, 0.21018041670322418, 0.22667296230793, 0.243165522813797, 0.2596580684185028, 0.2761506140232086, 0.2926431894302368, 0.3091357350349426, 0.32562828063964844, 0.34212082624435425, 0.35861337184906006, 0.37510591745376587, 0.3915984630584717, 0.4080910384654999, 0.4245835840702057, 0.4410761296749115, 0.4575686752796173, 0.4740612506866455, 0.4905537962913513, 0.5070463418960571, 0.5235388875007629, 0.5400314331054688, 0.5565240383148193, 0.5730165243148804, 0.589509129524231, 0.606001615524292, 0.6224941611289978, 0.6389867067337036, 0.6554792523384094, 0.6719717979431152, 0.6884644031524658, 0.7049568891525269, 0.7214494943618774, 0.7379420399665833, 0.7544345855712891, 0.7709271311759949, 0.7874196767807007, 0.8039122223854065, 0.8204047679901123, 0.8368973731994629, 0.8533899188041687, 0.8698824644088745]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 3.0, 2.0, 3.0, 7.0, 6.0, 6.0, 16.0, 23.0, 27.0, 32.0, 43.0, 42.0, 53.0, 62.0, 86.0, 64.0, 75.0, 74.0, 83.0, 51.0, 64.0, 36.0, 42.0, 26.0, 22.0, 14.0, 15.0, 11.0, 7.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.15102112293243408, -0.14479359984397888, -0.1385660618543625, -0.1323385238647461, -0.1261110007762909, -0.1198834702372551, -0.1136559396982193, -0.1074284091591835, -0.1012008786201477, -0.09497334808111191, -0.08874581754207611, -0.08251828700304031, -0.07629075646400452, -0.07006322592496872, -0.06383569538593292, -0.057608164846897125, -0.05138063430786133, -0.04515310376882553, -0.038925573229789734, -0.03269804269075394, -0.02647051215171814, -0.020242981612682343, -0.014015451073646545, -0.007787920534610748, -0.0015603899955749512, 0.004667140543460846, 0.010894671082496643, 0.01712220162153244, 0.023349732160568237, 0.029577262699604034, 0.03580479323863983, 0.04203232377767563, 0.048259854316711426, 0.05448738485574722, 0.06071491539478302, 0.06694244593381882, 0.07316997647285461, 0.07939750701189041, 0.08562503755092621, 0.091852568089962, 0.0980800986289978, 0.1043076291680336, 0.1105351597070694, 0.1167626902461052, 0.12299022078514099, 0.1292177438735962, 0.13544528186321259, 0.14167281985282898, 0.14790034294128418, 0.15412786602973938, 0.16035540401935577, 0.16658294200897217, 0.17281046509742737, 0.17903798818588257, 0.18526552617549896, 0.19149306416511536, 0.19772058725357056, 0.20394811034202576, 0.21017564833164215, 0.21640318632125854, 0.22263070940971375, 0.22885823249816895, 0.23508577048778534, 0.24131330847740173, 0.24754083156585693]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 3.0, 7.0, 3.0, 15.0, 17.0, 31.0, 65.0, 104.0, 197.0, 479.0, 1300.0, 4467.0, 22625.0, 182002.0, 646822.0, 163321.0, 20734.0, 4203.0, 1245.0, 492.0, 196.0, 110.0, 42.0, 35.0, 13.0, 6.0, 5.0, 7.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.166748046875, -0.16109085083007812, -0.15543365478515625, -0.14977645874023438, -0.1441192626953125, -0.13846206665039062, -0.13280487060546875, -0.12714767456054688, -0.121490478515625, -0.11583328247070312, -0.11017608642578125, -0.10451889038085938, -0.0988616943359375, -0.09320449829101562, -0.08754730224609375, -0.08189010620117188, -0.07623291015625, -0.07057571411132812, -0.06491851806640625, -0.059261322021484375, -0.0536041259765625, -0.047946929931640625, -0.04228973388671875, -0.036632537841796875, -0.030975341796875, -0.025318145751953125, -0.01966094970703125, -0.014003753662109375, -0.0083465576171875, -0.002689361572265625, 0.00296783447265625, 0.008625030517578125, 0.0142822265625, 0.019939422607421875, 0.02559661865234375, 0.031253814697265625, 0.0369110107421875, 0.042568206787109375, 0.04822540283203125, 0.053882598876953125, 0.059539794921875, 0.06519699096679688, 0.07085418701171875, 0.07651138305664062, 0.0821685791015625, 0.08782577514648438, 0.09348297119140625, 0.09914016723632812, 0.10479736328125, 0.11045455932617188, 0.11611175537109375, 0.12176895141601562, 0.1274261474609375, 0.13308334350585938, 0.13874053955078125, 0.14439773559570312, 0.150054931640625, 0.15571212768554688, 0.16136932373046875, 0.16702651977539062, 0.1726837158203125, 0.17834091186523438, 0.18399810791015625, 0.18965530395507812, 0.1953125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 6.0, 7.0, 4.0, 11.0, 9.0, 13.0, 15.0, 40.0, 32.0, 34.0, 57.0, 56.0, 59.0, 57.0, 71.0, 65.0, 79.0, 67.0, 62.0, 56.0, 46.0, 38.0, 28.0, 27.0, 16.0, 10.0, 13.0, 9.0, 4.0, 7.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041748046875, -0.04022645950317383, -0.038704872131347656, -0.037183284759521484, -0.03566169738769531, -0.03414011001586914, -0.03261852264404297, -0.031096935272216797, -0.029575347900390625, -0.028053760528564453, -0.02653217315673828, -0.02501058578491211, -0.023488998413085938, -0.021967411041259766, -0.020445823669433594, -0.018924236297607422, -0.01740264892578125, -0.015881061553955078, -0.014359474182128906, -0.012837886810302734, -0.011316299438476562, -0.00979471206665039, -0.008273124694824219, -0.006751537322998047, -0.005229949951171875, -0.003708362579345703, -0.0021867752075195312, -0.0006651878356933594, 0.0008563995361328125, 0.0023779869079589844, 0.0038995742797851562, 0.005421161651611328, 0.0069427490234375, 0.008464336395263672, 0.009985923767089844, 0.011507511138916016, 0.013029098510742188, 0.01455068588256836, 0.01607227325439453, 0.017593860626220703, 0.019115447998046875, 0.020637035369873047, 0.02215862274169922, 0.02368021011352539, 0.025201797485351562, 0.026723384857177734, 0.028244972229003906, 0.029766559600830078, 0.03128814697265625, 0.03280973434448242, 0.034331321716308594, 0.035852909088134766, 0.03737449645996094, 0.03889608383178711, 0.04041767120361328, 0.04193925857543945, 0.043460845947265625, 0.0449824333190918, 0.04650402069091797, 0.04802560806274414, 0.04954719543457031, 0.051068782806396484, 0.052590370178222656, 0.05411195755004883, 0.055633544921875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 6.0, 5.0, 11.0, 11.0, 20.0, 14.0, 27.0, 28.0, 56.0, 101.0, 112.0, 169.0, 275.0, 460.0, 918.0, 2230.0, 6566.0, 23797.0, 103216.0, 382148.0, 386574.0, 106282.0, 24233.0, 6772.0, 2275.0, 938.0, 508.0, 266.0, 173.0, 91.0, 73.0, 57.0, 45.0, 18.0, 25.0, 19.0, 10.0, 10.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1064453125, -0.10331535339355469, -0.10018539428710938, -0.09705543518066406, -0.09392547607421875, -0.09079551696777344, -0.08766555786132812, -0.08453559875488281, -0.0814056396484375, -0.07827568054199219, -0.07514572143554688, -0.07201576232910156, -0.06888580322265625, -0.06575584411621094, -0.06262588500976562, -0.05949592590332031, -0.056365966796875, -0.05323600769042969, -0.050106048583984375, -0.04697608947753906, -0.04384613037109375, -0.04071617126464844, -0.037586212158203125, -0.03445625305175781, -0.0313262939453125, -0.028196334838867188, -0.025066375732421875, -0.021936416625976562, -0.01880645751953125, -0.015676498413085938, -0.012546539306640625, -0.009416580200195312, -0.00628662109375, -0.0031566619873046875, -2.6702880859375e-05, 0.0031032562255859375, 0.00623321533203125, 0.009363174438476562, 0.012493133544921875, 0.015623092651367188, 0.0187530517578125, 0.021883010864257812, 0.025012969970703125, 0.028142929077148438, 0.03127288818359375, 0.03440284729003906, 0.037532806396484375, 0.04066276550292969, 0.043792724609375, 0.04692268371582031, 0.050052642822265625, 0.05318260192871094, 0.05631256103515625, 0.05944252014160156, 0.06257247924804688, 0.06570243835449219, 0.0688323974609375, 0.07196235656738281, 0.07509231567382812, 0.07822227478027344, 0.08135223388671875, 0.08448219299316406, 0.08761215209960938, 0.09074211120605469, 0.0938720703125]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 0.0, 5.0, 1.0, 4.0, 9.0, 9.0, 7.0, 13.0, 13.0, 20.0, 23.0, 20.0, 14.0, 33.0, 35.0, 30.0, 49.0, 43.0, 34.0, 34.0, 41.0, 46.0, 45.0, 41.0, 62.0, 42.0, 43.0, 40.0, 28.0, 26.0, 26.0, 21.0, 15.0, 21.0, 24.0, 17.0, 8.0, 18.0, 18.0, 9.0, 2.0, 2.0, 3.0, 4.0, 0.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.125, -0.12100982666015625, -0.1170196533203125, -0.11302947998046875, -0.109039306640625, -0.10504913330078125, -0.1010589599609375, -0.09706878662109375, -0.09307861328125, -0.08908843994140625, -0.0850982666015625, -0.08110809326171875, -0.077117919921875, -0.07312774658203125, -0.0691375732421875, -0.06514739990234375, -0.0611572265625, -0.05716705322265625, -0.0531768798828125, -0.04918670654296875, -0.045196533203125, -0.04120635986328125, -0.0372161865234375, -0.03322601318359375, -0.02923583984375, -0.02524566650390625, -0.0212554931640625, -0.01726531982421875, -0.013275146484375, -0.00928497314453125, -0.0052947998046875, -0.00130462646484375, 0.002685546875, 0.00667572021484375, 0.0106658935546875, 0.01465606689453125, 0.018646240234375, 0.02263641357421875, 0.0266265869140625, 0.03061676025390625, 0.03460693359375, 0.03859710693359375, 0.0425872802734375, 0.04657745361328125, 0.050567626953125, 0.05455780029296875, 0.0585479736328125, 0.06253814697265625, 0.0665283203125, 0.07051849365234375, 0.0745086669921875, 0.07849884033203125, 0.082489013671875, 0.08647918701171875, 0.0904693603515625, 0.09445953369140625, 0.09844970703125, 0.10243988037109375, 0.1064300537109375, 0.11042022705078125, 0.114410400390625, 0.11840057373046875, 0.1223907470703125, 0.12638092041015625, 0.13037109375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 7.0, 7.0, 11.0, 16.0, 31.0, 42.0, 112.0, 223.0, 626.0, 1650.0, 8032.0, 107667.0, 777786.0, 139740.0, 9516.0, 1890.0, 641.0, 273.0, 149.0, 54.0, 29.0, 20.0, 12.0, 8.0, 5.0, 10.0, 2.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07470703125, -0.07260513305664062, -0.07050323486328125, -0.06840133666992188, -0.0662994384765625, -0.06419754028320312, -0.06209564208984375, -0.059993743896484375, -0.057891845703125, -0.055789947509765625, -0.05368804931640625, -0.051586151123046875, -0.0494842529296875, -0.047382354736328125, -0.04528045654296875, -0.043178558349609375, -0.04107666015625, -0.038974761962890625, -0.03687286376953125, -0.034770965576171875, -0.0326690673828125, -0.030567169189453125, -0.02846527099609375, -0.026363372802734375, -0.024261474609375, -0.022159576416015625, -0.02005767822265625, -0.017955780029296875, -0.0158538818359375, -0.013751983642578125, -0.01165008544921875, -0.009548187255859375, -0.0074462890625, -0.005344390869140625, -0.00324249267578125, -0.001140594482421875, 0.0009613037109375, 0.003063201904296875, 0.00516510009765625, 0.007266998291015625, 0.009368896484375, 0.011470794677734375, 0.01357269287109375, 0.015674591064453125, 0.0177764892578125, 0.019878387451171875, 0.02198028564453125, 0.024082183837890625, 0.02618408203125, 0.028285980224609375, 0.03038787841796875, 0.032489776611328125, 0.0345916748046875, 0.036693572998046875, 0.03879547119140625, 0.040897369384765625, 0.042999267578125, 0.045101165771484375, 0.04720306396484375, 0.049304962158203125, 0.0514068603515625, 0.053508758544921875, 0.05561065673828125, 0.057712554931640625, 0.059814453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 4.0, 10.0, 5.0, 12.0, 14.0, 24.0, 35.0, 50.0, 98.0, 106.0, 104.0, 127.0, 138.0, 106.0, 70.0, 43.0, 27.0, 14.0, 5.0, 10.0, 8.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0325183868408203e-05, -1.985393464565277e-05, -1.938268542289734e-05, -1.8911436200141907e-05, -1.8440186977386475e-05, -1.7968937754631042e-05, -1.749768853187561e-05, -1.7026439309120178e-05, -1.6555190086364746e-05, -1.6083940863609314e-05, -1.5612691640853882e-05, -1.514144241809845e-05, -1.4670193195343018e-05, -1.4198943972587585e-05, -1.3727694749832153e-05, -1.3256445527076721e-05, -1.2785196304321289e-05, -1.2313947081565857e-05, -1.1842697858810425e-05, -1.1371448636054993e-05, -1.090019941329956e-05, -1.0428950190544128e-05, -9.957700967788696e-06, -9.486451745033264e-06, -9.015202522277832e-06, -8.5439532995224e-06, -8.072704076766968e-06, -7.601454854011536e-06, -7.1302056312561035e-06, -6.658956408500671e-06, -6.187707185745239e-06, -5.716457962989807e-06, -5.245208740234375e-06, -4.773959517478943e-06, -4.302710294723511e-06, -3.831461071968079e-06, -3.3602118492126465e-06, -2.8889626264572144e-06, -2.4177134037017822e-06, -1.94646418094635e-06, -1.475214958190918e-06, -1.0039657354354858e-06, -5.327165126800537e-07, -6.146728992462158e-08, 4.0978193283081055e-07, 8.810311555862427e-07, 1.3522803783416748e-06, 1.823529601097107e-06, 2.294778823852539e-06, 2.766028046607971e-06, 3.2372772693634033e-06, 3.7085264921188354e-06, 4.179775714874268e-06, 4.6510249376297e-06, 5.122274160385132e-06, 5.593523383140564e-06, 6.064772605895996e-06, 6.536021828651428e-06, 7.00727105140686e-06, 7.4785202741622925e-06, 7.949769496917725e-06, 8.421018719673157e-06, 8.892267942428589e-06, 9.363517165184021e-06, 9.834766387939453e-06]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 4.0, 6.0, 3.0, 13.0, 14.0, 23.0, 35.0, 52.0, 95.0, 171.0, 309.0, 718.0, 2032.0, 9155.0, 76249.0, 534016.0, 374404.0, 42604.0, 5972.0, 1485.0, 582.0, 241.0, 147.0, 92.0, 43.0, 16.0, 23.0, 23.0, 4.0, 10.0, 7.0, 1.0, 7.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05712890625, -0.05544233322143555, -0.053755760192871094, -0.05206918716430664, -0.05038261413574219, -0.048696041107177734, -0.04700946807861328, -0.04532289505004883, -0.043636322021484375, -0.04194974899291992, -0.04026317596435547, -0.038576602935791016, -0.03689002990722656, -0.03520345687866211, -0.033516883850097656, -0.0318303108215332, -0.03014373779296875, -0.028457164764404297, -0.026770591735839844, -0.02508401870727539, -0.023397445678710938, -0.021710872650146484, -0.02002429962158203, -0.018337726593017578, -0.016651153564453125, -0.014964580535888672, -0.013278007507324219, -0.011591434478759766, -0.009904861450195312, -0.00821828842163086, -0.006531715393066406, -0.004845142364501953, -0.0031585693359375, -0.0014719963073730469, 0.00021457672119140625, 0.0019011497497558594, 0.0035877227783203125, 0.005274295806884766, 0.006960868835449219, 0.008647441864013672, 0.010334014892578125, 0.012020587921142578, 0.013707160949707031, 0.015393733978271484, 0.017080307006835938, 0.01876688003540039, 0.020453453063964844, 0.022140026092529297, 0.02382659912109375, 0.025513172149658203, 0.027199745178222656, 0.02888631820678711, 0.030572891235351562, 0.032259464263916016, 0.03394603729248047, 0.03563261032104492, 0.037319183349609375, 0.03900575637817383, 0.04069232940673828, 0.042378902435302734, 0.04406547546386719, 0.04575204849243164, 0.047438621520996094, 0.04912519454956055, 0.050811767578125]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 11.0, 14.0, 13.0, 19.0, 21.0, 36.0, 51.0, 47.0, 62.0, 79.0, 63.0, 65.0, 78.0, 73.0, 62.0, 68.0, 47.0, 43.0, 39.0, 23.0, 28.0, 15.0, 6.0, 9.0, 8.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0467529296875, -0.04545259475708008, -0.044152259826660156, -0.042851924896240234, -0.04155158996582031, -0.04025125503540039, -0.03895092010498047, -0.03765058517456055, -0.036350250244140625, -0.0350499153137207, -0.03374958038330078, -0.03244924545288086, -0.031148910522460938, -0.029848575592041016, -0.028548240661621094, -0.027247905731201172, -0.02594757080078125, -0.024647235870361328, -0.023346900939941406, -0.022046566009521484, -0.020746231079101562, -0.01944589614868164, -0.01814556121826172, -0.016845226287841797, -0.015544891357421875, -0.014244556427001953, -0.012944221496582031, -0.01164388656616211, -0.010343551635742188, -0.009043216705322266, -0.007742881774902344, -0.006442546844482422, -0.0051422119140625, -0.003841876983642578, -0.0025415420532226562, -0.0012412071228027344, 5.91278076171875e-05, 0.0013594627380371094, 0.0026597976684570312, 0.003960132598876953, 0.005260467529296875, 0.006560802459716797, 0.007861137390136719, 0.00916147232055664, 0.010461807250976562, 0.011762142181396484, 0.013062477111816406, 0.014362812042236328, 0.01566314697265625, 0.016963481903076172, 0.018263816833496094, 0.019564151763916016, 0.020864486694335938, 0.02216482162475586, 0.02346515655517578, 0.024765491485595703, 0.026065826416015625, 0.027366161346435547, 0.02866649627685547, 0.02996683120727539, 0.03126716613769531, 0.032567501068115234, 0.033867835998535156, 0.03516817092895508, 0.036468505859375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 0.0, 5.0, 8.0, 8.0, 22.0, 27.0, 49.0, 45.0, 107.0, 144.0, 138.0, 136.0, 115.0, 64.0, 56.0, 32.0, 17.0, 9.0, 13.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.40869516134262085, -0.38580700755119324, -0.362918883562088, -0.3400307297706604, -0.3171426057815552, -0.29425445199012756, -0.27136629819869995, -0.24847815930843353, -0.22559002041816711, -0.2027018815279007, -0.17981374263763428, -0.15692558884620667, -0.13403744995594025, -0.11114931106567383, -0.08826115727424622, -0.0653730183839798, -0.04248487949371338, -0.019596736878156662, 0.003291405737400055, 0.02617955207824707, 0.04906769096851349, 0.07195582985877991, 0.09484398365020752, 0.11773212254047394, 0.14062026143074036, 0.16350840032100677, 0.1863965392112732, 0.2092846930027008, 0.23217283189296722, 0.25506097078323364, 0.27794912457466125, 0.30083727836608887, 0.32372546195983887, 0.3466136157512665, 0.3695017397403717, 0.3923898935317993, 0.41527801752090454, 0.43816617131233215, 0.46105432510375977, 0.483942449092865, 0.5068305730819702, 0.5297186970710754, 0.5526068806648254, 0.5754950046539307, 0.5983831286430359, 0.6212712526321411, 0.6441594362258911, 0.6670475602149963, 0.6899357438087463, 0.7128238677978516, 0.7357120513916016, 0.7586001753807068, 0.781488299369812, 0.804376482963562, 0.8272646069526672, 0.8501527309417725, 0.8730409145355225, 0.8959290385246277, 0.9188172221183777, 0.9417053461074829, 0.9645934700965881, 0.9874815940856934, 1.0103697776794434, 1.0332579612731934, 1.0561460256576538]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 2.0, 1.0, 6.0, 15.0, 9.0, 9.0, 15.0, 16.0, 16.0, 21.0, 21.0, 24.0, 31.0, 24.0, 45.0, 36.0, 47.0, 35.0, 39.0, 47.0, 52.0, 39.0, 42.0, 40.0, 40.0, 36.0, 40.0, 29.0, 26.0, 30.0, 30.0, 25.0, 13.0, 13.0, 13.0, 9.0, 17.0, 9.0, 9.0, 7.0, 3.0, 1.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.6337622404098511, -0.6144745349884033, -0.5951868891716003, -0.5758991837501526, -0.5566115379333496, -0.5373238325119019, -0.5180361866950989, -0.4987484812736511, -0.47946080565452576, -0.4601731300354004, -0.440885454416275, -0.42159777879714966, -0.4023100733757019, -0.3830224275588989, -0.36373472213745117, -0.3444470465183258, -0.32515937089920044, -0.3058716952800751, -0.2865840196609497, -0.26729634404182434, -0.24800865352153778, -0.22872097790241241, -0.20943328738212585, -0.1901456117630005, -0.17085793614387512, -0.15157026052474976, -0.1322825849056244, -0.11299489438533783, -0.09370721876621246, -0.0744195431470871, -0.055131860077381134, -0.03584417700767517, -0.016556501388549805, 0.00273117795586586, 0.022018857300281525, 0.04130653664469719, 0.060594215989112854, 0.07988189160823822, 0.09916957467794418, 0.11845725774765015, 0.1377449333667755, 0.15703260898590088, 0.17632028460502625, 0.1956079751253128, 0.21489565074443817, 0.23418332636356354, 0.2534710168838501, 0.27275869250297546, 0.29204636812210083, 0.3113340437412262, 0.33062171936035156, 0.34990939497947693, 0.3691970705986023, 0.38848477602005005, 0.4077724516391754, 0.4270601272583008, 0.44634780287742615, 0.4656354784965515, 0.4849231541156769, 0.5042108297348022, 0.52349853515625, 0.542786180973053, 0.5620738863945007, 0.5813615322113037, 0.6006492376327515]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 5.0, 4.0, 3.0, 7.0, 13.0, 7.0, 32.0, 38.0, 65.0, 116.0, 203.0, 349.0, 734.0, 1521.0, 4419.0, 19762.0, 695051.0, 3438326.0, 25039.0, 4998.0, 1783.0, 825.0, 384.0, 210.0, 133.0, 79.0, 55.0, 44.0, 23.0, 19.0, 7.0, 10.0, 7.0, 4.0, 3.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2203369140625, -0.21422767639160156, -0.20811843872070312, -0.2020092010498047, -0.19589996337890625, -0.1897907257080078, -0.18368148803710938, -0.17757225036621094, -0.1714630126953125, -0.16535377502441406, -0.15924453735351562, -0.1531352996826172, -0.14702606201171875, -0.1409168243408203, -0.13480758666992188, -0.12869834899902344, -0.122589111328125, -0.11647987365722656, -0.11037063598632812, -0.10426139831542969, -0.09815216064453125, -0.09204292297363281, -0.08593368530273438, -0.07982444763183594, -0.0737152099609375, -0.06760597229003906, -0.061496734619140625, -0.05538749694824219, -0.04927825927734375, -0.04316902160644531, -0.037059783935546875, -0.030950546264648438, -0.02484130859375, -0.018732070922851562, -0.012622833251953125, -0.0065135955810546875, -0.00040435791015625, 0.0057048797607421875, 0.011814117431640625, 0.017923355102539062, 0.0240325927734375, 0.030141830444335938, 0.036251068115234375, 0.04236030578613281, 0.04846954345703125, 0.05457878112792969, 0.060688018798828125, 0.06679725646972656, 0.072906494140625, 0.07901573181152344, 0.08512496948242188, 0.09123420715332031, 0.09734344482421875, 0.10345268249511719, 0.10956192016601562, 0.11567115783691406, 0.1217803955078125, 0.12788963317871094, 0.13399887084960938, 0.1401081085205078, 0.14621734619140625, 0.1523265838623047, 0.15843582153320312, 0.16454505920410156, 0.170654296875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 7.0, 3.0, 11.0, 12.0, 15.0, 22.0, 25.0, 25.0, 35.0, 41.0, 47.0, 50.0, 70.0, 80.0, 70.0, 68.0, 74.0, 62.0, 53.0, 49.0, 37.0, 34.0, 31.0, 13.0, 23.0, 14.0, 8.0, 10.0, 3.0, 5.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04345703125, -0.041903018951416016, -0.04034900665283203, -0.03879499435424805, -0.03724098205566406, -0.03568696975708008, -0.034132957458496094, -0.03257894515991211, -0.031024932861328125, -0.02947092056274414, -0.027916908264160156, -0.026362895965576172, -0.024808883666992188, -0.023254871368408203, -0.02170085906982422, -0.020146846771240234, -0.01859283447265625, -0.017038822174072266, -0.015484809875488281, -0.013930797576904297, -0.012376785278320312, -0.010822772979736328, -0.009268760681152344, -0.007714748382568359, -0.006160736083984375, -0.004606723785400391, -0.0030527114868164062, -0.0014986991882324219, 5.53131103515625e-05, 0.0016093254089355469, 0.0031633377075195312, 0.004717350006103516, 0.0062713623046875, 0.007825374603271484, 0.009379386901855469, 0.010933399200439453, 0.012487411499023438, 0.014041423797607422, 0.015595436096191406, 0.01714944839477539, 0.018703460693359375, 0.02025747299194336, 0.021811485290527344, 0.023365497589111328, 0.024919509887695312, 0.026473522186279297, 0.02802753448486328, 0.029581546783447266, 0.03113555908203125, 0.032689571380615234, 0.03424358367919922, 0.0357975959777832, 0.03735160827636719, 0.03890562057495117, 0.040459632873535156, 0.04201364517211914, 0.043567657470703125, 0.04512166976928711, 0.046675682067871094, 0.04822969436645508, 0.04978370666503906, 0.05133771896362305, 0.05289173126220703, 0.054445743560791016, 0.055999755859375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 7.0, 13.0, 28.0, 28.0, 53.0, 68.0, 119.0, 199.0, 299.0, 486.0, 780.0, 1430.0, 2680.0, 5537.0, 13518.0, 47255.0, 403278.0, 3527269.0, 145245.0, 27488.0, 9342.0, 4180.0, 2104.0, 1145.0, 637.0, 422.0, 269.0, 126.0, 99.0, 60.0, 32.0, 22.0, 15.0, 16.0, 7.0, 5.0, 5.0, 5.0, 0.0, 1.0, 3.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.08441162109375, -0.08153152465820312, -0.07865142822265625, -0.07577133178710938, -0.0728912353515625, -0.07001113891601562, -0.06713104248046875, -0.06425094604492188, -0.061370849609375, -0.058490753173828125, -0.05561065673828125, -0.052730560302734375, -0.0498504638671875, -0.046970367431640625, -0.04409027099609375, -0.041210174560546875, -0.038330078125, -0.035449981689453125, -0.03256988525390625, -0.029689788818359375, -0.0268096923828125, -0.023929595947265625, -0.02104949951171875, -0.018169403076171875, -0.015289306640625, -0.012409210205078125, -0.00952911376953125, -0.006649017333984375, -0.0037689208984375, -0.000888824462890625, 0.00199127197265625, 0.004871368408203125, 0.00775146484375, 0.010631561279296875, 0.01351165771484375, 0.016391754150390625, 0.0192718505859375, 0.022151947021484375, 0.02503204345703125, 0.027912139892578125, 0.030792236328125, 0.033672332763671875, 0.03655242919921875, 0.039432525634765625, 0.0423126220703125, 0.045192718505859375, 0.04807281494140625, 0.050952911376953125, 0.0538330078125, 0.056713104248046875, 0.05959320068359375, 0.062473297119140625, 0.0653533935546875, 0.06823348999023438, 0.07111358642578125, 0.07399368286132812, 0.076873779296875, 0.07975387573242188, 0.08263397216796875, 0.08551406860351562, 0.0883941650390625, 0.09127426147460938, 0.09415435791015625, 0.09703445434570312, 0.09991455078125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 5.0, 8.0, 9.0, 18.0, 43.0, 50.0, 109.0, 345.0, 2290.0, 788.0, 211.0, 70.0, 45.0, 23.0, 13.0, 5.0, 5.0, 4.0, 5.0, 3.0, 2.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07513427734375, -0.07283782958984375, -0.0705413818359375, -0.06824493408203125, -0.065948486328125, -0.06365203857421875, -0.0613555908203125, -0.05905914306640625, -0.0567626953125, -0.05446624755859375, -0.0521697998046875, -0.04987335205078125, -0.047576904296875, -0.04528045654296875, -0.0429840087890625, -0.04068756103515625, -0.03839111328125, -0.03609466552734375, -0.0337982177734375, -0.03150177001953125, -0.029205322265625, -0.02690887451171875, -0.0246124267578125, -0.02231597900390625, -0.02001953125, -0.01772308349609375, -0.0154266357421875, -0.01313018798828125, -0.010833740234375, -0.00853729248046875, -0.0062408447265625, -0.00394439697265625, -0.00164794921875, 0.00064849853515625, 0.0029449462890625, 0.00524139404296875, 0.007537841796875, 0.00983428955078125, 0.0121307373046875, 0.01442718505859375, 0.0167236328125, 0.01902008056640625, 0.0213165283203125, 0.02361297607421875, 0.025909423828125, 0.02820587158203125, 0.0305023193359375, 0.03279876708984375, 0.03509521484375, 0.03739166259765625, 0.0396881103515625, 0.04198455810546875, 0.044281005859375, 0.04657745361328125, 0.0488739013671875, 0.05117034912109375, 0.053466796875, 0.05576324462890625, 0.0580596923828125, 0.06035614013671875, 0.062652587890625, 0.06494903564453125, 0.0672454833984375, 0.06954193115234375, 0.07183837890625]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 10.0, 6.0, 37.0, 137.0, 308.0, 311.0, 136.0, 38.0, 14.0, 7.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14066611230373383, -0.12036820501089096, -0.1000702977180481, -0.07977239042520523, -0.059474483132362366, -0.0391765758395195, -0.018878668546676636, 0.0014192312955856323, 0.021717146039009094, 0.04201505333185196, 0.062312960624694824, 0.08261086791753769, 0.10290877521038055, 0.12320668250322342, 0.14350458979606628, 0.16380248963832855, 0.18410040438175201, 0.20439830422401428, 0.22469621896743774, 0.2449941337108612, 0.26529204845428467, 0.28558993339538574, 0.3058878481388092, 0.32618576288223267, 0.34648364782333374, 0.3667815625667572, 0.38707947731018066, 0.40737736225128174, 0.4276752769947052, 0.44797319173812866, 0.46827107667922974, 0.4885689914226532, 0.5088669061660767, 0.5291647911071777, 0.5494627356529236, 0.5697606205940247, 0.5900585651397705, 0.6103564500808716, 0.6306543350219727, 0.6509522199630737, 0.6712501645088196, 0.6915480494499207, 0.7118459939956665, 0.7321438789367676, 0.7524417638778687, 0.7727397084236145, 0.7930375933647156, 0.8133355379104614, 0.8336334228515625, 0.8539313077926636, 0.8742292523384094, 0.8945271372795105, 0.9148250818252563, 0.9351229667663574, 0.9554208517074585, 0.9757187366485596, 0.9960166811943054, 1.0163146257400513, 1.0366125106811523, 1.0569103956222534, 1.0772082805633545, 1.0975061655044556, 1.1178041696548462, 1.1381020545959473, 1.1583999395370483]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 10.0, 12.0, 20.0, 29.0, 46.0, 62.0, 68.0, 91.0, 67.0, 102.0, 82.0, 85.0, 73.0, 64.0, 54.0, 54.0, 32.0, 17.0, 16.0, 9.0, 6.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26860177516937256, -0.2596263587474823, -0.25065091252326965, -0.2416754812002182, -0.23270004987716675, -0.2237246334552765, -0.21474920213222504, -0.20577377080917358, -0.19679833948612213, -0.18782290816307068, -0.17884747684001923, -0.16987204551696777, -0.16089662909507751, -0.15192118287086487, -0.1429457664489746, -0.13397033512592316, -0.1249949038028717, -0.11601947247982025, -0.1070440411567688, -0.09806861728429794, -0.08909318596124649, -0.08011775463819504, -0.07114233076572418, -0.06216689944267273, -0.05319146811962128, -0.044216036796569824, -0.03524060919880867, -0.026265179738402367, -0.017289750277996063, -0.00831431895494461, 0.0006611086428165436, 0.009636536240577698, 0.01861196756362915, 0.027587397024035454, 0.03656282648444176, 0.04553825408220291, 0.054513685405254364, 0.06348911672830582, 0.07246454060077667, 0.08143997192382812, 0.09041540324687958, 0.09939083456993103, 0.10836626589298248, 0.11734168976545334, 0.1263171136379242, 0.13529255986213684, 0.1442679762840271, 0.15324340760707855, 0.16221883893013, 0.17119427025318146, 0.1801697015762329, 0.18914513289928436, 0.19812056422233582, 0.20709598064422607, 0.21607141196727753, 0.22504684329032898, 0.23402227461338043, 0.24299770593643188, 0.25197312235832214, 0.2609485685825348, 0.26992398500442505, 0.2788994312286377, 0.28787484765052795, 0.2968502640724182, 0.30582571029663086]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 0.0, 4.0, 4.0, 7.0, 10.0, 8.0, 11.0, 17.0, 35.0, 41.0, 60.0, 90.0, 158.0, 218.0, 419.0, 908.0, 1914.0, 5083.0, 18681.0, 97577.0, 474843.0, 362557.0, 65265.0, 13284.0, 3986.0, 1636.0, 717.0, 377.0, 245.0, 138.0, 86.0, 56.0, 31.0, 20.0, 10.0, 20.0, 9.0, 10.0, 8.0, 6.0, 9.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.126220703125, -0.12185096740722656, -0.11748123168945312, -0.11311149597167969, -0.10874176025390625, -0.10437202453613281, -0.10000228881835938, -0.09563255310058594, -0.0912628173828125, -0.08689308166503906, -0.08252334594726562, -0.07815361022949219, -0.07378387451171875, -0.06941413879394531, -0.06504440307617188, -0.06067466735839844, -0.056304931640625, -0.05193519592285156, -0.047565460205078125, -0.04319572448730469, -0.03882598876953125, -0.03445625305175781, -0.030086517333984375, -0.025716781616210938, -0.0213470458984375, -0.016977310180664062, -0.012607574462890625, -0.008237838745117188, -0.00386810302734375, 0.0005016326904296875, 0.004871368408203125, 0.009241104125976562, 0.01361083984375, 0.017980575561523438, 0.022350311279296875, 0.026720046997070312, 0.03108978271484375, 0.03545951843261719, 0.039829254150390625, 0.04419898986816406, 0.0485687255859375, 0.05293846130371094, 0.057308197021484375, 0.06167793273925781, 0.06604766845703125, 0.07041740417480469, 0.07478713989257812, 0.07915687561035156, 0.083526611328125, 0.08789634704589844, 0.09226608276367188, 0.09663581848144531, 0.10100555419921875, 0.10537528991699219, 0.10974502563476562, 0.11411476135253906, 0.1184844970703125, 0.12285423278808594, 0.12722396850585938, 0.1315937042236328, 0.13596343994140625, 0.1403331756591797, 0.14470291137695312, 0.14907264709472656, 0.1534423828125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 6.0, 10.0, 12.0, 23.0, 22.0, 21.0, 35.0, 36.0, 37.0, 57.0, 54.0, 71.0, 77.0, 66.0, 76.0, 91.0, 57.0, 41.0, 46.0, 27.0, 36.0, 27.0, 13.0, 19.0, 11.0, 10.0, 11.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.04937744140625, -0.047707557678222656, -0.04603767395019531, -0.04436779022216797, -0.042697906494140625, -0.04102802276611328, -0.03935813903808594, -0.037688255310058594, -0.03601837158203125, -0.034348487854003906, -0.03267860412597656, -0.03100872039794922, -0.029338836669921875, -0.02766895294189453, -0.025999069213867188, -0.024329185485839844, -0.0226593017578125, -0.020989418029785156, -0.019319534301757812, -0.01764965057373047, -0.015979766845703125, -0.014309883117675781, -0.012639999389648438, -0.010970115661621094, -0.00930023193359375, -0.007630348205566406, -0.0059604644775390625, -0.004290580749511719, -0.002620697021484375, -0.0009508132934570312, 0.0007190704345703125, 0.0023889541625976562, 0.004058837890625, 0.005728721618652344, 0.0073986053466796875, 0.009068489074707031, 0.010738372802734375, 0.012408256530761719, 0.014078140258789062, 0.015748023986816406, 0.01741790771484375, 0.019087791442871094, 0.020757675170898438, 0.02242755889892578, 0.024097442626953125, 0.02576732635498047, 0.027437210083007812, 0.029107093811035156, 0.0307769775390625, 0.032446861267089844, 0.03411674499511719, 0.03578662872314453, 0.037456512451171875, 0.03912639617919922, 0.04079627990722656, 0.042466163635253906, 0.04413604736328125, 0.045805931091308594, 0.04747581481933594, 0.04914569854736328, 0.050815582275390625, 0.05248546600341797, 0.05415534973144531, 0.055825233459472656, 0.0574951171875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 5.0, 4.0, 5.0, 7.0, 11.0, 23.0, 24.0, 28.0, 40.0, 67.0, 75.0, 136.0, 177.0, 247.0, 454.0, 954.0, 2610.0, 8560.0, 37068.0, 205859.0, 564772.0, 181586.0, 33264.0, 7991.0, 2337.0, 917.0, 458.0, 275.0, 170.0, 126.0, 71.0, 61.0, 42.0, 28.0, 33.0, 24.0, 13.0, 10.0, 5.0, 6.0, 10.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.12841796875, -0.12479686737060547, -0.12117576599121094, -0.1175546646118164, -0.11393356323242188, -0.11031246185302734, -0.10669136047363281, -0.10307025909423828, -0.09944915771484375, -0.09582805633544922, -0.09220695495605469, -0.08858585357666016, -0.08496475219726562, -0.0813436508178711, -0.07772254943847656, -0.07410144805908203, -0.0704803466796875, -0.06685924530029297, -0.06323814392089844, -0.059617042541503906, -0.055995941162109375, -0.052374839782714844, -0.04875373840332031, -0.04513263702392578, -0.04151153564453125, -0.03789043426513672, -0.03426933288574219, -0.030648231506347656, -0.027027130126953125, -0.023406028747558594, -0.019784927368164062, -0.01616382598876953, -0.012542724609375, -0.008921623229980469, -0.0053005218505859375, -0.0016794204711914062, 0.001941680908203125, 0.005562782287597656, 0.009183883666992188, 0.012804985046386719, 0.01642608642578125, 0.02004718780517578, 0.023668289184570312, 0.027289390563964844, 0.030910491943359375, 0.034531593322753906, 0.03815269470214844, 0.04177379608154297, 0.0453948974609375, 0.04901599884033203, 0.05263710021972656, 0.056258201599121094, 0.059879302978515625, 0.06350040435791016, 0.06712150573730469, 0.07074260711669922, 0.07436370849609375, 0.07798480987548828, 0.08160591125488281, 0.08522701263427734, 0.08884811401367188, 0.0924692153930664, 0.09609031677246094, 0.09971141815185547, 0.10333251953125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 11.0, 8.0, 10.0, 17.0, 17.0, 8.0, 21.0, 20.0, 22.0, 28.0, 43.0, 29.0, 42.0, 37.0, 52.0, 36.0, 46.0, 37.0, 53.0, 41.0, 49.0, 38.0, 37.0, 32.0, 28.0, 35.0, 24.0, 29.0, 22.0, 28.0, 17.0, 17.0, 11.0, 16.0, 6.0, 9.0, 12.0, 9.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.1531982421875, -0.14877700805664062, -0.14435577392578125, -0.13993453979492188, -0.1355133056640625, -0.13109207153320312, -0.12667083740234375, -0.12224960327148438, -0.117828369140625, -0.11340713500976562, -0.10898590087890625, -0.10456466674804688, -0.1001434326171875, -0.09572219848632812, -0.09130096435546875, -0.08687973022460938, -0.08245849609375, -0.07803726196289062, -0.07361602783203125, -0.06919479370117188, -0.0647735595703125, -0.060352325439453125, -0.05593109130859375, -0.051509857177734375, -0.047088623046875, -0.042667388916015625, -0.03824615478515625, -0.033824920654296875, -0.0294036865234375, -0.024982452392578125, -0.02056121826171875, -0.016139984130859375, -0.01171875, -0.007297515869140625, -0.00287628173828125, 0.001544952392578125, 0.0059661865234375, 0.010387420654296875, 0.01480865478515625, 0.019229888916015625, 0.023651123046875, 0.028072357177734375, 0.03249359130859375, 0.036914825439453125, 0.0413360595703125, 0.045757293701171875, 0.05017852783203125, 0.054599761962890625, 0.05902099609375, 0.06344223022460938, 0.06786346435546875, 0.07228469848632812, 0.0767059326171875, 0.08112716674804688, 0.08554840087890625, 0.08996963500976562, 0.094390869140625, 0.09881210327148438, 0.10323333740234375, 0.10765457153320312, 0.1120758056640625, 0.11649703979492188, 0.12091827392578125, 0.12533950805664062, 0.1297607421875]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 2.0, 6.0, 11.0, 21.0, 23.0, 31.0, 49.0, 61.0, 121.0, 219.0, 479.0, 1252.0, 4076.0, 25207.0, 703731.0, 293907.0, 14620.0, 2943.0, 905.0, 392.0, 168.0, 118.0, 78.0, 56.0, 33.0, 13.0, 12.0, 10.0, 4.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.139404296875, -0.1359081268310547, -0.13241195678710938, -0.12891578674316406, -0.12541961669921875, -0.12192344665527344, -0.11842727661132812, -0.11493110656738281, -0.1114349365234375, -0.10793876647949219, -0.10444259643554688, -0.10094642639160156, -0.09745025634765625, -0.09395408630371094, -0.09045791625976562, -0.08696174621582031, -0.083465576171875, -0.07996940612792969, -0.07647323608398438, -0.07297706604003906, -0.06948089599609375, -0.06598472595214844, -0.062488555908203125, -0.05899238586425781, -0.0554962158203125, -0.05200004577636719, -0.048503875732421875, -0.04500770568847656, -0.04151153564453125, -0.03801536560058594, -0.034519195556640625, -0.031023025512695312, -0.02752685546875, -0.024030685424804688, -0.020534515380859375, -0.017038345336914062, -0.01354217529296875, -0.010046005249023438, -0.006549835205078125, -0.0030536651611328125, 0.0004425048828125, 0.0039386749267578125, 0.007434844970703125, 0.010931015014648438, 0.01442718505859375, 0.017923355102539062, 0.021419525146484375, 0.024915695190429688, 0.028411865234375, 0.03190803527832031, 0.035404205322265625, 0.03890037536621094, 0.04239654541015625, 0.04589271545410156, 0.049388885498046875, 0.05288505554199219, 0.0563812255859375, 0.05987739562988281, 0.06337356567382812, 0.06686973571777344, 0.07036590576171875, 0.07386207580566406, 0.07735824584960938, 0.08085441589355469, 0.0843505859375]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 1.0, 9.0, 4.0, 12.0, 12.0, 14.0, 20.0, 33.0, 51.0, 51.0, 74.0, 93.0, 106.0, 90.0, 99.0, 79.0, 50.0, 54.0, 35.0, 33.0, 19.0, 16.0, 8.0, 9.0, 10.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.043081283569336e-05, -1.0034069418907166e-05, -9.637326002120972e-06, -9.240582585334778e-06, -8.843839168548584e-06, -8.44709575176239e-06, -8.050352334976196e-06, -7.653608918190002e-06, -7.256865501403809e-06, -6.860122084617615e-06, -6.463378667831421e-06, -6.066635251045227e-06, -5.669891834259033e-06, -5.273148417472839e-06, -4.8764050006866455e-06, -4.479661583900452e-06, -4.082918167114258e-06, -3.686174750328064e-06, -3.28943133354187e-06, -2.8926879167556763e-06, -2.4959444999694824e-06, -2.0992010831832886e-06, -1.7024576663970947e-06, -1.3057142496109009e-06, -9.08970832824707e-07, -5.122274160385132e-07, -1.1548399925231934e-07, 2.812594175338745e-07, 6.780028343200684e-07, 1.0747462511062622e-06, 1.471489667892456e-06, 1.86823308467865e-06, 2.2649765014648438e-06, 2.6617199182510376e-06, 3.0584633350372314e-06, 3.4552067518234253e-06, 3.851950168609619e-06, 4.248693585395813e-06, 4.645437002182007e-06, 5.042180418968201e-06, 5.4389238357543945e-06, 5.835667252540588e-06, 6.232410669326782e-06, 6.629154086112976e-06, 7.02589750289917e-06, 7.422640919685364e-06, 7.819384336471558e-06, 8.216127753257751e-06, 8.612871170043945e-06, 9.00961458683014e-06, 9.406358003616333e-06, 9.803101420402527e-06, 1.019984483718872e-05, 1.0596588253974915e-05, 1.0993331670761108e-05, 1.1390075087547302e-05, 1.1786818504333496e-05, 1.218356192111969e-05, 1.2580305337905884e-05, 1.2977048754692078e-05, 1.3373792171478271e-05, 1.3770535588264465e-05, 1.416727900505066e-05, 1.4564022421836853e-05, 1.4960765838623047e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 0.0, 3.0, 1.0, 4.0, 4.0, 7.0, 9.0, 18.0, 26.0, 42.0, 80.0, 161.0, 304.0, 663.0, 1747.0, 6880.0, 128175.0, 873250.0, 31412.0, 3638.0, 1148.0, 480.0, 229.0, 124.0, 60.0, 40.0, 23.0, 13.0, 8.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1422119140625, -0.13840007781982422, -0.13458824157714844, -0.13077640533447266, -0.12696456909179688, -0.1231527328491211, -0.11934089660644531, -0.11552906036376953, -0.11171722412109375, -0.10790538787841797, -0.10409355163574219, -0.1002817153930664, -0.09646987915039062, -0.09265804290771484, -0.08884620666503906, -0.08503437042236328, -0.0812225341796875, -0.07741069793701172, -0.07359886169433594, -0.06978702545166016, -0.06597518920898438, -0.062163352966308594, -0.05835151672363281, -0.05453968048095703, -0.05072784423828125, -0.04691600799560547, -0.04310417175292969, -0.039292335510253906, -0.035480499267578125, -0.031668663024902344, -0.027856826782226562, -0.02404499053955078, -0.020233154296875, -0.01642131805419922, -0.012609481811523438, -0.008797645568847656, -0.004985809326171875, -0.0011739730834960938, 0.0026378631591796875, 0.006449699401855469, 0.01026153564453125, 0.014073371887207031, 0.017885208129882812, 0.021697044372558594, 0.025508880615234375, 0.029320716857910156, 0.03313255310058594, 0.03694438934326172, 0.0407562255859375, 0.04456806182861328, 0.04837989807128906, 0.052191734313964844, 0.056003570556640625, 0.059815406799316406, 0.06362724304199219, 0.06743907928466797, 0.07125091552734375, 0.07506275177001953, 0.07887458801269531, 0.0826864242553711, 0.08649826049804688, 0.09031009674072266, 0.09412193298339844, 0.09793376922607422, 0.10174560546875]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 3.0, 15.0, 37.0, 75.0, 180.0, 244.0, 220.0, 134.0, 44.0, 22.0, 8.0, 2.0, 6.0, 1.0, 0.0, 0.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.1878662109375, -0.18313312530517578, -0.17840003967285156, -0.17366695404052734, -0.16893386840820312, -0.1642007827758789, -0.1594676971435547, -0.15473461151123047, -0.15000152587890625, -0.14526844024658203, -0.1405353546142578, -0.1358022689819336, -0.13106918334960938, -0.12633609771728516, -0.12160301208496094, -0.11686992645263672, -0.1121368408203125, -0.10740375518798828, -0.10267066955566406, -0.09793758392333984, -0.09320449829101562, -0.0884714126586914, -0.08373832702636719, -0.07900524139404297, -0.07427215576171875, -0.06953907012939453, -0.06480598449707031, -0.060072898864746094, -0.055339813232421875, -0.050606727600097656, -0.04587364196777344, -0.04114055633544922, -0.036407470703125, -0.03167438507080078, -0.026941299438476562, -0.022208213806152344, -0.017475128173828125, -0.012742042541503906, -0.008008956909179688, -0.0032758712768554688, 0.00145721435546875, 0.006190299987792969, 0.010923385620117188, 0.015656471252441406, 0.020389556884765625, 0.025122642517089844, 0.029855728149414062, 0.03458881378173828, 0.0393218994140625, 0.04405498504638672, 0.04878807067871094, 0.053521156311035156, 0.058254241943359375, 0.0629873275756836, 0.06772041320800781, 0.07245349884033203, 0.07718658447265625, 0.08191967010498047, 0.08665275573730469, 0.0913858413696289, 0.09611892700195312, 0.10085201263427734, 0.10558509826660156, 0.11031818389892578, 0.11505126953125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 9.0, 22.0, 43.0, 192.0, 292.0, 281.0, 134.0, 27.0, 9.0, 4.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0013232231140137, -1.93639075756073, -1.8714582920074463, -1.8065259456634521, -1.7415934801101685, -1.6766610145568848, -1.6117286682128906, -1.546796202659607, -1.4818637371063232, -1.4169312715530396, -1.3519988059997559, -1.2870664596557617, -1.222133994102478, -1.1572015285491943, -1.0922691822052002, -1.0273367166519165, -0.9624042510986328, -0.8974717855453491, -0.8325393795967102, -0.7676069736480713, -0.7026745080947876, -0.6377420425415039, -0.572809636592865, -0.5078772306442261, -0.4429447650909424, -0.3780123293399811, -0.3130798935890198, -0.24814745783805847, -0.18321502208709717, -0.11828258633613586, -0.05335015058517456, 0.011582285165786743, 0.07651448249816895, 0.14144691824913025, 0.20637935400009155, 0.27131178975105286, 0.33624422550201416, 0.40117666125297546, 0.46610909700393677, 0.5310415029525757, 0.5959739685058594, 0.6609064340591431, 0.725838840007782, 0.7907712459564209, 0.8557037115097046, 0.9206361770629883, 0.9855685830116272, 1.0505009889602661, 1.1154334545135498, 1.1803659200668335, 1.2452983856201172, 1.3102307319641113, 1.375163197517395, 1.4400956630706787, 1.5050280094146729, 1.5699604749679565, 1.6348929405212402, 1.699825406074524, 1.7647578716278076, 1.8296902179718018, 1.8946226835250854, 1.9595551490783691, 2.0244874954223633, 2.0894200801849365, 2.1543524265289307]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 6.0, 3.0, 4.0, 6.0, 7.0, 8.0, 12.0, 17.0, 24.0, 15.0, 24.0, 32.0, 20.0, 33.0, 24.0, 43.0, 40.0, 36.0, 43.0, 36.0, 53.0, 36.0, 41.0, 45.0, 53.0, 43.0, 33.0, 40.0, 34.0, 16.0, 28.0, 29.0, 26.0, 13.0, 21.0, 14.0, 14.0, 13.0, 7.0, 4.0, 3.0, 2.0, 4.0, 3.0, 2.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.7369064092636108, -0.7143139243125916, -0.6917214393615723, -0.6691288948059082, -0.6465364098548889, -0.6239439249038696, -0.6013514399528503, -0.578758955001831, -0.556166410446167, -0.5335739254951477, -0.5109814405441284, -0.48838892579078674, -0.46579641103744507, -0.4432039260864258, -0.4206114411354065, -0.3980189263820648, -0.37542644143104553, -0.35283395648002625, -0.33024144172668457, -0.3076489567756653, -0.2850564420223236, -0.2624639570713043, -0.23987145721912384, -0.21727895736694336, -0.19468645751476288, -0.1720939576625824, -0.14950145781040192, -0.12690895795822144, -0.10431646555662155, -0.08172396570444107, -0.059131473302841187, -0.036538973450660706, -0.013946473598480225, 0.008646024391055107, 0.03123852238059044, 0.05383101850748062, 0.0764235183596611, 0.09901601821184158, 0.12160851061344147, 0.14420101046562195, 0.16679351031780243, 0.1893860101699829, 0.2119785100221634, 0.23457100987434387, 0.25716349482536316, 0.27975600957870483, 0.3023484945297241, 0.3249409794807434, 0.3475334942340851, 0.37012597918510437, 0.39271849393844604, 0.41531097888946533, 0.437903493642807, 0.4604959785938263, 0.48308849334716797, 0.5056809782981873, 0.5282734632492065, 0.5508659482002258, 0.5734584331512451, 0.5960509777069092, 0.6186434626579285, 0.6412359476089478, 0.663828432559967, 0.6864209175109863, 0.7090134620666504]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 4.0, 6.0, 10.0, 14.0, 23.0, 29.0, 56.0, 64.0, 117.0, 289.0, 683.0, 2269.0, 11099.0, 3816824.0, 348881.0, 10536.0, 2111.0, 694.0, 252.0, 96.0, 85.0, 46.0, 29.0, 19.0, 15.0, 17.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.133056640625, -0.12793540954589844, -0.12281417846679688, -0.11769294738769531, -0.11257171630859375, -0.10745048522949219, -0.10232925415039062, -0.09720802307128906, -0.0920867919921875, -0.08696556091308594, -0.08184432983398438, -0.07672309875488281, -0.07160186767578125, -0.06648063659667969, -0.061359405517578125, -0.05623817443847656, -0.051116943359375, -0.04599571228027344, -0.040874481201171875, -0.03575325012207031, -0.03063201904296875, -0.025510787963867188, -0.020389556884765625, -0.015268325805664062, -0.0101470947265625, -0.0050258636474609375, 9.5367431640625e-05, 0.0052165985107421875, 0.01033782958984375, 0.015459060668945312, 0.020580291748046875, 0.025701522827148438, 0.03082275390625, 0.03594398498535156, 0.041065216064453125, 0.04618644714355469, 0.05130767822265625, 0.05642890930175781, 0.061550140380859375, 0.06667137145996094, 0.0717926025390625, 0.07691383361816406, 0.08203506469726562, 0.08715629577636719, 0.09227752685546875, 0.09739875793457031, 0.10251998901367188, 0.10764122009277344, 0.112762451171875, 0.11788368225097656, 0.12300491333007812, 0.1281261444091797, 0.13324737548828125, 0.1383686065673828, 0.14348983764648438, 0.14861106872558594, 0.1537322998046875, 0.15885353088378906, 0.16397476196289062, 0.1690959930419922, 0.17421722412109375, 0.1793384552001953, 0.18445968627929688, 0.18958091735839844, 0.1947021484375]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 11.0, 15.0, 22.0, 23.0, 25.0, 26.0, 41.0, 34.0, 53.0, 62.0, 72.0, 66.0, 74.0, 66.0, 70.0, 59.0, 41.0, 35.0, 35.0, 28.0, 32.0, 22.0, 21.0, 17.0, 12.0, 10.0, 5.0, 2.0, 0.0, 4.0, 7.0, 1.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.049713134765625, -0.048044681549072266, -0.04637622833251953, -0.0447077751159668, -0.04303932189941406, -0.04137086868286133, -0.039702415466308594, -0.03803396224975586, -0.036365509033203125, -0.03469705581665039, -0.033028602600097656, -0.03136014938354492, -0.029691696166992188, -0.028023242950439453, -0.02635478973388672, -0.024686336517333984, -0.02301788330078125, -0.021349430084228516, -0.01968097686767578, -0.018012523651123047, -0.016344070434570312, -0.014675617218017578, -0.013007164001464844, -0.01133871078491211, -0.009670257568359375, -0.00800180435180664, -0.006333351135253906, -0.004664897918701172, -0.0029964447021484375, -0.0013279914855957031, 0.00034046173095703125, 0.0020089149475097656, 0.0036773681640625, 0.005345821380615234, 0.007014274597167969, 0.008682727813720703, 0.010351181030273438, 0.012019634246826172, 0.013688087463378906, 0.01535654067993164, 0.017024993896484375, 0.01869344711303711, 0.020361900329589844, 0.022030353546142578, 0.023698806762695312, 0.025367259979248047, 0.02703571319580078, 0.028704166412353516, 0.03037261962890625, 0.032041072845458984, 0.03370952606201172, 0.03537797927856445, 0.03704643249511719, 0.03871488571166992, 0.040383338928222656, 0.04205179214477539, 0.043720245361328125, 0.04538869857788086, 0.047057151794433594, 0.04872560501098633, 0.05039405822753906, 0.0520625114440918, 0.05373096466064453, 0.055399417877197266, 0.05706787109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 1.0, 3.0, 6.0, 6.0, 8.0, 11.0, 9.0, 19.0, 25.0, 35.0, 51.0, 83.0, 112.0, 150.0, 189.0, 305.0, 451.0, 658.0, 1108.0, 2147.0, 4763.0, 12466.0, 55153.0, 3924670.0, 155912.0, 21872.0, 6991.0, 3006.0, 1530.0, 811.0, 542.0, 362.0, 233.0, 171.0, 133.0, 85.0, 53.0, 48.0, 27.0, 25.0, 20.0, 12.0, 8.0, 6.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.074462890625, -0.0718698501586914, -0.06927680969238281, -0.06668376922607422, -0.06409072875976562, -0.06149768829345703, -0.05890464782714844, -0.056311607360839844, -0.05371856689453125, -0.051125526428222656, -0.04853248596191406, -0.04593944549560547, -0.043346405029296875, -0.04075336456298828, -0.03816032409667969, -0.035567283630371094, -0.0329742431640625, -0.030381202697753906, -0.027788162231445312, -0.02519512176513672, -0.022602081298828125, -0.02000904083251953, -0.017416000366210938, -0.014822959899902344, -0.01222991943359375, -0.009636878967285156, -0.0070438385009765625, -0.004450798034667969, -0.001857757568359375, 0.0007352828979492188, 0.0033283233642578125, 0.005921363830566406, 0.008514404296875, 0.011107444763183594, 0.013700485229492188, 0.01629352569580078, 0.018886566162109375, 0.02147960662841797, 0.024072647094726562, 0.026665687561035156, 0.02925872802734375, 0.031851768493652344, 0.03444480895996094, 0.03703784942626953, 0.039630889892578125, 0.04222393035888672, 0.04481697082519531, 0.047410011291503906, 0.0500030517578125, 0.052596092224121094, 0.05518913269042969, 0.05778217315673828, 0.060375213623046875, 0.06296825408935547, 0.06556129455566406, 0.06815433502197266, 0.07074737548828125, 0.07334041595458984, 0.07593345642089844, 0.07852649688720703, 0.08111953735351562, 0.08371257781982422, 0.08630561828613281, 0.0888986587524414, 0.09149169921875]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 5.0, 4.0, 4.0, 7.0, 11.0, 8.0, 20.0, 25.0, 60.0, 130.0, 3237.0, 338.0, 101.0, 51.0, 24.0, 13.0, 14.0, 6.0, 3.0, 8.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.02044677734375, -0.019876956939697266, -0.01930713653564453, -0.018737316131591797, -0.018167495727539062, -0.017597675323486328, -0.017027854919433594, -0.01645803451538086, -0.015888214111328125, -0.01531839370727539, -0.014748573303222656, -0.014178752899169922, -0.013608932495117188, -0.013039112091064453, -0.012469291687011719, -0.011899471282958984, -0.01132965087890625, -0.010759830474853516, -0.010190010070800781, -0.009620189666748047, -0.009050369262695312, -0.008480548858642578, -0.007910728454589844, -0.007340908050537109, -0.006771087646484375, -0.006201267242431641, -0.005631446838378906, -0.005061626434326172, -0.0044918060302734375, -0.003921985626220703, -0.0033521652221679688, -0.0027823448181152344, -0.0022125244140625, -0.0016427040100097656, -0.0010728836059570312, -0.0005030632019042969, 6.67572021484375e-05, 0.0006365776062011719, 0.0012063980102539062, 0.0017762184143066406, 0.002346038818359375, 0.0029158592224121094, 0.0034856796264648438, 0.004055500030517578, 0.0046253204345703125, 0.005195140838623047, 0.005764961242675781, 0.006334781646728516, 0.00690460205078125, 0.007474422454833984, 0.008044242858886719, 0.008614063262939453, 0.009183883666992188, 0.009753704071044922, 0.010323524475097656, 0.01089334487915039, 0.011463165283203125, 0.01203298568725586, 0.012602806091308594, 0.013172626495361328, 0.013742446899414062, 0.014312267303466797, 0.014882087707519531, 0.015451908111572266, 0.016021728515625]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 8.0, 11.0, 25.0, 55.0, 106.0, 140.0, 180.0, 163.0, 111.0, 101.0, 49.0, 25.0, 16.0, 7.0, 7.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0], "bins": [-0.1572781205177307, -0.15407098829746246, -0.1508638560771942, -0.14765672385692596, -0.14444959163665771, -0.14124245941638947, -0.13803532719612122, -0.13482818007469177, -0.13162106275558472, -0.12841393053531647, -0.12520679831504822, -0.12199966609477997, -0.11879253387451172, -0.11558540165424347, -0.11237826198339462, -0.10917112976312637, -0.10596399009227753, -0.10275685787200928, -0.09954972565174103, -0.09634259343147278, -0.09313546121120453, -0.08992832899093628, -0.08672118932008743, -0.08351405709981918, -0.08030692487955093, -0.07709979265928268, -0.07389266043901443, -0.07068552821874619, -0.06747838854789734, -0.06427125632762909, -0.06106412410736084, -0.05785699188709259, -0.054649852216243744, -0.051442719995975494, -0.048235587775707245, -0.0450284518301487, -0.04182131960988045, -0.0386141873896122, -0.03540705144405365, -0.0321999192237854, -0.02899278700351715, -0.0257856547832489, -0.022578520700335503, -0.019371386617422104, -0.016164254397153854, -0.012957122176885605, -0.009749988093972206, -0.006542854011058807, -0.003335721790790558, -0.00012858863919973373, 0.0030785445123910904, 0.0062856776639819145, 0.009492810815572739, 0.012699943035840988, 0.015907077118754387, 0.019114211201667786, 0.022321343421936035, 0.025528475642204285, 0.028735609725117683, 0.03194274380803108, 0.03514987602829933, 0.03835700824856758, 0.04156414419412613, 0.04477127641439438, 0.04797840863466263]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 6.0, 11.0, 10.0, 11.0, 17.0, 20.0, 16.0, 32.0, 47.0, 23.0, 28.0, 44.0, 48.0, 40.0, 43.0, 39.0, 43.0, 55.0, 48.0, 37.0, 32.0, 62.0, 46.0, 34.0, 27.0, 36.0, 30.0, 19.0, 17.0, 16.0, 16.0, 8.0, 8.0, 9.0, 8.0, 4.0, 4.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02952110767364502, -0.028329428285360336, -0.027137748897075653, -0.02594606950879097, -0.024754390120506287, -0.023562710732221603, -0.02237103134393692, -0.021179351955652237, -0.019987672567367554, -0.01879599317908287, -0.017604313790798187, -0.016412634402513504, -0.01522095501422882, -0.014029275625944138, -0.012837596237659454, -0.011645916849374771, -0.010454237461090088, -0.009262558072805405, -0.008070878684520721, -0.006879199296236038, -0.005687519907951355, -0.004495840519666672, -0.0033041611313819885, -0.0021124817430973053, -0.0009208023548126221, 0.00027087703347206116, 0.0014625564217567444, 0.0026542358100414276, 0.003845915198326111, 0.005037594586610794, 0.006229273974895477, 0.0074209533631801605, 0.008612632751464844, 0.009804312139749527, 0.01099599152803421, 0.012187670916318893, 0.013379350304603577, 0.01457102969288826, 0.015762709081172943, 0.016954388469457626, 0.01814606785774231, 0.019337747246026993, 0.020529426634311676, 0.02172110602259636, 0.022912785410881042, 0.024104464799165726, 0.02529614418745041, 0.026487823575735092, 0.027679502964019775, 0.02887118235230446, 0.030062861740589142, 0.031254541128873825, 0.03244622051715851, 0.03363789990544319, 0.034829579293727875, 0.03602125868201256, 0.03721293807029724, 0.038404617458581924, 0.03959629684686661, 0.04078797623515129, 0.041979655623435974, 0.04317133501172066, 0.04436301440000534, 0.045554693788290024, 0.04674637317657471]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 12.0, 12.0, 21.0, 44.0, 78.0, 149.0, 390.0, 827.0, 2803.0, 12691.0, 77747.0, 453112.0, 416448.0, 68784.0, 11446.0, 2502.0, 857.0, 321.0, 145.0, 76.0, 29.0, 23.0, 14.0, 9.0, 4.0, 3.0, 2.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1712646484375, -0.16663169860839844, -0.16199874877929688, -0.1573657989501953, -0.15273284912109375, -0.1480998992919922, -0.14346694946289062, -0.13883399963378906, -0.1342010498046875, -0.12956809997558594, -0.12493515014648438, -0.12030220031738281, -0.11566925048828125, -0.11103630065917969, -0.10640335083007812, -0.10177040100097656, -0.097137451171875, -0.09250450134277344, -0.08787155151367188, -0.08323860168457031, -0.07860565185546875, -0.07397270202636719, -0.06933975219726562, -0.06470680236816406, -0.0600738525390625, -0.05544090270996094, -0.050807952880859375, -0.04617500305175781, -0.04154205322265625, -0.03690910339355469, -0.032276153564453125, -0.027643203735351562, -0.02301025390625, -0.018377304077148438, -0.013744354248046875, -0.009111404418945312, -0.00447845458984375, 0.0001544952392578125, 0.004787445068359375, 0.009420394897460938, 0.0140533447265625, 0.018686294555664062, 0.023319244384765625, 0.027952194213867188, 0.03258514404296875, 0.03721809387207031, 0.041851043701171875, 0.04648399353027344, 0.051116943359375, 0.05574989318847656, 0.060382843017578125, 0.06501579284667969, 0.06964874267578125, 0.07428169250488281, 0.07891464233398438, 0.08354759216308594, 0.0881805419921875, 0.09281349182128906, 0.09744644165039062, 0.10207939147949219, 0.10671234130859375, 0.11134529113769531, 0.11597824096679688, 0.12061119079589844, 0.125244140625]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 3.0, 3.0, 7.0, 8.0, 16.0, 19.0, 10.0, 28.0, 26.0, 40.0, 36.0, 47.0, 61.0, 57.0, 75.0, 62.0, 67.0, 62.0, 66.0, 54.0, 41.0, 37.0, 29.0, 29.0, 34.0, 15.0, 17.0, 16.0, 13.0, 10.0, 5.0, 2.0, 3.0, 1.0, 3.0, 4.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049774169921875, -0.04807472229003906, -0.046375274658203125, -0.04467582702636719, -0.04297637939453125, -0.04127693176269531, -0.039577484130859375, -0.03787803649902344, -0.0361785888671875, -0.03447914123535156, -0.032779693603515625, -0.031080245971679688, -0.02938079833984375, -0.027681350708007812, -0.025981903076171875, -0.024282455444335938, -0.0225830078125, -0.020883560180664062, -0.019184112548828125, -0.017484664916992188, -0.01578521728515625, -0.014085769653320312, -0.012386322021484375, -0.010686874389648438, -0.0089874267578125, -0.0072879791259765625, -0.005588531494140625, -0.0038890838623046875, -0.00218963623046875, -0.0004901885986328125, 0.001209259033203125, 0.0029087066650390625, 0.004608154296875, 0.0063076019287109375, 0.008007049560546875, 0.009706497192382812, 0.01140594482421875, 0.013105392456054688, 0.014804840087890625, 0.016504287719726562, 0.0182037353515625, 0.019903182983398438, 0.021602630615234375, 0.023302078247070312, 0.02500152587890625, 0.026700973510742188, 0.028400421142578125, 0.030099868774414062, 0.03179931640625, 0.03349876403808594, 0.035198211669921875, 0.03689765930175781, 0.03859710693359375, 0.04029655456542969, 0.041996002197265625, 0.04369544982910156, 0.0453948974609375, 0.04709434509277344, 0.048793792724609375, 0.05049324035644531, 0.05219268798828125, 0.05389213562011719, 0.055591583251953125, 0.05729103088378906, 0.058990478515625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 4.0, 5.0, 2.0, 10.0, 8.0, 9.0, 18.0, 17.0, 24.0, 24.0, 52.0, 62.0, 81.0, 109.0, 151.0, 236.0, 478.0, 1095.0, 3405.0, 15948.0, 98833.0, 540309.0, 325900.0, 48902.0, 8884.0, 2170.0, 779.0, 357.0, 201.0, 140.0, 91.0, 71.0, 42.0, 40.0, 18.0, 20.0, 20.0, 13.0, 10.0, 4.0, 2.0, 5.0, 2.0, 4.0, 1.0, 2.0, 4.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.107666015625, -0.10392951965332031, -0.10019302368164062, -0.09645652770996094, -0.09272003173828125, -0.08898353576660156, -0.08524703979492188, -0.08151054382324219, -0.0777740478515625, -0.07403755187988281, -0.07030105590820312, -0.06656455993652344, -0.06282806396484375, -0.05909156799316406, -0.055355072021484375, -0.05161857604980469, -0.047882080078125, -0.04414558410644531, -0.040409088134765625, -0.03667259216308594, -0.03293609619140625, -0.029199600219726562, -0.025463104248046875, -0.021726608276367188, -0.0179901123046875, -0.014253616333007812, -0.010517120361328125, -0.0067806243896484375, -0.00304412841796875, 0.0006923675537109375, 0.004428863525390625, 0.008165359497070312, 0.01190185546875, 0.015638351440429688, 0.019374847412109375, 0.023111343383789062, 0.02684783935546875, 0.030584335327148438, 0.034320831298828125, 0.03805732727050781, 0.0417938232421875, 0.04553031921386719, 0.049266815185546875, 0.05300331115722656, 0.05673980712890625, 0.06047630310058594, 0.06421279907226562, 0.06794929504394531, 0.071685791015625, 0.07542228698730469, 0.07915878295898438, 0.08289527893066406, 0.08663177490234375, 0.09036827087402344, 0.09410476684570312, 0.09784126281738281, 0.1015777587890625, 0.10531425476074219, 0.10905075073242188, 0.11278724670410156, 0.11652374267578125, 0.12026023864746094, 0.12399673461914062, 0.1277332305908203, 0.1314697265625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 7.0, 8.0, 6.0, 9.0, 8.0, 19.0, 12.0, 26.0, 16.0, 23.0, 30.0, 22.0, 36.0, 39.0, 34.0, 51.0, 48.0, 59.0, 38.0, 42.0, 54.0, 43.0, 45.0, 41.0, 40.0, 39.0, 29.0, 36.0, 24.0, 33.0, 19.0, 17.0, 7.0, 13.0, 10.0, 3.0, 3.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.1605224609375, -0.15557861328125, -0.150634765625, -0.14569091796875, -0.1407470703125, -0.13580322265625, -0.130859375, -0.12591552734375, -0.1209716796875, -0.11602783203125, -0.111083984375, -0.10614013671875, -0.1011962890625, -0.09625244140625, -0.09130859375, -0.08636474609375, -0.0814208984375, -0.07647705078125, -0.071533203125, -0.06658935546875, -0.0616455078125, -0.05670166015625, -0.0517578125, -0.04681396484375, -0.0418701171875, -0.03692626953125, -0.031982421875, -0.02703857421875, -0.0220947265625, -0.01715087890625, -0.01220703125, -0.00726318359375, -0.0023193359375, 0.00262451171875, 0.007568359375, 0.01251220703125, 0.0174560546875, 0.02239990234375, 0.02734375, 0.03228759765625, 0.0372314453125, 0.04217529296875, 0.047119140625, 0.05206298828125, 0.0570068359375, 0.06195068359375, 0.06689453125, 0.07183837890625, 0.0767822265625, 0.08172607421875, 0.086669921875, 0.09161376953125, 0.0965576171875, 0.10150146484375, 0.1064453125, 0.11138916015625, 0.1163330078125, 0.12127685546875, 0.126220703125, 0.13116455078125, 0.1361083984375, 0.14105224609375, 0.14599609375, 0.15093994140625, 0.1558837890625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 6.0, 5.0, 11.0, 17.0, 25.0, 39.0, 63.0, 80.0, 195.0, 347.0, 667.0, 1536.0, 3981.0, 12697.0, 55261.0, 314772.0, 524387.0, 103273.0, 21295.0, 5816.0, 2151.0, 942.0, 450.0, 241.0, 114.0, 70.0, 50.0, 24.0, 18.0, 12.0, 4.0, 7.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.05084228515625, -0.0496370792388916, -0.0484318733215332, -0.047226667404174805, -0.046021461486816406, -0.04481625556945801, -0.04361104965209961, -0.04240584373474121, -0.04120063781738281, -0.039995431900024414, -0.038790225982666016, -0.03758502006530762, -0.03637981414794922, -0.03517460823059082, -0.03396940231323242, -0.03276419639587402, -0.031558990478515625, -0.030353784561157227, -0.029148578643798828, -0.02794337272644043, -0.02673816680908203, -0.025532960891723633, -0.024327754974365234, -0.023122549057006836, -0.021917343139648438, -0.02071213722229004, -0.01950693130493164, -0.018301725387573242, -0.017096519470214844, -0.015891313552856445, -0.014686107635498047, -0.013480901718139648, -0.01227569580078125, -0.011070489883422852, -0.009865283966064453, -0.008660078048706055, -0.007454872131347656, -0.006249666213989258, -0.005044460296630859, -0.003839254379272461, -0.0026340484619140625, -0.001428842544555664, -0.00022363662719726562, 0.0009815692901611328, 0.0021867752075195312, 0.0033919811248779297, 0.004597187042236328, 0.0058023929595947266, 0.007007598876953125, 0.008212804794311523, 0.009418010711669922, 0.01062321662902832, 0.011828422546386719, 0.013033628463745117, 0.014238834381103516, 0.015444040298461914, 0.016649246215820312, 0.01785445213317871, 0.01905965805053711, 0.020264863967895508, 0.021470069885253906, 0.022675275802612305, 0.023880481719970703, 0.0250856876373291, 0.0262908935546875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 3.0, 11.0, 6.0, 15.0, 22.0, 19.0, 31.0, 32.0, 43.0, 35.0, 51.0, 74.0, 66.0, 64.0, 83.0, 67.0, 63.0, 58.0, 62.0, 40.0, 24.0, 25.0, 25.0, 11.0, 9.0, 7.0, 12.0, 11.0, 3.0, 3.0, 7.0, 3.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.344650268554688e-06, -8.083879947662354e-06, -7.82310962677002e-06, -7.5623393058776855e-06, -7.3015689849853516e-06, -7.040798664093018e-06, -6.780028343200684e-06, -6.51925802230835e-06, -6.258487701416016e-06, -5.997717380523682e-06, -5.736947059631348e-06, -5.476176738739014e-06, -5.21540641784668e-06, -4.954636096954346e-06, -4.693865776062012e-06, -4.433095455169678e-06, -4.172325134277344e-06, -3.91155481338501e-06, -3.6507844924926758e-06, -3.390014171600342e-06, -3.129243850708008e-06, -2.868473529815674e-06, -2.60770320892334e-06, -2.346932888031006e-06, -2.086162567138672e-06, -1.8253922462463379e-06, -1.564621925354004e-06, -1.30385160446167e-06, -1.043081283569336e-06, -7.82310962677002e-07, -5.21540641784668e-07, -2.60770320892334e-07, 0.0, 2.60770320892334e-07, 5.21540641784668e-07, 7.82310962677002e-07, 1.043081283569336e-06, 1.30385160446167e-06, 1.564621925354004e-06, 1.8253922462463379e-06, 2.086162567138672e-06, 2.346932888031006e-06, 2.60770320892334e-06, 2.868473529815674e-06, 3.129243850708008e-06, 3.390014171600342e-06, 3.6507844924926758e-06, 3.91155481338501e-06, 4.172325134277344e-06, 4.433095455169678e-06, 4.693865776062012e-06, 4.954636096954346e-06, 5.21540641784668e-06, 5.476176738739014e-06, 5.736947059631348e-06, 5.997717380523682e-06, 6.258487701416016e-06, 6.51925802230835e-06, 6.780028343200684e-06, 7.040798664093018e-06, 7.3015689849853516e-06, 7.5623393058776855e-06, 7.82310962677002e-06, 8.083879947662354e-06, 8.344650268554688e-06]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 4.0, 8.0, 12.0, 22.0, 19.0, 41.0, 71.0, 114.0, 235.0, 632.0, 2130.0, 10820.0, 94862.0, 679564.0, 232177.0, 22572.0, 3632.0, 936.0, 324.0, 159.0, 65.0, 51.0, 34.0, 27.0, 18.0, 10.0, 4.0, 5.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.049407958984375, -0.0476231575012207, -0.045838356018066406, -0.04405355453491211, -0.04226875305175781, -0.040483951568603516, -0.03869915008544922, -0.03691434860229492, -0.035129547119140625, -0.03334474563598633, -0.03155994415283203, -0.029775142669677734, -0.027990341186523438, -0.02620553970336914, -0.024420738220214844, -0.022635936737060547, -0.02085113525390625, -0.019066333770751953, -0.017281532287597656, -0.01549673080444336, -0.013711929321289062, -0.011927127838134766, -0.010142326354980469, -0.008357524871826172, -0.006572723388671875, -0.004787921905517578, -0.0030031204223632812, -0.0012183189392089844, 0.0005664825439453125, 0.0023512840270996094, 0.004136085510253906, 0.005920886993408203, 0.0077056884765625, 0.009490489959716797, 0.011275291442871094, 0.01306009292602539, 0.014844894409179688, 0.016629695892333984, 0.01841449737548828, 0.020199298858642578, 0.021984100341796875, 0.023768901824951172, 0.02555370330810547, 0.027338504791259766, 0.029123306274414062, 0.03090810775756836, 0.032692909240722656, 0.03447771072387695, 0.03626251220703125, 0.03804731369018555, 0.039832115173339844, 0.04161691665649414, 0.04340171813964844, 0.045186519622802734, 0.04697132110595703, 0.04875612258911133, 0.050540924072265625, 0.05232572555541992, 0.05411052703857422, 0.055895328521728516, 0.05768013000488281, 0.05946493148803711, 0.061249732971191406, 0.0630345344543457, 0.0648193359375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 1.0, 6.0, 4.0, 5.0, 5.0, 7.0, 10.0, 17.0, 24.0, 14.0, 20.0, 33.0, 31.0, 45.0, 60.0, 70.0, 47.0, 63.0, 79.0, 63.0, 74.0, 47.0, 47.0, 38.0, 35.0, 36.0, 30.0, 19.0, 19.0, 14.0, 13.0, 4.0, 7.0, 4.0, 3.0, 3.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.035675048828125, -0.0345916748046875, -0.03350830078125, -0.0324249267578125, -0.031341552734375, -0.0302581787109375, -0.0291748046875, -0.0280914306640625, -0.027008056640625, -0.0259246826171875, -0.02484130859375, -0.0237579345703125, -0.022674560546875, -0.0215911865234375, -0.0205078125, -0.0194244384765625, -0.018341064453125, -0.0172576904296875, -0.01617431640625, -0.0150909423828125, -0.014007568359375, -0.0129241943359375, -0.0118408203125, -0.0107574462890625, -0.009674072265625, -0.0085906982421875, -0.00750732421875, -0.0064239501953125, -0.005340576171875, -0.0042572021484375, -0.003173828125, -0.0020904541015625, -0.001007080078125, 7.62939453125e-05, 0.00115966796875, 0.0022430419921875, 0.003326416015625, 0.0044097900390625, 0.0054931640625, 0.0065765380859375, 0.007659912109375, 0.0087432861328125, 0.00982666015625, 0.0109100341796875, 0.011993408203125, 0.0130767822265625, 0.01416015625, 0.0152435302734375, 0.016326904296875, 0.0174102783203125, 0.01849365234375, 0.0195770263671875, 0.020660400390625, 0.0217437744140625, 0.0228271484375, 0.0239105224609375, 0.024993896484375, 0.0260772705078125, 0.02716064453125, 0.0282440185546875, 0.029327392578125, 0.0304107666015625, 0.031494140625, 0.0325775146484375, 0.033660888671875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 5.0, 8.0, 31.0, 81.0, 155.0, 251.0, 246.0, 145.0, 53.0, 24.0, 10.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5174418687820435, -0.46977996826171875, -0.42211806774139404, -0.37445613741874695, -0.32679423689842224, -0.27913233637809753, -0.23147040605545044, -0.18380850553512573, -0.13614660501480103, -0.08848469704389572, -0.04082278907299042, 0.006839126348495483, 0.05450102686882019, 0.1021629273891449, 0.149824857711792, 0.1974867582321167, 0.2451486587524414, 0.2928105592727661, 0.3404724597930908, 0.3881343901157379, 0.4357962906360626, 0.48345819115638733, 0.5311201214790344, 0.5787820219993591, 0.6264439225196838, 0.6741058230400085, 0.7217677235603333, 0.7694296836853027, 0.8170915842056274, 0.8647534847259521, 0.9124153852462769, 0.9600772857666016, 1.0077390670776367, 1.0554009675979614, 1.1030628681182861, 1.1507247686386108, 1.1983866691589355, 1.2460485696792603, 1.293710470199585, 1.3413724899291992, 1.3890342712402344, 1.436696171760559, 1.4843580722808838, 1.5320199728012085, 1.5796818733215332, 1.627343773841858, 1.6750056743621826, 1.7226676940917969, 1.7703295946121216, 1.8179914951324463, 1.865653395652771, 1.9133152961730957, 1.9609771966934204, 2.008639097213745, 2.0563011169433594, 2.1039628982543945, 2.151624917984009, 2.199286937713623, 2.246948719024658, 2.2946107387542725, 2.3422725200653076, 2.389934539794922, 2.437596321105957, 2.4852583408355713, 2.5329201221466064]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 4.0, 3.0, 2.0, 5.0, 7.0, 2.0, 5.0, 5.0, 9.0, 11.0, 8.0, 15.0, 9.0, 12.0, 19.0, 27.0, 20.0, 25.0, 10.0, 39.0, 34.0, 32.0, 48.0, 43.0, 40.0, 50.0, 48.0, 39.0, 43.0, 30.0, 43.0, 36.0, 23.0, 33.0, 32.0, 30.0, 21.0, 22.0, 17.0, 17.0, 19.0, 19.0, 11.0, 6.0, 6.0, 10.0, 5.0, 5.0, 4.0, 5.0, 2.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.6328861713409424, -0.6122980713844299, -0.5917100310325623, -0.5711219310760498, -0.5505338311195374, -0.5299457311630249, -0.5093576908111572, -0.4887695908546448, -0.4681815207004547, -0.44759345054626465, -0.4270053505897522, -0.40641728043556213, -0.38582921028137207, -0.3652411103248596, -0.34465304017066956, -0.3240649700164795, -0.30347687005996704, -0.282888799905777, -0.2623006999492645, -0.24171262979507446, -0.2211245447397232, -0.20053645968437195, -0.17994838953018188, -0.15936030447483063, -0.13877221941947937, -0.11818413436412811, -0.09759605675935745, -0.07700797915458679, -0.056419894099235535, -0.03583180904388428, -0.015243731439113617, 0.0053443461656570435, 0.025932490825653076, 0.046520572155714035, 0.067108653485775, 0.08769673109054565, 0.10828481614589691, 0.12887290120124817, 0.14946097135543823, 0.1700490564107895, 0.19063714146614075, 0.211225226521492, 0.23181331157684326, 0.2524013817310333, 0.2729894518852234, 0.29357755184173584, 0.3141656219959259, 0.33475369215011597, 0.3553417921066284, 0.3759298622608185, 0.39651796221733093, 0.417106032371521, 0.43769413232803345, 0.4582822024822235, 0.4788702726364136, 0.499458372592926, 0.5200464725494385, 0.5406345725059509, 0.5612226128578186, 0.581810712814331, 0.6023988127708435, 0.622986912727356, 0.6435749530792236, 0.6641630530357361, 0.6847510933876038]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 6.0, 7.0, 11.0, 16.0, 22.0, 33.0, 55.0, 89.0, 130.0, 203.0, 399.0, 761.0, 1695.0, 5115.0, 20670.0, 3899504.0, 242060.0, 16201.0, 4204.0, 1542.0, 646.0, 350.0, 186.0, 133.0, 79.0, 44.0, 39.0, 24.0, 20.0, 7.0, 7.0, 9.0, 7.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.11590576171875, -0.11248970031738281, -0.10907363891601562, -0.10565757751464844, -0.10224151611328125, -0.09882545471191406, -0.09540939331054688, -0.09199333190917969, -0.0885772705078125, -0.08516120910644531, -0.08174514770507812, -0.07832908630371094, -0.07491302490234375, -0.07149696350097656, -0.06808090209960938, -0.06466484069824219, -0.061248779296875, -0.05783271789550781, -0.054416656494140625, -0.05100059509277344, -0.04758453369140625, -0.04416847229003906, -0.040752410888671875, -0.03733634948730469, -0.0339202880859375, -0.030504226684570312, -0.027088165283203125, -0.023672103881835938, -0.02025604248046875, -0.016839981079101562, -0.013423919677734375, -0.010007858276367188, -0.006591796875, -0.0031757354736328125, 0.000240325927734375, 0.0036563873291015625, 0.00707244873046875, 0.010488510131835938, 0.013904571533203125, 0.017320632934570312, 0.0207366943359375, 0.024152755737304688, 0.027568817138671875, 0.030984878540039062, 0.03440093994140625, 0.03781700134277344, 0.041233062744140625, 0.04464912414550781, 0.048065185546875, 0.05148124694824219, 0.054897308349609375, 0.05831336975097656, 0.06172943115234375, 0.06514549255371094, 0.06856155395507812, 0.07197761535644531, 0.0753936767578125, 0.07880973815917969, 0.08222579956054688, 0.08564186096191406, 0.08905792236328125, 0.09247398376464844, 0.09589004516601562, 0.09930610656738281, 0.10272216796875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 10.0, 10.0, 14.0, 12.0, 21.0, 25.0, 31.0, 23.0, 36.0, 39.0, 50.0, 54.0, 64.0, 77.0, 63.0, 64.0, 67.0, 66.0, 52.0, 42.0, 39.0, 34.0, 23.0, 21.0, 13.0, 17.0, 9.0, 8.0, 5.0, 6.0, 2.0, 4.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05035400390625, -0.04865598678588867, -0.046957969665527344, -0.045259952545166016, -0.04356193542480469, -0.04186391830444336, -0.04016590118408203, -0.0384678840637207, -0.036769866943359375, -0.03507184982299805, -0.03337383270263672, -0.03167581558227539, -0.029977798461914062, -0.028279781341552734, -0.026581764221191406, -0.024883747100830078, -0.02318572998046875, -0.021487712860107422, -0.019789695739746094, -0.018091678619384766, -0.016393661499023438, -0.01469564437866211, -0.012997627258300781, -0.011299610137939453, -0.009601593017578125, -0.007903575897216797, -0.006205558776855469, -0.004507541656494141, -0.0028095245361328125, -0.0011115074157714844, 0.0005865097045898438, 0.002284526824951172, 0.0039825439453125, 0.005680561065673828, 0.007378578186035156, 0.009076595306396484, 0.010774612426757812, 0.01247262954711914, 0.014170646667480469, 0.015868663787841797, 0.017566680908203125, 0.019264698028564453, 0.02096271514892578, 0.02266073226928711, 0.024358749389648438, 0.026056766510009766, 0.027754783630371094, 0.029452800750732422, 0.03115081787109375, 0.03284883499145508, 0.034546852111816406, 0.036244869232177734, 0.03794288635253906, 0.03964090347290039, 0.04133892059326172, 0.04303693771362305, 0.044734954833984375, 0.0464329719543457, 0.04813098907470703, 0.04982900619506836, 0.05152702331542969, 0.053225040435791016, 0.054923057556152344, 0.05662107467651367, 0.058319091796875]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 5.0, 8.0, 13.0, 13.0, 26.0, 37.0, 40.0, 68.0, 70.0, 98.0, 165.0, 206.0, 337.0, 407.0, 597.0, 871.0, 1288.0, 2194.0, 3909.0, 8529.0, 22577.0, 88795.0, 3846554.0, 162547.0, 31587.0, 11014.0, 4966.0, 2540.0, 1493.0, 998.0, 678.0, 482.0, 324.0, 240.0, 188.0, 129.0, 74.0, 62.0, 57.0, 29.0, 17.0, 15.0, 13.0, 13.0, 6.0, 2.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0565185546875, -0.05488729476928711, -0.05325603485107422, -0.05162477493286133, -0.04999351501464844, -0.04836225509643555, -0.046730995178222656, -0.045099735260009766, -0.043468475341796875, -0.041837215423583984, -0.040205955505371094, -0.0385746955871582, -0.03694343566894531, -0.03531217575073242, -0.03368091583251953, -0.03204965591430664, -0.03041839599609375, -0.02878713607788086, -0.02715587615966797, -0.025524616241455078, -0.023893356323242188, -0.022262096405029297, -0.020630836486816406, -0.018999576568603516, -0.017368316650390625, -0.015737056732177734, -0.014105796813964844, -0.012474536895751953, -0.010843276977539062, -0.009212017059326172, -0.007580757141113281, -0.005949497222900391, -0.0043182373046875, -0.0026869773864746094, -0.0010557174682617188, 0.0005755424499511719, 0.0022068023681640625, 0.003838062286376953, 0.005469322204589844, 0.007100582122802734, 0.008731842041015625, 0.010363101959228516, 0.011994361877441406, 0.013625621795654297, 0.015256881713867188, 0.016888141632080078, 0.01851940155029297, 0.02015066146850586, 0.02178192138671875, 0.02341318130493164, 0.02504444122314453, 0.026675701141357422, 0.028306961059570312, 0.029938220977783203, 0.031569480895996094, 0.033200740814208984, 0.034832000732421875, 0.036463260650634766, 0.038094520568847656, 0.03972578048706055, 0.04135704040527344, 0.04298830032348633, 0.04461956024169922, 0.04625082015991211, 0.047882080078125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 4.0, 4.0, 10.0, 20.0, 14.0, 20.0, 39.0, 62.0, 90.0, 329.0, 3157.0, 142.0, 65.0, 32.0, 21.0, 21.0, 8.0, 7.0, 3.0, 7.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0147705078125, -0.014296770095825195, -0.01382303237915039, -0.013349294662475586, -0.012875556945800781, -0.012401819229125977, -0.011928081512451172, -0.011454343795776367, -0.010980606079101562, -0.010506868362426758, -0.010033130645751953, -0.009559392929077148, -0.009085655212402344, -0.008611917495727539, -0.008138179779052734, -0.00766444206237793, -0.007190704345703125, -0.00671696662902832, -0.006243228912353516, -0.005769491195678711, -0.005295753479003906, -0.0048220157623291016, -0.004348278045654297, -0.003874540328979492, -0.0034008026123046875, -0.002927064895629883, -0.002453327178955078, -0.0019795894622802734, -0.0015058517456054688, -0.001032114028930664, -0.0005583763122558594, -8.463859558105469e-05, 0.00038909912109375, 0.0008628368377685547, 0.0013365745544433594, 0.001810312271118164, 0.0022840499877929688, 0.0027577877044677734, 0.003231525421142578, 0.003705263137817383, 0.0041790008544921875, 0.004652738571166992, 0.005126476287841797, 0.0056002140045166016, 0.006073951721191406, 0.006547689437866211, 0.007021427154541016, 0.00749516487121582, 0.007968902587890625, 0.00844264030456543, 0.008916378021240234, 0.009390115737915039, 0.009863853454589844, 0.010337591171264648, 0.010811328887939453, 0.011285066604614258, 0.011758804321289062, 0.012232542037963867, 0.012706279754638672, 0.013180017471313477, 0.013653755187988281, 0.014127492904663086, 0.01460123062133789, 0.015074968338012695, 0.0155487060546875]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 8.0, 16.0, 23.0, 41.0, 66.0, 119.0, 202.0, 164.0, 140.0, 109.0, 66.0, 31.0, 16.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.16769087314605713, -0.16424518823623657, -0.16079950332641602, -0.15735380351543427, -0.1539081186056137, -0.15046243369579315, -0.1470167338848114, -0.14357104897499084, -0.1401253640651703, -0.13667967915534973, -0.13323399424552917, -0.12978829443454742, -0.12634260952472687, -0.12289692461490631, -0.11945123225450516, -0.116005539894104, -0.11255985498428345, -0.10911417007446289, -0.10566847771406174, -0.10222278535366058, -0.09877710044384003, -0.09533141553401947, -0.09188572317361832, -0.08844003081321716, -0.0849943459033966, -0.08154866099357605, -0.0781029686331749, -0.07465727627277374, -0.07121159136295319, -0.06776590645313263, -0.06432021409273148, -0.06087452545762062, -0.05742884427309036, -0.05398315563797951, -0.05053746700286865, -0.0470917783677578, -0.04364608973264694, -0.04020040109753609, -0.03675471246242523, -0.03330902382731438, -0.02986333519220352, -0.026417646557092667, -0.02297195792198181, -0.019526269286870956, -0.0160805806517601, -0.012634892016649246, -0.009189203381538391, -0.005743514746427536, -0.002297826111316681, 0.0011478625237941742, 0.004593551158905029, 0.008039239794015884, 0.01148492842912674, 0.014930617064237595, 0.01837630569934845, 0.021821994334459305, 0.02526768296957016, 0.028713371604681015, 0.03215906023979187, 0.035604748874902725, 0.03905043751001358, 0.042496126145124435, 0.04594181478023529, 0.049387503415346146, 0.052833192050457]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 13.0, 9.0, 10.0, 21.0, 18.0, 19.0, 26.0, 20.0, 28.0, 21.0, 32.0, 28.0, 47.0, 37.0, 37.0, 34.0, 45.0, 41.0, 41.0, 30.0, 46.0, 33.0, 28.0, 41.0, 28.0, 46.0, 32.0, 31.0, 30.0, 21.0, 25.0, 19.0, 11.0, 12.0, 9.0, 7.0, 11.0, 2.0, 1.0, 6.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.03432697057723999, -0.033227089792490005, -0.03212720900774002, -0.031027331948280334, -0.02992745116353035, -0.028827570378780365, -0.02772769145667553, -0.026627812534570694, -0.02552793174982071, -0.024428050965070724, -0.02332817204296589, -0.022228293120861053, -0.02112841233611107, -0.020028531551361084, -0.01892865262925625, -0.017828773707151413, -0.016728892922401428, -0.015629012137651443, -0.014529133215546608, -0.013429253362119198, -0.012329373508691788, -0.011229493655264378, -0.010129613801836967, -0.009029733948409557, -0.007929854094982147, -0.006829974241554737, -0.005730094388127327, -0.004630214534699917, -0.0035303346812725067, -0.0024304548278450966, -0.0013305749744176865, -0.00023069512099027634, 0.0008691847324371338, 0.001969064585864544, 0.003068944439291954, 0.004168824292719364, 0.005268704146146774, 0.006368583999574184, 0.0074684638530015945, 0.008568343706429005, 0.009668223559856415, 0.010768103413283825, 0.011867983266711235, 0.012967863120138645, 0.014067742973566055, 0.015167622826993465, 0.016267502680420876, 0.01736738160252571, 0.018467262387275696, 0.01956714317202568, 0.020667022094130516, 0.02176690101623535, 0.022866781800985336, 0.02396666258573532, 0.025066541507840157, 0.026166420429944992, 0.027266301214694977, 0.02836618199944496, 0.029466060921549797, 0.030565939843654633, 0.03166582062840462, 0.0327657014131546, 0.03386557847261429, 0.03496545925736427, 0.03606534004211426]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 1.0, 3.0, 4.0, 8.0, 8.0, 8.0, 22.0, 26.0, 65.0, 94.0, 154.0, 264.0, 512.0, 1131.0, 2909.0, 8601.0, 31617.0, 136245.0, 451622.0, 312634.0, 74966.0, 18451.0, 5422.0, 1922.0, 879.0, 442.0, 242.0, 93.0, 63.0, 59.0, 32.0, 24.0, 9.0, 3.0, 11.0, 6.0, 4.0, 1.0, 3.0, 3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08837890625, -0.08508110046386719, -0.08178329467773438, -0.07848548889160156, -0.07518768310546875, -0.07188987731933594, -0.06859207153320312, -0.06529426574707031, -0.0619964599609375, -0.05869865417480469, -0.055400848388671875, -0.05210304260253906, -0.04880523681640625, -0.04550743103027344, -0.042209625244140625, -0.03891181945800781, -0.035614013671875, -0.03231620788574219, -0.029018402099609375, -0.025720596313476562, -0.02242279052734375, -0.019124984741210938, -0.015827178955078125, -0.012529373168945312, -0.0092315673828125, -0.0059337615966796875, -0.002635955810546875, 0.0006618499755859375, 0.00395965576171875, 0.0072574615478515625, 0.010555267333984375, 0.013853073120117188, 0.01715087890625, 0.020448684692382812, 0.023746490478515625, 0.027044296264648438, 0.03034210205078125, 0.03363990783691406, 0.036937713623046875, 0.04023551940917969, 0.0435333251953125, 0.04683113098144531, 0.050128936767578125, 0.05342674255371094, 0.05672454833984375, 0.06002235412597656, 0.06332015991210938, 0.06661796569824219, 0.069915771484375, 0.07321357727050781, 0.07651138305664062, 0.07980918884277344, 0.08310699462890625, 0.08640480041503906, 0.08970260620117188, 0.09300041198730469, 0.0962982177734375, 0.09959602355957031, 0.10289382934570312, 0.10619163513183594, 0.10948944091796875, 0.11278724670410156, 0.11608505249023438, 0.11938285827636719, 0.1226806640625]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 5.0, 9.0, 3.0, 9.0, 15.0, 10.0, 28.0, 33.0, 35.0, 17.0, 45.0, 45.0, 58.0, 66.0, 64.0, 65.0, 59.0, 77.0, 56.0, 62.0, 44.0, 36.0, 30.0, 31.0, 25.0, 21.0, 15.0, 11.0, 9.0, 6.0, 6.0, 4.0, 2.0, 2.0, 1.0, 2.0, 2.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.05133056640625, -0.049622535705566406, -0.04791450500488281, -0.04620647430419922, -0.044498443603515625, -0.04279041290283203, -0.04108238220214844, -0.039374351501464844, -0.03766632080078125, -0.035958290100097656, -0.03425025939941406, -0.03254222869873047, -0.030834197998046875, -0.02912616729736328, -0.027418136596679688, -0.025710105895996094, -0.0240020751953125, -0.022294044494628906, -0.020586013793945312, -0.01887798309326172, -0.017169952392578125, -0.015461921691894531, -0.013753890991210938, -0.012045860290527344, -0.01033782958984375, -0.008629798889160156, -0.0069217681884765625, -0.005213737487792969, -0.003505706787109375, -0.0017976760864257812, -8.96453857421875e-05, 0.0016183853149414062, 0.003326416015625, 0.005034446716308594, 0.0067424774169921875, 0.008450508117675781, 0.010158538818359375, 0.011866569519042969, 0.013574600219726562, 0.015282630920410156, 0.01699066162109375, 0.018698692321777344, 0.020406723022460938, 0.02211475372314453, 0.023822784423828125, 0.02553081512451172, 0.027238845825195312, 0.028946876525878906, 0.0306549072265625, 0.032362937927246094, 0.03407096862792969, 0.03577899932861328, 0.037487030029296875, 0.03919506072998047, 0.04090309143066406, 0.042611122131347656, 0.04431915283203125, 0.046027183532714844, 0.04773521423339844, 0.04944324493408203, 0.051151275634765625, 0.05285930633544922, 0.05456733703613281, 0.056275367736816406, 0.0579833984375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 10.0, 10.0, 15.0, 14.0, 18.0, 34.0, 48.0, 68.0, 76.0, 115.0, 198.0, 342.0, 685.0, 1676.0, 5038.0, 20860.0, 134832.0, 640358.0, 204387.0, 29213.0, 6516.0, 2084.0, 872.0, 406.0, 203.0, 146.0, 96.0, 53.0, 45.0, 31.0, 28.0, 15.0, 9.0, 16.0, 11.0, 5.0, 2.0, 11.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10137939453125, -0.09783458709716797, -0.09428977966308594, -0.0907449722290039, -0.08720016479492188, -0.08365535736083984, -0.08011054992675781, -0.07656574249267578, -0.07302093505859375, -0.06947612762451172, -0.06593132019042969, -0.062386512756347656, -0.058841705322265625, -0.055296897888183594, -0.05175209045410156, -0.04820728302001953, -0.0446624755859375, -0.04111766815185547, -0.03757286071777344, -0.034028053283691406, -0.030483245849609375, -0.026938438415527344, -0.023393630981445312, -0.01984882354736328, -0.01630401611328125, -0.012759208679199219, -0.009214401245117188, -0.005669593811035156, -0.002124786376953125, 0.0014200210571289062, 0.0049648284912109375, 0.008509635925292969, 0.012054443359375, 0.015599250793457031, 0.019144058227539062, 0.022688865661621094, 0.026233673095703125, 0.029778480529785156, 0.03332328796386719, 0.03686809539794922, 0.04041290283203125, 0.04395771026611328, 0.04750251770019531, 0.051047325134277344, 0.054592132568359375, 0.058136940002441406, 0.06168174743652344, 0.06522655487060547, 0.0687713623046875, 0.07231616973876953, 0.07586097717285156, 0.0794057846069336, 0.08295059204101562, 0.08649539947509766, 0.09004020690917969, 0.09358501434326172, 0.09712982177734375, 0.10067462921142578, 0.10421943664550781, 0.10776424407958984, 0.11130905151367188, 0.1148538589477539, 0.11839866638183594, 0.12194347381591797, 0.12548828125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 6.0, 10.0, 14.0, 9.0, 14.0, 13.0, 20.0, 23.0, 20.0, 18.0, 22.0, 38.0, 31.0, 30.0, 44.0, 45.0, 44.0, 43.0, 41.0, 34.0, 59.0, 42.0, 48.0, 31.0, 45.0, 37.0, 31.0, 30.0, 33.0, 15.0, 20.0, 16.0, 19.0, 12.0, 12.0, 9.0, 4.0, 3.0, 0.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1378173828125, -0.13333892822265625, -0.1288604736328125, -0.12438201904296875, -0.119903564453125, -0.11542510986328125, -0.1109466552734375, -0.10646820068359375, -0.10198974609375, -0.09751129150390625, -0.0930328369140625, -0.08855438232421875, -0.084075927734375, -0.07959747314453125, -0.0751190185546875, -0.07064056396484375, -0.066162109375, -0.06168365478515625, -0.0572052001953125, -0.05272674560546875, -0.048248291015625, -0.04376983642578125, -0.0392913818359375, -0.03481292724609375, -0.03033447265625, -0.02585601806640625, -0.0213775634765625, -0.01689910888671875, -0.012420654296875, -0.00794219970703125, -0.0034637451171875, 0.00101470947265625, 0.0054931640625, 0.00997161865234375, 0.0144500732421875, 0.01892852783203125, 0.023406982421875, 0.02788543701171875, 0.0323638916015625, 0.03684234619140625, 0.04132080078125, 0.04579925537109375, 0.0502777099609375, 0.05475616455078125, 0.059234619140625, 0.06371307373046875, 0.0681915283203125, 0.07266998291015625, 0.0771484375, 0.08162689208984375, 0.0861053466796875, 0.09058380126953125, 0.095062255859375, 0.09954071044921875, 0.1040191650390625, 0.10849761962890625, 0.11297607421875, 0.11745452880859375, 0.1219329833984375, 0.12641143798828125, 0.130889892578125, 0.13536834716796875, 0.1398468017578125, 0.14432525634765625, 0.1488037109375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 4.0, 1.0, 9.0, 15.0, 13.0, 18.0, 27.0, 54.0, 92.0, 165.0, 280.0, 734.0, 2148.0, 8495.0, 70467.0, 790568.0, 156875.0, 14055.0, 2924.0, 892.0, 363.0, 150.0, 88.0, 54.0, 25.0, 13.0, 14.0, 6.0, 4.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06549072265625, -0.06360006332397461, -0.06170940399169922, -0.05981874465942383, -0.05792808532714844, -0.05603742599487305, -0.054146766662597656, -0.052256107330322266, -0.050365447998046875, -0.048474788665771484, -0.046584129333496094, -0.0446934700012207, -0.04280281066894531, -0.04091215133666992, -0.03902149200439453, -0.03713083267211914, -0.03524017333984375, -0.03334951400756836, -0.03145885467529297, -0.029568195343017578, -0.027677536010742188, -0.025786876678466797, -0.023896217346191406, -0.022005558013916016, -0.020114898681640625, -0.018224239349365234, -0.016333580017089844, -0.014442920684814453, -0.012552261352539062, -0.010661602020263672, -0.008770942687988281, -0.006880283355712891, -0.0049896240234375, -0.0030989646911621094, -0.0012083053588867188, 0.0006823539733886719, 0.0025730133056640625, 0.004463672637939453, 0.006354331970214844, 0.008244991302490234, 0.010135650634765625, 0.012026309967041016, 0.013916969299316406, 0.015807628631591797, 0.017698287963867188, 0.019588947296142578, 0.02147960662841797, 0.02337026596069336, 0.02526092529296875, 0.02715158462524414, 0.02904224395751953, 0.030932903289794922, 0.03282356262207031, 0.0347142219543457, 0.036604881286621094, 0.038495540618896484, 0.040386199951171875, 0.042276859283447266, 0.044167518615722656, 0.04605817794799805, 0.04794883728027344, 0.04983949661254883, 0.05173015594482422, 0.05362081527709961, 0.055511474609375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 4.0, 9.0, 16.0, 13.0, 16.0, 26.0, 37.0, 44.0, 52.0, 66.0, 78.0, 76.0, 113.0, 83.0, 94.0, 54.0, 60.0, 40.0, 37.0, 27.0, 20.0, 10.0, 6.0, 9.0, 4.0, 2.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.033348083496094e-06, -6.723217666149139e-06, -6.413087248802185e-06, -6.102956831455231e-06, -5.792826414108276e-06, -5.482695996761322e-06, -5.172565579414368e-06, -4.862435162067413e-06, -4.552304744720459e-06, -4.242174327373505e-06, -3.93204391002655e-06, -3.621913492679596e-06, -3.3117830753326416e-06, -3.0016526579856873e-06, -2.691522240638733e-06, -2.3813918232917786e-06, -2.0712614059448242e-06, -1.7611309885978699e-06, -1.4510005712509155e-06, -1.1408701539039612e-06, -8.307397365570068e-07, -5.206093192100525e-07, -2.1047890186309814e-07, 9.96515154838562e-08, 4.0978193283081055e-07, 7.199123501777649e-07, 1.0300427675247192e-06, 1.3401731848716736e-06, 1.650303602218628e-06, 1.9604340195655823e-06, 2.2705644369125366e-06, 2.580694854259491e-06, 2.8908252716064453e-06, 3.2009556889533997e-06, 3.511086106300354e-06, 3.821216523647308e-06, 4.131346940994263e-06, 4.441477358341217e-06, 4.751607775688171e-06, 5.061738193035126e-06, 5.37186861038208e-06, 5.6819990277290344e-06, 5.992129445075989e-06, 6.302259862422943e-06, 6.6123902797698975e-06, 6.922520697116852e-06, 7.232651114463806e-06, 7.5427815318107605e-06, 7.852911949157715e-06, 8.16304236650467e-06, 8.473172783851624e-06, 8.783303201198578e-06, 9.093433618545532e-06, 9.403564035892487e-06, 9.713694453239441e-06, 1.0023824870586395e-05, 1.033395528793335e-05, 1.0644085705280304e-05, 1.0954216122627258e-05, 1.1264346539974213e-05, 1.1574476957321167e-05, 1.1884607374668121e-05, 1.2194737792015076e-05, 1.250486820936203e-05, 1.2814998626708984e-05]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 3.0, 0.0, 4.0, 7.0, 9.0, 11.0, 29.0, 38.0, 72.0, 131.0, 301.0, 720.0, 2119.0, 12765.0, 262804.0, 729538.0, 34343.0, 3796.0, 1050.0, 394.0, 174.0, 124.0, 45.0, 29.0, 18.0, 15.0, 11.0, 4.0, 3.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08245849609375, -0.08011531829833984, -0.07777214050292969, -0.07542896270751953, -0.07308578491210938, -0.07074260711669922, -0.06839942932128906, -0.0660562515258789, -0.06371307373046875, -0.061369895935058594, -0.05902671813964844, -0.05668354034423828, -0.054340362548828125, -0.05199718475341797, -0.04965400695800781, -0.047310829162597656, -0.0449676513671875, -0.042624473571777344, -0.04028129577636719, -0.03793811798095703, -0.035594940185546875, -0.03325176239013672, -0.030908584594726562, -0.028565406799316406, -0.02622222900390625, -0.023879051208496094, -0.021535873413085938, -0.01919269561767578, -0.016849517822265625, -0.014506340026855469, -0.012163162231445312, -0.009819984436035156, -0.007476806640625, -0.005133628845214844, -0.0027904510498046875, -0.00044727325439453125, 0.001895904541015625, 0.004239082336425781, 0.0065822601318359375, 0.008925437927246094, 0.01126861572265625, 0.013611793518066406, 0.015954971313476562, 0.01829814910888672, 0.020641326904296875, 0.02298450469970703, 0.025327682495117188, 0.027670860290527344, 0.0300140380859375, 0.032357215881347656, 0.03470039367675781, 0.03704357147216797, 0.039386749267578125, 0.04172992706298828, 0.04407310485839844, 0.046416282653808594, 0.04875946044921875, 0.051102638244628906, 0.05344581604003906, 0.05578899383544922, 0.058132171630859375, 0.06047534942626953, 0.06281852722167969, 0.06516170501708984, 0.0675048828125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 1.0, 1.0, 5.0, 4.0, 14.0, 8.0, 34.0, 59.0, 88.0, 117.0, 160.0, 161.0, 132.0, 85.0, 47.0, 43.0, 20.0, 9.0, 4.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.095458984375, -0.09273529052734375, -0.0900115966796875, -0.08728790283203125, -0.084564208984375, -0.08184051513671875, -0.0791168212890625, -0.07639312744140625, -0.07366943359375, -0.07094573974609375, -0.0682220458984375, -0.06549835205078125, -0.062774658203125, -0.06005096435546875, -0.0573272705078125, -0.05460357666015625, -0.0518798828125, -0.04915618896484375, -0.0464324951171875, -0.04370880126953125, -0.040985107421875, -0.03826141357421875, -0.0355377197265625, -0.03281402587890625, -0.03009033203125, -0.02736663818359375, -0.0246429443359375, -0.02191925048828125, -0.019195556640625, -0.01647186279296875, -0.0137481689453125, -0.01102447509765625, -0.00830078125, -0.00557708740234375, -0.0028533935546875, -0.00012969970703125, 0.002593994140625, 0.00531768798828125, 0.0080413818359375, 0.01076507568359375, 0.01348876953125, 0.01621246337890625, 0.0189361572265625, 0.02165985107421875, 0.024383544921875, 0.02710723876953125, 0.0298309326171875, 0.03255462646484375, 0.0352783203125, 0.03800201416015625, 0.0407257080078125, 0.04344940185546875, 0.046173095703125, 0.04889678955078125, 0.0516204833984375, 0.05434417724609375, 0.05706787109375, 0.05979156494140625, 0.0625152587890625, 0.06523895263671875, 0.067962646484375, 0.07068634033203125, 0.0734100341796875, 0.07613372802734375, 0.078857421875]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 21.0, 80.0, 208.0, 328.0, 250.0, 82.0, 22.0, 7.0, 6.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4775189459323883, -0.4145411550998688, -0.35156339406967163, -0.2885856032371521, -0.22560781240463257, -0.16263002157211304, -0.0996522605419159, -0.03667446970939636, 0.02630332112312317, 0.0892811045050621, 0.15225888788700104, 0.21523666381835938, 0.2782144546508789, 0.34119224548339844, 0.4041700065135956, 0.4671477973461151, 0.530125617980957, 0.5931034088134766, 0.6560811996459961, 0.7190589904785156, 0.7820367813110352, 0.8450145721435547, 0.9079923033714294, 0.970970094203949, 1.0339478254318237, 1.0969256162643433, 1.1599034070968628, 1.2228811979293823, 1.2858589887619019, 1.3488367795944214, 1.4118144512176514, 1.474792242050171, 1.5377700328826904, 1.60074782371521, 1.6637256145477295, 1.726703405380249, 1.7896811962127686, 1.852658987045288, 1.9156367778778076, 1.9786145687103271, 2.0415923595428467, 2.104570150375366, 2.1675479412078857, 2.2305257320404053, 2.293503522872925, 2.3564813137054443, 2.419459104537964, 2.4824368953704834, 2.545414447784424, 2.6083922386169434, 2.671370029449463, 2.7343478202819824, 2.797325611114502, 2.8603034019470215, 2.923281192779541, 2.9862589836120605, 3.04923677444458, 3.1122145652770996, 3.175192356109619, 3.2381701469421387, 3.301147937774658, 3.3641257286071777, 3.4271035194396973, 3.490081310272217, 3.5530591011047363]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 5.0, 9.0, 13.0, 7.0, 12.0, 24.0, 10.0, 26.0, 31.0, 35.0, 43.0, 38.0, 56.0, 50.0, 49.0, 51.0, 77.0, 54.0, 55.0, 55.0, 69.0, 47.0, 44.0, 29.0, 23.0, 18.0, 14.0, 10.0, 12.0, 7.0, 9.0, 6.0, 3.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8222468495368958, -0.7931749820709229, -0.76410311460495, -0.735031247138977, -0.7059594392776489, -0.6768875122070312, -0.6478157043457031, -0.6187438368797302, -0.5896719694137573, -0.5606001019477844, -0.5315282344818115, -0.5024563670158386, -0.4733845293521881, -0.4443126618862152, -0.4152408242225647, -0.3861689567565918, -0.3570970892906189, -0.328025221824646, -0.2989533543586731, -0.2698815166950226, -0.24080964922904968, -0.21173778176307678, -0.18266592919826508, -0.15359407663345337, -0.12452220916748047, -0.09545034915208817, -0.06637848913669586, -0.03730662912130356, -0.008234769105911255, 0.020837098360061646, 0.04990895092487335, 0.07898080348968506, 0.10805261135101318, 0.13712447881698608, 0.1661963313817978, 0.1952681839466095, 0.2243400514125824, 0.2534119188785553, 0.2824837565422058, 0.3115556240081787, 0.3406274914741516, 0.3696993589401245, 0.3987712264060974, 0.4278430640697479, 0.4569149315357208, 0.4859867990016937, 0.5150586366653442, 0.5441305041313171, 0.57320237159729, 0.6022742390632629, 0.6313461065292358, 0.6604179739952087, 0.6894898414611816, 0.7185616493225098, 0.7476335167884827, 0.7767053842544556, 0.8057772517204285, 0.8348491191864014, 0.8639209866523743, 0.8929928541183472, 0.9220646619796753, 0.951136589050293, 0.9802083969116211, 1.0092802047729492, 1.038352131843567]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 15.0, 21.0, 35.0, 55.0, 69.0, 127.0, 299.0, 1804.0, 4109490.0, 80534.0, 1280.0, 221.0, 102.0, 66.0, 41.0, 36.0, 22.0, 21.0, 11.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.389892578125, -0.3759346008300781, -0.36197662353515625, -0.3480186462402344, -0.3340606689453125, -0.3201026916503906, -0.30614471435546875, -0.2921867370605469, -0.278228759765625, -0.2642707824707031, -0.25031280517578125, -0.23635482788085938, -0.2223968505859375, -0.20843887329101562, -0.19448089599609375, -0.18052291870117188, -0.16656494140625, -0.15260696411132812, -0.13864898681640625, -0.12469100952148438, -0.1107330322265625, -0.09677505493164062, -0.08281707763671875, -0.06885910034179688, -0.054901123046875, -0.040943145751953125, -0.02698516845703125, -0.013027191162109375, 0.0009307861328125, 0.014888763427734375, 0.02884674072265625, 0.042804718017578125, 0.0567626953125, 0.07072067260742188, 0.08467864990234375, 0.09863662719726562, 0.1125946044921875, 0.12655258178710938, 0.14051055908203125, 0.15446853637695312, 0.168426513671875, 0.18238449096679688, 0.19634246826171875, 0.21030044555664062, 0.2242584228515625, 0.23821640014648438, 0.25217437744140625, 0.2661323547363281, 0.28009033203125, 0.2940483093261719, 0.30800628662109375, 0.3219642639160156, 0.3359222412109375, 0.3498802185058594, 0.36383819580078125, 0.3777961730957031, 0.391754150390625, 0.4057121276855469, 0.41967010498046875, 0.4336280822753906, 0.4475860595703125, 0.4615440368652344, 0.47550201416015625, 0.4894599914550781, 0.50341796875]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 9.0, 11.0, 11.0, 12.0, 23.0, 27.0, 31.0, 33.0, 33.0, 38.0, 47.0, 52.0, 67.0, 56.0, 74.0, 59.0, 65.0, 54.0, 47.0, 47.0, 38.0, 34.0, 28.0, 22.0, 15.0, 14.0, 6.0, 10.0, 13.0, 2.0, 6.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0489501953125, -0.047292232513427734, -0.04563426971435547, -0.0439763069152832, -0.04231834411621094, -0.04066038131713867, -0.039002418518066406, -0.03734445571899414, -0.035686492919921875, -0.03402853012084961, -0.032370567321777344, -0.030712604522705078, -0.029054641723632812, -0.027396678924560547, -0.02573871612548828, -0.024080753326416016, -0.02242279052734375, -0.020764827728271484, -0.01910686492919922, -0.017448902130126953, -0.015790939331054688, -0.014132976531982422, -0.012475013732910156, -0.01081705093383789, -0.009159088134765625, -0.007501125335693359, -0.005843162536621094, -0.004185199737548828, -0.0025272369384765625, -0.0008692741394042969, 0.0007886886596679688, 0.0024466514587402344, 0.0041046142578125, 0.005762577056884766, 0.007420539855957031, 0.009078502655029297, 0.010736465454101562, 0.012394428253173828, 0.014052391052246094, 0.01571035385131836, 0.017368316650390625, 0.01902627944946289, 0.020684242248535156, 0.022342205047607422, 0.024000167846679688, 0.025658130645751953, 0.02731609344482422, 0.028974056243896484, 0.03063201904296875, 0.032289981842041016, 0.03394794464111328, 0.03560590744018555, 0.03726387023925781, 0.03892183303833008, 0.040579795837402344, 0.04223775863647461, 0.043895721435546875, 0.04555368423461914, 0.047211647033691406, 0.04886960983276367, 0.05052757263183594, 0.0521855354309082, 0.05384349822998047, 0.055501461029052734, 0.057159423828125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 3.0, 5.0, 6.0, 8.0, 7.0, 9.0, 16.0, 17.0, 19.0, 22.0, 29.0, 34.0, 39.0, 64.0, 89.0, 111.0, 223.0, 484.0, 1473.0, 6204.0, 51677.0, 4098783.0, 28561.0, 4125.0, 1242.0, 408.0, 178.0, 108.0, 63.0, 55.0, 49.0, 32.0, 35.0, 24.0, 26.0, 14.0, 16.0, 13.0, 6.0, 5.0, 4.0, 2.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09625244140625, -0.09246158599853516, -0.08867073059082031, -0.08487987518310547, -0.08108901977539062, -0.07729816436767578, -0.07350730895996094, -0.0697164535522461, -0.06592559814453125, -0.062134742736816406, -0.05834388732910156, -0.05455303192138672, -0.050762176513671875, -0.04697132110595703, -0.04318046569824219, -0.039389610290527344, -0.0355987548828125, -0.031807899475097656, -0.028017044067382812, -0.02422618865966797, -0.020435333251953125, -0.01664447784423828, -0.012853622436523438, -0.009062767028808594, -0.00527191162109375, -0.0014810562133789062, 0.0023097991943359375, 0.006100654602050781, 0.009891510009765625, 0.013682365417480469, 0.017473220825195312, 0.021264076232910156, 0.025054931640625, 0.028845787048339844, 0.03263664245605469, 0.03642749786376953, 0.040218353271484375, 0.04400920867919922, 0.04780006408691406, 0.051590919494628906, 0.05538177490234375, 0.059172630310058594, 0.06296348571777344, 0.06675434112548828, 0.07054519653320312, 0.07433605194091797, 0.07812690734863281, 0.08191776275634766, 0.0857086181640625, 0.08949947357177734, 0.09329032897949219, 0.09708118438720703, 0.10087203979492188, 0.10466289520263672, 0.10845375061035156, 0.1122446060180664, 0.11603546142578125, 0.1198263168334961, 0.12361717224121094, 0.12740802764892578, 0.13119888305664062, 0.13498973846435547, 0.1387805938720703, 0.14257144927978516, 0.1463623046875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 5.0, 11.0, 39.0, 95.0, 3774.0, 107.0, 28.0, 11.0, 5.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05419921875, -0.05285978317260742, -0.051520347595214844, -0.050180912017822266, -0.04884147644042969, -0.04750204086303711, -0.04616260528564453, -0.04482316970825195, -0.043483734130859375, -0.0421442985534668, -0.04080486297607422, -0.03946542739868164, -0.03812599182128906, -0.036786556243896484, -0.035447120666503906, -0.03410768508911133, -0.03276824951171875, -0.03142881393432617, -0.030089378356933594, -0.028749942779541016, -0.027410507202148438, -0.02607107162475586, -0.02473163604736328, -0.023392200469970703, -0.022052764892578125, -0.020713329315185547, -0.01937389373779297, -0.01803445816040039, -0.016695022583007812, -0.015355587005615234, -0.014016151428222656, -0.012676715850830078, -0.0113372802734375, -0.009997844696044922, -0.008658409118652344, -0.007318973541259766, -0.0059795379638671875, -0.004640102386474609, -0.0033006668090820312, -0.001961231231689453, -0.000621795654296875, 0.0007176399230957031, 0.0020570755004882812, 0.0033965110778808594, 0.0047359466552734375, 0.006075382232666016, 0.007414817810058594, 0.008754253387451172, 0.01009368896484375, 0.011433124542236328, 0.012772560119628906, 0.014111995697021484, 0.015451431274414062, 0.01679086685180664, 0.01813030242919922, 0.019469738006591797, 0.020809173583984375, 0.022148609161376953, 0.02348804473876953, 0.02482748031616211, 0.026166915893554688, 0.027506351470947266, 0.028845787048339844, 0.030185222625732422, 0.031524658203125]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 9.0, 19.0, 53.0, 81.0, 215.0, 300.0, 204.0, 82.0, 29.0, 9.0, 4.0, 4.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20182916522026062, -0.1971951574087143, -0.19256114959716797, -0.18792714178562164, -0.18329313397407532, -0.178659126162529, -0.17402511835098267, -0.16939109563827515, -0.16475710272789001, -0.1601230949163437, -0.15548908710479736, -0.15085507929325104, -0.1462210714817047, -0.1415870636701584, -0.13695305585861206, -0.13231903314590454, -0.12768502533435822, -0.12305101752281189, -0.11841700971126556, -0.11378300189971924, -0.10914899408817291, -0.10451498627662659, -0.09988097101449966, -0.09524696320295334, -0.09061295539140701, -0.08597894757986069, -0.08134493976831436, -0.07671093195676804, -0.07207691669464111, -0.06744290888309479, -0.06280890107154846, -0.058174893260002136, -0.053540877997875214, -0.04890687018632889, -0.04427286237478256, -0.03963885083794594, -0.03500484302639961, -0.030370835214853287, -0.025736825540661812, -0.021102815866470337, -0.01646880805492401, -0.011834799312055111, -0.007200790569186211, -0.0025667818263173103, 0.00206722691655159, 0.006701234728097916, 0.01133524440228939, 0.015969254076480865, 0.02060326188802719, 0.025237269699573517, 0.029871279373764992, 0.03450528904795647, 0.03913929685950279, 0.04377330467104912, 0.04840731620788574, 0.05304132401943207, 0.057675331830978394, 0.06230933964252472, 0.06694334745407104, 0.07157735526561737, 0.0762113630771637, 0.08084537088871002, 0.08547938615083694, 0.09011339396238327, 0.0947474017739296]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 0.0, 9.0, 6.0, 3.0, 5.0, 9.0, 10.0, 14.0, 14.0, 27.0, 18.0, 21.0, 28.0, 28.0, 37.0, 43.0, 49.0, 43.0, 51.0, 29.0, 33.0, 45.0, 42.0, 47.0, 39.0, 43.0, 38.0, 46.0, 24.0, 38.0, 29.0, 25.0, 21.0, 14.0, 11.0, 13.0, 11.0, 11.0, 8.0, 3.0, 5.0, 2.0, 5.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.03876698017120361, -0.0374857559800148, -0.03620453178882599, -0.034923311322927475, -0.03364208713173866, -0.03236086294054985, -0.031079640612006187, -0.029798418283462524, -0.028517194092273712, -0.0272359699010849, -0.025954747572541237, -0.024673525243997574, -0.02339230105280876, -0.02211107686161995, -0.020829854533076286, -0.019548632204532623, -0.01826740801334381, -0.016986183822155, -0.015704961493611336, -0.014423738233745098, -0.01314251497387886, -0.011861291714012623, -0.010580068454146385, -0.009298845194280148, -0.00801762193441391, -0.006736398674547672, -0.005455175414681435, -0.004173952154815197, -0.0028927288949489594, -0.0016115056350827217, -0.00033028237521648407, 0.0009509408846497536, 0.002232164144515991, 0.003513387404382229, 0.0047946106642484665, 0.006075833924114704, 0.007357057183980942, 0.00863828044384718, 0.009919503703713417, 0.011200726963579655, 0.012481950223445892, 0.01376317348331213, 0.015044396743178368, 0.01632561907172203, 0.017606843262910843, 0.018888067454099655, 0.020169289782643318, 0.02145051211118698, 0.022731736302375793, 0.024012960493564606, 0.02529418282210827, 0.026575405150651932, 0.027856629341840744, 0.029137853533029556, 0.03041907586157322, 0.03170029819011688, 0.032981522381305695, 0.03426274657249451, 0.03554397076368332, 0.03682519122958183, 0.038106415420770645, 0.03938763961195946, 0.04066886007785797, 0.04195008426904678, 0.043231308460235596]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 6.0, 3.0, 7.0, 12.0, 11.0, 11.0, 16.0, 24.0, 22.0, 46.0, 58.0, 101.0, 137.0, 247.0, 341.0, 495.0, 917.0, 1610.0, 3240.0, 9732.0, 71605.0, 657578.0, 268472.0, 23135.0, 5298.0, 2260.0, 1203.0, 707.0, 439.0, 257.0, 166.0, 120.0, 82.0, 47.0, 27.0, 40.0, 15.0, 24.0, 11.0, 7.0, 6.0, 6.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.157958984375, -0.15282249450683594, -0.14768600463867188, -0.1425495147705078, -0.13741302490234375, -0.1322765350341797, -0.12714004516601562, -0.12200355529785156, -0.1168670654296875, -0.11173057556152344, -0.10659408569335938, -0.10145759582519531, -0.09632110595703125, -0.09118461608886719, -0.08604812622070312, -0.08091163635253906, -0.075775146484375, -0.07063865661621094, -0.06550216674804688, -0.06036567687988281, -0.05522918701171875, -0.05009269714355469, -0.044956207275390625, -0.03981971740722656, -0.0346832275390625, -0.029546737670898438, -0.024410247802734375, -0.019273757934570312, -0.01413726806640625, -0.009000778198242188, -0.003864288330078125, 0.0012722015380859375, 0.00640869140625, 0.011545181274414062, 0.016681671142578125, 0.021818161010742188, 0.02695465087890625, 0.03209114074707031, 0.037227630615234375, 0.04236412048339844, 0.0475006103515625, 0.05263710021972656, 0.057773590087890625, 0.06291007995605469, 0.06804656982421875, 0.07318305969238281, 0.07831954956054688, 0.08345603942871094, 0.088592529296875, 0.09372901916503906, 0.09886550903320312, 0.10400199890136719, 0.10913848876953125, 0.11427497863769531, 0.11941146850585938, 0.12454795837402344, 0.1296844482421875, 0.13482093811035156, 0.13995742797851562, 0.1450939178466797, 0.15023040771484375, 0.1553668975830078, 0.16050338745117188, 0.16563987731933594, 0.1707763671875]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 7.0, 7.0, 8.0, 10.0, 15.0, 16.0, 31.0, 31.0, 32.0, 32.0, 35.0, 43.0, 47.0, 56.0, 64.0, 70.0, 61.0, 67.0, 55.0, 44.0, 35.0, 47.0, 43.0, 31.0, 24.0, 18.0, 13.0, 9.0, 12.0, 11.0, 8.0, 2.0, 3.0, 4.0, 0.0, 3.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.050323486328125, -0.04863882064819336, -0.04695415496826172, -0.04526948928833008, -0.04358482360839844, -0.0419001579284668, -0.040215492248535156, -0.038530826568603516, -0.036846160888671875, -0.035161495208740234, -0.033476829528808594, -0.03179216384887695, -0.030107498168945312, -0.028422832489013672, -0.02673816680908203, -0.02505350112915039, -0.02336883544921875, -0.02168416976928711, -0.01999950408935547, -0.018314838409423828, -0.016630172729492188, -0.014945507049560547, -0.013260841369628906, -0.011576175689697266, -0.009891510009765625, -0.008206844329833984, -0.006522178649902344, -0.004837512969970703, -0.0031528472900390625, -0.0014681816101074219, 0.00021648406982421875, 0.0019011497497558594, 0.0035858154296875, 0.005270481109619141, 0.006955146789550781, 0.008639812469482422, 0.010324478149414062, 0.012009143829345703, 0.013693809509277344, 0.015378475189208984, 0.017063140869140625, 0.018747806549072266, 0.020432472229003906, 0.022117137908935547, 0.023801803588867188, 0.025486469268798828, 0.02717113494873047, 0.02885580062866211, 0.03054046630859375, 0.03222513198852539, 0.03390979766845703, 0.03559446334838867, 0.03727912902832031, 0.03896379470825195, 0.040648460388183594, 0.042333126068115234, 0.044017791748046875, 0.045702457427978516, 0.047387123107910156, 0.0490717887878418, 0.05075645446777344, 0.05244112014770508, 0.05412578582763672, 0.05581045150756836, 0.0574951171875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 8.0, 10.0, 8.0, 25.0, 26.0, 39.0, 72.0, 119.0, 164.0, 243.0, 416.0, 742.0, 1295.0, 2663.0, 7590.0, 83881.0, 887213.0, 52465.0, 6274.0, 2327.0, 1229.0, 690.0, 374.0, 252.0, 145.0, 111.0, 55.0, 41.0, 26.0, 16.0, 12.0, 8.0, 7.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.1956787109375, -0.18924903869628906, -0.18281936645507812, -0.1763896942138672, -0.16996002197265625, -0.1635303497314453, -0.15710067749023438, -0.15067100524902344, -0.1442413330078125, -0.13781166076660156, -0.13138198852539062, -0.12495231628417969, -0.11852264404296875, -0.11209297180175781, -0.10566329956054688, -0.09923362731933594, -0.092803955078125, -0.08637428283691406, -0.07994461059570312, -0.07351493835449219, -0.06708526611328125, -0.06065559387207031, -0.054225921630859375, -0.04779624938964844, -0.0413665771484375, -0.03493690490722656, -0.028507232666015625, -0.022077560424804688, -0.01564788818359375, -0.009218215942382812, -0.002788543701171875, 0.0036411285400390625, 0.01007080078125, 0.016500473022460938, 0.022930145263671875, 0.029359817504882812, 0.03578948974609375, 0.04221916198730469, 0.048648834228515625, 0.05507850646972656, 0.0615081787109375, 0.06793785095214844, 0.07436752319335938, 0.08079719543457031, 0.08722686767578125, 0.09365653991699219, 0.10008621215820312, 0.10651588439941406, 0.112945556640625, 0.11937522888183594, 0.12580490112304688, 0.1322345733642578, 0.13866424560546875, 0.1450939178466797, 0.15152359008789062, 0.15795326232910156, 0.1643829345703125, 0.17081260681152344, 0.17724227905273438, 0.1836719512939453, 0.19010162353515625, 0.1965312957763672, 0.20296096801757812, 0.20939064025878906, 0.2158203125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 0.0, 4.0, 4.0, 6.0, 7.0, 3.0, 14.0, 16.0, 14.0, 26.0, 25.0, 29.0, 34.0, 39.0, 44.0, 44.0, 42.0, 54.0, 50.0, 46.0, 50.0, 50.0, 47.0, 45.0, 42.0, 40.0, 39.0, 38.0, 22.0, 28.0, 17.0, 14.0, 17.0, 11.0, 6.0, 9.0, 9.0, 3.0, 2.0, 1.0, 3.0, 6.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.1978759765625, -0.19192886352539062, -0.18598175048828125, -0.18003463745117188, -0.1740875244140625, -0.16814041137695312, -0.16219329833984375, -0.15624618530273438, -0.150299072265625, -0.14435195922851562, -0.13840484619140625, -0.13245773315429688, -0.1265106201171875, -0.12056350708007812, -0.11461639404296875, -0.10866928100585938, -0.10272216796875, -0.09677505493164062, -0.09082794189453125, -0.08488082885742188, -0.0789337158203125, -0.07298660278320312, -0.06703948974609375, -0.061092376708984375, -0.055145263671875, -0.049198150634765625, -0.04325103759765625, -0.037303924560546875, -0.0313568115234375, -0.025409698486328125, -0.01946258544921875, -0.013515472412109375, -0.007568359375, -0.001621246337890625, 0.00432586669921875, 0.010272979736328125, 0.0162200927734375, 0.022167205810546875, 0.02811431884765625, 0.034061431884765625, 0.040008544921875, 0.045955657958984375, 0.05190277099609375, 0.057849884033203125, 0.0637969970703125, 0.06974411010742188, 0.07569122314453125, 0.08163833618164062, 0.08758544921875, 0.09353256225585938, 0.09947967529296875, 0.10542678833007812, 0.1113739013671875, 0.11732101440429688, 0.12326812744140625, 0.12921524047851562, 0.135162353515625, 0.14110946655273438, 0.14705657958984375, 0.15300369262695312, 0.1589508056640625, 0.16489791870117188, 0.17084503173828125, 0.17679214477539062, 0.1827392578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 2.0, 8.0, 5.0, 7.0, 12.0, 24.0, 46.0, 82.0, 160.0, 398.0, 1205.0, 4353.0, 45686.0, 952661.0, 37894.0, 4030.0, 1131.0, 468.0, 200.0, 88.0, 39.0, 32.0, 17.0, 4.0, 7.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06964111328125, -0.0665426254272461, -0.06344413757324219, -0.06034564971923828, -0.057247161865234375, -0.05414867401123047, -0.05105018615722656, -0.047951698303222656, -0.04485321044921875, -0.041754722595214844, -0.03865623474121094, -0.03555774688720703, -0.032459259033203125, -0.02936077117919922, -0.026262283325195312, -0.023163795471191406, -0.0200653076171875, -0.016966819763183594, -0.013868331909179688, -0.010769844055175781, -0.007671356201171875, -0.004572868347167969, -0.0014743804931640625, 0.0016241073608398438, 0.00472259521484375, 0.007821083068847656, 0.010919570922851562, 0.014018058776855469, 0.017116546630859375, 0.02021503448486328, 0.023313522338867188, 0.026412010192871094, 0.029510498046875, 0.032608985900878906, 0.03570747375488281, 0.03880596160888672, 0.041904449462890625, 0.04500293731689453, 0.04810142517089844, 0.051199913024902344, 0.05429840087890625, 0.057396888732910156, 0.06049537658691406, 0.06359386444091797, 0.06669235229492188, 0.06979084014892578, 0.07288932800292969, 0.0759878158569336, 0.0790863037109375, 0.0821847915649414, 0.08528327941894531, 0.08838176727294922, 0.09148025512695312, 0.09457874298095703, 0.09767723083496094, 0.10077571868896484, 0.10387420654296875, 0.10697269439697266, 0.11007118225097656, 0.11316967010498047, 0.11626815795898438, 0.11936664581298828, 0.12246513366699219, 0.1255636215209961, 0.128662109375]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 29.0, 70.0, 132.0, 269.0, 238.0, 156.0, 68.0, 22.0, 10.0, 2.0, 3.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5676021575927734e-05, -1.4804303646087646e-05, -1.3932585716247559e-05, -1.306086778640747e-05, -1.2189149856567383e-05, -1.1317431926727295e-05, -1.0445713996887207e-05, -9.573996067047119e-06, -8.702278137207031e-06, -7.830560207366943e-06, -6.9588422775268555e-06, -6.087124347686768e-06, -5.21540641784668e-06, -4.343688488006592e-06, -3.471970558166504e-06, -2.600252628326416e-06, -1.7285346984863281e-06, -8.568167686462402e-07, 1.4901161193847656e-08, 8.866190910339355e-07, 1.7583370208740234e-06, 2.6300549507141113e-06, 3.5017728805541992e-06, 4.373490810394287e-06, 5.245208740234375e-06, 6.116926670074463e-06, 6.988644599914551e-06, 7.860362529754639e-06, 8.732080459594727e-06, 9.603798389434814e-06, 1.0475516319274902e-05, 1.134723424911499e-05, 1.2218952178955078e-05, 1.3090670108795166e-05, 1.3962388038635254e-05, 1.4834105968475342e-05, 1.570582389831543e-05, 1.6577541828155518e-05, 1.7449259757995605e-05, 1.8320977687835693e-05, 1.919269561767578e-05, 2.006441354751587e-05, 2.0936131477355957e-05, 2.1807849407196045e-05, 2.2679567337036133e-05, 2.355128526687622e-05, 2.442300319671631e-05, 2.5294721126556396e-05, 2.6166439056396484e-05, 2.7038156986236572e-05, 2.790987491607666e-05, 2.8781592845916748e-05, 2.9653310775756836e-05, 3.0525028705596924e-05, 3.139674663543701e-05, 3.22684645652771e-05, 3.314018249511719e-05, 3.4011900424957275e-05, 3.488361835479736e-05, 3.575533628463745e-05, 3.662705421447754e-05, 3.749877214431763e-05, 3.8370490074157715e-05, 3.92422080039978e-05, 4.011392593383789e-05]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 6.0, 8.0, 11.0, 15.0, 17.0, 20.0, 44.0, 78.0, 131.0, 292.0, 633.0, 1561.0, 5405.0, 59101.0, 945697.0, 29452.0, 3943.0, 1217.0, 453.0, 212.0, 90.0, 67.0, 32.0, 21.0, 14.0, 10.0, 5.0, 4.0, 3.0, 4.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.09735107421875, -0.09392356872558594, -0.09049606323242188, -0.08706855773925781, -0.08364105224609375, -0.08021354675292969, -0.07678604125976562, -0.07335853576660156, -0.0699310302734375, -0.06650352478027344, -0.06307601928710938, -0.05964851379394531, -0.05622100830078125, -0.05279350280761719, -0.049365997314453125, -0.04593849182128906, -0.042510986328125, -0.03908348083496094, -0.035655975341796875, -0.03222846984863281, -0.02880096435546875, -0.025373458862304688, -0.021945953369140625, -0.018518447875976562, -0.0150909423828125, -0.011663436889648438, -0.008235931396484375, -0.0048084259033203125, -0.00138092041015625, 0.0020465850830078125, 0.005474090576171875, 0.008901596069335938, 0.0123291015625, 0.015756607055664062, 0.019184112548828125, 0.022611618041992188, 0.02603912353515625, 0.029466629028320312, 0.032894134521484375, 0.03632164001464844, 0.0397491455078125, 0.04317665100097656, 0.046604156494140625, 0.05003166198730469, 0.05345916748046875, 0.05688667297363281, 0.060314178466796875, 0.06374168395996094, 0.067169189453125, 0.07059669494628906, 0.07402420043945312, 0.07745170593261719, 0.08087921142578125, 0.08430671691894531, 0.08773422241210938, 0.09116172790527344, 0.0945892333984375, 0.09801673889160156, 0.10144424438476562, 0.10487174987792969, 0.10829925537109375, 0.11172676086425781, 0.11515426635742188, 0.11858177185058594, 0.12200927734375]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 11.0, 9.0, 47.0, 169.0, 362.0, 238.0, 79.0, 22.0, 9.0, 8.0, 8.0, 6.0, 6.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.279541015625, -0.27266693115234375, -0.2657928466796875, -0.25891876220703125, -0.252044677734375, -0.24517059326171875, -0.2382965087890625, -0.23142242431640625, -0.22454833984375, -0.21767425537109375, -0.2108001708984375, -0.20392608642578125, -0.197052001953125, -0.19017791748046875, -0.1833038330078125, -0.17642974853515625, -0.1695556640625, -0.16268157958984375, -0.1558074951171875, -0.14893341064453125, -0.142059326171875, -0.13518524169921875, -0.1283111572265625, -0.12143707275390625, -0.11456298828125, -0.10768890380859375, -0.1008148193359375, -0.09394073486328125, -0.087066650390625, -0.08019256591796875, -0.0733184814453125, -0.06644439697265625, -0.0595703125, -0.05269622802734375, -0.0458221435546875, -0.03894805908203125, -0.032073974609375, -0.02519989013671875, -0.0183258056640625, -0.01145172119140625, -0.00457763671875, 0.00229644775390625, 0.0091705322265625, 0.01604461669921875, 0.022918701171875, 0.02979278564453125, 0.0366668701171875, 0.04354095458984375, 0.0504150390625, 0.05728912353515625, 0.0641632080078125, 0.07103729248046875, 0.077911376953125, 0.08478546142578125, 0.0916595458984375, 0.09853363037109375, 0.10540771484375, 0.11228179931640625, 0.1191558837890625, 0.12602996826171875, 0.132904052734375, 0.13977813720703125, 0.1466522216796875, 0.15352630615234375, 0.160400390625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 5.0, 18.0, 57.0, 161.0, 438.0, 271.0, 49.0, 11.0, 3.0, 1.0, 1.0, 2.0], "bins": [-5.338333606719971, -5.2444539070129395, -5.15057373046875, -5.056694030761719, -4.9628143310546875, -4.868934631347656, -4.775054454803467, -4.6811747550964355, -4.587295055389404, -4.493415355682373, -4.399535179138184, -4.305655479431152, -4.211775779724121, -4.11789608001709, -4.0240159034729, -3.930136203765869, -3.836256504058838, -3.7423765659332275, -3.6484968662261963, -3.554616928100586, -3.4607372283935547, -3.3668572902679443, -3.272977590560913, -3.1790976524353027, -3.0852177143096924, -2.991337776184082, -2.897458076477051, -2.8035781383514404, -2.709698438644409, -2.615818500518799, -2.5219388008117676, -2.4280588626861572, -2.334179401397705, -2.2402994632720947, -2.1464197635650635, -2.052539825439453, -1.9586601257324219, -1.864780306816101, -1.7709004878997803, -1.67702054977417, -1.5831406116485596, -1.4892607927322388, -1.395380973815918, -1.3015011548995972, -1.2076213359832764, -1.1137415170669556, -1.0198616981506348, -0.9259818196296692, -0.8321020603179932, -0.7382222414016724, -0.6443424224853516, -0.5504626035690308, -0.4565827548503876, -0.3627029359340668, -0.2688230872154236, -0.17494326829910278, -0.08106344938278198, 0.012816376984119415, 0.10669620335102081, 0.2005760371685028, 0.2944558560848236, 0.3883356750011444, 0.4822155237197876, 0.5760953426361084, 0.6699751615524292]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 2.0, 1.0, 4.0, 13.0, 7.0, 19.0, 17.0, 18.0, 33.0, 27.0, 31.0, 29.0, 43.0, 56.0, 47.0, 42.0, 59.0, 59.0, 54.0, 57.0, 55.0, 56.0, 41.0, 48.0, 20.0, 28.0, 34.0, 25.0, 16.0, 12.0, 16.0, 6.0, 8.0, 6.0, 2.0, 6.0, 0.0, 5.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0266449451446533, -0.9956722259521484, -0.9646994471549988, -0.9337267279624939, -0.9027539491653442, -0.8717812299728394, -0.8408085107803345, -0.8098357319831848, -0.7788629531860352, -0.7478902339935303, -0.7169174551963806, -0.6859447360038757, -0.6549719572067261, -0.6239992380142212, -0.5930265188217163, -0.5620537400245667, -0.5310810208320618, -0.5001083016395569, -0.4691355228424072, -0.43816280364990234, -0.4071900248527527, -0.3762173056602478, -0.34524455666542053, -0.31427180767059326, -0.283299058675766, -0.2523263096809387, -0.22135356068611145, -0.19038082659244537, -0.1594080775976181, -0.12843532860279083, -0.09746259450912476, -0.06648984551429749, -0.035517096519470215, -0.004544351249933243, 0.02642839401960373, 0.0574011355638504, 0.08837388455867767, 0.11934663355350494, 0.15031936764717102, 0.1812921166419983, 0.21226486563682556, 0.24323761463165283, 0.2742103636264801, 0.3051831126213074, 0.33615583181381226, 0.3671286106109619, 0.3981013298034668, 0.42907407879829407, 0.46004682779312134, 0.4910195767879486, 0.5219923257827759, 0.5529650449752808, 0.5839378237724304, 0.6149105429649353, 0.645883321762085, 0.6768560409545898, 0.7078287601470947, 0.7388014793395996, 0.7697742581367493, 0.8007469773292542, 0.8317197561264038, 0.8626924753189087, 0.8936651945114136, 0.9246379733085632, 0.9556107521057129]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 3.0, 2.0, 5.0, 9.0, 7.0, 20.0, 17.0, 25.0, 25.0, 33.0, 35.0, 72.0, 140.0, 368.0, 1372.0, 14321.0, 4157750.0, 17698.0, 1580.0, 353.0, 148.0, 89.0, 42.0, 40.0, 30.0, 24.0, 15.0, 12.0, 7.0, 11.0, 7.0, 2.0, 2.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.251708984375, -0.24288558959960938, -0.23406219482421875, -0.22523880004882812, -0.2164154052734375, -0.20759201049804688, -0.19876861572265625, -0.18994522094726562, -0.181121826171875, -0.17229843139648438, -0.16347503662109375, -0.15465164184570312, -0.1458282470703125, -0.13700485229492188, -0.12818145751953125, -0.11935806274414062, -0.11053466796875, -0.10171127319335938, -0.09288787841796875, -0.08406448364257812, -0.0752410888671875, -0.06641769409179688, -0.05759429931640625, -0.048770904541015625, -0.039947509765625, -0.031124114990234375, -0.02230072021484375, -0.013477325439453125, -0.0046539306640625, 0.004169464111328125, 0.01299285888671875, 0.021816253662109375, 0.0306396484375, 0.039463043212890625, 0.04828643798828125, 0.057109832763671875, 0.0659332275390625, 0.07475662231445312, 0.08358001708984375, 0.09240341186523438, 0.101226806640625, 0.11005020141601562, 0.11887359619140625, 0.12769699096679688, 0.1365203857421875, 0.14534378051757812, 0.15416717529296875, 0.16299057006835938, 0.17181396484375, 0.18063735961914062, 0.18946075439453125, 0.19828414916992188, 0.2071075439453125, 0.21593093872070312, 0.22475433349609375, 0.23357772827148438, 0.242401123046875, 0.2512245178222656, 0.26004791259765625, 0.2688713073730469, 0.2776947021484375, 0.2865180969238281, 0.29534149169921875, 0.3041648864746094, 0.31298828125]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 4.0, 4.0, 2.0, 1.0, 3.0, 14.0, 13.0, 10.0, 14.0, 34.0, 21.0, 44.0, 36.0, 40.0, 46.0, 45.0, 59.0, 69.0, 68.0, 64.0, 51.0, 53.0, 51.0, 44.0, 34.0, 37.0, 34.0, 31.0, 19.0, 12.0, 11.0, 13.0, 6.0, 6.0, 4.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.05218505859375, -0.050490379333496094, -0.04879570007324219, -0.04710102081298828, -0.045406341552734375, -0.04371166229248047, -0.04201698303222656, -0.040322303771972656, -0.03862762451171875, -0.036932945251464844, -0.03523826599121094, -0.03354358673095703, -0.031848907470703125, -0.03015422821044922, -0.028459548950195312, -0.026764869689941406, -0.0250701904296875, -0.023375511169433594, -0.021680831909179688, -0.01998615264892578, -0.018291473388671875, -0.01659679412841797, -0.014902114868164062, -0.013207435607910156, -0.01151275634765625, -0.009818077087402344, -0.008123397827148438, -0.006428718566894531, -0.004734039306640625, -0.0030393600463867188, -0.0013446807861328125, 0.00034999847412109375, 0.002044677734375, 0.0037393569946289062, 0.0054340362548828125, 0.007128715515136719, 0.008823394775390625, 0.010518074035644531, 0.012212753295898438, 0.013907432556152344, 0.01560211181640625, 0.017296791076660156, 0.018991470336914062, 0.02068614959716797, 0.022380828857421875, 0.02407550811767578, 0.025770187377929688, 0.027464866638183594, 0.0291595458984375, 0.030854225158691406, 0.03254890441894531, 0.03424358367919922, 0.035938262939453125, 0.03763294219970703, 0.03932762145996094, 0.041022300720214844, 0.04271697998046875, 0.044411659240722656, 0.04610633850097656, 0.04780101776123047, 0.049495697021484375, 0.05119037628173828, 0.05288505554199219, 0.054579734802246094, 0.0562744140625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 5.0, 5.0, 5.0, 4.0, 12.0, 12.0, 11.0, 21.0, 38.0, 33.0, 63.0, 69.0, 89.0, 119.0, 167.0, 189.0, 235.0, 335.0, 571.0, 1225.0, 4746.0, 106444.0, 4065747.0, 9831.0, 1787.0, 773.0, 419.0, 295.0, 230.0, 177.0, 144.0, 127.0, 86.0, 69.0, 42.0, 35.0, 32.0, 23.0, 15.0, 15.0, 14.0, 9.0, 8.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.226806640625, -0.21903228759765625, -0.2112579345703125, -0.20348358154296875, -0.195709228515625, -0.18793487548828125, -0.1801605224609375, -0.17238616943359375, -0.16461181640625, -0.15683746337890625, -0.1490631103515625, -0.14128875732421875, -0.133514404296875, -0.12574005126953125, -0.1179656982421875, -0.11019134521484375, -0.1024169921875, -0.09464263916015625, -0.0868682861328125, -0.07909393310546875, -0.071319580078125, -0.06354522705078125, -0.0557708740234375, -0.04799652099609375, -0.04022216796875, -0.03244781494140625, -0.0246734619140625, -0.01689910888671875, -0.009124755859375, -0.00135040283203125, 0.0064239501953125, 0.01419830322265625, 0.02197265625, 0.02974700927734375, 0.0375213623046875, 0.04529571533203125, 0.053070068359375, 0.06084442138671875, 0.0686187744140625, 0.07639312744140625, 0.08416748046875, 0.09194183349609375, 0.0997161865234375, 0.10749053955078125, 0.115264892578125, 0.12303924560546875, 0.1308135986328125, 0.13858795166015625, 0.1463623046875, 0.15413665771484375, 0.1619110107421875, 0.16968536376953125, 0.177459716796875, 0.18523406982421875, 0.1930084228515625, 0.20078277587890625, 0.20855712890625, 0.21633148193359375, 0.2241058349609375, 0.23188018798828125, 0.239654541015625, 0.24742889404296875, 0.2552032470703125, 0.26297760009765625, 0.270751953125]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 7.0, 22.0, 230.0, 3741.0, 59.0, 13.0, 9.0, 5.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1343994140625, -0.1286163330078125, -0.122833251953125, -0.1170501708984375, -0.11126708984375, -0.1054840087890625, -0.099700927734375, -0.0939178466796875, -0.088134765625, -0.0823516845703125, -0.076568603515625, -0.0707855224609375, -0.06500244140625, -0.0592193603515625, -0.053436279296875, -0.0476531982421875, -0.0418701171875, -0.0360870361328125, -0.030303955078125, -0.0245208740234375, -0.01873779296875, -0.0129547119140625, -0.007171630859375, -0.0013885498046875, 0.00439453125, 0.0101776123046875, 0.015960693359375, 0.0217437744140625, 0.02752685546875, 0.0333099365234375, 0.039093017578125, 0.0448760986328125, 0.0506591796875, 0.0564422607421875, 0.062225341796875, 0.0680084228515625, 0.07379150390625, 0.0795745849609375, 0.085357666015625, 0.0911407470703125, 0.096923828125, 0.1027069091796875, 0.108489990234375, 0.1142730712890625, 0.12005615234375, 0.1258392333984375, 0.131622314453125, 0.1374053955078125, 0.1431884765625, 0.1489715576171875, 0.154754638671875, 0.1605377197265625, 0.16632080078125, 0.1721038818359375, 0.177886962890625, 0.1836700439453125, 0.189453125, 0.1952362060546875, 0.201019287109375, 0.2068023681640625, 0.21258544921875, 0.2183685302734375, 0.224151611328125, 0.2299346923828125, 0.2357177734375]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 8.0, 5.0, 12.0, 14.0, 11.0, 25.0, 35.0, 52.0, 78.0, 84.0, 146.0, 129.0, 128.0, 81.0, 65.0, 51.0, 33.0, 13.0, 10.0, 10.0, 4.0, 5.0, 3.0, 1.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.12511499226093292, -0.11744730919599533, -0.10977963358163834, -0.10211195051670074, -0.09444427490234375, -0.08677659183740616, -0.07910890877246857, -0.07144123315811157, -0.06377355009317398, -0.05610587075352669, -0.048438191413879395, -0.0407705083489418, -0.03310282900929451, -0.025435149669647217, -0.017767466604709625, -0.010099787265062332, -0.002432107925415039, 0.005235572345554829, 0.012903252616524696, 0.02057093381881714, 0.028238613158464432, 0.035906292498111725, 0.043573975563049316, 0.05124165490269661, 0.0589093342423439, 0.0665770173072815, 0.07424469292163849, 0.08191237598657608, 0.08958005905151367, 0.09724773466587067, 0.10491541773080826, 0.11258310079574585, 0.12025076150894165, 0.12791843712329865, 0.13558612763881683, 0.14325380325317383, 0.15092147886753082, 0.15858915448188782, 0.166256844997406, 0.173924520611763, 0.18159219622612, 0.189259871840477, 0.19692756235599518, 0.20459523797035217, 0.21226291358470917, 0.21993058919906616, 0.22759827971458435, 0.23526595532894135, 0.24293364584445953, 0.25060132145881653, 0.2582690119743347, 0.2659366726875305, 0.2736043632030487, 0.2812720537185669, 0.2889397144317627, 0.2966074049472809, 0.3042750954627991, 0.31194278597831726, 0.31961044669151306, 0.32727813720703125, 0.33494582772254944, 0.34261348843574524, 0.3502811789512634, 0.3579488694667816, 0.3656165301799774]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 16.0, 19.0, 20.0, 30.0, 47.0, 67.0, 102.0, 94.0, 95.0, 122.0, 81.0, 75.0, 69.0, 54.0, 30.0, 28.0, 17.0, 10.0, 7.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42266297340393066, -0.41019269824028015, -0.39772242307662964, -0.3852521777153015, -0.372781902551651, -0.3603116273880005, -0.34784135222435, -0.33537107706069946, -0.32290083169937134, -0.3104305565357208, -0.2979602813720703, -0.2854900360107422, -0.2730197608470917, -0.26054948568344116, -0.24807921051979065, -0.23560893535614014, -0.22313866019248962, -0.2106683850288391, -0.1981981247663498, -0.18572784960269928, -0.17325758934020996, -0.16078731417655945, -0.14831703901290894, -0.13584676384925842, -0.1233765035867691, -0.11090623587369919, -0.09843596816062927, -0.08596569299697876, -0.07349542528390884, -0.06102515757083893, -0.048554882407188416, -0.0360846146941185, -0.023614346981048584, -0.011144077405333519, 0.001326192170381546, 0.01379646360874176, 0.026266731321811676, 0.03873699903488159, 0.051207274198532104, 0.06367754191160202, 0.07614780962467194, 0.08861807733774185, 0.10108834505081177, 0.11355862021446228, 0.1260288953781128, 0.1384991556406021, 0.15096943080425262, 0.16343969106674194, 0.17590996623039246, 0.18838024139404297, 0.2008505016565323, 0.2133207768201828, 0.22579103708267212, 0.23826131224632263, 0.25073158740997314, 0.26320186257362366, 0.27567213773727417, 0.2881424129009247, 0.3006126880645752, 0.3130829334259033, 0.32555320858955383, 0.33802348375320435, 0.35049375891685486, 0.36296403408050537, 0.3754342794418335]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 4.0, 9.0, 8.0, 12.0, 14.0, 16.0, 22.0, 35.0, 36.0, 68.0, 94.0, 181.0, 275.0, 441.0, 841.0, 1623.0, 3600.0, 8231.0, 20828.0, 56972.0, 172894.0, 377085.0, 262768.0, 89526.0, 31150.0, 11867.0, 5010.0, 2296.0, 1151.0, 587.0, 308.0, 189.0, 115.0, 83.0, 66.0, 32.0, 33.0, 22.0, 12.0, 10.0, 5.0, 7.0, 9.0, 7.0, 4.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0648193359375, -0.0626373291015625, -0.060455322265625, -0.0582733154296875, -0.05609130859375, -0.0539093017578125, -0.051727294921875, -0.0495452880859375, -0.04736328125, -0.0451812744140625, -0.042999267578125, -0.0408172607421875, -0.03863525390625, -0.0364532470703125, -0.034271240234375, -0.0320892333984375, -0.0299072265625, -0.0277252197265625, -0.025543212890625, -0.0233612060546875, -0.02117919921875, -0.0189971923828125, -0.016815185546875, -0.0146331787109375, -0.012451171875, -0.0102691650390625, -0.008087158203125, -0.0059051513671875, -0.00372314453125, -0.0015411376953125, 0.000640869140625, 0.0028228759765625, 0.0050048828125, 0.0071868896484375, 0.009368896484375, 0.0115509033203125, 0.01373291015625, 0.0159149169921875, 0.018096923828125, 0.0202789306640625, 0.0224609375, 0.0246429443359375, 0.026824951171875, 0.0290069580078125, 0.03118896484375, 0.0333709716796875, 0.035552978515625, 0.0377349853515625, 0.0399169921875, 0.0420989990234375, 0.044281005859375, 0.0464630126953125, 0.04864501953125, 0.0508270263671875, 0.053009033203125, 0.0551910400390625, 0.057373046875, 0.0595550537109375, 0.061737060546875, 0.0639190673828125, 0.06610107421875, 0.0682830810546875, 0.070465087890625, 0.0726470947265625, 0.0748291015625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 6.0, 3.0, 8.0, 14.0, 10.0, 14.0, 19.0, 27.0, 32.0, 30.0, 40.0, 40.0, 67.0, 61.0, 51.0, 56.0, 57.0, 60.0, 61.0, 63.0, 42.0, 38.0, 33.0, 36.0, 24.0, 29.0, 13.0, 13.0, 13.0, 9.0, 5.0, 9.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.052093505859375, -0.050377845764160156, -0.04866218566894531, -0.04694652557373047, -0.045230865478515625, -0.04351520538330078, -0.04179954528808594, -0.040083885192871094, -0.03836822509765625, -0.036652565002441406, -0.03493690490722656, -0.03322124481201172, -0.031505584716796875, -0.02978992462158203, -0.028074264526367188, -0.026358604431152344, -0.0246429443359375, -0.022927284240722656, -0.021211624145507812, -0.01949596405029297, -0.017780303955078125, -0.01606464385986328, -0.014348983764648438, -0.012633323669433594, -0.01091766357421875, -0.009202003479003906, -0.0074863433837890625, -0.005770683288574219, -0.004055023193359375, -0.0023393630981445312, -0.0006237030029296875, 0.0010919570922851562, 0.0028076171875, 0.004523277282714844, 0.0062389373779296875, 0.007954597473144531, 0.009670257568359375, 0.011385917663574219, 0.013101577758789062, 0.014817237854003906, 0.01653289794921875, 0.018248558044433594, 0.019964218139648438, 0.02167987823486328, 0.023395538330078125, 0.02511119842529297, 0.026826858520507812, 0.028542518615722656, 0.0302581787109375, 0.031973838806152344, 0.03368949890136719, 0.03540515899658203, 0.037120819091796875, 0.03883647918701172, 0.04055213928222656, 0.042267799377441406, 0.04398345947265625, 0.045699119567871094, 0.04741477966308594, 0.04913043975830078, 0.050846099853515625, 0.05256175994873047, 0.05427742004394531, 0.055993080139160156, 0.057708740234375]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 7.0, 10.0, 18.0, 26.0, 46.0, 155.0, 301.0, 904.0, 5185.0, 219801.0, 807336.0, 12437.0, 1528.0, 430.0, 203.0, 78.0, 45.0, 25.0, 15.0, 5.0, 2.0, 1.0, 1.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1988525390625, -0.1898784637451172, -0.18090438842773438, -0.17193031311035156, -0.16295623779296875, -0.15398216247558594, -0.14500808715820312, -0.1360340118408203, -0.1270599365234375, -0.11808586120605469, -0.10911178588867188, -0.10013771057128906, -0.09116363525390625, -0.08218955993652344, -0.07321548461914062, -0.06424140930175781, -0.055267333984375, -0.04629325866699219, -0.037319183349609375, -0.028345108032226562, -0.01937103271484375, -0.010396957397460938, -0.001422882080078125, 0.0075511932373046875, 0.0165252685546875, 0.025499343872070312, 0.034473419189453125, 0.04344749450683594, 0.05242156982421875, 0.06139564514160156, 0.07036972045898438, 0.07934379577636719, 0.08831787109375, 0.09729194641113281, 0.10626602172851562, 0.11524009704589844, 0.12421417236328125, 0.13318824768066406, 0.14216232299804688, 0.1511363983154297, 0.1601104736328125, 0.1690845489501953, 0.17805862426757812, 0.18703269958496094, 0.19600677490234375, 0.20498085021972656, 0.21395492553710938, 0.2229290008544922, 0.231903076171875, 0.2408771514892578, 0.24985122680664062, 0.25882530212402344, 0.26779937744140625, 0.27677345275878906, 0.2857475280761719, 0.2947216033935547, 0.3036956787109375, 0.3126697540283203, 0.3216438293457031, 0.33061790466308594, 0.33959197998046875, 0.34856605529785156, 0.3575401306152344, 0.3665142059326172, 0.37548828125]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 7.0, 7.0, 13.0, 25.0, 39.0, 33.0, 42.0, 41.0, 63.0, 73.0, 80.0, 67.0, 73.0, 59.0, 69.0, 57.0, 48.0, 39.0, 50.0, 24.0, 25.0, 23.0, 18.0, 10.0, 6.0, 5.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.145263671875, -0.1371612548828125, -0.129058837890625, -0.1209564208984375, -0.11285400390625, -0.1047515869140625, -0.096649169921875, -0.0885467529296875, -0.0804443359375, -0.0723419189453125, -0.064239501953125, -0.0561370849609375, -0.04803466796875, -0.0399322509765625, -0.031829833984375, -0.0237274169921875, -0.015625, -0.0075225830078125, 0.000579833984375, 0.0086822509765625, 0.01678466796875, 0.0248870849609375, 0.032989501953125, 0.0410919189453125, 0.0491943359375, 0.0572967529296875, 0.065399169921875, 0.0735015869140625, 0.08160400390625, 0.0897064208984375, 0.097808837890625, 0.1059112548828125, 0.114013671875, 0.1221160888671875, 0.130218505859375, 0.1383209228515625, 0.14642333984375, 0.1545257568359375, 0.162628173828125, 0.1707305908203125, 0.1788330078125, 0.1869354248046875, 0.195037841796875, 0.2031402587890625, 0.21124267578125, 0.2193450927734375, 0.227447509765625, 0.2355499267578125, 0.24365234375, 0.2517547607421875, 0.259857177734375, 0.2679595947265625, 0.27606201171875, 0.2841644287109375, 0.292266845703125, 0.3003692626953125, 0.3084716796875, 0.3165740966796875, 0.324676513671875, 0.3327789306640625, 0.34088134765625, 0.3489837646484375, 0.357086181640625, 0.3651885986328125, 0.373291015625]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 3.0, 1.0, 9.0, 0.0, 3.0, 8.0, 6.0, 12.0, 8.0, 17.0, 30.0, 31.0, 42.0, 79.0, 110.0, 233.0, 404.0, 882.0, 2311.0, 7772.0, 40765.0, 380911.0, 544707.0, 55374.0, 9969.0, 2762.0, 1033.0, 452.0, 237.0, 123.0, 83.0, 42.0, 38.0, 22.0, 15.0, 20.0, 10.0, 7.0, 5.0, 5.0, 8.0, 5.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.035736083984375, -0.03468751907348633, -0.033638954162597656, -0.032590389251708984, -0.03154182434082031, -0.03049325942993164, -0.02944469451904297, -0.028396129608154297, -0.027347564697265625, -0.026298999786376953, -0.02525043487548828, -0.02420186996459961, -0.023153305053710938, -0.022104740142822266, -0.021056175231933594, -0.020007610321044922, -0.01895904541015625, -0.017910480499267578, -0.016861915588378906, -0.015813350677490234, -0.014764785766601562, -0.01371622085571289, -0.012667655944824219, -0.011619091033935547, -0.010570526123046875, -0.009521961212158203, -0.008473396301269531, -0.007424831390380859, -0.0063762664794921875, -0.005327701568603516, -0.004279136657714844, -0.003230571746826172, -0.0021820068359375, -0.0011334419250488281, -8.487701416015625e-05, 0.0009636878967285156, 0.0020122528076171875, 0.0030608177185058594, 0.004109382629394531, 0.005157947540283203, 0.006206512451171875, 0.007255077362060547, 0.008303642272949219, 0.00935220718383789, 0.010400772094726562, 0.011449337005615234, 0.012497901916503906, 0.013546466827392578, 0.01459503173828125, 0.015643596649169922, 0.016692161560058594, 0.017740726470947266, 0.018789291381835938, 0.01983785629272461, 0.02088642120361328, 0.021934986114501953, 0.022983551025390625, 0.024032115936279297, 0.02508068084716797, 0.02612924575805664, 0.027177810668945312, 0.028226375579833984, 0.029274940490722656, 0.030323505401611328, 0.0313720703125]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 7.0, 5.0, 8.0, 7.0, 15.0, 15.0, 20.0, 24.0, 20.0, 33.0, 38.0, 44.0, 49.0, 73.0, 82.0, 70.0, 71.0, 60.0, 65.0, 62.0, 50.0, 32.0, 27.0, 30.0, 25.0, 15.0, 9.0, 14.0, 3.0, 4.0, 10.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.106231689453125e-06, -7.874332368373871e-06, -7.642433047294617e-06, -7.4105337262153625e-06, -7.178634405136108e-06, -6.946735084056854e-06, -6.7148357629776e-06, -6.482936441898346e-06, -6.251037120819092e-06, -6.019137799739838e-06, -5.7872384786605835e-06, -5.555339157581329e-06, -5.323439836502075e-06, -5.091540515422821e-06, -4.859641194343567e-06, -4.627741873264313e-06, -4.395842552185059e-06, -4.1639432311058044e-06, -3.93204391002655e-06, -3.700144588947296e-06, -3.468245267868042e-06, -3.236345946788788e-06, -3.0044466257095337e-06, -2.7725473046302795e-06, -2.5406479835510254e-06, -2.3087486624717712e-06, -2.076849341392517e-06, -1.844950020313263e-06, -1.6130506992340088e-06, -1.3811513781547546e-06, -1.1492520570755005e-06, -9.173527359962463e-07, -6.854534149169922e-07, -4.5355409383773804e-07, -2.2165477275848389e-07, 1.0244548320770264e-08, 2.421438694000244e-07, 4.7404319047927856e-07, 7.059425115585327e-07, 9.378418326377869e-07, 1.169741153717041e-06, 1.4016404747962952e-06, 1.6335397958755493e-06, 1.8654391169548035e-06, 2.0973384380340576e-06, 2.3292377591133118e-06, 2.561137080192566e-06, 2.79303640127182e-06, 3.0249357223510742e-06, 3.2568350434303284e-06, 3.4887343645095825e-06, 3.7206336855888367e-06, 3.952533006668091e-06, 4.184432327747345e-06, 4.416331648826599e-06, 4.648230969905853e-06, 4.880130290985107e-06, 5.1120296120643616e-06, 5.343928933143616e-06, 5.57582825422287e-06, 5.807727575302124e-06, 6.039626896381378e-06, 6.271526217460632e-06, 6.5034255385398865e-06, 6.735324859619141e-06]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 5.0, 4.0, 10.0, 23.0, 49.0, 110.0, 289.0, 1014.0, 7510.0, 402208.0, 625601.0, 9927.0, 1206.0, 366.0, 122.0, 55.0, 25.0, 14.0, 9.0, 4.0, 2.0, 0.0, 2.0, 2.0, 3.0, 0.0, 3.0], "bins": [-0.1236572265625, -0.12102890014648438, -0.11840057373046875, -0.11577224731445312, -0.1131439208984375, -0.11051559448242188, -0.10788726806640625, -0.10525894165039062, -0.102630615234375, -0.10000228881835938, -0.09737396240234375, -0.09474563598632812, -0.0921173095703125, -0.08948898315429688, -0.08686065673828125, -0.08423233032226562, -0.08160400390625, -0.07897567749023438, -0.07634735107421875, -0.07371902465820312, -0.0710906982421875, -0.06846237182617188, -0.06583404541015625, -0.06320571899414062, -0.060577392578125, -0.057949066162109375, -0.05532073974609375, -0.052692413330078125, -0.0500640869140625, -0.047435760498046875, -0.04480743408203125, -0.042179107666015625, -0.03955078125, -0.036922454833984375, -0.03429412841796875, -0.031665802001953125, -0.0290374755859375, -0.026409149169921875, -0.02378082275390625, -0.021152496337890625, -0.018524169921875, -0.015895843505859375, -0.01326751708984375, -0.010639190673828125, -0.0080108642578125, -0.005382537841796875, -0.00275421142578125, -0.000125885009765625, 0.00250244140625, 0.005130767822265625, 0.00775909423828125, 0.010387420654296875, 0.0130157470703125, 0.015644073486328125, 0.01827239990234375, 0.020900726318359375, 0.023529052734375, 0.026157379150390625, 0.02878570556640625, 0.031414031982421875, 0.0340423583984375, 0.036670684814453125, 0.03929901123046875, 0.041927337646484375, 0.0445556640625]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 6.0, 5.0, 21.0, 24.0, 55.0, 77.0, 125.0, 155.0, 164.0, 136.0, 94.0, 63.0, 26.0, 23.0, 11.0, 13.0, 3.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.049774169921875, -0.04752206802368164, -0.04526996612548828, -0.04301786422729492, -0.04076576232910156, -0.0385136604309082, -0.036261558532714844, -0.034009456634521484, -0.031757354736328125, -0.029505252838134766, -0.027253150939941406, -0.025001049041748047, -0.022748947143554688, -0.020496845245361328, -0.01824474334716797, -0.01599264144897461, -0.01374053955078125, -0.01148843765258789, -0.009236335754394531, -0.006984233856201172, -0.0047321319580078125, -0.002480030059814453, -0.00022792816162109375, 0.0020241737365722656, 0.004276275634765625, 0.006528377532958984, 0.008780479431152344, 0.011032581329345703, 0.013284683227539062, 0.015536785125732422, 0.01778888702392578, 0.02004098892211914, 0.0222930908203125, 0.02454519271850586, 0.02679729461669922, 0.029049396514892578, 0.03130149841308594, 0.0335536003112793, 0.035805702209472656, 0.038057804107666016, 0.040309906005859375, 0.042562007904052734, 0.044814109802246094, 0.04706621170043945, 0.04931831359863281, 0.05157041549682617, 0.05382251739501953, 0.05607461929321289, 0.05832672119140625, 0.06057882308959961, 0.06283092498779297, 0.06508302688598633, 0.06733512878417969, 0.06958723068237305, 0.0718393325805664, 0.07409143447875977, 0.07634353637695312, 0.07859563827514648, 0.08084774017333984, 0.0830998420715332, 0.08535194396972656, 0.08760404586791992, 0.08985614776611328, 0.09210824966430664, 0.0943603515625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 6.0, 9.0, 23.0, 58.0, 216.0, 338.0, 247.0, 73.0, 33.0, 7.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.349781036376953, -3.2847836017608643, -3.2197864055633545, -3.1547889709472656, -3.089791774749756, -3.024794340133667, -2.9597971439361572, -2.8947997093200684, -2.8298025131225586, -2.7648050785064697, -2.69980788230896, -2.634810447692871, -2.5698132514953613, -2.5048158168792725, -2.4398186206817627, -2.374821186065674, -2.309823989868164, -2.244826555252075, -2.1798293590545654, -2.1148319244384766, -2.049834728240967, -1.9848374128341675, -1.9198400974273682, -1.8548426628112793, -1.7898452281951904, -1.7248479127883911, -1.6598505973815918, -1.5948532819747925, -1.5298559665679932, -1.4648586511611938, -1.3998613357543945, -1.3348639011383057, -1.269866943359375, -1.2048696279525757, -1.1398723125457764, -1.074874997138977, -1.0098776817321777, -0.9448803663253784, -0.8798829913139343, -0.814885675907135, -0.7498883008956909, -0.6848909854888916, -0.6198936700820923, -0.554896354675293, -0.48989900946617126, -0.42490169405937195, -0.35990434885025024, -0.2949070334434509, -0.2299097180366516, -0.1649124026298523, -0.09991507232189178, -0.034917742013931274, 0.030079573392868042, 0.09507688879966736, 0.16007423400878906, 0.22507154941558838, 0.2900688648223877, 0.355066180229187, 0.42006349563598633, 0.48506084084510803, 0.550058126449585, 0.6150554418563843, 0.6800528168678284, 0.7450501322746277, 0.810047447681427]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 3.0, 2.0, 5.0, 9.0, 9.0, 14.0, 15.0, 18.0, 18.0, 23.0, 24.0, 21.0, 29.0, 37.0, 34.0, 42.0, 53.0, 54.0, 35.0, 46.0, 54.0, 49.0, 38.0, 53.0, 41.0, 31.0, 27.0, 28.0, 29.0, 23.0, 23.0, 22.0, 16.0, 9.0, 11.0, 4.0, 5.0, 7.0, 5.0, 6.0, 3.0, 6.0, 5.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.7380832433700562, -0.7149181962013245, -0.6917531490325928, -0.6685881018638611, -0.6454230546951294, -0.6222580075263977, -0.599092960357666, -0.5759279131889343, -0.5527628660202026, -0.529597818851471, -0.5064327716827393, -0.48326772451400757, -0.4601026773452759, -0.4369376301765442, -0.4137725830078125, -0.3906075358390808, -0.36744245886802673, -0.34427741169929504, -0.32111236453056335, -0.29794731736183167, -0.2747822701931, -0.2516172230243683, -0.2284521609544754, -0.2052871137857437, -0.18212206661701202, -0.15895701944828033, -0.13579197227954865, -0.11262691766023636, -0.08946187049150467, -0.06629682332277298, -0.04313176870346069, -0.019966721534729004, 0.0031983256340026855, 0.026363374665379524, 0.04952842369675636, 0.07269347459077835, 0.09585852175951004, 0.11902356892824173, 0.14218862354755402, 0.1653536707162857, 0.1885187178850174, 0.21168376505374908, 0.23484881222248077, 0.25801387429237366, 0.28117892146110535, 0.30434396862983704, 0.3275090157985687, 0.3506740629673004, 0.3738391101360321, 0.3970041573047638, 0.4201692044734955, 0.4433342516422272, 0.46649929881095886, 0.48966434597969055, 0.5128294229507446, 0.5359944701194763, 0.559159517288208, 0.5823245644569397, 0.6054896116256714, 0.6286546587944031, 0.6518197059631348, 0.6749847531318665, 0.6981498003005981, 0.7213148474693298, 0.7444798946380615]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [8.0, 19.0, 81.0, 421.0, 3111.0, 93025.0, 4080810.0, 15218.0, 1322.0, 216.0, 46.0, 11.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059112548828125, -0.04972028732299805, -0.040328025817871094, -0.03093576431274414, -0.021543502807617188, -0.012151241302490234, -0.0027589797973632812, 0.006633281707763672, 0.016025543212890625, 0.025417804718017578, 0.03481006622314453, 0.044202327728271484, 0.05359458923339844, 0.06298685073852539, 0.07237911224365234, 0.0817713737487793, 0.09116363525390625, 0.1005558967590332, 0.10994815826416016, 0.11934041976928711, 0.12873268127441406, 0.13812494277954102, 0.14751720428466797, 0.15690946578979492, 0.16630172729492188, 0.17569398880004883, 0.18508625030517578, 0.19447851181030273, 0.2038707733154297, 0.21326303482055664, 0.2226552963256836, 0.23204755783081055, 0.2414398193359375, 0.25083208084106445, 0.2602243423461914, 0.26961660385131836, 0.2790088653564453, 0.28840112686157227, 0.2977933883666992, 0.30718564987182617, 0.3165779113769531, 0.3259701728820801, 0.33536243438720703, 0.344754695892334, 0.35414695739746094, 0.3635392189025879, 0.37293148040771484, 0.3823237419128418, 0.39171600341796875, 0.4011082649230957, 0.41050052642822266, 0.4198927879333496, 0.42928504943847656, 0.4386773109436035, 0.44806957244873047, 0.4574618339538574, 0.4668540954589844, 0.47624635696411133, 0.4856386184692383, 0.49503087997436523, 0.5044231414794922, 0.5138154029846191, 0.5232076644897461, 0.532599925994873, 0.5419921875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 3.0, 4.0, 5.0, 6.0, 9.0, 14.0, 24.0, 21.0, 25.0, 42.0, 39.0, 31.0, 46.0, 51.0, 58.0, 55.0, 53.0, 75.0, 67.0, 52.0, 47.0, 50.0, 43.0, 29.0, 34.0, 17.0, 16.0, 23.0, 12.0, 16.0, 7.0, 7.0, 4.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.04498291015625, -0.043379783630371094, -0.04177665710449219, -0.04017353057861328, -0.038570404052734375, -0.03696727752685547, -0.03536415100097656, -0.033761024475097656, -0.03215789794921875, -0.030554771423339844, -0.028951644897460938, -0.02734851837158203, -0.025745391845703125, -0.02414226531982422, -0.022539138793945312, -0.020936012268066406, -0.0193328857421875, -0.017729759216308594, -0.016126632690429688, -0.014523506164550781, -0.012920379638671875, -0.011317253112792969, -0.009714126586914062, -0.008111000061035156, -0.00650787353515625, -0.004904747009277344, -0.0033016204833984375, -0.0016984939575195312, -9.5367431640625e-05, 0.0015077590942382812, 0.0031108856201171875, 0.004714012145996094, 0.006317138671875, 0.007920265197753906, 0.009523391723632812, 0.011126518249511719, 0.012729644775390625, 0.014332771301269531, 0.015935897827148438, 0.017539024353027344, 0.01914215087890625, 0.020745277404785156, 0.022348403930664062, 0.02395153045654297, 0.025554656982421875, 0.02715778350830078, 0.028760910034179688, 0.030364036560058594, 0.0319671630859375, 0.033570289611816406, 0.03517341613769531, 0.03677654266357422, 0.038379669189453125, 0.03998279571533203, 0.04158592224121094, 0.043189048767089844, 0.04479217529296875, 0.046395301818847656, 0.04799842834472656, 0.04960155487060547, 0.051204681396484375, 0.05280780792236328, 0.05441093444824219, 0.056014060974121094, 0.0576171875]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 5.0, 1.0, 2.0, 3.0, 3.0, 12.0, 9.0, 10.0, 18.0, 24.0, 32.0, 47.0, 71.0, 124.0, 338.0, 1335.0, 8354.0, 91088.0, 3985235.0, 96428.0, 8822.0, 1485.0, 426.0, 166.0, 69.0, 47.0, 39.0, 28.0, 12.0, 19.0, 13.0, 6.0, 7.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14404296875, -0.1386089324951172, -0.13317489624023438, -0.12774085998535156, -0.12230682373046875, -0.11687278747558594, -0.11143875122070312, -0.10600471496582031, -0.1005706787109375, -0.09513664245605469, -0.08970260620117188, -0.08426856994628906, -0.07883453369140625, -0.07340049743652344, -0.06796646118164062, -0.06253242492675781, -0.057098388671875, -0.05166435241699219, -0.046230316162109375, -0.04079627990722656, -0.03536224365234375, -0.029928207397460938, -0.024494171142578125, -0.019060134887695312, -0.0136260986328125, -0.008192062377929688, -0.002758026123046875, 0.0026760101318359375, 0.00811004638671875, 0.013544082641601562, 0.018978118896484375, 0.024412155151367188, 0.02984619140625, 0.03528022766113281, 0.040714263916015625, 0.04614830017089844, 0.05158233642578125, 0.05701637268066406, 0.062450408935546875, 0.06788444519042969, 0.0733184814453125, 0.07875251770019531, 0.08418655395507812, 0.08962059020996094, 0.09505462646484375, 0.10048866271972656, 0.10592269897460938, 0.11135673522949219, 0.116790771484375, 0.12222480773925781, 0.12765884399414062, 0.13309288024902344, 0.13852691650390625, 0.14396095275878906, 0.14939498901367188, 0.1548290252685547, 0.1602630615234375, 0.1656970977783203, 0.17113113403320312, 0.17656517028808594, 0.18199920654296875, 0.18743324279785156, 0.19286727905273438, 0.1983013153076172, 0.2037353515625]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 1.0, 3.0, 2.0, 5.0, 9.0, 5.0, 8.0, 8.0, 11.0, 10.0, 14.0, 31.0, 41.0, 52.0, 97.0, 227.0, 616.0, 1348.0, 829.0, 343.0, 143.0, 71.0, 32.0, 38.0, 25.0, 17.0, 22.0, 11.0, 14.0, 7.0, 5.0, 8.0, 6.0, 5.0, 5.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0850830078125, -0.08211708068847656, -0.07915115356445312, -0.07618522644042969, -0.07321929931640625, -0.07025337219238281, -0.06728744506835938, -0.06432151794433594, -0.0613555908203125, -0.05838966369628906, -0.055423736572265625, -0.05245780944824219, -0.04949188232421875, -0.04652595520019531, -0.043560028076171875, -0.04059410095214844, -0.037628173828125, -0.03466224670410156, -0.031696319580078125, -0.028730392456054688, -0.02576446533203125, -0.022798538208007812, -0.019832611083984375, -0.016866683959960938, -0.0139007568359375, -0.010934829711914062, -0.007968902587890625, -0.0050029754638671875, -0.00203704833984375, 0.0009288787841796875, 0.003894805908203125, 0.0068607330322265625, 0.00982666015625, 0.012792587280273438, 0.015758514404296875, 0.018724441528320312, 0.02169036865234375, 0.024656295776367188, 0.027622222900390625, 0.030588150024414062, 0.0335540771484375, 0.03652000427246094, 0.039485931396484375, 0.04245185852050781, 0.04541778564453125, 0.04838371276855469, 0.051349639892578125, 0.05431556701660156, 0.057281494140625, 0.06024742126464844, 0.06321334838867188, 0.06617927551269531, 0.06914520263671875, 0.07211112976074219, 0.07507705688476562, 0.07804298400878906, 0.0810089111328125, 0.08397483825683594, 0.08694076538085938, 0.08990669250488281, 0.09287261962890625, 0.09583854675292969, 0.09880447387695312, 0.10177040100097656, 0.104736328125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 9.0, 49.0, 298.0, 461.0, 131.0, 31.0, 14.0, 3.0, 0.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0118188858032227, -1.945077657699585, -1.8783365488052368, -1.8115953207015991, -1.744854211807251, -1.6781129837036133, -1.6113717555999756, -1.5446306467056274, -1.4778895378112793, -1.4111483097076416, -1.3444072008132935, -1.2776659727096558, -1.2109248638153076, -1.14418363571167, -1.0774424076080322, -1.010701298713684, -0.9439600706100464, -0.8772189021110535, -0.8104777336120605, -0.7437365055084229, -0.6769953966140747, -0.610254168510437, -0.5435130000114441, -0.47677183151245117, -0.41003066301345825, -0.34328949451446533, -0.2765483260154724, -0.2098071277141571, -0.14306595921516418, -0.07632479071617126, -0.009583592414855957, 0.05715757608413696, 0.12389874458312988, 0.1906399130821228, 0.2573810815811157, 0.32412227988243103, 0.39086344838142395, 0.45760461688041687, 0.5243458151817322, 0.5910869836807251, 0.657828152179718, 0.7245693206787109, 0.7913104891777039, 0.8580516576766968, 0.9247928857803345, 0.9915339946746826, 1.0582752227783203, 1.125016450881958, 1.1917575597763062, 1.2584987878799438, 1.325239896774292, 1.3919811248779297, 1.4587222337722778, 1.5254634618759155, 1.5922045707702637, 1.6589457988739014, 1.725687026977539, 1.7924282550811768, 1.859169363975525, 1.9259105920791626, 1.9926517009735107, 2.0593929290771484, 2.126134157180786, 2.192875385284424, 2.2596163749694824]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 5.0, 7.0, 2.0, 2.0, 9.0, 3.0, 8.0, 9.0, 14.0, 10.0, 24.0, 24.0, 28.0, 30.0, 36.0, 29.0, 49.0, 51.0, 42.0, 45.0, 49.0, 52.0, 44.0, 53.0, 56.0, 45.0, 30.0, 30.0, 50.0, 35.0, 27.0, 23.0, 12.0, 17.0, 11.0, 8.0, 9.0, 7.0, 8.0, 3.0, 4.0, 6.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41751956939697266, -0.40398627519607544, -0.3904529809951782, -0.376919686794281, -0.3633863627910614, -0.3498530685901642, -0.33631977438926697, -0.32278648018836975, -0.30925315618515015, -0.29571986198425293, -0.2821865677833557, -0.2686532735824585, -0.2551199495792389, -0.24158665537834167, -0.22805336117744446, -0.21452006697654724, -0.20098677277565002, -0.1874534785747528, -0.1739201694726944, -0.16038687527179718, -0.14685356616973877, -0.13332027196884155, -0.11978697776794434, -0.10625367611646652, -0.09272037446498871, -0.0791870728135109, -0.06565377116203308, -0.052120476961135864, -0.03858717530965805, -0.025053873658180237, -0.01152057945728302, 0.0020127221941947937, 0.015546023845672607, 0.029079323634505272, 0.042612623423337936, 0.05614592134952545, 0.06967922300100327, 0.08321252465248108, 0.0967458188533783, 0.11027912050485611, 0.12381242215633392, 0.13734571635723114, 0.15087902545928955, 0.16441231966018677, 0.17794561386108398, 0.1914789229631424, 0.2050122171640396, 0.21854552626609802, 0.23207882046699524, 0.24561211466789246, 0.2591454088687897, 0.2726787328720093, 0.2862120270729065, 0.2997453212738037, 0.3132786154747009, 0.32681190967559814, 0.34034520387649536, 0.3538784980773926, 0.3674117922782898, 0.380945086479187, 0.3944784104824066, 0.40801170468330383, 0.42154499888420105, 0.43507829308509827, 0.44861161708831787]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 10.0, 16.0, 17.0, 44.0, 95.0, 478.0, 3338.0, 44188.0, 676851.0, 306493.0, 15177.0, 1452.0, 241.0, 52.0, 21.0, 15.0, 8.0, 2.0, 5.0, 6.0, 6.0, 3.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-0.2462158203125, -0.23987197875976562, -0.23352813720703125, -0.22718429565429688, -0.2208404541015625, -0.21449661254882812, -0.20815277099609375, -0.20180892944335938, -0.195465087890625, -0.18912124633789062, -0.18277740478515625, -0.17643356323242188, -0.1700897216796875, -0.16374588012695312, -0.15740203857421875, -0.15105819702148438, -0.14471435546875, -0.13837051391601562, -0.13202667236328125, -0.12568283081054688, -0.1193389892578125, -0.11299514770507812, -0.10665130615234375, -0.10030746459960938, -0.093963623046875, -0.08761978149414062, -0.08127593994140625, -0.07493209838867188, -0.0685882568359375, -0.062244415283203125, -0.05590057373046875, -0.049556732177734375, -0.043212890625, -0.036869049072265625, -0.03052520751953125, -0.024181365966796875, -0.0178375244140625, -0.011493682861328125, -0.00514984130859375, 0.001194000244140625, 0.007537841796875, 0.013881683349609375, 0.02022552490234375, 0.026569366455078125, 0.0329132080078125, 0.039257049560546875, 0.04560089111328125, 0.051944732666015625, 0.05828857421875, 0.06463241577148438, 0.07097625732421875, 0.07732009887695312, 0.0836639404296875, 0.09000778198242188, 0.09635162353515625, 0.10269546508789062, 0.109039306640625, 0.11538314819335938, 0.12172698974609375, 0.12807083129882812, 0.1344146728515625, 0.14075851440429688, 0.14710235595703125, 0.15344619750976562, 0.1597900390625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 5.0, 0.0, 2.0, 7.0, 9.0, 11.0, 11.0, 19.0, 25.0, 35.0, 34.0, 26.0, 45.0, 34.0, 60.0, 57.0, 72.0, 62.0, 72.0, 56.0, 52.0, 58.0, 31.0, 38.0, 32.0, 26.0, 28.0, 22.0, 21.0, 5.0, 13.0, 10.0, 8.0, 5.0, 4.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0501708984375, -0.04849815368652344, -0.046825408935546875, -0.04515266418457031, -0.04347991943359375, -0.04180717468261719, -0.040134429931640625, -0.03846168518066406, -0.0367889404296875, -0.03511619567871094, -0.033443450927734375, -0.03177070617675781, -0.03009796142578125, -0.028425216674804688, -0.026752471923828125, -0.025079727172851562, -0.023406982421875, -0.021734237670898438, -0.020061492919921875, -0.018388748168945312, -0.01671600341796875, -0.015043258666992188, -0.013370513916015625, -0.011697769165039062, -0.0100250244140625, -0.008352279663085938, -0.006679534912109375, -0.0050067901611328125, -0.00333404541015625, -0.0016613006591796875, 1.1444091796875e-05, 0.0016841888427734375, 0.00335693359375, 0.0050296783447265625, 0.006702423095703125, 0.008375167846679688, 0.01004791259765625, 0.011720657348632812, 0.013393402099609375, 0.015066146850585938, 0.0167388916015625, 0.018411636352539062, 0.020084381103515625, 0.021757125854492188, 0.02342987060546875, 0.025102615356445312, 0.026775360107421875, 0.028448104858398438, 0.030120849609375, 0.03179359436035156, 0.033466339111328125, 0.03513908386230469, 0.03681182861328125, 0.03848457336425781, 0.040157318115234375, 0.04183006286621094, 0.0435028076171875, 0.04517555236816406, 0.046848297119140625, 0.04852104187011719, 0.05019378662109375, 0.05186653137207031, 0.053539276123046875, 0.05521202087402344, 0.056884765625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 4.0, 8.0, 6.0, 7.0, 8.0, 13.0, 14.0, 18.0, 29.0, 43.0, 64.0, 109.0, 134.0, 226.0, 413.0, 675.0, 1387.0, 3393.0, 15041.0, 150681.0, 738714.0, 118695.0, 12529.0, 3145.0, 1304.0, 707.0, 410.0, 251.0, 165.0, 110.0, 85.0, 44.0, 28.0, 30.0, 15.0, 8.0, 11.0, 7.0, 5.0, 6.0, 4.0, 2.0, 2.0, 4.0, 0.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.1229248046875, -0.11901664733886719, -0.11510848999023438, -0.11120033264160156, -0.10729217529296875, -0.10338401794433594, -0.09947586059570312, -0.09556770324707031, -0.0916595458984375, -0.08775138854980469, -0.08384323120117188, -0.07993507385253906, -0.07602691650390625, -0.07211875915527344, -0.06821060180664062, -0.06430244445800781, -0.060394287109375, -0.05648612976074219, -0.052577972412109375, -0.04866981506347656, -0.04476165771484375, -0.04085350036621094, -0.036945343017578125, -0.03303718566894531, -0.0291290283203125, -0.025220870971679688, -0.021312713623046875, -0.017404556274414062, -0.01349639892578125, -0.009588241577148438, -0.005680084228515625, -0.0017719268798828125, 0.00213623046875, 0.0060443878173828125, 0.009952545166015625, 0.013860702514648438, 0.01776885986328125, 0.021677017211914062, 0.025585174560546875, 0.029493331909179688, 0.0334014892578125, 0.03730964660644531, 0.041217803955078125, 0.04512596130371094, 0.04903411865234375, 0.05294227600097656, 0.056850433349609375, 0.06075859069824219, 0.064666748046875, 0.06857490539550781, 0.07248306274414062, 0.07639122009277344, 0.08029937744140625, 0.08420753479003906, 0.08811569213867188, 0.09202384948730469, 0.0959320068359375, 0.09984016418457031, 0.10374832153320312, 0.10765647888183594, 0.11156463623046875, 0.11547279357910156, 0.11938095092773438, 0.12328910827636719, 0.127197265625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 10.0, 8.0, 4.0, 13.0, 8.0, 20.0, 17.0, 27.0, 29.0, 42.0, 29.0, 29.0, 38.0, 48.0, 47.0, 41.0, 59.0, 51.0, 55.0, 56.0, 46.0, 40.0, 39.0, 36.0, 32.0, 28.0, 29.0, 26.0, 25.0, 15.0, 9.0, 17.0, 6.0, 4.0, 5.0, 4.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.134033203125, -0.12881088256835938, -0.12358856201171875, -0.11836624145507812, -0.1131439208984375, -0.10792160034179688, -0.10269927978515625, -0.09747695922851562, -0.092254638671875, -0.08703231811523438, -0.08180999755859375, -0.07658767700195312, -0.0713653564453125, -0.06614303588867188, -0.06092071533203125, -0.055698394775390625, -0.05047607421875, -0.045253753662109375, -0.04003143310546875, -0.034809112548828125, -0.0295867919921875, -0.024364471435546875, -0.01914215087890625, -0.013919830322265625, -0.008697509765625, -0.003475189208984375, 0.00174713134765625, 0.006969451904296875, 0.0121917724609375, 0.017414093017578125, 0.02263641357421875, 0.027858734130859375, 0.0330810546875, 0.038303375244140625, 0.04352569580078125, 0.048748016357421875, 0.0539703369140625, 0.059192657470703125, 0.06441497802734375, 0.06963729858398438, 0.074859619140625, 0.08008193969726562, 0.08530426025390625, 0.09052658081054688, 0.0957489013671875, 0.10097122192382812, 0.10619354248046875, 0.11141586303710938, 0.11663818359375, 0.12186050415039062, 0.12708282470703125, 0.13230514526367188, 0.1375274658203125, 0.14274978637695312, 0.14797210693359375, 0.15319442749023438, 0.158416748046875, 0.16363906860351562, 0.16886138916015625, 0.17408370971679688, 0.1793060302734375, 0.18452835083007812, 0.18975067138671875, 0.19497299194335938, 0.2001953125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 5.0, 3.0, 3.0, 4.0, 12.0, 2.0, 18.0, 15.0, 14.0, 22.0, 35.0, 50.0, 88.0, 106.0, 166.0, 258.0, 446.0, 787.0, 1562.0, 4034.0, 12028.0, 65545.0, 704380.0, 223090.0, 24409.0, 6361.0, 2471.0, 1081.0, 588.0, 331.0, 221.0, 124.0, 84.0, 62.0, 39.0, 24.0, 16.0, 17.0, 15.0, 11.0, 13.0, 12.0, 2.0, 4.0, 1.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.037811279296875, -0.03649568557739258, -0.035180091857910156, -0.033864498138427734, -0.03254890441894531, -0.03123331069946289, -0.02991771697998047, -0.028602123260498047, -0.027286529541015625, -0.025970935821533203, -0.02465534210205078, -0.02333974838256836, -0.022024154663085938, -0.020708560943603516, -0.019392967224121094, -0.018077373504638672, -0.01676177978515625, -0.015446186065673828, -0.014130592346191406, -0.012814998626708984, -0.011499404907226562, -0.01018381118774414, -0.008868217468261719, -0.007552623748779297, -0.006237030029296875, -0.004921436309814453, -0.0036058425903320312, -0.0022902488708496094, -0.0009746551513671875, 0.0003409385681152344, 0.0016565322875976562, 0.002972126007080078, 0.0042877197265625, 0.005603313446044922, 0.006918907165527344, 0.008234500885009766, 0.009550094604492188, 0.01086568832397461, 0.012181282043457031, 0.013496875762939453, 0.014812469482421875, 0.016128063201904297, 0.01744365692138672, 0.01875925064086914, 0.020074844360351562, 0.021390438079833984, 0.022706031799316406, 0.024021625518798828, 0.02533721923828125, 0.026652812957763672, 0.027968406677246094, 0.029284000396728516, 0.030599594116210938, 0.03191518783569336, 0.03323078155517578, 0.0345463752746582, 0.035861968994140625, 0.03717756271362305, 0.03849315643310547, 0.03980875015258789, 0.04112434387207031, 0.042439937591552734, 0.043755531311035156, 0.04507112503051758, 0.04638671875]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 2.0, 1.0, 9.0, 11.0, 16.0, 23.0, 40.0, 62.0, 110.0, 153.0, 161.0, 128.0, 108.0, 58.0, 31.0, 31.0, 11.0, 13.0, 11.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.633167266845703e-05, -1.5757977962493896e-05, -1.5184283256530762e-05, -1.4610588550567627e-05, -1.4036893844604492e-05, -1.3463199138641357e-05, -1.2889504432678223e-05, -1.2315809726715088e-05, -1.1742115020751953e-05, -1.1168420314788818e-05, -1.0594725608825684e-05, -1.0021030902862549e-05, -9.447336196899414e-06, -8.87364149093628e-06, -8.299946784973145e-06, -7.72625207901001e-06, -7.152557373046875e-06, -6.57886266708374e-06, -6.0051679611206055e-06, -5.431473255157471e-06, -4.857778549194336e-06, -4.284083843231201e-06, -3.7103891372680664e-06, -3.1366944313049316e-06, -2.562999725341797e-06, -1.989305019378662e-06, -1.4156103134155273e-06, -8.419156074523926e-07, -2.682209014892578e-07, 3.0547380447387695e-07, 8.791685104370117e-07, 1.4528632164001465e-06, 2.0265579223632812e-06, 2.600252628326416e-06, 3.1739473342895508e-06, 3.7476420402526855e-06, 4.32133674621582e-06, 4.895031452178955e-06, 5.46872615814209e-06, 6.042420864105225e-06, 6.616115570068359e-06, 7.189810276031494e-06, 7.763504981994629e-06, 8.337199687957764e-06, 8.910894393920898e-06, 9.484589099884033e-06, 1.0058283805847168e-05, 1.0631978511810303e-05, 1.1205673217773438e-05, 1.1779367923736572e-05, 1.2353062629699707e-05, 1.2926757335662842e-05, 1.3500452041625977e-05, 1.4074146747589111e-05, 1.4647841453552246e-05, 1.5221536159515381e-05, 1.5795230865478516e-05, 1.636892557144165e-05, 1.6942620277404785e-05, 1.751631498336792e-05, 1.8090009689331055e-05, 1.866370439529419e-05, 1.9237399101257324e-05, 1.981109380722046e-05, 2.0384788513183594e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 7.0, 9.0, 9.0, 9.0, 7.0, 15.0, 21.0, 38.0, 54.0, 103.0, 161.0, 325.0, 836.0, 2564.0, 13773.0, 296698.0, 702404.0, 25807.0, 3732.0, 1055.0, 438.0, 205.0, 95.0, 75.0, 41.0, 18.0, 17.0, 19.0, 12.0, 7.0, 5.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.057373046875, -0.055403709411621094, -0.05343437194824219, -0.05146503448486328, -0.049495697021484375, -0.04752635955810547, -0.04555702209472656, -0.043587684631347656, -0.04161834716796875, -0.039649009704589844, -0.03767967224121094, -0.03571033477783203, -0.033740997314453125, -0.03177165985107422, -0.029802322387695312, -0.027832984924316406, -0.0258636474609375, -0.023894309997558594, -0.021924972534179688, -0.01995563507080078, -0.017986297607421875, -0.01601696014404297, -0.014047622680664062, -0.012078285217285156, -0.01010894775390625, -0.008139610290527344, -0.0061702728271484375, -0.004200935363769531, -0.002231597900390625, -0.00026226043701171875, 0.0017070770263671875, 0.0036764144897460938, 0.005645751953125, 0.007615089416503906, 0.009584426879882812, 0.011553764343261719, 0.013523101806640625, 0.015492439270019531, 0.017461776733398438, 0.019431114196777344, 0.02140045166015625, 0.023369789123535156, 0.025339126586914062, 0.02730846405029297, 0.029277801513671875, 0.03124713897705078, 0.03321647644042969, 0.035185813903808594, 0.0371551513671875, 0.039124488830566406, 0.04109382629394531, 0.04306316375732422, 0.045032501220703125, 0.04700183868408203, 0.04897117614746094, 0.050940513610839844, 0.05290985107421875, 0.054879188537597656, 0.05684852600097656, 0.05881786346435547, 0.060787200927734375, 0.06275653839111328, 0.06472587585449219, 0.0666952133178711, 0.06866455078125]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 3.0, 2.0, 2.0, 5.0, 5.0, 4.0, 13.0, 15.0, 14.0, 26.0, 35.0, 41.0, 61.0, 75.0, 76.0, 96.0, 97.0, 74.0, 100.0, 64.0, 37.0, 40.0, 33.0, 24.0, 21.0, 12.0, 6.0, 8.0, 8.0, 3.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.046600341796875, -0.04509925842285156, -0.043598175048828125, -0.04209709167480469, -0.04059600830078125, -0.03909492492675781, -0.037593841552734375, -0.03609275817871094, -0.0345916748046875, -0.03309059143066406, -0.031589508056640625, -0.030088424682617188, -0.02858734130859375, -0.027086257934570312, -0.025585174560546875, -0.024084091186523438, -0.0225830078125, -0.021081924438476562, -0.019580841064453125, -0.018079757690429688, -0.01657867431640625, -0.015077590942382812, -0.013576507568359375, -0.012075424194335938, -0.0105743408203125, -0.009073257446289062, -0.007572174072265625, -0.0060710906982421875, -0.00457000732421875, -0.0030689239501953125, -0.001567840576171875, -6.67572021484375e-05, 0.001434326171875, 0.0029354095458984375, 0.004436492919921875, 0.0059375762939453125, 0.00743865966796875, 0.008939743041992188, 0.010440826416015625, 0.011941909790039062, 0.0134429931640625, 0.014944076538085938, 0.016445159912109375, 0.017946243286132812, 0.01944732666015625, 0.020948410034179688, 0.022449493408203125, 0.023950576782226562, 0.02545166015625, 0.026952743530273438, 0.028453826904296875, 0.029954910278320312, 0.03145599365234375, 0.03295707702636719, 0.034458160400390625, 0.03595924377441406, 0.0374603271484375, 0.03896141052246094, 0.040462493896484375, 0.04196357727050781, 0.04346466064453125, 0.04496574401855469, 0.046466827392578125, 0.04796791076660156, 0.049468994140625]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 3.0, 9.0, 13.0, 67.0, 464.0, 427.0, 25.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.944953441619873, -2.8362271785736084, -2.727501153945923, -2.618774890899658, -2.5100488662719727, -2.401322603225708, -2.2925965785980225, -2.183870315551758, -2.0751442909240723, -1.9664181470870972, -1.857692003250122, -1.748965859413147, -1.6402397155761719, -1.5315134525299072, -1.4227874279022217, -1.314061164855957, -1.205335021018982, -1.0966088771820068, -0.9878827333450317, -0.8791565895080566, -0.7704304456710815, -0.6617042422294617, -0.5529780983924866, -0.4442519545555115, -0.3355258107185364, -0.22679966688156128, -0.11807350814342499, -0.009347349405288696, 0.0993787944316864, 0.2081049680709839, 0.316831111907959, 0.4255572557449341, 0.5342833995819092, 0.6430095434188843, 0.7517356872558594, 0.8604618310928345, 0.9691879749298096, 1.0779142379760742, 1.1866402626037598, 1.2953665256500244, 1.40409255027771, 1.512818694114685, 1.6215448379516602, 1.7302709817886353, 1.8389971256256104, 1.947723388671875, 2.0564494132995605, 2.165175676345825, 2.27390193939209, 2.3826282024383545, 2.49135422706604, 2.6000804901123047, 2.7088065147399902, 2.817532777786255, 2.9262588024139404, 3.034985065460205, 3.1437110900878906, 3.2524373531341553, 3.361163377761841, 3.4698896408081055, 3.578615665435791, 3.6873419284820557, 3.796067953109741, 3.904794216156006, 4.013520240783691]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 4.0, 9.0, 6.0, 6.0, 6.0, 6.0, 10.0, 12.0, 12.0, 26.0, 24.0, 19.0, 26.0, 33.0, 24.0, 21.0, 32.0, 32.0, 37.0, 51.0, 37.0, 49.0, 34.0, 44.0, 51.0, 42.0, 31.0, 34.0, 29.0, 35.0, 23.0, 33.0, 20.0, 26.0, 22.0, 14.0, 15.0, 13.0, 11.0, 5.0, 12.0, 8.0, 4.0, 4.0, 3.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6095308065414429, -0.592193603515625, -0.5748564004898071, -0.5575191974639893, -0.5401819944381714, -0.5228447914123535, -0.5055075883865356, -0.4881703555583954, -0.4708331525325775, -0.45349594950675964, -0.4361587464809418, -0.4188215434551239, -0.40148431062698364, -0.38414710760116577, -0.3668099045753479, -0.34947270154953003, -0.33213549852371216, -0.3147982954978943, -0.2974610924720764, -0.28012388944625854, -0.2627866864204407, -0.2454494684934616, -0.22811225056648254, -0.21077504754066467, -0.1934378445148468, -0.17610064148902893, -0.15876343846321106, -0.141426220536232, -0.12408901751041412, -0.10675181448459625, -0.08941460400819778, -0.07207739353179932, -0.054740190505981445, -0.037402983754873276, -0.020065777003765106, -0.0027285702526569366, 0.014608636498451233, 0.031945839524269104, 0.04928305000066757, 0.06662026047706604, 0.08395746350288391, 0.10129466652870178, 0.11863187700510025, 0.13596908748149872, 0.1533062905073166, 0.17064349353313446, 0.18798071146011353, 0.2053179144859314, 0.22265511751174927, 0.23999232053756714, 0.257329523563385, 0.2746667265892029, 0.29200392961502075, 0.3093411326408386, 0.3266783654689789, 0.34401556849479675, 0.3613527715206146, 0.3786899745464325, 0.39602717757225037, 0.41336438059806824, 0.4307016134262085, 0.44803881645202637, 0.46537601947784424, 0.4827132225036621, 0.50005042552948]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 19.0, 70.0, 344.0, 4192672.0, 975.0, 167.0, 33.0, 9.0, 3.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.00390625, -0.79583740234375, -0.5877685546875, -0.37969970703125, -0.171630859375, 0.03643798828125, 0.2445068359375, 0.45257568359375, 0.66064453125, 0.86871337890625, 1.0767822265625, 1.28485107421875, 1.492919921875, 1.70098876953125, 1.9090576171875, 2.11712646484375, 2.3251953125, 2.53326416015625, 2.7413330078125, 2.94940185546875, 3.157470703125, 3.36553955078125, 3.5736083984375, 3.78167724609375, 3.98974609375, 4.19781494140625, 4.4058837890625, 4.61395263671875, 4.822021484375, 5.03009033203125, 5.2381591796875, 5.44622802734375, 5.654296875, 5.86236572265625, 6.0704345703125, 6.27850341796875, 6.486572265625, 6.69464111328125, 6.9027099609375, 7.11077880859375, 7.31884765625, 7.52691650390625, 7.7349853515625, 7.94305419921875, 8.151123046875, 8.35919189453125, 8.5672607421875, 8.77532958984375, 8.9833984375, 9.19146728515625, 9.3995361328125, 9.60760498046875, 9.815673828125, 10.02374267578125, 10.2318115234375, 10.43988037109375, 10.64794921875, 10.85601806640625, 11.0640869140625, 11.27215576171875, 11.480224609375, 11.68829345703125, 11.8963623046875, 12.10443115234375, 12.3125]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 2.0, 5.0, 6.0, 9.0, 9.0, 9.0, 18.0, 11.0, 27.0, 23.0, 37.0, 41.0, 49.0, 59.0, 63.0, 63.0, 72.0, 62.0, 65.0, 52.0, 57.0, 48.0, 40.0, 31.0, 34.0, 27.0, 21.0, 15.0, 12.0, 7.0, 7.0, 5.0, 3.0, 3.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.049346923828125, -0.047707557678222656, -0.04606819152832031, -0.04442882537841797, -0.042789459228515625, -0.04115009307861328, -0.03951072692871094, -0.037871360778808594, -0.03623199462890625, -0.034592628479003906, -0.03295326232910156, -0.03131389617919922, -0.029674530029296875, -0.02803516387939453, -0.026395797729492188, -0.024756431579589844, -0.0231170654296875, -0.021477699279785156, -0.019838333129882812, -0.01819896697998047, -0.016559600830078125, -0.014920234680175781, -0.013280868530273438, -0.011641502380371094, -0.01000213623046875, -0.008362770080566406, -0.0067234039306640625, -0.005084037780761719, -0.003444671630859375, -0.0018053054809570312, -0.0001659393310546875, 0.0014734268188476562, 0.00311279296875, 0.004752159118652344, 0.0063915252685546875, 0.008030891418457031, 0.009670257568359375, 0.011309623718261719, 0.012948989868164062, 0.014588356018066406, 0.01622772216796875, 0.017867088317871094, 0.019506454467773438, 0.02114582061767578, 0.022785186767578125, 0.02442455291748047, 0.026063919067382812, 0.027703285217285156, 0.0293426513671875, 0.030982017517089844, 0.03262138366699219, 0.03426074981689453, 0.035900115966796875, 0.03753948211669922, 0.03917884826660156, 0.040818214416503906, 0.04245758056640625, 0.044096946716308594, 0.04573631286621094, 0.04737567901611328, 0.049015045166015625, 0.05065441131591797, 0.05229377746582031, 0.053933143615722656, 0.055572509765625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 5.0, 2.0, 7.0, 5.0, 10.0, 14.0, 15.0, 37.0, 116.0, 212.0, 577.0, 1977.0, 11927.0, 209122.0, 3910618.0, 52027.0, 5713.0, 1179.0, 373.0, 167.0, 84.0, 44.0, 18.0, 12.0, 10.0, 5.0, 4.0, 2.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1319580078125, -0.12674331665039062, -0.12152862548828125, -0.11631393432617188, -0.1110992431640625, -0.10588455200195312, -0.10066986083984375, -0.09545516967773438, -0.090240478515625, -0.08502578735351562, -0.07981109619140625, -0.07459640502929688, -0.0693817138671875, -0.06416702270507812, -0.05895233154296875, -0.053737640380859375, -0.04852294921875, -0.043308258056640625, -0.03809356689453125, -0.032878875732421875, -0.0276641845703125, -0.022449493408203125, -0.01723480224609375, -0.012020111083984375, -0.006805419921875, -0.001590728759765625, 0.00362396240234375, 0.008838653564453125, 0.0140533447265625, 0.019268035888671875, 0.02448272705078125, 0.029697418212890625, 0.034912109375, 0.040126800537109375, 0.04534149169921875, 0.050556182861328125, 0.0557708740234375, 0.060985565185546875, 0.06620025634765625, 0.07141494750976562, 0.076629638671875, 0.08184432983398438, 0.08705902099609375, 0.09227371215820312, 0.0974884033203125, 0.10270309448242188, 0.10791778564453125, 0.11313247680664062, 0.11834716796875, 0.12356185913085938, 0.12877655029296875, 0.13399124145507812, 0.1392059326171875, 0.14442062377929688, 0.14963531494140625, 0.15485000610351562, 0.160064697265625, 0.16527938842773438, 0.17049407958984375, 0.17570877075195312, 0.1809234619140625, 0.18613815307617188, 0.19135284423828125, 0.19656753540039062, 0.2017822265625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 3.0, 8.0, 9.0, 12.0, 12.0, 24.0, 34.0, 76.0, 202.0, 564.0, 1493.0, 1007.0, 345.0, 121.0, 62.0, 39.0, 16.0, 12.0, 14.0, 10.0, 6.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0833740234375, -0.07953643798828125, -0.0756988525390625, -0.07186126708984375, -0.068023681640625, -0.06418609619140625, -0.0603485107421875, -0.05651092529296875, -0.05267333984375, -0.04883575439453125, -0.0449981689453125, -0.04116058349609375, -0.037322998046875, -0.03348541259765625, -0.0296478271484375, -0.02581024169921875, -0.02197265625, -0.01813507080078125, -0.0142974853515625, -0.01045989990234375, -0.006622314453125, -0.00278472900390625, 0.0010528564453125, 0.00489044189453125, 0.00872802734375, 0.01256561279296875, 0.0164031982421875, 0.02024078369140625, 0.024078369140625, 0.02791595458984375, 0.0317535400390625, 0.03559112548828125, 0.0394287109375, 0.04326629638671875, 0.0471038818359375, 0.05094146728515625, 0.054779052734375, 0.05861663818359375, 0.0624542236328125, 0.06629180908203125, 0.07012939453125, 0.07396697998046875, 0.0778045654296875, 0.08164215087890625, 0.085479736328125, 0.08931732177734375, 0.0931549072265625, 0.09699249267578125, 0.100830078125, 0.10466766357421875, 0.1085052490234375, 0.11234283447265625, 0.116180419921875, 0.12001800537109375, 0.1238555908203125, 0.12769317626953125, 0.13153076171875, 0.13536834716796875, 0.1392059326171875, 0.14304351806640625, 0.146881103515625, 0.15071868896484375, 0.1545562744140625, 0.15839385986328125, 0.1622314453125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 4.0, 5.0, 12.0, 23.0, 101.0, 302.0, 405.0, 127.0, 23.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.4253435134887695, -3.362220048904419, -3.2990965843200684, -3.2359731197357178, -3.172849655151367, -3.1097264289855957, -3.046602964401245, -2.9834794998168945, -2.920356035232544, -2.8572325706481934, -2.7941091060638428, -2.730985641479492, -2.6678624153137207, -2.60473895072937, -2.5416154861450195, -2.478492021560669, -2.4153685569763184, -2.3522450923919678, -2.289121627807617, -2.2259981632232666, -2.162874698638916, -2.0997514724731445, -2.036628007888794, -1.9735045433044434, -1.9103810787200928, -1.8472576141357422, -1.7841341495513916, -1.7210108041763306, -1.65788733959198, -1.5947638750076294, -1.5316405296325684, -1.4685170650482178, -1.4053937196731567, -1.3422702550888062, -1.2791469097137451, -1.2160234451293945, -1.152899980545044, -1.0897765159606934, -1.0266530513763428, -0.9635297060012817, -0.9004062414169312, -0.8372827768325806, -0.7741593718528748, -0.711035966873169, -0.6479125022888184, -0.5847890377044678, -0.521665632724762, -0.45854219794273376, -0.39541876316070557, -0.33229532837867737, -0.26917189359664917, -0.20604845881462097, -0.14292502403259277, -0.07980158925056458, -0.016678154468536377, 0.04644528031349182, 0.10956871509552002, 0.17269214987754822, 0.23581558465957642, 0.2989390194416046, 0.3620624542236328, 0.425185889005661, 0.4883093237876892, 0.551432728767395, 0.6145561933517456]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 10.0, 6.0, 10.0, 12.0, 15.0, 30.0, 27.0, 38.0, 62.0, 70.0, 81.0, 81.0, 87.0, 92.0, 69.0, 70.0, 47.0, 43.0, 39.0, 34.0, 16.0, 15.0, 15.0, 9.0, 9.0, 3.0, 1.0, 6.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6648352742195129, -0.6417621970176697, -0.6186891794204712, -0.5956161022186279, -0.5725430846214294, -0.5494700074195862, -0.5263969898223877, -0.5033239126205444, -0.48025086522102356, -0.4571778178215027, -0.4341047704219818, -0.41103172302246094, -0.3879586458206177, -0.3648856282234192, -0.3418125510215759, -0.31873950362205505, -0.2956664562225342, -0.2725934088230133, -0.24952036142349243, -0.22644729912281036, -0.2033742517232895, -0.18030120432376862, -0.15722814202308655, -0.13415509462356567, -0.1110820472240448, -0.08800899982452393, -0.06493594497442245, -0.041862890124320984, -0.01878984272480011, 0.004283204674720764, 0.027356266975402832, 0.050429314374923706, 0.0735023021697998, 0.09657534956932068, 0.11964840441942215, 0.14272145926952362, 0.1657945066690445, 0.18886755406856537, 0.21194061636924744, 0.2350136637687683, 0.2580867111682892, 0.28115975856781006, 0.30423280596733093, 0.3273058533668518, 0.35037893056869507, 0.37345194816589355, 0.3965250253677368, 0.4195980727672577, 0.44267112016677856, 0.46574416756629944, 0.4888172149658203, 0.5118902921676636, 0.5349633097648621, 0.5580363869667053, 0.5811094045639038, 0.6041824817657471, 0.6272555589675903, 0.6503286361694336, 0.6734016537666321, 0.6964747309684753, 0.7195477485656738, 0.7426208257675171, 0.7656939029693604, 0.7887669205665588, 0.8118399381637573]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 2.0, 6.0, 12.0, 10.0, 38.0, 130.0, 466.0, 2491.0, 187528.0, 852295.0, 4594.0, 659.0, 179.0, 80.0, 19.0, 13.0, 4.0, 3.0, 5.0, 3.0, 5.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.51416015625, -0.49448394775390625, -0.4748077392578125, -0.45513153076171875, -0.435455322265625, -0.41577911376953125, -0.3961029052734375, -0.37642669677734375, -0.35675048828125, -0.33707427978515625, -0.3173980712890625, -0.29772186279296875, -0.278045654296875, -0.25836944580078125, -0.2386932373046875, -0.21901702880859375, -0.1993408203125, -0.17966461181640625, -0.1599884033203125, -0.14031219482421875, -0.120635986328125, -0.10095977783203125, -0.0812835693359375, -0.06160736083984375, -0.04193115234375, -0.02225494384765625, -0.0025787353515625, 0.01709747314453125, 0.036773681640625, 0.05644989013671875, 0.0761260986328125, 0.09580230712890625, 0.115478515625, 0.13515472412109375, 0.1548309326171875, 0.17450714111328125, 0.194183349609375, 0.21385955810546875, 0.2335357666015625, 0.25321197509765625, 0.27288818359375, 0.29256439208984375, 0.3122406005859375, 0.33191680908203125, 0.351593017578125, 0.37126922607421875, 0.3909454345703125, 0.41062164306640625, 0.4302978515625, 0.44997406005859375, 0.4696502685546875, 0.48932647705078125, 0.509002685546875, 0.5286788940429688, 0.5483551025390625, 0.5680313110351562, 0.58770751953125, 0.6073837280273438, 0.6270599365234375, 0.6467361450195312, 0.666412353515625, 0.6860885620117188, 0.7057647705078125, 0.7254409790039062, 0.7451171875]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 5.0, 3.0, 3.0, 14.0, 9.0, 11.0, 20.0, 31.0, 30.0, 36.0, 31.0, 52.0, 54.0, 68.0, 61.0, 62.0, 73.0, 62.0, 49.0, 51.0, 62.0, 53.0, 33.0, 27.0, 16.0, 23.0, 13.0, 8.0, 6.0, 7.0, 4.0, 6.0, 5.0, 4.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.05694580078125, -0.055173397064208984, -0.05340099334716797, -0.05162858963012695, -0.04985618591308594, -0.04808378219604492, -0.046311378479003906, -0.04453897476196289, -0.042766571044921875, -0.04099416732788086, -0.039221763610839844, -0.03744935989379883, -0.03567695617675781, -0.0339045524597168, -0.03213214874267578, -0.030359745025634766, -0.02858734130859375, -0.026814937591552734, -0.02504253387451172, -0.023270130157470703, -0.021497726440429688, -0.019725322723388672, -0.017952919006347656, -0.01618051528930664, -0.014408111572265625, -0.01263570785522461, -0.010863304138183594, -0.009090900421142578, -0.0073184967041015625, -0.005546092987060547, -0.0037736892700195312, -0.0020012855529785156, -0.0002288818359375, 0.0015435218811035156, 0.0033159255981445312, 0.005088329315185547, 0.0068607330322265625, 0.008633136749267578, 0.010405540466308594, 0.01217794418334961, 0.013950347900390625, 0.01572275161743164, 0.017495155334472656, 0.019267559051513672, 0.021039962768554688, 0.022812366485595703, 0.02458477020263672, 0.026357173919677734, 0.02812957763671875, 0.029901981353759766, 0.03167438507080078, 0.0334467887878418, 0.03521919250488281, 0.03699159622192383, 0.038763999938964844, 0.04053640365600586, 0.042308807373046875, 0.04408121109008789, 0.045853614807128906, 0.04762601852416992, 0.04939842224121094, 0.05117082595825195, 0.05294322967529297, 0.054715633392333984, 0.056488037109375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 4.0, 7.0, 16.0, 14.0, 21.0, 30.0, 40.0, 106.0, 201.0, 447.0, 1204.0, 4245.0, 45388.0, 936242.0, 53861.0, 4503.0, 1305.0, 486.0, 198.0, 92.0, 48.0, 30.0, 15.0, 11.0, 10.0, 7.0, 4.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3076171875, -0.29753875732421875, -0.2874603271484375, -0.27738189697265625, -0.267303466796875, -0.25722503662109375, -0.2471466064453125, -0.23706817626953125, -0.22698974609375, -0.21691131591796875, -0.2068328857421875, -0.19675445556640625, -0.186676025390625, -0.17659759521484375, -0.1665191650390625, -0.15644073486328125, -0.1463623046875, -0.13628387451171875, -0.1262054443359375, -0.11612701416015625, -0.106048583984375, -0.09597015380859375, -0.0858917236328125, -0.07581329345703125, -0.06573486328125, -0.05565643310546875, -0.0455780029296875, -0.03549957275390625, -0.025421142578125, -0.01534271240234375, -0.0052642822265625, 0.00481414794921875, 0.014892578125, 0.02497100830078125, 0.0350494384765625, 0.04512786865234375, 0.055206298828125, 0.06528472900390625, 0.0753631591796875, 0.08544158935546875, 0.09552001953125, 0.10559844970703125, 0.1156768798828125, 0.12575531005859375, 0.135833740234375, 0.14591217041015625, 0.1559906005859375, 0.16606903076171875, 0.1761474609375, 0.18622589111328125, 0.1963043212890625, 0.20638275146484375, 0.216461181640625, 0.22653961181640625, 0.2366180419921875, 0.24669647216796875, 0.25677490234375, 0.26685333251953125, 0.2769317626953125, 0.28701019287109375, 0.297088623046875, 0.30716705322265625, 0.3172454833984375, 0.32732391357421875, 0.33740234375]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 7.0, 4.0, 6.0, 8.0, 10.0, 13.0, 22.0, 29.0, 28.0, 28.0, 37.0, 45.0, 46.0, 64.0, 51.0, 68.0, 84.0, 59.0, 61.0, 53.0, 41.0, 53.0, 48.0, 21.0, 24.0, 20.0, 15.0, 13.0, 12.0, 10.0, 5.0, 8.0, 6.0, 4.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2242431640625, -0.2177257537841797, -0.21120834350585938, -0.20469093322753906, -0.19817352294921875, -0.19165611267089844, -0.18513870239257812, -0.1786212921142578, -0.1721038818359375, -0.1655864715576172, -0.15906906127929688, -0.15255165100097656, -0.14603424072265625, -0.13951683044433594, -0.13299942016601562, -0.1264820098876953, -0.119964599609375, -0.11344718933105469, -0.10692977905273438, -0.10041236877441406, -0.09389495849609375, -0.08737754821777344, -0.08086013793945312, -0.07434272766113281, -0.0678253173828125, -0.06130790710449219, -0.054790496826171875, -0.04827308654785156, -0.04175567626953125, -0.03523826599121094, -0.028720855712890625, -0.022203445434570312, -0.01568603515625, -0.009168624877929688, -0.002651214599609375, 0.0038661956787109375, 0.01038360595703125, 0.016901016235351562, 0.023418426513671875, 0.029935836791992188, 0.0364532470703125, 0.04297065734863281, 0.049488067626953125, 0.05600547790527344, 0.06252288818359375, 0.06904029846191406, 0.07555770874023438, 0.08207511901855469, 0.088592529296875, 0.09510993957519531, 0.10162734985351562, 0.10814476013183594, 0.11466217041015625, 0.12117958068847656, 0.12769699096679688, 0.1342144012451172, 0.1407318115234375, 0.1472492218017578, 0.15376663208007812, 0.16028404235839844, 0.16680145263671875, 0.17331886291503906, 0.17983627319335938, 0.1863536834716797, 0.19287109375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 8.0, 7.0, 4.0, 6.0, 15.0, 9.0, 19.0, 47.0, 62.0, 103.0, 226.0, 387.0, 915.0, 2630.0, 10563.0, 684243.0, 335669.0, 9459.0, 2431.0, 852.0, 413.0, 194.0, 103.0, 64.0, 41.0, 25.0, 12.0, 15.0, 15.0, 5.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.307861328125, -0.298797607421875, -0.28973388671875, -0.280670166015625, -0.2716064453125, -0.262542724609375, -0.25347900390625, -0.244415283203125, -0.2353515625, -0.226287841796875, -0.21722412109375, -0.208160400390625, -0.1990966796875, -0.190032958984375, -0.18096923828125, -0.171905517578125, -0.162841796875, -0.153778076171875, -0.14471435546875, -0.135650634765625, -0.1265869140625, -0.117523193359375, -0.10845947265625, -0.099395751953125, -0.09033203125, -0.081268310546875, -0.07220458984375, -0.063140869140625, -0.0540771484375, -0.045013427734375, -0.03594970703125, -0.026885986328125, -0.017822265625, -0.008758544921875, 0.00030517578125, 0.009368896484375, 0.0184326171875, 0.027496337890625, 0.03656005859375, 0.045623779296875, 0.0546875, 0.063751220703125, 0.07281494140625, 0.081878662109375, 0.0909423828125, 0.100006103515625, 0.10906982421875, 0.118133544921875, 0.127197265625, 0.136260986328125, 0.14532470703125, 0.154388427734375, 0.1634521484375, 0.172515869140625, 0.18157958984375, 0.190643310546875, 0.19970703125, 0.208770751953125, 0.21783447265625, 0.226898193359375, 0.2359619140625, 0.245025634765625, 0.25408935546875, 0.263153076171875, 0.272216796875]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 3.0, 4.0, 5.0, 5.0, 6.0, 22.0, 57.0, 284.0, 445.0, 110.0, 31.0, 12.0, 4.0, 8.0, 0.0, 2.0, 4.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.860494613647461e-05, -6.588175892829895e-05, -6.315857172012329e-05, -6.043538451194763e-05, -5.771219730377197e-05, -5.4989010095596313e-05, -5.2265822887420654e-05, -4.9542635679244995e-05, -4.6819448471069336e-05, -4.409626126289368e-05, -4.137307405471802e-05, -3.864988684654236e-05, -3.59266996383667e-05, -3.320351243019104e-05, -3.048032522201538e-05, -2.775713801383972e-05, -2.5033950805664062e-05, -2.2310763597488403e-05, -1.9587576389312744e-05, -1.6864389181137085e-05, -1.4141201972961426e-05, -1.1418014764785767e-05, -8.694827556610107e-06, -5.971640348434448e-06, -3.248453140258789e-06, -5.252659320831299e-07, 2.1979212760925293e-06, 4.9211084842681885e-06, 7.644295692443848e-06, 1.0367482900619507e-05, 1.3090670108795166e-05, 1.5813857316970825e-05, 1.8537044525146484e-05, 2.1260231733322144e-05, 2.3983418941497803e-05, 2.6706606149673462e-05, 2.942979335784912e-05, 3.215298056602478e-05, 3.487616777420044e-05, 3.75993549823761e-05, 4.032254219055176e-05, 4.304572939872742e-05, 4.5768916606903076e-05, 4.8492103815078735e-05, 5.1215291023254395e-05, 5.3938478231430054e-05, 5.666166543960571e-05, 5.938485264778137e-05, 6.210803985595703e-05, 6.483122706413269e-05, 6.755441427230835e-05, 7.027760148048401e-05, 7.300078868865967e-05, 7.572397589683533e-05, 7.844716310501099e-05, 8.117035031318665e-05, 8.38935375213623e-05, 8.661672472953796e-05, 8.933991193771362e-05, 9.206309914588928e-05, 9.478628635406494e-05, 9.75094735622406e-05, 0.00010023266077041626, 0.00010295584797859192, 0.00010567903518676758]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 1.0, 2.0, 2.0, 2.0, 7.0, 8.0, 17.0, 13.0, 24.0, 32.0, 33.0, 69.0, 114.0, 280.0, 679.0, 2211.0, 11949.0, 781305.0, 240581.0, 8399.0, 1768.0, 548.0, 209.0, 114.0, 59.0, 46.0, 23.0, 22.0, 12.0, 8.0, 7.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2437744140625, -0.2365856170654297, -0.22939682006835938, -0.22220802307128906, -0.21501922607421875, -0.20783042907714844, -0.20064163208007812, -0.1934528350830078, -0.1862640380859375, -0.1790752410888672, -0.17188644409179688, -0.16469764709472656, -0.15750885009765625, -0.15032005310058594, -0.14313125610351562, -0.1359424591064453, -0.128753662109375, -0.12156486511230469, -0.11437606811523438, -0.10718727111816406, -0.09999847412109375, -0.09280967712402344, -0.08562088012695312, -0.07843208312988281, -0.0712432861328125, -0.06405448913574219, -0.056865692138671875, -0.04967689514160156, -0.04248809814453125, -0.03529930114746094, -0.028110504150390625, -0.020921707153320312, -0.01373291015625, -0.0065441131591796875, 0.000644683837890625, 0.007833480834960938, 0.01502227783203125, 0.022211074829101562, 0.029399871826171875, 0.03658866882324219, 0.0437774658203125, 0.05096626281738281, 0.058155059814453125, 0.06534385681152344, 0.07253265380859375, 0.07972145080566406, 0.08691024780273438, 0.09409904479980469, 0.101287841796875, 0.10847663879394531, 0.11566543579101562, 0.12285423278808594, 0.13004302978515625, 0.13723182678222656, 0.14442062377929688, 0.1516094207763672, 0.1587982177734375, 0.1659870147705078, 0.17317581176757812, 0.18036460876464844, 0.18755340576171875, 0.19474220275878906, 0.20193099975585938, 0.2091197967529297, 0.21630859375]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 1.0, 8.0, 6.0, 2.0, 10.0, 9.0, 13.0, 17.0, 15.0, 27.0, 78.0, 140.0, 167.0, 173.0, 132.0, 77.0, 36.0, 29.0, 15.0, 10.0, 3.0, 12.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.16357421875, -0.1593770980834961, -0.1551799774169922, -0.15098285675048828, -0.14678573608398438, -0.14258861541748047, -0.13839149475097656, -0.13419437408447266, -0.12999725341796875, -0.12580013275146484, -0.12160301208496094, -0.11740589141845703, -0.11320877075195312, -0.10901165008544922, -0.10481452941894531, -0.1006174087524414, -0.0964202880859375, -0.0922231674194336, -0.08802604675292969, -0.08382892608642578, -0.07963180541992188, -0.07543468475341797, -0.07123756408691406, -0.06704044342041016, -0.06284332275390625, -0.058646202087402344, -0.05444908142089844, -0.05025196075439453, -0.046054840087890625, -0.04185771942138672, -0.03766059875488281, -0.033463478088378906, -0.029266357421875, -0.025069236755371094, -0.020872116088867188, -0.01667499542236328, -0.012477874755859375, -0.008280754089355469, -0.0040836334228515625, 0.00011348724365234375, 0.00431060791015625, 0.008507728576660156, 0.012704849243164062, 0.01690196990966797, 0.021099090576171875, 0.02529621124267578, 0.029493331909179688, 0.033690452575683594, 0.0378875732421875, 0.042084693908691406, 0.04628181457519531, 0.05047893524169922, 0.054676055908203125, 0.05887317657470703, 0.06307029724121094, 0.06726741790771484, 0.07146453857421875, 0.07566165924072266, 0.07985877990722656, 0.08405590057373047, 0.08825302124023438, 0.09245014190673828, 0.09664726257324219, 0.1008443832397461, 0.10504150390625]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 8.0, 60.0, 441.0, 323.0, 91.0, 38.0, 21.0, 15.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.546508550643921, -1.3895516395568848, -1.2325947284698486, -1.0756378173828125, -0.9186809659004211, -0.761724054813385, -0.6047672033309937, -0.4478102922439575, -0.2908533811569214, -0.13389648497104645, 0.02306041121482849, 0.18001729249954224, 0.33697420358657837, 0.4939311146736145, 0.6508879661560059, 0.807844877243042, 0.9648017883300781, 1.1217586994171143, 1.2787156105041504, 1.4356725215911865, 1.5926294326782227, 1.7495863437652588, 1.9065431356430054, 2.063499927520752, 2.220457077026367, 2.3774139881134033, 2.5343708992004395, 2.6913278102874756, 2.8482847213745117, 3.005241632461548, 3.162198543548584, 3.319155216217041, 3.476111888885498, 3.633068799972534, 3.7900257110595703, 3.9469826221466064, 4.103939533233643, 4.2608962059021, 4.417853355407715, 4.574810028076172, 4.731767177581787, 4.888723850250244, 5.045680999755859, 5.202637672424316, 5.359594821929932, 5.516551494598389, 5.673508644104004, 5.830465316772461, 5.987421989440918, 6.144378662109375, 6.30133581161499, 6.458292484283447, 6.6152496337890625, 6.7722063064575195, 6.929163455963135, 7.086120128631592, 7.243077278137207, 7.400033950805664, 7.556991100311279, 7.713947772979736, 7.870904922485352, 8.027861595153809, 8.184818267822266, 8.341775894165039, 8.498732566833496]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 6.0, 5.0, 4.0, 10.0, 13.0, 12.0, 15.0, 14.0, 17.0, 24.0, 30.0, 30.0, 26.0, 38.0, 32.0, 40.0, 36.0, 56.0, 58.0, 72.0, 63.0, 49.0, 46.0, 54.0, 30.0, 27.0, 28.0, 29.0, 25.0, 16.0, 22.0, 13.0, 13.0, 11.0, 5.0, 9.0, 7.0, 5.0, 5.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-1.0033349990844727, -0.9756072759628296, -0.9478794932365417, -0.9201517701148987, -0.8924240469932556, -0.8646962642669678, -0.8369685411453247, -0.8092408180236816, -0.7815130949020386, -0.7537853717803955, -0.7260575890541077, -0.6983298659324646, -0.6706021428108215, -0.6428743600845337, -0.6151466369628906, -0.5874189138412476, -0.5596911311149597, -0.5319634079933167, -0.5042356252670288, -0.47650790214538574, -0.4487801790237427, -0.4210524260997772, -0.39332467317581177, -0.3655969500541687, -0.33786919713020325, -0.3101414442062378, -0.2824137210845947, -0.2546859681606293, -0.226958230137825, -0.19923049211502075, -0.1715027391910553, -0.14377500116825104, -0.11604732275009155, -0.08831958472728729, -0.060591839253902435, -0.03286409378051758, -0.005136355757713318, 0.022591382265090942, 0.050319135189056396, 0.07804687321186066, 0.10577461123466492, 0.13350234925746918, 0.16123008728027344, 0.1889578402042389, 0.21668557822704315, 0.2444133162498474, 0.27214106917381287, 0.2998688220977783, 0.3275965452194214, 0.35532429814338684, 0.3830520212650299, 0.41077977418899536, 0.4385074973106384, 0.4662352502346039, 0.49396300315856934, 0.5216907262802124, 0.5494184494018555, 0.5771461725234985, 0.6048739552497864, 0.6326016783714294, 0.6603294014930725, 0.6880571842193604, 0.7157849073410034, 0.7435126304626465, 0.7712404131889343]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 7.0, 8.0, 19.0, 66.0, 187.0, 2128.0, 4190329.0, 1276.0, 168.0, 54.0, 37.0, 7.0, 7.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44287109375, -0.40727996826171875, -0.3716888427734375, -0.33609771728515625, -0.300506591796875, -0.26491546630859375, -0.2293243408203125, -0.19373321533203125, -0.15814208984375, -0.12255096435546875, -0.0869598388671875, -0.05136871337890625, -0.015777587890625, 0.01981353759765625, 0.0554046630859375, 0.09099578857421875, 0.1265869140625, 0.16217803955078125, 0.1977691650390625, 0.23336029052734375, 0.268951416015625, 0.30454254150390625, 0.3401336669921875, 0.37572479248046875, 0.41131591796875, 0.44690704345703125, 0.4824981689453125, 0.5180892944335938, 0.553680419921875, 0.5892715454101562, 0.6248626708984375, 0.6604537963867188, 0.696044921875, 0.7316360473632812, 0.7672271728515625, 0.8028182983398438, 0.838409423828125, 0.8740005493164062, 0.9095916748046875, 0.9451828002929688, 0.98077392578125, 1.0163650512695312, 1.0519561767578125, 1.0875473022460938, 1.123138427734375, 1.1587295532226562, 1.1943206787109375, 1.2299118041992188, 1.2655029296875, 1.3010940551757812, 1.3366851806640625, 1.3722763061523438, 1.407867431640625, 1.4434585571289062, 1.4790496826171875, 1.5146408081054688, 1.55023193359375, 1.5858230590820312, 1.6214141845703125, 1.6570053100585938, 1.692596435546875, 1.7281875610351562, 1.7637786865234375, 1.7993698120117188, 1.8349609375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 1.0, 5.0, 12.0, 9.0, 9.0, 12.0, 17.0, 20.0, 19.0, 34.0, 38.0, 35.0, 41.0, 62.0, 58.0, 62.0, 64.0, 57.0, 64.0, 63.0, 49.0, 61.0, 46.0, 37.0, 18.0, 24.0, 18.0, 13.0, 12.0, 11.0, 8.0, 2.0, 4.0, 3.0, 3.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0447998046875, -0.04319572448730469, -0.041591644287109375, -0.03998756408691406, -0.03838348388671875, -0.03677940368652344, -0.035175323486328125, -0.03357124328613281, -0.0319671630859375, -0.030363082885742188, -0.028759002685546875, -0.027154922485351562, -0.02555084228515625, -0.023946762084960938, -0.022342681884765625, -0.020738601684570312, -0.019134521484375, -0.017530441284179688, -0.015926361083984375, -0.014322280883789062, -0.01271820068359375, -0.011114120483398438, -0.009510040283203125, -0.007905960083007812, -0.0063018798828125, -0.0046977996826171875, -0.003093719482421875, -0.0014896392822265625, 0.00011444091796875, 0.0017185211181640625, 0.003322601318359375, 0.0049266815185546875, 0.00653076171875, 0.008134841918945312, 0.009738922119140625, 0.011343002319335938, 0.01294708251953125, 0.014551162719726562, 0.016155242919921875, 0.017759323120117188, 0.0193634033203125, 0.020967483520507812, 0.022571563720703125, 0.024175643920898438, 0.02577972412109375, 0.027383804321289062, 0.028987884521484375, 0.030591964721679688, 0.032196044921875, 0.03380012512207031, 0.035404205322265625, 0.03700828552246094, 0.03861236572265625, 0.04021644592285156, 0.041820526123046875, 0.04342460632324219, 0.0450286865234375, 0.04663276672363281, 0.048236846923828125, 0.04984092712402344, 0.05144500732421875, 0.05304908752441406, 0.054653167724609375, 0.05625724792480469, 0.057861328125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 8.0, 10.0, 18.0, 23.0, 23.0, 46.0, 53.0, 80.0, 144.0, 414.0, 1723.0, 226477.0, 3962280.0, 2418.0, 322.0, 111.0, 60.0, 29.0, 16.0, 15.0, 7.0, 5.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.41748046875, -0.39942169189453125, -0.3813629150390625, -0.36330413818359375, -0.345245361328125, -0.32718658447265625, -0.3091278076171875, -0.29106903076171875, -0.27301025390625, -0.25495147705078125, -0.2368927001953125, -0.21883392333984375, -0.200775146484375, -0.18271636962890625, -0.1646575927734375, -0.14659881591796875, -0.1285400390625, -0.11048126220703125, -0.0924224853515625, -0.07436370849609375, -0.056304931640625, -0.03824615478515625, -0.0201873779296875, -0.00212860107421875, 0.01593017578125, 0.03398895263671875, 0.0520477294921875, 0.07010650634765625, 0.088165283203125, 0.10622406005859375, 0.1242828369140625, 0.14234161376953125, 0.160400390625, 0.17845916748046875, 0.1965179443359375, 0.21457672119140625, 0.232635498046875, 0.25069427490234375, 0.2687530517578125, 0.28681182861328125, 0.30487060546875, 0.32292938232421875, 0.3409881591796875, 0.35904693603515625, 0.377105712890625, 0.39516448974609375, 0.4132232666015625, 0.43128204345703125, 0.4493408203125, 0.46739959716796875, 0.4854583740234375, 0.5035171508789062, 0.521575927734375, 0.5396347045898438, 0.5576934814453125, 0.5757522583007812, 0.59381103515625, 0.6118698120117188, 0.6299285888671875, 0.6479873657226562, 0.666046142578125, 0.6841049194335938, 0.7021636962890625, 0.7202224731445312, 0.73828125]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 10.0, 7.0, 21.0, 35.0, 113.0, 408.0, 2069.0, 1069.0, 205.0, 77.0, 32.0, 21.0, 8.0, 2.0, 3.0, 2.0, 1.0], "bins": [-0.49755859375, -0.48830509185791016, -0.4790515899658203, -0.46979808807373047, -0.4605445861816406, -0.4512910842895508, -0.44203758239746094, -0.4327840805053711, -0.42353057861328125, -0.4142770767211914, -0.40502357482910156, -0.3957700729370117, -0.3865165710449219, -0.37726306915283203, -0.3680095672607422, -0.35875606536865234, -0.3495025634765625, -0.34024906158447266, -0.3309955596923828, -0.32174205780029297, -0.3124885559082031, -0.3032350540161133, -0.29398155212402344, -0.2847280502319336, -0.27547454833984375, -0.2662210464477539, -0.25696754455566406, -0.24771404266357422, -0.23846054077148438, -0.22920703887939453, -0.2199535369873047, -0.21070003509521484, -0.201446533203125, -0.19219303131103516, -0.1829395294189453, -0.17368602752685547, -0.16443252563476562, -0.15517902374267578, -0.14592552185058594, -0.1366720199584961, -0.12741851806640625, -0.1181650161743164, -0.10891151428222656, -0.09965801239013672, -0.09040451049804688, -0.08115100860595703, -0.07189750671386719, -0.06264400482177734, -0.0533905029296875, -0.044137001037597656, -0.03488349914550781, -0.02562999725341797, -0.016376495361328125, -0.007122993469238281, 0.0021305084228515625, 0.011384010314941406, 0.02063751220703125, 0.029891014099121094, 0.03914451599121094, 0.04839801788330078, 0.057651519775390625, 0.06690502166748047, 0.07615852355957031, 0.08541202545166016, 0.09466552734375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 4.0, 4.0, 5.0, 2.0, 8.0, 7.0, 12.0, 11.0, 20.0, 22.0, 33.0, 42.0, 69.0, 95.0, 122.0, 189.0, 138.0, 98.0, 44.0, 25.0, 20.0, 15.0, 10.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-2.2066240310668945, -2.1593518257141113, -2.1120798587799072, -2.064807653427124, -2.01753568649292, -1.9702634811401367, -1.922991394996643, -1.8757193088531494, -1.8284471035003662, -1.7811750173568726, -1.733902931213379, -1.6866307258605957, -1.639358639717102, -1.5920865535736084, -1.5448144674301147, -1.497542381286621, -1.450270175933838, -1.4029980897903442, -1.3557260036468506, -1.3084537982940674, -1.2611817121505737, -1.21390962600708, -1.1666375398635864, -1.1193654537200928, -1.0720933675765991, -1.0248212814331055, -0.977549135684967, -0.9302770495414734, -0.883004903793335, -0.8357328176498413, -0.7884607315063477, -0.7411885857582092, -0.693916380405426, -0.6466442942619324, -0.599372148513794, -0.5521000623703003, -0.5048279166221619, -0.4575558304786682, -0.4102837145328522, -0.36301159858703613, -0.3157394826412201, -0.26846736669540405, -0.221195250749588, -0.17392314970493317, -0.12665103375911713, -0.07937891781330109, -0.03210681676864624, 0.0151652991771698, 0.06243741512298584, 0.10970953106880188, 0.15698164701461792, 0.20425374805927277, 0.25152587890625, 0.29879796504974365, 0.3460700809955597, 0.39334219694137573, 0.4406143128871918, 0.4878864288330078, 0.5351585149765015, 0.5824306607246399, 0.6297027468681335, 0.676974892616272, 0.7242469787597656, 0.7715190649032593, 0.8187912106513977]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 10.0, 3.0, 5.0, 4.0, 3.0, 8.0, 12.0, 14.0, 25.0, 27.0, 28.0, 24.0, 35.0, 27.0, 38.0, 45.0, 41.0, 38.0, 46.0, 54.0, 50.0, 43.0, 43.0, 50.0, 41.0, 35.0, 35.0, 35.0, 30.0, 20.0, 20.0, 16.0, 25.0, 8.0, 11.0, 9.0, 7.0, 9.0, 8.0, 3.0, 3.0, 6.0, 4.0, 4.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.8549874424934387, -0.8260473012924194, -0.7971072196960449, -0.7681670784950256, -0.7392269968986511, -0.7102868556976318, -0.6813467741012573, -0.652406632900238, -0.6234664916992188, -0.5945263504981995, -0.565586268901825, -0.5366461277008057, -0.5077060461044312, -0.47876590490341187, -0.44982579350471497, -0.42088568210601807, -0.39194560050964355, -0.36300548911094666, -0.33406537771224976, -0.30512523651123047, -0.27618515491485596, -0.24724502861499786, -0.21830490231513977, -0.18936479091644287, -0.16042467951774597, -0.13148456811904907, -0.10254444926977158, -0.07360433042049408, -0.04466421902179718, -0.01572410762310028, 0.013216018676757812, 0.04215613007545471, 0.07109618186950684, 0.10003629326820374, 0.12897640466690063, 0.15791653096675873, 0.18685664236545563, 0.21579675376415253, 0.24473688006401062, 0.2736769914627075, 0.3026171028614044, 0.3315572142601013, 0.3604973256587982, 0.3894374370574951, 0.4183775782585144, 0.4473176598548889, 0.4762578010559082, 0.5051978826522827, 0.534138023853302, 0.5630781650543213, 0.5920182466506958, 0.6209583878517151, 0.6498984694480896, 0.6788386106491089, 0.7077786922454834, 0.7367188334465027, 0.765658974647522, 0.7945991158485413, 0.8235391974449158, 0.8524793386459351, 0.8814194202423096, 0.9103595614433289, 0.9392997026443481, 0.9682397842407227, 0.9971798658370972]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 7.0, 4.0, 10.0, 14.0, 21.0, 34.0, 72.0, 127.0, 380.0, 1185.0, 4292.0, 19141.0, 111617.0, 548642.0, 303483.0, 46592.0, 9443.0, 2401.0, 650.0, 219.0, 95.0, 43.0, 27.0, 11.0, 14.0, 6.0, 4.0, 8.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.190185546875, -0.1845531463623047, -0.17892074584960938, -0.17328834533691406, -0.16765594482421875, -0.16202354431152344, -0.15639114379882812, -0.1507587432861328, -0.1451263427734375, -0.1394939422607422, -0.13386154174804688, -0.12822914123535156, -0.12259674072265625, -0.11696434020996094, -0.11133193969726562, -0.10569953918457031, -0.100067138671875, -0.09443473815917969, -0.08880233764648438, -0.08316993713378906, -0.07753753662109375, -0.07190513610839844, -0.06627273559570312, -0.06064033508300781, -0.0550079345703125, -0.04937553405761719, -0.043743133544921875, -0.03811073303222656, -0.03247833251953125, -0.026845932006835938, -0.021213531494140625, -0.015581130981445312, -0.00994873046875, -0.0043163299560546875, 0.001316070556640625, 0.0069484710693359375, 0.01258087158203125, 0.018213272094726562, 0.023845672607421875, 0.029478073120117188, 0.0351104736328125, 0.04074287414550781, 0.046375274658203125, 0.05200767517089844, 0.05764007568359375, 0.06327247619628906, 0.06890487670898438, 0.07453727722167969, 0.080169677734375, 0.08580207824707031, 0.09143447875976562, 0.09706687927246094, 0.10269927978515625, 0.10833168029785156, 0.11396408081054688, 0.11959648132324219, 0.1252288818359375, 0.1308612823486328, 0.13649368286132812, 0.14212608337402344, 0.14775848388671875, 0.15339088439941406, 0.15902328491210938, 0.1646556854248047, 0.1702880859375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 7.0, 5.0, 6.0, 9.0, 11.0, 18.0, 20.0, 26.0, 29.0, 37.0, 39.0, 41.0, 49.0, 46.0, 57.0, 50.0, 46.0, 65.0, 48.0, 54.0, 35.0, 38.0, 44.0, 39.0, 35.0, 27.0, 23.0, 17.0, 19.0, 8.0, 8.0, 9.0, 5.0, 11.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05364990234375, -0.05171680450439453, -0.04978370666503906, -0.047850608825683594, -0.045917510986328125, -0.043984413146972656, -0.04205131530761719, -0.04011821746826172, -0.03818511962890625, -0.03625202178955078, -0.03431892395019531, -0.032385826110839844, -0.030452728271484375, -0.028519630432128906, -0.026586532592773438, -0.02465343475341797, -0.0227203369140625, -0.02078723907470703, -0.018854141235351562, -0.016921043395996094, -0.014987945556640625, -0.013054847717285156, -0.011121749877929688, -0.009188652038574219, -0.00725555419921875, -0.005322456359863281, -0.0033893585205078125, -0.0014562606811523438, 0.000476837158203125, 0.0024099349975585938, 0.0043430328369140625, 0.006276130676269531, 0.008209228515625, 0.010142326354980469, 0.012075424194335938, 0.014008522033691406, 0.015941619873046875, 0.017874717712402344, 0.019807815551757812, 0.02174091339111328, 0.02367401123046875, 0.02560710906982422, 0.027540206909179688, 0.029473304748535156, 0.031406402587890625, 0.033339500427246094, 0.03527259826660156, 0.03720569610595703, 0.0391387939453125, 0.04107189178466797, 0.04300498962402344, 0.044938087463378906, 0.046871185302734375, 0.048804283142089844, 0.05073738098144531, 0.05267047882080078, 0.05460357666015625, 0.05653667449951172, 0.05846977233886719, 0.060402870178222656, 0.062335968017578125, 0.0642690658569336, 0.06620216369628906, 0.06813526153564453, 0.070068359375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 7.0, 7.0, 11.0, 19.0, 29.0, 35.0, 59.0, 126.0, 262.0, 625.0, 1761.0, 6729.0, 55382.0, 932728.0, 42165.0, 5887.0, 1580.0, 587.0, 260.0, 108.0, 68.0, 35.0, 20.0, 9.0, 10.0, 10.0, 6.0, 8.0, 2.0, 8.0, 2.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.47802734375, -0.4632987976074219, -0.44857025146484375, -0.4338417053222656, -0.4191131591796875, -0.4043846130371094, -0.38965606689453125, -0.3749275207519531, -0.360198974609375, -0.3454704284667969, -0.33074188232421875, -0.3160133361816406, -0.3012847900390625, -0.2865562438964844, -0.27182769775390625, -0.2570991516113281, -0.24237060546875, -0.22764205932617188, -0.21291351318359375, -0.19818496704101562, -0.1834564208984375, -0.16872787475585938, -0.15399932861328125, -0.13927078247070312, -0.124542236328125, -0.10981369018554688, -0.09508514404296875, -0.08035659790039062, -0.0656280517578125, -0.050899505615234375, -0.03617095947265625, -0.021442413330078125, -0.0067138671875, 0.008014678955078125, 0.02274322509765625, 0.037471771240234375, 0.0522003173828125, 0.06692886352539062, 0.08165740966796875, 0.09638595581054688, 0.111114501953125, 0.12584304809570312, 0.14057159423828125, 0.15530014038085938, 0.1700286865234375, 0.18475723266601562, 0.19948577880859375, 0.21421432495117188, 0.22894287109375, 0.24367141723632812, 0.25839996337890625, 0.2731285095214844, 0.2878570556640625, 0.3025856018066406, 0.31731414794921875, 0.3320426940917969, 0.346771240234375, 0.3614997863769531, 0.37622833251953125, 0.3909568786621094, 0.4056854248046875, 0.4204139709472656, 0.43514251708984375, 0.4498710632324219, 0.464599609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 2.0, 5.0, 1.0, 5.0, 5.0, 3.0, 7.0, 6.0, 9.0, 12.0, 11.0, 31.0, 29.0, 40.0, 44.0, 51.0, 60.0, 65.0, 90.0, 80.0, 62.0, 80.0, 56.0, 57.0, 41.0, 24.0, 35.0, 23.0, 17.0, 10.0, 10.0, 5.0, 9.0, 4.0, 3.0, 2.0, 4.0, 3.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.359130859375, -0.3468818664550781, -0.33463287353515625, -0.3223838806152344, -0.3101348876953125, -0.2978858947753906, -0.28563690185546875, -0.2733879089355469, -0.261138916015625, -0.24888992309570312, -0.23664093017578125, -0.22439193725585938, -0.2121429443359375, -0.19989395141601562, -0.18764495849609375, -0.17539596557617188, -0.16314697265625, -0.15089797973632812, -0.13864898681640625, -0.12639999389648438, -0.1141510009765625, -0.10190200805664062, -0.08965301513671875, -0.07740402221679688, -0.065155029296875, -0.052906036376953125, -0.04065704345703125, -0.028408050537109375, -0.0161590576171875, -0.003910064697265625, 0.00833892822265625, 0.020587921142578125, 0.0328369140625, 0.045085906982421875, 0.05733489990234375, 0.06958389282226562, 0.0818328857421875, 0.09408187866210938, 0.10633087158203125, 0.11857986450195312, 0.130828857421875, 0.14307785034179688, 0.15532684326171875, 0.16757583618164062, 0.1798248291015625, 0.19207382202148438, 0.20432281494140625, 0.21657180786132812, 0.22882080078125, 0.24106979370117188, 0.25331878662109375, 0.2655677795410156, 0.2778167724609375, 0.2900657653808594, 0.30231475830078125, 0.3145637512207031, 0.326812744140625, 0.3390617370605469, 0.35131072998046875, 0.3635597229003906, 0.3758087158203125, 0.3880577087402344, 0.40030670166015625, 0.4125556945800781, 0.4248046875]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 1.0, 3.0, 8.0, 8.0, 8.0, 19.0, 17.0, 38.0, 61.0, 83.0, 151.0, 245.0, 422.0, 806.0, 1561.0, 3510.0, 9322.0, 32484.0, 930115.0, 49275.0, 12018.0, 4361.0, 1898.0, 950.0, 505.0, 271.0, 149.0, 98.0, 57.0, 39.0, 15.0, 19.0, 12.0, 11.0, 11.0, 3.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.352783203125, -0.3416252136230469, -0.33046722412109375, -0.3193092346191406, -0.3081512451171875, -0.2969932556152344, -0.28583526611328125, -0.2746772766113281, -0.263519287109375, -0.2523612976074219, -0.24120330810546875, -0.23004531860351562, -0.2188873291015625, -0.20772933959960938, -0.19657135009765625, -0.18541336059570312, -0.17425537109375, -0.16309738159179688, -0.15193939208984375, -0.14078140258789062, -0.1296234130859375, -0.11846542358398438, -0.10730743408203125, -0.09614944458007812, -0.084991455078125, -0.07383346557617188, -0.06267547607421875, -0.051517486572265625, -0.0403594970703125, -0.029201507568359375, -0.01804351806640625, -0.006885528564453125, 0.0042724609375, 0.015430450439453125, 0.02658843994140625, 0.037746429443359375, 0.0489044189453125, 0.060062408447265625, 0.07122039794921875, 0.08237838745117188, 0.093536376953125, 0.10469436645507812, 0.11585235595703125, 0.12701034545898438, 0.1381683349609375, 0.14932632446289062, 0.16048431396484375, 0.17164230346679688, 0.18280029296875, 0.19395828247070312, 0.20511627197265625, 0.21627426147460938, 0.2274322509765625, 0.23859024047851562, 0.24974822998046875, 0.2609062194824219, 0.272064208984375, 0.2832221984863281, 0.29438018798828125, 0.3055381774902344, 0.3166961669921875, 0.3278541564941406, 0.33901214599609375, 0.3501701354980469, 0.361328125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 6.0, 10.0, 5.0, 8.0, 8.0, 27.0, 169.0, 588.0, 75.0, 30.0, 17.0, 11.0, 9.0, 9.0, 9.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0001919269561767578, -0.00018705148249864578, -0.00018217600882053375, -0.00017730053514242172, -0.0001724250614643097, -0.00016754958778619766, -0.00016267411410808563, -0.0001577986404299736, -0.00015292316675186157, -0.00014804769307374954, -0.0001431722193956375, -0.00013829674571752548, -0.00013342127203941345, -0.00012854579836130142, -0.0001236703246831894, -0.00011879485100507736, -0.00011391937732696533, -0.0001090439036488533, -0.00010416842997074127, -9.929295629262924e-05, -9.441748261451721e-05, -8.954200893640518e-05, -8.466653525829315e-05, -7.979106158018112e-05, -7.491558790206909e-05, -7.004011422395706e-05, -6.516464054584503e-05, -6.0289166867733e-05, -5.541369318962097e-05, -5.053821951150894e-05, -4.566274583339691e-05, -4.078727215528488e-05, -3.591179847717285e-05, -3.103632479906082e-05, -2.616085112094879e-05, -2.128537744283676e-05, -1.640990376472473e-05, -1.1534430086612701e-05, -6.658956408500671e-06, -1.7834827303886414e-06, 3.0919909477233887e-06, 7.967464625835419e-06, 1.2842938303947449e-05, 1.771841198205948e-05, 2.259388566017151e-05, 2.746935933828354e-05, 3.234483301639557e-05, 3.72203066945076e-05, 4.209578037261963e-05, 4.697125405073166e-05, 5.184672772884369e-05, 5.672220140695572e-05, 6.159767508506775e-05, 6.647314876317978e-05, 7.134862244129181e-05, 7.622409611940384e-05, 8.109956979751587e-05, 8.59750434756279e-05, 9.085051715373993e-05, 9.572599083185196e-05, 0.00010060146450996399, 0.00010547693818807602, 0.00011035241186618805, 0.00011522788554430008, 0.00012010335922241211]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 6.0, 9.0, 7.0, 11.0, 14.0, 34.0, 57.0, 122.0, 323.0, 698.0, 1890.0, 5910.0, 23523.0, 940992.0, 58676.0, 11110.0, 3226.0, 1135.0, 465.0, 157.0, 73.0, 43.0, 18.0, 12.0, 7.0, 5.0, 3.0, 6.0, 2.0, 3.0, 3.0, 5.0, 2.0, 0.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.468994140625, -0.4554939270019531, -0.44199371337890625, -0.4284934997558594, -0.4149932861328125, -0.4014930725097656, -0.38799285888671875, -0.3744926452636719, -0.360992431640625, -0.3474922180175781, -0.33399200439453125, -0.3204917907714844, -0.3069915771484375, -0.2934913635253906, -0.27999114990234375, -0.2664909362792969, -0.25299072265625, -0.23949050903320312, -0.22599029541015625, -0.21249008178710938, -0.1989898681640625, -0.18548965454101562, -0.17198944091796875, -0.15848922729492188, -0.144989013671875, -0.13148880004882812, -0.11798858642578125, -0.10448837280273438, -0.0909881591796875, -0.07748794555664062, -0.06398773193359375, -0.050487518310546875, -0.0369873046875, -0.023487091064453125, -0.00998687744140625, 0.003513336181640625, 0.0170135498046875, 0.030513763427734375, 0.04401397705078125, 0.057514190673828125, 0.071014404296875, 0.08451461791992188, 0.09801483154296875, 0.11151504516601562, 0.1250152587890625, 0.13851547241210938, 0.15201568603515625, 0.16551589965820312, 0.17901611328125, 0.19251632690429688, 0.20601654052734375, 0.21951675415039062, 0.2330169677734375, 0.24651718139648438, 0.26001739501953125, 0.2735176086425781, 0.287017822265625, 0.3005180358886719, 0.31401824951171875, 0.3275184631347656, 0.3410186767578125, 0.3545188903808594, 0.36801910400390625, 0.3815193176269531, 0.39501953125]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 1.0, 0.0, 0.0, 7.0, 4.0, 3.0, 4.0, 3.0, 1.0, 7.0, 3.0, 10.0, 5.0, 10.0, 13.0, 19.0, 53.0, 269.0, 383.0, 98.0, 24.0, 8.0, 7.0, 8.0, 4.0, 10.0, 12.0, 6.0, 5.0, 5.0, 4.0, 0.0, 3.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.275146484375, -0.2657127380371094, -0.25627899169921875, -0.24684524536132812, -0.2374114990234375, -0.22797775268554688, -0.21854400634765625, -0.20911026000976562, -0.199676513671875, -0.19024276733398438, -0.18080902099609375, -0.17137527465820312, -0.1619415283203125, -0.15250778198242188, -0.14307403564453125, -0.13364028930664062, -0.12420654296875, -0.11477279663085938, -0.10533905029296875, -0.09590530395507812, -0.0864715576171875, -0.07703781127929688, -0.06760406494140625, -0.058170318603515625, -0.048736572265625, -0.039302825927734375, -0.02986907958984375, -0.020435333251953125, -0.0110015869140625, -0.001567840576171875, 0.00786590576171875, 0.017299652099609375, 0.0267333984375, 0.036167144775390625, 0.04560089111328125, 0.055034637451171875, 0.0644683837890625, 0.07390213012695312, 0.08333587646484375, 0.09276962280273438, 0.102203369140625, 0.11163711547851562, 0.12107086181640625, 0.13050460815429688, 0.1399383544921875, 0.14937210083007812, 0.15880584716796875, 0.16823959350585938, 0.17767333984375, 0.18710708618164062, 0.19654083251953125, 0.20597457885742188, 0.2154083251953125, 0.22484207153320312, 0.23427581787109375, 0.24370956420898438, 0.253143310546875, 0.2625770568847656, 0.27201080322265625, 0.2814445495605469, 0.2908782958984375, 0.3003120422363281, 0.30974578857421875, 0.3191795349121094, 0.32861328125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 3.0, 10.0, 14.0, 46.0, 135.0, 351.0, 191.0, 99.0, 53.0, 39.0, 22.0, 12.0, 5.0, 8.0, 5.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.3017144203186035, -6.13893985748291, -5.976165771484375, -5.813391208648682, -5.650616645812988, -5.487842082977295, -5.325067520141602, -5.162293434143066, -4.999518871307373, -4.83674430847168, -4.6739702224731445, -4.511195659637451, -4.348421096801758, -4.1856465339660645, -4.022871971130371, -3.860097885131836, -3.6973233222961426, -3.534548759460449, -3.371774435043335, -3.2090001106262207, -3.0462255477905273, -2.883450984954834, -2.7206766605377197, -2.5579023361206055, -2.395127773284912, -2.2323532104492188, -2.0695788860321045, -1.9068044424057007, -1.7440299987792969, -1.581255555152893, -1.4184811115264893, -1.2557066679000854, -1.0929317474365234, -0.9301573038101196, -0.7673828601837158, -0.604608416557312, -0.4418339729309082, -0.2790595293045044, -0.11628508567810059, 0.04648935794830322, 0.20926380157470703, 0.37203824520111084, 0.5348126888275146, 0.6975871324539185, 0.8603615760803223, 1.023136019706726, 1.1859104633331299, 1.3486849069595337, 1.5114593505859375, 1.6742337942123413, 1.8370082378387451, 1.999782681465149, 2.1625571250915527, 2.325331687927246, 2.4881060123443604, 2.6508803367614746, 2.813654899597168, 2.9764294624328613, 3.1392037868499756, 3.30197811126709, 3.464752674102783, 3.6275272369384766, 3.790301561355591, 3.953075885772705, 4.115850448608398]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 11.0, 5.0, 9.0, 10.0, 9.0, 16.0, 10.0, 13.0, 18.0, 18.0, 24.0, 29.0, 33.0, 25.0, 43.0, 39.0, 47.0, 70.0, 80.0, 82.0, 55.0, 54.0, 35.0, 34.0, 44.0, 21.0, 33.0, 24.0, 22.0, 18.0, 15.0, 19.0, 10.0, 8.0, 4.0, 5.0, 5.0, 2.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.168922185897827, -2.105311155319214, -2.0416998863220215, -1.9780888557434082, -1.9144777059555054, -1.8508665561676025, -1.7872555255889893, -1.7236443758010864, -1.6600332260131836, -1.5964220762252808, -1.532810926437378, -1.4691998958587646, -1.4055887460708618, -1.341977596282959, -1.2783665657043457, -1.2147554159164429, -1.15114426612854, -1.0875331163406372, -1.0239219665527344, -0.9603109359741211, -0.8966997861862183, -0.8330886363983154, -0.7694775462150574, -0.7058664560317993, -0.6422553062438965, -0.5786441564559937, -0.5150330662727356, -0.45142194628715515, -0.3878108263015747, -0.32419970631599426, -0.2605885863304138, -0.19697746634483337, -0.13336610794067383, -0.06975498795509338, -0.0061438679695129395, 0.057467252016067505, 0.12107837200164795, 0.1846894919872284, 0.24830061197280884, 0.3119117319583893, 0.3755228519439697, 0.43913397192955017, 0.5027450919151306, 0.5663561820983887, 0.6299673318862915, 0.6935784816741943, 0.7571895718574524, 0.8208006620407104, 0.8844118118286133, 0.9480229616165161, 1.011634111404419, 1.0752451419830322, 1.138856291770935, 1.202467441558838, 1.2660784721374512, 1.329689621925354, 1.3933007717132568, 1.4569119215011597, 1.5205230712890625, 1.5841341018676758, 1.6477452516555786, 1.7113564014434814, 1.7749674320220947, 1.8385785818099976, 1.9021897315979004]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 9.0, 8.0, 10.0, 21.0, 31.0, 43.0, 59.0, 84.0, 117.0, 262.0, 876.0, 6951.0, 1045055.0, 3128134.0, 10734.0, 1134.0, 332.0, 137.0, 79.0, 60.0, 54.0, 29.0, 21.0, 13.0, 12.0, 10.0, 7.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.291259765625, -0.2791633605957031, -0.26706695556640625, -0.2549705505371094, -0.2428741455078125, -0.23077774047851562, -0.21868133544921875, -0.20658493041992188, -0.194488525390625, -0.18239212036132812, -0.17029571533203125, -0.15819931030273438, -0.1461029052734375, -0.13400650024414062, -0.12191009521484375, -0.10981369018554688, -0.09771728515625, -0.08562088012695312, -0.07352447509765625, -0.061428070068359375, -0.0493316650390625, -0.037235260009765625, -0.02513885498046875, -0.013042449951171875, -0.000946044921875, 0.011150360107421875, 0.02324676513671875, 0.035343170166015625, 0.0474395751953125, 0.059535980224609375, 0.07163238525390625, 0.08372879028320312, 0.0958251953125, 0.10792160034179688, 0.12001800537109375, 0.13211441040039062, 0.1442108154296875, 0.15630722045898438, 0.16840362548828125, 0.18050003051757812, 0.192596435546875, 0.20469284057617188, 0.21678924560546875, 0.22888565063476562, 0.2409820556640625, 0.2530784606933594, 0.26517486572265625, 0.2772712707519531, 0.28936767578125, 0.3014640808105469, 0.31356048583984375, 0.3256568908691406, 0.3377532958984375, 0.3498497009277344, 0.36194610595703125, 0.3740425109863281, 0.386138916015625, 0.3982353210449219, 0.41033172607421875, 0.4224281311035156, 0.4345245361328125, 0.4466209411621094, 0.45871734619140625, 0.4708137512207031, 0.48291015625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 2.0, 13.0, 9.0, 13.0, 13.0, 19.0, 27.0, 31.0, 43.0, 49.0, 51.0, 59.0, 62.0, 58.0, 66.0, 70.0, 65.0, 51.0, 40.0, 53.0, 36.0, 34.0, 28.0, 38.0, 13.0, 4.0, 5.0, 12.0, 9.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06463623046875, -0.06211662292480469, -0.059597015380859375, -0.05707740783691406, -0.05455780029296875, -0.05203819274902344, -0.049518585205078125, -0.04699897766113281, -0.0444793701171875, -0.04195976257324219, -0.039440155029296875, -0.03692054748535156, -0.03440093994140625, -0.03188133239746094, -0.029361724853515625, -0.026842117309570312, -0.024322509765625, -0.021802902221679688, -0.019283294677734375, -0.016763687133789062, -0.01424407958984375, -0.011724472045898438, -0.009204864501953125, -0.0066852569580078125, -0.0041656494140625, -0.0016460418701171875, 0.000873565673828125, 0.0033931732177734375, 0.00591278076171875, 0.008432388305664062, 0.010951995849609375, 0.013471603393554688, 0.0159912109375, 0.018510818481445312, 0.021030426025390625, 0.023550033569335938, 0.02606964111328125, 0.028589248657226562, 0.031108856201171875, 0.03362846374511719, 0.0361480712890625, 0.03866767883300781, 0.041187286376953125, 0.04370689392089844, 0.04622650146484375, 0.04874610900878906, 0.051265716552734375, 0.05378532409667969, 0.056304931640625, 0.05882453918457031, 0.061344146728515625, 0.06386375427246094, 0.06638336181640625, 0.06890296936035156, 0.07142257690429688, 0.07394218444824219, 0.0764617919921875, 0.07898139953613281, 0.08150100708007812, 0.08402061462402344, 0.08654022216796875, 0.08905982971191406, 0.09157943725585938, 0.09409904479980469, 0.09661865234375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 2.0, 7.0, 10.0, 14.0, 21.0, 22.0, 54.0, 59.0, 107.0, 168.0, 388.0, 837.0, 3642.0, 71662.0, 4086783.0, 26928.0, 2073.0, 605.0, 267.0, 177.0, 110.0, 90.0, 79.0, 45.0, 36.0, 30.0, 15.0, 13.0, 13.0, 10.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.455078125, -0.4364166259765625, -0.417755126953125, -0.3990936279296875, -0.38043212890625, -0.3617706298828125, -0.343109130859375, -0.3244476318359375, -0.3057861328125, -0.2871246337890625, -0.268463134765625, -0.2498016357421875, -0.23114013671875, -0.2124786376953125, -0.193817138671875, -0.1751556396484375, -0.156494140625, -0.1378326416015625, -0.119171142578125, -0.1005096435546875, -0.08184814453125, -0.0631866455078125, -0.044525146484375, -0.0258636474609375, -0.0072021484375, 0.0114593505859375, 0.030120849609375, 0.0487823486328125, 0.06744384765625, 0.0861053466796875, 0.104766845703125, 0.1234283447265625, 0.14208984375, 0.1607513427734375, 0.179412841796875, 0.1980743408203125, 0.21673583984375, 0.2353973388671875, 0.254058837890625, 0.2727203369140625, 0.2913818359375, 0.3100433349609375, 0.328704833984375, 0.3473663330078125, 0.36602783203125, 0.3846893310546875, 0.403350830078125, 0.4220123291015625, 0.440673828125, 0.4593353271484375, 0.477996826171875, 0.4966583251953125, 0.51531982421875, 0.5339813232421875, 0.552642822265625, 0.5713043212890625, 0.5899658203125, 0.6086273193359375, 0.627288818359375, 0.6459503173828125, 0.66461181640625, 0.6832733154296875, 0.701934814453125, 0.7205963134765625, 0.7392578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 7.0, 8.0, 11.0, 15.0, 30.0, 56.0, 129.0, 766.0, 2055.0, 712.0, 174.0, 56.0, 27.0, 18.0, 8.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2327880859375, -0.2186908721923828, -0.20459365844726562, -0.19049644470214844, -0.17639923095703125, -0.16230201721191406, -0.14820480346679688, -0.1341075897216797, -0.1200103759765625, -0.10591316223144531, -0.09181594848632812, -0.07771873474121094, -0.06362152099609375, -0.04952430725097656, -0.035427093505859375, -0.021329879760742188, -0.007232666015625, 0.0068645477294921875, 0.020961761474609375, 0.03505897521972656, 0.04915618896484375, 0.06325340270996094, 0.07735061645507812, 0.09144783020019531, 0.1055450439453125, 0.11964225769042969, 0.13373947143554688, 0.14783668518066406, 0.16193389892578125, 0.17603111267089844, 0.19012832641601562, 0.2042255401611328, 0.21832275390625, 0.2324199676513672, 0.24651718139648438, 0.26061439514160156, 0.27471160888671875, 0.28880882263183594, 0.3029060363769531, 0.3170032501220703, 0.3311004638671875, 0.3451976776123047, 0.3592948913574219, 0.37339210510253906, 0.38748931884765625, 0.40158653259277344, 0.4156837463378906, 0.4297809600830078, 0.443878173828125, 0.4579753875732422, 0.4720726013183594, 0.48616981506347656, 0.5002670288085938, 0.5143642425537109, 0.5284614562988281, 0.5425586700439453, 0.5566558837890625, 0.5707530975341797, 0.5848503112792969, 0.5989475250244141, 0.6130447387695312, 0.6271419525146484, 0.6412391662597656, 0.6553363800048828, 0.66943359375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 7.0, 7.0, 40.0, 141.0, 371.0, 300.0, 88.0, 19.0, 16.0, 12.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.645979404449463, -4.472877025604248, -4.299775123596191, -4.126672744750977, -3.953570604324341, -3.780468463897705, -3.6073663234710693, -3.4342641830444336, -3.2611618041992188, -3.088059663772583, -2.9149575233459473, -2.7418551445007324, -2.5687530040740967, -2.395650863647461, -2.222548723220825, -2.0494465827941895, -1.8763444423675537, -1.703242301940918, -1.5301400423049927, -1.357037901878357, -1.1839356422424316, -1.010833501815796, -0.8377313613891602, -0.6646291017532349, -0.4915269613265991, -0.3184247612953186, -0.14532259106636047, 0.027779579162597656, 0.20088177919387817, 0.3739839792251587, 0.5470861196517944, 0.7201883792877197, 0.8932905197143555, 1.0663926601409912, 1.2394949197769165, 1.4125970602035522, 1.5856993198394775, 1.7588014602661133, 1.931903600692749, 2.1050057411193848, 2.2781081199645996, 2.4512102603912354, 2.624312400817871, 2.797414779663086, 2.9705169200897217, 3.1436190605163574, 3.316721200942993, 3.489823341369629, 3.6629254817962646, 3.8360276222229004, 4.009130001068115, 4.182231903076172, 4.355334281921387, 4.528436660766602, 4.701538562774658, 4.874640941619873, 5.04774284362793, 5.2208452224731445, 5.393947124481201, 5.567049503326416, 5.740151405334473, 5.9132537841796875, 6.086356163024902, 6.259458065032959, 6.432560443878174]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 6.0, 7.0, 4.0, 12.0, 11.0, 16.0, 8.0, 12.0, 21.0, 19.0, 31.0, 33.0, 24.0, 36.0, 45.0, 42.0, 54.0, 59.0, 45.0, 48.0, 44.0, 44.0, 50.0, 38.0, 47.0, 31.0, 32.0, 37.0, 30.0, 16.0, 16.0, 19.0, 13.0, 9.0, 11.0, 12.0, 7.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0], "bins": [-1.215989112854004, -1.1820282936096191, -1.1480674743652344, -1.1141066551208496, -1.0801459550857544, -1.0461851358413696, -1.0122243165969849, -0.9782634973526001, -0.9443026781082153, -0.9103418588638306, -0.8763810992240906, -0.8424202799797058, -0.808459460735321, -0.774498701095581, -0.7405378818511963, -0.7065770626068115, -0.6726163029670715, -0.6386554837226868, -0.6046947240829468, -0.570733904838562, -0.5367730855941772, -0.5028122663497925, -0.4688515067100525, -0.4348906874656677, -0.40092989802360535, -0.36696910858154297, -0.3330082893371582, -0.2990474998950958, -0.26508671045303345, -0.23112589120864868, -0.1971651017665863, -0.16320429742336273, -0.12924343347549438, -0.09528262913227081, -0.06132183223962784, -0.027361035346984863, 0.0065997689962387085, 0.04056057333946228, 0.07452136278152466, 0.10848216712474823, 0.1424429714679718, 0.17640377581119537, 0.21036458015441895, 0.24432536959648132, 0.2782861590385437, 0.31224697828292847, 0.34620776772499084, 0.3801685571670532, 0.414129376411438, 0.44809016585350037, 0.48205098509788513, 0.5160117745399475, 0.5499725937843323, 0.5839333534240723, 0.617894172668457, 0.6518549919128418, 0.6858158111572266, 0.7197766304016113, 0.7537373900413513, 0.7876982092857361, 0.8216590285301208, 0.8556197881698608, 0.8895806074142456, 0.9235414266586304, 0.9575021862983704]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 5.0, 4.0, 3.0, 11.0, 15.0, 15.0, 34.0, 43.0, 78.0, 95.0, 184.0, 245.0, 392.0, 775.0, 1391.0, 2803.0, 6081.0, 14586.0, 39670.0, 125463.0, 371719.0, 325774.0, 102616.0, 33147.0, 12614.0, 5262.0, 2501.0, 1246.0, 729.0, 418.0, 232.0, 165.0, 85.0, 55.0, 30.0, 22.0, 18.0, 12.0, 16.0, 5.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1578369140625, -0.15256118774414062, -0.14728546142578125, -0.14200973510742188, -0.1367340087890625, -0.13145828247070312, -0.12618255615234375, -0.12090682983398438, -0.115631103515625, -0.11035537719726562, -0.10507965087890625, -0.09980392456054688, -0.0945281982421875, -0.08925247192382812, -0.08397674560546875, -0.07870101928710938, -0.07342529296875, -0.06814956665039062, -0.06287384033203125, -0.057598114013671875, -0.0523223876953125, -0.047046661376953125, -0.04177093505859375, -0.036495208740234375, -0.031219482421875, -0.025943756103515625, -0.02066802978515625, -0.015392303466796875, -0.0101165771484375, -0.004840850830078125, 0.00043487548828125, 0.005710601806640625, 0.010986328125, 0.016262054443359375, 0.02153778076171875, 0.026813507080078125, 0.0320892333984375, 0.037364959716796875, 0.04264068603515625, 0.047916412353515625, 0.053192138671875, 0.058467864990234375, 0.06374359130859375, 0.06901931762695312, 0.0742950439453125, 0.07957077026367188, 0.08484649658203125, 0.09012222290039062, 0.09539794921875, 0.10067367553710938, 0.10594940185546875, 0.11122512817382812, 0.1165008544921875, 0.12177658081054688, 0.12705230712890625, 0.13232803344726562, 0.137603759765625, 0.14287948608398438, 0.14815521240234375, 0.15343093872070312, 0.1587066650390625, 0.16398239135742188, 0.16925811767578125, 0.17453384399414062, 0.1798095703125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 5.0, 3.0, 8.0, 9.0, 12.0, 12.0, 16.0, 20.0, 22.0, 20.0, 29.0, 42.0, 42.0, 46.0, 40.0, 53.0, 62.0, 69.0, 50.0, 58.0, 52.0, 45.0, 46.0, 46.0, 38.0, 41.0, 17.0, 20.0, 20.0, 19.0, 11.0, 3.0, 6.0, 3.0, 4.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.08795166015625, -0.08519935607910156, -0.08244705200195312, -0.07969474792480469, -0.07694244384765625, -0.07419013977050781, -0.07143783569335938, -0.06868553161621094, -0.0659332275390625, -0.06318092346191406, -0.060428619384765625, -0.05767631530761719, -0.05492401123046875, -0.05217170715332031, -0.049419403076171875, -0.04666709899902344, -0.043914794921875, -0.04116249084472656, -0.038410186767578125, -0.03565788269042969, -0.03290557861328125, -0.030153274536132812, -0.027400970458984375, -0.024648666381835938, -0.0218963623046875, -0.019144058227539062, -0.016391754150390625, -0.013639450073242188, -0.01088714599609375, -0.008134841918945312, -0.005382537841796875, -0.0026302337646484375, 0.0001220703125, 0.0028743743896484375, 0.005626678466796875, 0.008378982543945312, 0.01113128662109375, 0.013883590698242188, 0.016635894775390625, 0.019388198852539062, 0.0221405029296875, 0.024892807006835938, 0.027645111083984375, 0.030397415161132812, 0.03314971923828125, 0.03590202331542969, 0.038654327392578125, 0.04140663146972656, 0.044158935546875, 0.04691123962402344, 0.049663543701171875, 0.05241584777832031, 0.05516815185546875, 0.05792045593261719, 0.060672760009765625, 0.06342506408691406, 0.0661773681640625, 0.06892967224121094, 0.07168197631835938, 0.07443428039550781, 0.07718658447265625, 0.07993888854980469, 0.08269119262695312, 0.08544349670410156, 0.08819580078125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 8.0, 8.0, 6.0, 9.0, 16.0, 28.0, 50.0, 56.0, 88.0, 118.0, 183.0, 312.0, 525.0, 993.0, 1928.0, 4649.0, 17066.0, 120437.0, 769635.0, 107641.0, 16070.0, 4636.0, 1886.0, 906.0, 504.0, 273.0, 174.0, 126.0, 60.0, 51.0, 26.0, 20.0, 12.0, 18.0, 13.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.33203125, -0.3199462890625, -0.307861328125, -0.2957763671875, -0.28369140625, -0.2716064453125, -0.259521484375, -0.2474365234375, -0.2353515625, -0.2232666015625, -0.211181640625, -0.1990966796875, -0.18701171875, -0.1749267578125, -0.162841796875, -0.1507568359375, -0.138671875, -0.1265869140625, -0.114501953125, -0.1024169921875, -0.09033203125, -0.0782470703125, -0.066162109375, -0.0540771484375, -0.0419921875, -0.0299072265625, -0.017822265625, -0.0057373046875, 0.00634765625, 0.0184326171875, 0.030517578125, 0.0426025390625, 0.0546875, 0.0667724609375, 0.078857421875, 0.0909423828125, 0.10302734375, 0.1151123046875, 0.127197265625, 0.1392822265625, 0.1513671875, 0.1634521484375, 0.175537109375, 0.1876220703125, 0.19970703125, 0.2117919921875, 0.223876953125, 0.2359619140625, 0.248046875, 0.2601318359375, 0.272216796875, 0.2843017578125, 0.29638671875, 0.3084716796875, 0.320556640625, 0.3326416015625, 0.3447265625, 0.3568115234375, 0.368896484375, 0.3809814453125, 0.39306640625, 0.4051513671875, 0.417236328125, 0.4293212890625, 0.44140625]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 5.0, 2.0, 6.0, 9.0, 12.0, 21.0, 13.0, 21.0, 31.0, 29.0, 36.0, 42.0, 57.0, 60.0, 63.0, 56.0, 62.0, 70.0, 62.0, 68.0, 51.0, 45.0, 32.0, 30.0, 27.0, 23.0, 22.0, 8.0, 12.0, 7.0, 8.0, 0.0, 7.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.368408203125, -0.3539848327636719, -0.33956146240234375, -0.3251380920410156, -0.3107147216796875, -0.2962913513183594, -0.28186798095703125, -0.2674446105957031, -0.253021240234375, -0.23859786987304688, -0.22417449951171875, -0.20975112915039062, -0.1953277587890625, -0.18090438842773438, -0.16648101806640625, -0.15205764770507812, -0.13763427734375, -0.12321090698242188, -0.10878753662109375, -0.09436416625976562, -0.0799407958984375, -0.06551742553710938, -0.05109405517578125, -0.036670684814453125, -0.022247314453125, -0.007823944091796875, 0.00659942626953125, 0.021022796630859375, 0.0354461669921875, 0.049869537353515625, 0.06429290771484375, 0.07871627807617188, 0.0931396484375, 0.10756301879882812, 0.12198638916015625, 0.13640975952148438, 0.1508331298828125, 0.16525650024414062, 0.17967987060546875, 0.19410324096679688, 0.208526611328125, 0.22294998168945312, 0.23737335205078125, 0.2517967224121094, 0.2662200927734375, 0.2806434631347656, 0.29506683349609375, 0.3094902038574219, 0.32391357421875, 0.3383369445800781, 0.35276031494140625, 0.3671836853027344, 0.3816070556640625, 0.3960304260253906, 0.41045379638671875, 0.4248771667480469, 0.439300537109375, 0.4537239074707031, 0.46814727783203125, 0.4825706481933594, 0.4969940185546875, 0.5114173889160156, 0.5258407592773438, 0.5402641296386719, 0.5546875]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 5.0, 9.0, 13.0, 11.0, 23.0, 26.0, 32.0, 56.0, 87.0, 165.0, 272.0, 495.0, 967.0, 1815.0, 3995.0, 10021.0, 26370.0, 111240.0, 748111.0, 102271.0, 25308.0, 9348.0, 3964.0, 1832.0, 933.0, 489.0, 276.0, 150.0, 81.0, 58.0, 31.0, 26.0, 30.0, 16.0, 12.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1552734375, -0.15034103393554688, -0.14540863037109375, -0.14047622680664062, -0.1355438232421875, -0.13061141967773438, -0.12567901611328125, -0.12074661254882812, -0.115814208984375, -0.11088180541992188, -0.10594940185546875, -0.10101699829101562, -0.0960845947265625, -0.09115219116210938, -0.08621978759765625, -0.08128738403320312, -0.07635498046875, -0.07142257690429688, -0.06649017333984375, -0.061557769775390625, -0.0566253662109375, -0.051692962646484375, -0.04676055908203125, -0.041828155517578125, -0.036895751953125, -0.031963348388671875, -0.02703094482421875, -0.022098541259765625, -0.0171661376953125, -0.012233734130859375, -0.00730133056640625, -0.002368927001953125, 0.0025634765625, 0.007495880126953125, 0.01242828369140625, 0.017360687255859375, 0.0222930908203125, 0.027225494384765625, 0.03215789794921875, 0.037090301513671875, 0.042022705078125, 0.046955108642578125, 0.05188751220703125, 0.056819915771484375, 0.0617523193359375, 0.06668472290039062, 0.07161712646484375, 0.07654953002929688, 0.08148193359375, 0.08641433715820312, 0.09134674072265625, 0.09627914428710938, 0.1012115478515625, 0.10614395141601562, 0.11107635498046875, 0.11600875854492188, 0.120941162109375, 0.12587356567382812, 0.13080596923828125, 0.13573837280273438, 0.1406707763671875, 0.14560317993164062, 0.15053558349609375, 0.15546798706054688, 0.160400390625]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 8.0, 4.0, 8.0, 7.0, 8.0, 7.0, 20.0, 31.0, 74.0, 191.0, 359.0, 143.0, 42.0, 29.0, 17.0, 8.0, 6.0, 8.0, 5.0, 3.0, 4.0, 5.0, 3.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.00015997886657714844, -0.00015591364353895187, -0.0001518484205007553, -0.00014778319746255875, -0.00014371797442436218, -0.00013965275138616562, -0.00013558752834796906, -0.0001315223053097725, -0.00012745708227157593, -0.00012339185923337936, -0.0001193266361951828, -0.00011526141315698624, -0.00011119619011878967, -0.00010713096708059311, -0.00010306574404239655, -9.900052100419998e-05, -9.493529796600342e-05, -9.087007492780685e-05, -8.680485188961029e-05, -8.273962885141373e-05, -7.867440581321716e-05, -7.46091827750206e-05, -7.054395973682404e-05, -6.647873669862747e-05, -6.241351366043091e-05, -5.8348290622234344e-05, -5.428306758403778e-05, -5.021784454584122e-05, -4.615262150764465e-05, -4.208739846944809e-05, -3.8022175431251526e-05, -3.395695239305496e-05, -2.98917293548584e-05, -2.5826506316661835e-05, -2.176128327846527e-05, -1.7696060240268707e-05, -1.3630837202072144e-05, -9.56561416387558e-06, -5.500391125679016e-06, -1.4351680874824524e-06, 2.6300549507141113e-06, 6.695277988910675e-06, 1.0760501027107239e-05, 1.4825724065303802e-05, 1.8890947103500366e-05, 2.295617014169693e-05, 2.7021393179893494e-05, 3.108661621809006e-05, 3.515183925628662e-05, 3.9217062294483185e-05, 4.328228533267975e-05, 4.734750837087631e-05, 5.1412731409072876e-05, 5.547795444726944e-05, 5.9543177485466003e-05, 6.360840052366257e-05, 6.767362356185913e-05, 7.17388466000557e-05, 7.580406963825226e-05, 7.986929267644882e-05, 8.393451571464539e-05, 8.799973875284195e-05, 9.206496179103851e-05, 9.613018482923508e-05, 0.00010019540786743164]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 5.0, 4.0, 4.0, 6.0, 6.0, 5.0, 9.0, 17.0, 34.0, 41.0, 64.0, 101.0, 171.0, 294.0, 528.0, 976.0, 2370.0, 6235.0, 20705.0, 114079.0, 790266.0, 85718.0, 17408.0, 5379.0, 2039.0, 945.0, 456.0, 256.0, 146.0, 95.0, 62.0, 47.0, 29.0, 17.0, 12.0, 11.0, 13.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1951904296875, -0.18917274475097656, -0.18315505981445312, -0.1771373748779297, -0.17111968994140625, -0.1651020050048828, -0.15908432006835938, -0.15306663513183594, -0.1470489501953125, -0.14103126525878906, -0.13501358032226562, -0.1289958953857422, -0.12297821044921875, -0.11696052551269531, -0.11094284057617188, -0.10492515563964844, -0.098907470703125, -0.09288978576660156, -0.08687210083007812, -0.08085441589355469, -0.07483673095703125, -0.06881904602050781, -0.06280136108398438, -0.05678367614746094, -0.0507659912109375, -0.04474830627441406, -0.038730621337890625, -0.03271293640136719, -0.02669525146484375, -0.020677566528320312, -0.014659881591796875, -0.008642196655273438, -0.00262451171875, 0.0033931732177734375, 0.009410858154296875, 0.015428543090820312, 0.02144622802734375, 0.027463912963867188, 0.033481597900390625, 0.03949928283691406, 0.0455169677734375, 0.05153465270996094, 0.057552337646484375, 0.06357002258300781, 0.06958770751953125, 0.07560539245605469, 0.08162307739257812, 0.08764076232910156, 0.093658447265625, 0.09967613220214844, 0.10569381713867188, 0.11171150207519531, 0.11772918701171875, 0.12374687194824219, 0.12976455688476562, 0.13578224182128906, 0.1417999267578125, 0.14781761169433594, 0.15383529663085938, 0.1598529815673828, 0.16587066650390625, 0.1718883514404297, 0.17790603637695312, 0.18392372131347656, 0.18994140625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 5.0, 5.0, 10.0, 10.0, 11.0, 20.0, 13.0, 29.0, 43.0, 56.0, 91.0, 118.0, 146.0, 123.0, 93.0, 63.0, 25.0, 17.0, 25.0, 17.0, 11.0, 7.0, 19.0, 7.0, 3.0, 5.0, 1.0, 3.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1597900390625, -0.15436935424804688, -0.14894866943359375, -0.14352798461914062, -0.1381072998046875, -0.13268661499023438, -0.12726593017578125, -0.12184524536132812, -0.116424560546875, -0.11100387573242188, -0.10558319091796875, -0.10016250610351562, -0.0947418212890625, -0.08932113647460938, -0.08390045166015625, -0.07847976684570312, -0.07305908203125, -0.06763839721679688, -0.06221771240234375, -0.056797027587890625, -0.0513763427734375, -0.045955657958984375, -0.04053497314453125, -0.035114288330078125, -0.029693603515625, -0.024272918701171875, -0.01885223388671875, -0.013431549072265625, -0.0080108642578125, -0.002590179443359375, 0.00283050537109375, 0.008251190185546875, 0.013671875, 0.019092559814453125, 0.02451324462890625, 0.029933929443359375, 0.0353546142578125, 0.040775299072265625, 0.04619598388671875, 0.051616668701171875, 0.057037353515625, 0.062458038330078125, 0.06787872314453125, 0.07329940795898438, 0.0787200927734375, 0.08414077758789062, 0.08956146240234375, 0.09498214721679688, 0.10040283203125, 0.10582351684570312, 0.11124420166015625, 0.11666488647460938, 0.1220855712890625, 0.12750625610351562, 0.13292694091796875, 0.13834762573242188, 0.143768310546875, 0.14918899536132812, 0.15460968017578125, 0.16003036499023438, 0.1654510498046875, 0.17087173461914062, 0.17629241943359375, 0.18171310424804688, 0.1871337890625]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 6.0, 4.0, 12.0, 13.0, 22.0, 34.0, 46.0, 113.0, 232.0, 304.0, 123.0, 57.0, 23.0, 11.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-6.898059844970703, -6.752254962921143, -6.60645055770874, -6.46064567565918, -6.314840793609619, -6.169035911560059, -6.023231506347656, -5.877426624298096, -5.731621742248535, -5.585816860198975, -5.440012454986572, -5.294207572937012, -5.148402690887451, -5.002597808837891, -4.856793403625488, -4.710988521575928, -4.565184116363525, -4.419379234313965, -4.2735748291015625, -4.127769947052002, -3.9819650650024414, -3.83616042137146, -3.6903557777404785, -3.544550895690918, -3.3987462520599365, -3.252941608428955, -3.1071367263793945, -2.961332082748413, -2.8155274391174316, -2.669722557067871, -2.5239179134368896, -2.378113269805908, -2.2323081493377686, -2.086503505706787, -1.9406986236572266, -1.7948939800262451, -1.6490892171859741, -1.5032844543457031, -1.3574798107147217, -1.2116750478744507, -1.0658702850341797, -0.9200655221939087, -0.7742608189582825, -0.6284561157226562, -0.48265135288238525, -0.33684659004211426, -0.19104188680648804, -0.045237183570861816, 0.10056757926940918, 0.2463723123073578, 0.3921770453453064, 0.5379817485809326, 0.6837865114212036, 0.8295912742614746, 0.9753959774971008, 1.121200680732727, 1.267005443572998, 1.412810206413269, 1.55861496925354, 1.7044196128845215, 1.8502243757247925, 1.9960291385650635, 2.141833782196045, 2.2876386642456055, 2.433443307876587]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 6.0, 6.0, 4.0, 13.0, 13.0, 9.0, 11.0, 18.0, 25.0, 34.0, 31.0, 34.0, 45.0, 36.0, 44.0, 61.0, 112.0, 88.0, 70.0, 58.0, 41.0, 30.0, 27.0, 29.0, 31.0, 25.0, 17.0, 16.0, 12.0, 7.0, 12.0, 7.0, 10.0, 6.0, 4.0, 3.0, 4.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7468786239624023, -2.6706655025482178, -2.594452381134033, -2.5182390213012695, -2.442025899887085, -2.3658127784729004, -2.289599657058716, -2.2133865356445312, -2.1371734142303467, -2.060960292816162, -1.984747052192688, -1.9085339307785034, -1.8323208093643188, -1.7561075687408447, -1.6798944473266602, -1.6036813259124756, -1.5274680852890015, -1.451254963874817, -1.3750417232513428, -1.2988286018371582, -1.2226154804229736, -1.146402359008789, -1.070189118385315, -0.9939759969711304, -0.917762815952301, -0.8415496349334717, -0.7653365135192871, -0.6891233325004578, -0.6129101514816284, -0.5366970300674438, -0.4604838490486145, -0.38427072763442993, -0.3080575466156006, -0.23184439539909363, -0.15563122928142548, -0.07941806316375732, -0.003204911947250366, 0.07300823926925659, 0.14922142028808594, 0.2254345417022705, 0.30164772272109985, 0.3778608739376068, 0.45407402515411377, 0.5302872061729431, 0.6065003871917725, 0.682713508605957, 0.7589266896247864, 0.835139811038971, 0.9113529920578003, 0.9875661730766296, 1.063779354095459, 1.1399924755096436, 1.2162055969238281, 1.2924187183380127, 1.3686319589614868, 1.4448450803756714, 1.5210583209991455, 1.59727144241333, 1.6734846830368042, 1.7496978044509888, 1.8259109258651733, 1.9021241664886475, 1.978337287902832, 2.0545504093170166, 2.130763530731201]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 6.0, 6.0, 6.0, 7.0, 17.0, 25.0, 37.0, 71.0, 134.0, 267.0, 602.0, 1259.0, 3170.0, 9751.0, 47332.0, 731510.0, 3165692.0, 202302.0, 22006.0, 5946.0, 2200.0, 912.0, 483.0, 225.0, 121.0, 66.0, 39.0, 29.0, 26.0, 12.0, 13.0, 4.0, 1.0, 2.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1785888671875, -0.17249488830566406, -0.16640090942382812, -0.1603069305419922, -0.15421295166015625, -0.1481189727783203, -0.14202499389648438, -0.13593101501464844, -0.1298370361328125, -0.12374305725097656, -0.11764907836914062, -0.11155509948730469, -0.10546112060546875, -0.09936714172363281, -0.09327316284179688, -0.08717918395996094, -0.081085205078125, -0.07499122619628906, -0.06889724731445312, -0.06280326843261719, -0.05670928955078125, -0.05061531066894531, -0.044521331787109375, -0.03842735290527344, -0.0323333740234375, -0.026239395141601562, -0.020145416259765625, -0.014051437377929688, -0.00795745849609375, -0.0018634796142578125, 0.004230499267578125, 0.010324478149414062, 0.01641845703125, 0.022512435913085938, 0.028606414794921875, 0.03470039367675781, 0.04079437255859375, 0.04688835144042969, 0.052982330322265625, 0.05907630920410156, 0.0651702880859375, 0.07126426696777344, 0.07735824584960938, 0.08345222473144531, 0.08954620361328125, 0.09564018249511719, 0.10173416137695312, 0.10782814025878906, 0.113922119140625, 0.12001609802246094, 0.12611007690429688, 0.1322040557861328, 0.13829803466796875, 0.1443920135498047, 0.15048599243164062, 0.15657997131347656, 0.1626739501953125, 0.16876792907714844, 0.17486190795898438, 0.1809558868408203, 0.18704986572265625, 0.1931438446044922, 0.19923782348632812, 0.20533180236816406, 0.21142578125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 1.0, 4.0, 7.0, 4.0, 9.0, 10.0, 10.0, 15.0, 14.0, 24.0, 24.0, 35.0, 45.0, 37.0, 48.0, 50.0, 53.0, 53.0, 68.0, 38.0, 56.0, 48.0, 49.0, 50.0, 42.0, 44.0, 32.0, 24.0, 25.0, 21.0, 14.0, 12.0, 8.0, 5.0, 2.0, 5.0, 10.0, 7.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.09490966796875, -0.09186553955078125, -0.0888214111328125, -0.08577728271484375, -0.082733154296875, -0.07968902587890625, -0.0766448974609375, -0.07360076904296875, -0.070556640625, -0.06751251220703125, -0.0644683837890625, -0.06142425537109375, -0.058380126953125, -0.05533599853515625, -0.0522918701171875, -0.04924774169921875, -0.04620361328125, -0.04315948486328125, -0.0401153564453125, -0.03707122802734375, -0.034027099609375, -0.03098297119140625, -0.0279388427734375, -0.02489471435546875, -0.0218505859375, -0.01880645751953125, -0.0157623291015625, -0.01271820068359375, -0.009674072265625, -0.00662994384765625, -0.0035858154296875, -0.00054168701171875, 0.00250244140625, 0.00554656982421875, 0.0085906982421875, 0.01163482666015625, 0.014678955078125, 0.01772308349609375, 0.0207672119140625, 0.02381134033203125, 0.02685546875, 0.02989959716796875, 0.0329437255859375, 0.03598785400390625, 0.039031982421875, 0.04207611083984375, 0.0451202392578125, 0.04816436767578125, 0.05120849609375, 0.05425262451171875, 0.0572967529296875, 0.06034088134765625, 0.063385009765625, 0.06642913818359375, 0.0694732666015625, 0.07251739501953125, 0.0755615234375, 0.07860565185546875, 0.0816497802734375, 0.08469390869140625, 0.087738037109375, 0.09078216552734375, 0.0938262939453125, 0.09687042236328125, 0.09991455078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 5.0, 1.0, 8.0, 8.0, 21.0, 35.0, 61.0, 116.0, 167.0, 237.0, 442.0, 1247.0, 74743.0, 4112175.0, 3625.0, 664.0, 282.0, 194.0, 118.0, 69.0, 26.0, 25.0, 14.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.3623046875, -1.32000732421875, -1.2777099609375, -1.23541259765625, -1.193115234375, -1.15081787109375, -1.1085205078125, -1.06622314453125, -1.02392578125, -0.98162841796875, -0.9393310546875, -0.89703369140625, -0.854736328125, -0.81243896484375, -0.7701416015625, -0.72784423828125, -0.685546875, -0.64324951171875, -0.6009521484375, -0.55865478515625, -0.516357421875, -0.47406005859375, -0.4317626953125, -0.38946533203125, -0.34716796875, -0.30487060546875, -0.2625732421875, -0.22027587890625, -0.177978515625, -0.13568115234375, -0.0933837890625, -0.05108642578125, -0.0087890625, 0.03350830078125, 0.0758056640625, 0.11810302734375, 0.160400390625, 0.20269775390625, 0.2449951171875, 0.28729248046875, 0.32958984375, 0.37188720703125, 0.4141845703125, 0.45648193359375, 0.498779296875, 0.54107666015625, 0.5833740234375, 0.62567138671875, 0.66796875, 0.71026611328125, 0.7525634765625, 0.79486083984375, 0.837158203125, 0.87945556640625, 0.9217529296875, 0.96405029296875, 1.00634765625, 1.04864501953125, 1.0909423828125, 1.13323974609375, 1.175537109375, 1.21783447265625, 1.2601318359375, 1.30242919921875, 1.3447265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 10.0, 78.0, 713.0, 2937.0, 257.0, 58.0, 26.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2529296875, -1.21533203125, -1.177734375, -1.14013671875, -1.1025390625, -1.06494140625, -1.02734375, -0.98974609375, -0.9521484375, -0.91455078125, -0.876953125, -0.83935546875, -0.8017578125, -0.76416015625, -0.7265625, -0.68896484375, -0.6513671875, -0.61376953125, -0.576171875, -0.53857421875, -0.5009765625, -0.46337890625, -0.42578125, -0.38818359375, -0.3505859375, -0.31298828125, -0.275390625, -0.23779296875, -0.2001953125, -0.16259765625, -0.125, -0.08740234375, -0.0498046875, -0.01220703125, 0.025390625, 0.06298828125, 0.1005859375, 0.13818359375, 0.17578125, 0.21337890625, 0.2509765625, 0.28857421875, 0.326171875, 0.36376953125, 0.4013671875, 0.43896484375, 0.4765625, 0.51416015625, 0.5517578125, 0.58935546875, 0.626953125, 0.66455078125, 0.7021484375, 0.73974609375, 0.77734375, 0.81494140625, 0.8525390625, 0.89013671875, 0.927734375, 0.96533203125, 1.0029296875, 1.04052734375, 1.078125, 1.11572265625, 1.1533203125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 8.0, 15.0, 25.0, 62.0, 269.0, 386.0, 181.0, 36.0, 14.0, 6.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.843277931213379, -9.615950584411621, -9.38862419128418, -9.161296844482422, -8.933969497680664, -8.706643104553223, -8.479315757751465, -8.251989364624023, -8.024662017822266, -7.797335147857666, -7.570007801055908, -7.342680931091309, -7.115354061126709, -6.888027191162109, -6.660699844360352, -6.433372974395752, -6.206046104431152, -5.978719234466553, -5.751391887664795, -5.524065017700195, -5.296738147735596, -5.069411277770996, -4.842083930969238, -4.614757061004639, -4.387429714202881, -4.160102844238281, -3.9327757358551025, -3.705448627471924, -3.478121757507324, -3.2507946491241455, -3.023467540740967, -2.796140670776367, -2.5688138008117676, -2.341486692428589, -2.1141598224639893, -1.8868327140808105, -1.659505844116211, -1.4321787357330322, -1.204851746559143, -0.9775247573852539, -0.7501977682113647, -0.5228707790374756, -0.29554376006126404, -0.06821674108505249, 0.15911024808883667, 0.3864372968673706, 0.6137642860412598, 0.8410912752151489, 1.068418264389038, 1.2957452535629272, 1.5230722427368164, 1.7503993511199951, 1.9777262210845947, 2.2050533294677734, 2.432380199432373, 2.6597073078155518, 2.8870344161987305, 3.114361524581909, 3.341688394546509, 3.5690155029296875, 3.796342372894287, 4.023669242858887, 4.2509965896606445, 4.478323459625244, 4.705650329589844]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 6.0, 7.0, 12.0, 20.0, 20.0, 32.0, 43.0, 51.0, 56.0, 64.0, 94.0, 52.0, 92.0, 70.0, 72.0, 70.0, 56.0, 40.0, 36.0, 34.0, 21.0, 23.0, 9.0, 12.0, 7.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.7021191120147705, -1.633888840675354, -1.5656585693359375, -1.4974281787872314, -1.429197907447815, -1.3609676361083984, -1.2927372455596924, -1.2245069742202759, -1.1562767028808594, -1.0880464315414429, -1.0198161602020264, -0.9515857696533203, -0.8833554983139038, -0.8151252269744873, -0.746894896030426, -0.6786645650863647, -0.6104342937469482, -0.5422040224075317, -0.47397369146347046, -0.40574339032173157, -0.3375130891799927, -0.2692827880382538, -0.2010524868965149, -0.132822185754776, -0.06459188461303711, 0.0036384165287017822, 0.07186871767044067, 0.14009901881217957, 0.20832931995391846, 0.27655962109565735, 0.34478992223739624, 0.41302022337913513, 0.4812507629394531, 0.5494810342788696, 0.6177113652229309, 0.6859416961669922, 0.7541719675064087, 0.8224022388458252, 0.8906325697898865, 0.9588629007339478, 1.0270931720733643, 1.0953234434127808, 1.1635537147521973, 1.2317841053009033, 1.3000143766403198, 1.3682446479797363, 1.4364750385284424, 1.5047053098678589, 1.5729355812072754, 1.641165852546692, 1.7093961238861084, 1.7776265144348145, 1.845856785774231, 1.9140870571136475, 1.9823174476623535, 2.0505475997924805, 2.1187779903411865, 2.1870083808898926, 2.2552385330200195, 2.3234689235687256, 2.3916993141174316, 2.4599294662475586, 2.5281598567962646, 2.5963900089263916, 2.6646203994750977]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 13.0, 9.0, 15.0, 17.0, 23.0, 44.0, 60.0, 96.0, 140.0, 206.0, 371.0, 633.0, 1120.0, 1865.0, 3424.0, 6504.0, 12909.0, 26919.0, 58129.0, 125485.0, 236573.0, 265698.0, 162310.0, 76136.0, 35052.0, 16623.0, 8171.0, 4238.0, 2401.0, 1342.0, 772.0, 472.0, 282.0, 173.0, 116.0, 75.0, 44.0, 28.0, 18.0, 17.0, 10.0, 9.0, 7.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11474609375, -0.11081314086914062, -0.10688018798828125, -0.10294723510742188, -0.0990142822265625, -0.09508132934570312, -0.09114837646484375, -0.08721542358398438, -0.083282470703125, -0.07934951782226562, -0.07541656494140625, -0.07148361206054688, -0.0675506591796875, -0.06361770629882812, -0.05968475341796875, -0.055751800537109375, -0.05181884765625, -0.047885894775390625, -0.04395294189453125, -0.040019989013671875, -0.0360870361328125, -0.032154083251953125, -0.02822113037109375, -0.024288177490234375, -0.020355224609375, -0.016422271728515625, -0.01248931884765625, -0.008556365966796875, -0.0046234130859375, -0.000690460205078125, 0.00324249267578125, 0.007175445556640625, 0.0111083984375, 0.015041351318359375, 0.01897430419921875, 0.022907257080078125, 0.0268402099609375, 0.030773162841796875, 0.03470611572265625, 0.038639068603515625, 0.042572021484375, 0.046504974365234375, 0.05043792724609375, 0.054370880126953125, 0.0583038330078125, 0.062236785888671875, 0.06616973876953125, 0.07010269165039062, 0.07403564453125, 0.07796859741210938, 0.08190155029296875, 0.08583450317382812, 0.0897674560546875, 0.09370040893554688, 0.09763336181640625, 0.10156631469726562, 0.105499267578125, 0.10943222045898438, 0.11336517333984375, 0.11729812622070312, 0.1212310791015625, 0.12516403198242188, 0.12909698486328125, 0.13302993774414062, 0.136962890625]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 13.0, 23.0, 18.0, 30.0, 28.0, 26.0, 35.0, 43.0, 49.0, 65.0, 55.0, 61.0, 61.0, 59.0, 68.0, 63.0, 61.0, 55.0, 30.0, 44.0, 27.0, 21.0, 17.0, 10.0, 12.0, 9.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.11090087890625, -0.10689067840576172, -0.10288047790527344, -0.09887027740478516, -0.09486007690429688, -0.0908498764038086, -0.08683967590332031, -0.08282947540283203, -0.07881927490234375, -0.07480907440185547, -0.07079887390136719, -0.0667886734008789, -0.06277847290039062, -0.058768272399902344, -0.05475807189941406, -0.05074787139892578, -0.0467376708984375, -0.04272747039794922, -0.03871726989746094, -0.034707069396972656, -0.030696868896484375, -0.026686668395996094, -0.022676467895507812, -0.01866626739501953, -0.01465606689453125, -0.010645866394042969, -0.0066356658935546875, -0.0026254653930664062, 0.001384735107421875, 0.005394935607910156, 0.009405136108398438, 0.013415336608886719, 0.017425537109375, 0.02143573760986328, 0.025445938110351562, 0.029456138610839844, 0.033466339111328125, 0.037476539611816406, 0.04148674011230469, 0.04549694061279297, 0.04950714111328125, 0.05351734161376953, 0.05752754211425781, 0.061537742614746094, 0.06554794311523438, 0.06955814361572266, 0.07356834411621094, 0.07757854461669922, 0.0815887451171875, 0.08559894561767578, 0.08960914611816406, 0.09361934661865234, 0.09762954711914062, 0.1016397476196289, 0.10564994812011719, 0.10966014862060547, 0.11367034912109375, 0.11768054962158203, 0.12169075012207031, 0.1257009506225586, 0.12971115112304688, 0.13372135162353516, 0.13773155212402344, 0.14174175262451172, 0.145751953125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 4.0, 7.0, 14.0, 9.0, 16.0, 10.0, 32.0, 49.0, 68.0, 104.0, 175.0, 243.0, 446.0, 802.0, 1557.0, 3504.0, 9523.0, 32713.0, 142850.0, 589768.0, 200668.0, 45371.0, 12267.0, 4226.0, 1856.0, 950.0, 482.0, 293.0, 167.0, 120.0, 62.0, 57.0, 36.0, 31.0, 25.0, 11.0, 9.0, 4.0, 6.0, 7.0, 10.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.343505859375, -0.3346099853515625, -0.325714111328125, -0.3168182373046875, -0.30792236328125, -0.2990264892578125, -0.290130615234375, -0.2812347412109375, -0.2723388671875, -0.2634429931640625, -0.254547119140625, -0.2456512451171875, -0.23675537109375, -0.2278594970703125, -0.218963623046875, -0.2100677490234375, -0.201171875, -0.1922760009765625, -0.183380126953125, -0.1744842529296875, -0.16558837890625, -0.1566925048828125, -0.147796630859375, -0.1389007568359375, -0.1300048828125, -0.1211090087890625, -0.112213134765625, -0.1033172607421875, -0.09442138671875, -0.0855255126953125, -0.076629638671875, -0.0677337646484375, -0.058837890625, -0.0499420166015625, -0.041046142578125, -0.0321502685546875, -0.02325439453125, -0.0143585205078125, -0.005462646484375, 0.0034332275390625, 0.0123291015625, 0.0212249755859375, 0.030120849609375, 0.0390167236328125, 0.04791259765625, 0.0568084716796875, 0.065704345703125, 0.0746002197265625, 0.08349609375, 0.0923919677734375, 0.101287841796875, 0.1101837158203125, 0.11907958984375, 0.1279754638671875, 0.136871337890625, 0.1457672119140625, 0.1546630859375, 0.1635589599609375, 0.172454833984375, 0.1813507080078125, 0.19024658203125, 0.1991424560546875, 0.208038330078125, 0.2169342041015625, 0.225830078125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 6.0, 5.0, 4.0, 8.0, 14.0, 11.0, 17.0, 22.0, 17.0, 30.0, 23.0, 27.0, 37.0, 35.0, 38.0, 58.0, 48.0, 53.0, 49.0, 65.0, 57.0, 47.0, 38.0, 51.0, 32.0, 30.0, 26.0, 27.0, 20.0, 17.0, 11.0, 12.0, 14.0, 14.0, 6.0, 5.0, 8.0, 3.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.431884765625, -0.4180145263671875, -0.404144287109375, -0.3902740478515625, -0.37640380859375, -0.3625335693359375, -0.348663330078125, -0.3347930908203125, -0.3209228515625, -0.3070526123046875, -0.293182373046875, -0.2793121337890625, -0.26544189453125, -0.2515716552734375, -0.237701416015625, -0.2238311767578125, -0.2099609375, -0.1960906982421875, -0.182220458984375, -0.1683502197265625, -0.15447998046875, -0.1406097412109375, -0.126739501953125, -0.1128692626953125, -0.0989990234375, -0.0851287841796875, -0.071258544921875, -0.0573883056640625, -0.04351806640625, -0.0296478271484375, -0.015777587890625, -0.0019073486328125, 0.011962890625, 0.0258331298828125, 0.039703369140625, 0.0535736083984375, 0.06744384765625, 0.0813140869140625, 0.095184326171875, 0.1090545654296875, 0.1229248046875, 0.1367950439453125, 0.150665283203125, 0.1645355224609375, 0.17840576171875, 0.1922760009765625, 0.206146240234375, 0.2200164794921875, 0.23388671875, 0.2477569580078125, 0.261627197265625, 0.2754974365234375, 0.28936767578125, 0.3032379150390625, 0.317108154296875, 0.3309783935546875, 0.3448486328125, 0.3587188720703125, 0.372589111328125, 0.3864593505859375, 0.40032958984375, 0.4141998291015625, 0.428070068359375, 0.4419403076171875, 0.455810546875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 5.0, 0.0, 5.0, 5.0, 14.0, 20.0, 30.0, 34.0, 56.0, 108.0, 186.0, 297.0, 450.0, 741.0, 1295.0, 2432.0, 4762.0, 9908.0, 22852.0, 60076.0, 224239.0, 560238.0, 98849.0, 33870.0, 14130.0, 6602.0, 3227.0, 1757.0, 881.0, 566.0, 344.0, 204.0, 127.0, 84.0, 48.0, 41.0, 21.0, 13.0, 14.0, 8.0, 7.0, 4.0, 1.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1268310546875, -0.12248992919921875, -0.1181488037109375, -0.11380767822265625, -0.109466552734375, -0.10512542724609375, -0.1007843017578125, -0.09644317626953125, -0.09210205078125, -0.08776092529296875, -0.0834197998046875, -0.07907867431640625, -0.074737548828125, -0.07039642333984375, -0.0660552978515625, -0.06171417236328125, -0.057373046875, -0.05303192138671875, -0.0486907958984375, -0.04434967041015625, -0.040008544921875, -0.03566741943359375, -0.0313262939453125, -0.02698516845703125, -0.02264404296875, -0.01830291748046875, -0.0139617919921875, -0.00962066650390625, -0.005279541015625, -0.00093841552734375, 0.0034027099609375, 0.00774383544921875, 0.0120849609375, 0.01642608642578125, 0.0207672119140625, 0.02510833740234375, 0.029449462890625, 0.03379058837890625, 0.0381317138671875, 0.04247283935546875, 0.04681396484375, 0.05115509033203125, 0.0554962158203125, 0.05983734130859375, 0.064178466796875, 0.06851959228515625, 0.0728607177734375, 0.07720184326171875, 0.08154296875, 0.08588409423828125, 0.0902252197265625, 0.09456634521484375, 0.098907470703125, 0.10324859619140625, 0.1075897216796875, 0.11193084716796875, 0.11627197265625, 0.12061309814453125, 0.1249542236328125, 0.12929534912109375, 0.133636474609375, 0.13797760009765625, 0.1423187255859375, 0.14665985107421875, 0.1510009765625]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 4.0, 5.0, 6.0, 6.0, 4.0, 10.0, 7.0, 18.0, 15.0, 23.0, 17.0, 44.0, 63.0, 76.0, 92.0, 121.0, 143.0, 75.0, 80.0, 51.0, 34.0, 29.0, 17.0, 12.0, 11.0, 10.0, 6.0, 8.0, 4.0, 6.0, 6.0, 5.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.253885269165039e-05, -7.02710822224617e-05, -6.800331175327301e-05, -6.573554128408432e-05, -6.346777081489563e-05, -6.120000034570694e-05, -5.893222987651825e-05, -5.666445940732956e-05, -5.439668893814087e-05, -5.212891846895218e-05, -4.986114799976349e-05, -4.75933775305748e-05, -4.532560706138611e-05, -4.305783659219742e-05, -4.079006612300873e-05, -3.852229565382004e-05, -3.625452518463135e-05, -3.398675471544266e-05, -3.171898424625397e-05, -2.9451213777065277e-05, -2.7183443307876587e-05, -2.4915672838687897e-05, -2.2647902369499207e-05, -2.0380131900310516e-05, -1.8112361431121826e-05, -1.5844590961933136e-05, -1.3576820492744446e-05, -1.1309050023555756e-05, -9.041279554367065e-06, -6.773509085178375e-06, -4.505738615989685e-06, -2.237968146800995e-06, 2.9802322387695312e-08, 2.2975727915763855e-06, 4.565343260765076e-06, 6.833113729953766e-06, 9.100884199142456e-06, 1.1368654668331146e-05, 1.3636425137519836e-05, 1.5904195606708527e-05, 1.8171966075897217e-05, 2.0439736545085907e-05, 2.2707507014274597e-05, 2.4975277483463287e-05, 2.7243047952651978e-05, 2.9510818421840668e-05, 3.177858889102936e-05, 3.404635936021805e-05, 3.631412982940674e-05, 3.858190029859543e-05, 4.084967076778412e-05, 4.311744123697281e-05, 4.53852117061615e-05, 4.765298217535019e-05, 4.992075264453888e-05, 5.218852311372757e-05, 5.445629358291626e-05, 5.672406405210495e-05, 5.899183452129364e-05, 6.125960499048233e-05, 6.352737545967102e-05, 6.579514592885971e-05, 6.80629163980484e-05, 7.033068686723709e-05, 7.259845733642578e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 8.0, 4.0, 2.0, 13.0, 8.0, 8.0, 25.0, 19.0, 45.0, 76.0, 145.0, 202.0, 361.0, 759.0, 1508.0, 3440.0, 8663.0, 25459.0, 92459.0, 622167.0, 220397.0, 47693.0, 15028.0, 5584.0, 2263.0, 1000.0, 515.0, 267.0, 169.0, 93.0, 67.0, 35.0, 17.0, 18.0, 16.0, 10.0, 12.0, 7.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.186767578125, -0.18106651306152344, -0.17536544799804688, -0.1696643829345703, -0.16396331787109375, -0.1582622528076172, -0.15256118774414062, -0.14686012268066406, -0.1411590576171875, -0.13545799255371094, -0.12975692749023438, -0.12405586242675781, -0.11835479736328125, -0.11265373229980469, -0.10695266723632812, -0.10125160217285156, -0.095550537109375, -0.08984947204589844, -0.08414840698242188, -0.07844734191894531, -0.07274627685546875, -0.06704521179199219, -0.061344146728515625, -0.05564308166503906, -0.0499420166015625, -0.04424095153808594, -0.038539886474609375, -0.03283882141113281, -0.02713775634765625, -0.021436691284179688, -0.015735626220703125, -0.010034561157226562, -0.00433349609375, 0.0013675689697265625, 0.007068634033203125, 0.012769699096679688, 0.01847076416015625, 0.024171829223632812, 0.029872894287109375, 0.03557395935058594, 0.0412750244140625, 0.04697608947753906, 0.052677154541015625, 0.05837821960449219, 0.06407928466796875, 0.06978034973144531, 0.07548141479492188, 0.08118247985839844, 0.086883544921875, 0.09258460998535156, 0.09828567504882812, 0.10398674011230469, 0.10968780517578125, 0.11538887023925781, 0.12108993530273438, 0.12679100036621094, 0.1324920654296875, 0.13819313049316406, 0.14389419555664062, 0.1495952606201172, 0.15529632568359375, 0.1609973907470703, 0.16669845581054688, 0.17239952087402344, 0.1781005859375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 6.0, 9.0, 8.0, 11.0, 15.0, 21.0, 17.0, 20.0, 33.0, 30.0, 49.0, 52.0, 48.0, 85.0, 78.0, 73.0, 69.0, 48.0, 60.0, 57.0, 44.0, 27.0, 29.0, 15.0, 18.0, 15.0, 11.0, 6.0, 8.0, 5.0, 5.0, 4.0, 3.0, 4.0, 5.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.1456298828125, -0.1414785385131836, -0.1373271942138672, -0.13317584991455078, -0.12902450561523438, -0.12487316131591797, -0.12072181701660156, -0.11657047271728516, -0.11241912841796875, -0.10826778411865234, -0.10411643981933594, -0.09996509552001953, -0.09581375122070312, -0.09166240692138672, -0.08751106262207031, -0.0833597183227539, -0.0792083740234375, -0.0750570297241211, -0.07090568542480469, -0.06675434112548828, -0.06260299682617188, -0.05845165252685547, -0.05430030822753906, -0.050148963928222656, -0.04599761962890625, -0.041846275329589844, -0.03769493103027344, -0.03354358673095703, -0.029392242431640625, -0.02524089813232422, -0.021089553833007812, -0.016938209533691406, -0.012786865234375, -0.008635520935058594, -0.0044841766357421875, -0.00033283233642578125, 0.003818511962890625, 0.007969856262207031, 0.012121200561523438, 0.016272544860839844, 0.02042388916015625, 0.024575233459472656, 0.028726577758789062, 0.03287792205810547, 0.037029266357421875, 0.04118061065673828, 0.04533195495605469, 0.049483299255371094, 0.0536346435546875, 0.057785987854003906, 0.06193733215332031, 0.06608867645263672, 0.07024002075195312, 0.07439136505126953, 0.07854270935058594, 0.08269405364990234, 0.08684539794921875, 0.09099674224853516, 0.09514808654785156, 0.09929943084716797, 0.10345077514648438, 0.10760211944580078, 0.11175346374511719, 0.1159048080444336, 0.12005615234375]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 4.0, 6.0, 9.0, 14.0, 31.0, 59.0, 93.0, 154.0, 303.0, 145.0, 99.0, 43.0, 23.0, 9.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.1723456382751465, -4.047217845916748, -3.9220902919769287, -3.7969627380371094, -3.671834945678711, -3.5467071533203125, -3.421579599380493, -3.296452045440674, -3.1713242530822754, -3.046196460723877, -2.9210689067840576, -2.7959413528442383, -2.67081356048584, -2.5456857681274414, -2.420558214187622, -2.2954306602478027, -2.1703028678894043, -2.045175075531006, -1.9200475215911865, -1.7949198484420776, -1.6697921752929688, -1.5446645021438599, -1.419536828994751, -1.294409155845642, -1.1692814826965332, -1.0441538095474243, -0.9190261363983154, -0.7938984632492065, -0.6687707901000977, -0.5436431169509888, -0.4185154438018799, -0.293387770652771, -0.1682596206665039, -0.04313194751739502, 0.08199572563171387, 0.20712339878082275, 0.33225107192993164, 0.4573787450790405, 0.5825064182281494, 0.7076340913772583, 0.8327617645263672, 0.9578894376754761, 1.083017110824585, 1.2081447839736938, 1.3332724571228027, 1.4584001302719116, 1.5835278034210205, 1.7086554765701294, 1.8337831497192383, 1.9589108228683472, 2.084038496017456, 2.2091660499572754, 2.334293842315674, 2.4594216346740723, 2.5845491886138916, 2.709676742553711, 2.8348045349121094, 2.959932327270508, 3.085059881210327, 3.2101874351501465, 3.335315227508545, 3.4604430198669434, 3.5855705738067627, 3.710698127746582, 3.8358259201049805]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 2.0, 4.0, 5.0, 14.0, 8.0, 10.0, 17.0, 15.0, 18.0, 14.0, 16.0, 31.0, 31.0, 28.0, 27.0, 39.0, 30.0, 58.0, 64.0, 89.0, 93.0, 56.0, 40.0, 34.0, 38.0, 27.0, 18.0, 23.0, 23.0, 30.0, 18.0, 18.0, 14.0, 10.0, 6.0, 12.0, 5.0, 3.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 4.0], "bins": [-2.333367347717285, -2.2659389972686768, -2.1985104084014893, -2.131082057952881, -2.0636537075042725, -1.9962252378463745, -1.9287967681884766, -1.8613684177398682, -1.7939399480819702, -1.7265114784240723, -1.6590831279754639, -1.591654658317566, -1.524226188659668, -1.4567978382110596, -1.3893693685531616, -1.3219408988952637, -1.2545125484466553, -1.1870840787887573, -1.119655728340149, -1.052227258682251, -0.9847988486289978, -0.9173704385757446, -0.8499419689178467, -0.7825135588645935, -0.7150851488113403, -0.6476567387580872, -0.580228328704834, -0.512799859046936, -0.44537144899368286, -0.3779430389404297, -0.3105145990848541, -0.24308615922927856, -0.1756579875946045, -0.10822956264019012, -0.04080113768577576, 0.02662728726863861, 0.09405571222305298, 0.16148412227630615, 0.2289125621318817, 0.2963410019874573, 0.36376941204071045, 0.4311978220939636, 0.4986262619495392, 0.5660547018051147, 0.6334831118583679, 0.7009115219116211, 0.768339991569519, 0.8357684016227722, 0.9031968116760254, 0.9706252217292786, 1.0380536317825317, 1.1054821014404297, 1.172910451889038, 1.240338921546936, 1.307767391204834, 1.3751957416534424, 1.4426242113113403, 1.5100526809692383, 1.5774810314178467, 1.6449095010757446, 1.7123379707336426, 1.779766321182251, 1.847194790840149, 1.9146232604980469, 1.9820516109466553]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 6.0, 5.0, 9.0, 15.0, 24.0, 51.0, 77.0, 124.0, 218.0, 364.0, 597.0, 1160.0, 2436.0, 5793.0, 16995.0, 69843.0, 722678.0, 2929457.0, 377827.0, 45456.0, 12039.0, 4638.0, 2126.0, 1023.0, 555.0, 287.0, 182.0, 104.0, 77.0, 36.0, 27.0, 21.0, 10.0, 7.0, 7.0, 5.0, 5.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177978515625, -0.1719207763671875, -0.165863037109375, -0.1598052978515625, -0.15374755859375, -0.1476898193359375, -0.141632080078125, -0.1355743408203125, -0.1295166015625, -0.1234588623046875, -0.117401123046875, -0.1113433837890625, -0.10528564453125, -0.0992279052734375, -0.093170166015625, -0.0871124267578125, -0.0810546875, -0.0749969482421875, -0.068939208984375, -0.0628814697265625, -0.05682373046875, -0.0507659912109375, -0.044708251953125, -0.0386505126953125, -0.0325927734375, -0.0265350341796875, -0.020477294921875, -0.0144195556640625, -0.00836181640625, -0.0023040771484375, 0.003753662109375, 0.0098114013671875, 0.015869140625, 0.0219268798828125, 0.027984619140625, 0.0340423583984375, 0.04010009765625, 0.0461578369140625, 0.052215576171875, 0.0582733154296875, 0.0643310546875, 0.0703887939453125, 0.076446533203125, 0.0825042724609375, 0.08856201171875, 0.0946197509765625, 0.100677490234375, 0.1067352294921875, 0.11279296875, 0.1188507080078125, 0.124908447265625, 0.1309661865234375, 0.13702392578125, 0.1430816650390625, 0.149139404296875, 0.1551971435546875, 0.1612548828125, 0.1673126220703125, 0.173370361328125, 0.1794281005859375, 0.18548583984375, 0.1915435791015625, 0.197601318359375, 0.2036590576171875, 0.209716796875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 3.0, 3.0, 5.0, 11.0, 16.0, 21.0, 16.0, 31.0, 30.0, 29.0, 29.0, 55.0, 57.0, 57.0, 56.0, 41.0, 52.0, 49.0, 59.0, 50.0, 43.0, 45.0, 33.0, 45.0, 40.0, 19.0, 29.0, 16.0, 20.0, 8.0, 8.0, 7.0, 0.0, 5.0, 5.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08685302734375, -0.08333873748779297, -0.07982444763183594, -0.0763101577758789, -0.07279586791992188, -0.06928157806396484, -0.06576728820800781, -0.06225299835205078, -0.05873870849609375, -0.05522441864013672, -0.05171012878417969, -0.048195838928222656, -0.044681549072265625, -0.041167259216308594, -0.03765296936035156, -0.03413867950439453, -0.0306243896484375, -0.02711009979248047, -0.023595809936523438, -0.020081520080566406, -0.016567230224609375, -0.013052940368652344, -0.009538650512695312, -0.006024360656738281, -0.00251007080078125, 0.0010042190551757812, 0.0045185089111328125, 0.008032798767089844, 0.011547088623046875, 0.015061378479003906, 0.018575668334960938, 0.02208995819091797, 0.025604248046875, 0.02911853790283203, 0.03263282775878906, 0.036147117614746094, 0.039661407470703125, 0.043175697326660156, 0.04668998718261719, 0.05020427703857422, 0.05371856689453125, 0.05723285675048828, 0.06074714660644531, 0.06426143646240234, 0.06777572631835938, 0.0712900161743164, 0.07480430603027344, 0.07831859588623047, 0.0818328857421875, 0.08534717559814453, 0.08886146545410156, 0.0923757553100586, 0.09589004516601562, 0.09940433502197266, 0.10291862487792969, 0.10643291473388672, 0.10994720458984375, 0.11346149444580078, 0.11697578430175781, 0.12049007415771484, 0.12400436401367188, 0.1275186538696289, 0.13103294372558594, 0.13454723358154297, 0.1380615234375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 7.0, 5.0, 5.0, 12.0, 25.0, 44.0, 77.0, 151.0, 276.0, 563.0, 1973.0, 15882.0, 4000880.0, 167530.0, 5020.0, 999.0, 376.0, 203.0, 115.0, 68.0, 32.0, 25.0, 9.0, 6.0, 5.0, 2.0, 6.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0966796875, -1.0632171630859375, -1.029754638671875, -0.9962921142578125, -0.96282958984375, -0.9293670654296875, -0.895904541015625, -0.8624420166015625, -0.8289794921875, -0.7955169677734375, -0.762054443359375, -0.7285919189453125, -0.69512939453125, -0.6616668701171875, -0.628204345703125, -0.5947418212890625, -0.561279296875, -0.5278167724609375, -0.494354248046875, -0.4608917236328125, -0.42742919921875, -0.3939666748046875, -0.360504150390625, -0.3270416259765625, -0.2935791015625, -0.2601165771484375, -0.226654052734375, -0.1931915283203125, -0.15972900390625, -0.1262664794921875, -0.092803955078125, -0.0593414306640625, -0.02587890625, 0.0075836181640625, 0.041046142578125, 0.0745086669921875, 0.10797119140625, 0.1414337158203125, 0.174896240234375, 0.2083587646484375, 0.2418212890625, 0.2752838134765625, 0.308746337890625, 0.3422088623046875, 0.37567138671875, 0.4091339111328125, 0.442596435546875, 0.4760589599609375, 0.509521484375, 0.5429840087890625, 0.576446533203125, 0.6099090576171875, 0.64337158203125, 0.6768341064453125, 0.710296630859375, 0.7437591552734375, 0.7772216796875, 0.8106842041015625, 0.844146728515625, 0.8776092529296875, 0.91107177734375, 0.9445343017578125, 0.977996826171875, 1.0114593505859375, 1.044921875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 0.0, 2.0, 4.0, 7.0, 8.0, 9.0, 10.0, 22.0, 27.0, 42.0, 103.0, 245.0, 676.0, 1384.0, 947.0, 306.0, 126.0, 79.0, 25.0, 17.0, 13.0, 13.0, 3.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.410400390625, -0.3949546813964844, -0.37950897216796875, -0.3640632629394531, -0.3486175537109375, -0.3331718444824219, -0.31772613525390625, -0.3022804260253906, -0.286834716796875, -0.2713890075683594, -0.25594329833984375, -0.24049758911132812, -0.2250518798828125, -0.20960617065429688, -0.19416046142578125, -0.17871475219726562, -0.16326904296875, -0.14782333374023438, -0.13237762451171875, -0.11693191528320312, -0.1014862060546875, -0.08604049682617188, -0.07059478759765625, -0.055149078369140625, -0.039703369140625, -0.024257659912109375, -0.00881195068359375, 0.006633758544921875, 0.0220794677734375, 0.037525177001953125, 0.05297088623046875, 0.06841659545898438, 0.0838623046875, 0.09930801391601562, 0.11475372314453125, 0.13019943237304688, 0.1456451416015625, 0.16109085083007812, 0.17653656005859375, 0.19198226928710938, 0.207427978515625, 0.22287368774414062, 0.23831939697265625, 0.2537651062011719, 0.2692108154296875, 0.2846565246582031, 0.30010223388671875, 0.3155479431152344, 0.33099365234375, 0.3464393615722656, 0.36188507080078125, 0.3773307800292969, 0.3927764892578125, 0.4082221984863281, 0.42366790771484375, 0.4391136169433594, 0.454559326171875, 0.4700050354003906, 0.48545074462890625, 0.5008964538574219, 0.5163421630859375, 0.5317878723144531, 0.5472335815429688, 0.5626792907714844, 0.578125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 9.0, 28.0, 40.0, 72.0, 139.0, 226.0, 213.0, 138.0, 71.0, 40.0, 11.0, 6.0, 3.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.690418243408203, -2.540031909942627, -2.38964581489563, -2.2392594814300537, -2.0888731479644775, -1.938486933708191, -1.7881007194519043, -1.6377143859863281, -1.4873281717300415, -1.3369419574737549, -1.1865556240081787, -1.036169409751892, -0.8857831358909607, -0.7353968620300293, -0.5850106477737427, -0.4346243143081665, -0.2842381000518799, -0.13385184109210968, 0.016534417867660522, 0.16692066192626953, 0.3173069357872009, 0.4676932096481323, 0.618079423904419, 0.7684657573699951, 0.9188519716262817, 1.0692381858825684, 1.2196245193481445, 1.3700107336044312, 1.5203969478607178, 1.670783281326294, 1.8211694955825806, 1.9715558290481567, 2.1219420433044434, 2.2723283767700195, 2.4227144718170166, 2.5731008052825928, 2.723487138748169, 2.873873233795166, 3.024259567260742, 3.1746459007263184, 3.3250322341918945, 3.4754185676574707, 3.6258046627044678, 3.776190996170044, 3.92657732963562, 4.076963424682617, 4.227349758148193, 4.3777360916137695, 4.5281219482421875, 4.678508281707764, 4.82889461517334, 4.979280471801758, 5.129666805267334, 5.28005313873291, 5.430439472198486, 5.5808258056640625, 5.731212139129639, 5.881598472595215, 6.031984806060791, 6.182371139526367, 6.332756996154785, 6.483143329620361, 6.6335296630859375, 6.783915996551514, 6.93430233001709]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 13.0, 14.0, 16.0, 18.0, 17.0, 20.0, 17.0, 21.0, 39.0, 34.0, 35.0, 44.0, 50.0, 44.0, 40.0, 46.0, 47.0, 50.0, 37.0, 41.0, 50.0, 36.0, 35.0, 42.0, 37.0, 27.0, 22.0, 23.0, 19.0, 10.0, 7.0, 17.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4795427322387695, -1.4371159076690674, -1.3946890830993652, -1.352262258529663, -1.309835433959961, -1.2674086093902588, -1.2249817848205566, -1.1825549602508545, -1.1401281356811523, -1.0977013111114502, -1.055274486541748, -1.012847661972046, -0.9704208374023438, -0.9279940128326416, -0.8855672478675842, -0.8431404232978821, -0.8007136583328247, -0.7582868337631226, -0.7158600091934204, -0.6734331846237183, -0.6310063600540161, -0.588579535484314, -0.5461527705192566, -0.5037259459495544, -0.4612991213798523, -0.41887229681015015, -0.376445472240448, -0.33401867747306824, -0.2915918529033661, -0.24916502833366394, -0.20673823356628418, -0.16431140899658203, -0.12188446521759033, -0.07945764809846878, -0.03703083097934723, 0.005395978689193726, 0.047822803258895874, 0.09024962782859802, 0.13267642259597778, 0.17510324716567993, 0.21753007173538208, 0.25995689630508423, 0.3023837208747864, 0.34481051564216614, 0.3872373402118683, 0.42966416478157043, 0.4720909595489502, 0.5145177841186523, 0.5569446086883545, 0.5993714332580566, 0.6417982578277588, 0.6842250823974609, 0.7266519069671631, 0.7690787315368652, 0.8115054965019226, 0.8539323210716248, 0.8963591456413269, 0.938785970211029, 0.9812127947807312, 1.0236395597457886, 1.0660663843154907, 1.1084932088851929, 1.150920033454895, 1.1933468580245972, 1.2357736825942993]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 8.0, 8.0, 11.0, 14.0, 29.0, 34.0, 46.0, 68.0, 83.0, 193.0, 282.0, 471.0, 700.0, 1276.0, 2180.0, 3869.0, 6932.0, 13052.0, 24858.0, 49648.0, 98867.0, 189622.0, 263276.0, 189899.0, 98871.0, 49597.0, 25231.0, 13177.0, 6902.0, 3863.0, 2214.0, 1306.0, 727.0, 451.0, 269.0, 203.0, 117.0, 65.0, 43.0, 40.0, 20.0, 14.0, 8.0, 6.0, 6.0, 2.0, 3.0, 1.0, 2.0, 1.0], "bins": [-0.1580810546875, -0.15375041961669922, -0.14941978454589844, -0.14508914947509766, -0.14075851440429688, -0.1364278793334961, -0.1320972442626953, -0.12776660919189453, -0.12343597412109375, -0.11910533905029297, -0.11477470397949219, -0.1104440689086914, -0.10611343383789062, -0.10178279876708984, -0.09745216369628906, -0.09312152862548828, -0.0887908935546875, -0.08446025848388672, -0.08012962341308594, -0.07579898834228516, -0.07146835327148438, -0.0671377182006836, -0.06280708312988281, -0.05847644805908203, -0.05414581298828125, -0.04981517791748047, -0.04548454284667969, -0.041153907775878906, -0.036823272705078125, -0.032492637634277344, -0.028162002563476562, -0.02383136749267578, -0.019500732421875, -0.015170097351074219, -0.010839462280273438, -0.006508827209472656, -0.002178192138671875, 0.0021524429321289062, 0.0064830780029296875, 0.010813713073730469, 0.01514434814453125, 0.01947498321533203, 0.023805618286132812, 0.028136253356933594, 0.032466888427734375, 0.036797523498535156, 0.04112815856933594, 0.04545879364013672, 0.0497894287109375, 0.05412006378173828, 0.05845069885253906, 0.06278133392333984, 0.06711196899414062, 0.0714426040649414, 0.07577323913574219, 0.08010387420654297, 0.08443450927734375, 0.08876514434814453, 0.09309577941894531, 0.0974264144897461, 0.10175704956054688, 0.10608768463134766, 0.11041831970214844, 0.11474895477294922, 0.11907958984375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 9.0, 11.0, 13.0, 18.0, 24.0, 30.0, 37.0, 39.0, 47.0, 62.0, 59.0, 65.0, 71.0, 64.0, 77.0, 58.0, 56.0, 47.0, 53.0, 40.0, 25.0, 22.0, 19.0, 21.0, 12.0, 9.0, 3.0, 3.0, 5.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1859130859375, -0.1806354522705078, -0.17535781860351562, -0.17008018493652344, -0.16480255126953125, -0.15952491760253906, -0.15424728393554688, -0.1489696502685547, -0.1436920166015625, -0.1384143829345703, -0.13313674926757812, -0.12785911560058594, -0.12258148193359375, -0.11730384826660156, -0.11202621459960938, -0.10674858093261719, -0.101470947265625, -0.09619331359863281, -0.09091567993164062, -0.08563804626464844, -0.08036041259765625, -0.07508277893066406, -0.06980514526367188, -0.06452751159667969, -0.0592498779296875, -0.05397224426269531, -0.048694610595703125, -0.04341697692871094, -0.03813934326171875, -0.03286170959472656, -0.027584075927734375, -0.022306442260742188, -0.01702880859375, -0.011751174926757812, -0.006473541259765625, -0.0011959075927734375, 0.00408172607421875, 0.009359359741210938, 0.014636993408203125, 0.019914627075195312, 0.0251922607421875, 0.030469894409179688, 0.035747528076171875, 0.04102516174316406, 0.04630279541015625, 0.05158042907714844, 0.056858062744140625, 0.06213569641113281, 0.067413330078125, 0.07269096374511719, 0.07796859741210938, 0.08324623107910156, 0.08852386474609375, 0.09380149841308594, 0.09907913208007812, 0.10435676574707031, 0.1096343994140625, 0.11491203308105469, 0.12018966674804688, 0.12546730041503906, 0.13074493408203125, 0.13602256774902344, 0.14130020141601562, 0.1465778350830078, 0.15185546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 9.0, 9.0, 10.0, 13.0, 24.0, 31.0, 35.0, 49.0, 75.0, 112.0, 155.0, 263.0, 355.0, 752.0, 1612.0, 4151.0, 15140.0, 75759.0, 618386.0, 270161.0, 45269.0, 10079.0, 3193.0, 1228.0, 610.0, 376.0, 207.0, 141.0, 106.0, 64.0, 50.0, 30.0, 24.0, 21.0, 17.0, 7.0, 9.0, 5.0, 3.0, 7.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.344970703125, -0.332122802734375, -0.31927490234375, -0.306427001953125, -0.2935791015625, -0.280731201171875, -0.26788330078125, -0.255035400390625, -0.2421875, -0.229339599609375, -0.21649169921875, -0.203643798828125, -0.1907958984375, -0.177947998046875, -0.16510009765625, -0.152252197265625, -0.139404296875, -0.126556396484375, -0.11370849609375, -0.100860595703125, -0.0880126953125, -0.075164794921875, -0.06231689453125, -0.049468994140625, -0.03662109375, -0.023773193359375, -0.01092529296875, 0.001922607421875, 0.0147705078125, 0.027618408203125, 0.04046630859375, 0.053314208984375, 0.066162109375, 0.079010009765625, 0.09185791015625, 0.104705810546875, 0.1175537109375, 0.130401611328125, 0.14324951171875, 0.156097412109375, 0.1689453125, 0.181793212890625, 0.19464111328125, 0.207489013671875, 0.2203369140625, 0.233184814453125, 0.24603271484375, 0.258880615234375, 0.271728515625, 0.284576416015625, 0.29742431640625, 0.310272216796875, 0.3231201171875, 0.335968017578125, 0.34881591796875, 0.361663818359375, 0.37451171875, 0.387359619140625, 0.40020751953125, 0.413055419921875, 0.4259033203125, 0.438751220703125, 0.45159912109375, 0.464447021484375, 0.477294921875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 4.0, 6.0, 4.0, 2.0, 7.0, 5.0, 8.0, 10.0, 10.0, 22.0, 17.0, 27.0, 24.0, 29.0, 38.0, 34.0, 33.0, 50.0, 57.0, 60.0, 72.0, 58.0, 52.0, 67.0, 46.0, 39.0, 44.0, 37.0, 24.0, 20.0, 23.0, 17.0, 10.0, 11.0, 9.0, 6.0, 5.0, 6.0, 5.0, 3.0, 1.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.51806640625, -0.50152587890625, -0.4849853515625, -0.46844482421875, -0.451904296875, -0.43536376953125, -0.4188232421875, -0.40228271484375, -0.3857421875, -0.36920166015625, -0.3526611328125, -0.33612060546875, -0.319580078125, -0.30303955078125, -0.2864990234375, -0.26995849609375, -0.25341796875, -0.23687744140625, -0.2203369140625, -0.20379638671875, -0.187255859375, -0.17071533203125, -0.1541748046875, -0.13763427734375, -0.12109375, -0.10455322265625, -0.0880126953125, -0.07147216796875, -0.054931640625, -0.03839111328125, -0.0218505859375, -0.00531005859375, 0.01123046875, 0.02777099609375, 0.0443115234375, 0.06085205078125, 0.077392578125, 0.09393310546875, 0.1104736328125, 0.12701416015625, 0.1435546875, 0.16009521484375, 0.1766357421875, 0.19317626953125, 0.209716796875, 0.22625732421875, 0.2427978515625, 0.25933837890625, 0.27587890625, 0.29241943359375, 0.3089599609375, 0.32550048828125, 0.342041015625, 0.35858154296875, 0.3751220703125, 0.39166259765625, 0.408203125, 0.42474365234375, 0.4412841796875, 0.45782470703125, 0.474365234375, 0.49090576171875, 0.5074462890625, 0.52398681640625, 0.54052734375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 10.0, 2.0, 5.0, 4.0, 7.0, 10.0, 16.0, 15.0, 33.0, 38.0, 46.0, 77.0, 153.0, 205.0, 412.0, 810.0, 1554.0, 3419.0, 8491.0, 25140.0, 95172.0, 681063.0, 171488.0, 39051.0, 12304.0, 4642.0, 1985.0, 1021.0, 560.0, 293.0, 189.0, 123.0, 61.0, 45.0, 35.0, 21.0, 17.0, 11.0, 7.0, 8.0, 4.0, 3.0, 3.0, 1.0, 4.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2059326171875, -0.20016098022460938, -0.19438934326171875, -0.18861770629882812, -0.1828460693359375, -0.17707443237304688, -0.17130279541015625, -0.16553115844726562, -0.159759521484375, -0.15398788452148438, -0.14821624755859375, -0.14244461059570312, -0.1366729736328125, -0.13090133666992188, -0.12512969970703125, -0.11935806274414062, -0.11358642578125, -0.10781478881835938, -0.10204315185546875, -0.09627151489257812, -0.0904998779296875, -0.08472824096679688, -0.07895660400390625, -0.07318496704101562, -0.067413330078125, -0.061641693115234375, -0.05587005615234375, -0.050098419189453125, -0.0443267822265625, -0.038555145263671875, -0.03278350830078125, -0.027011871337890625, -0.021240234375, -0.015468597412109375, -0.00969696044921875, -0.003925323486328125, 0.0018463134765625, 0.007617950439453125, 0.01338958740234375, 0.019161224365234375, 0.024932861328125, 0.030704498291015625, 0.03647613525390625, 0.042247772216796875, 0.0480194091796875, 0.053791046142578125, 0.05956268310546875, 0.06533432006835938, 0.07110595703125, 0.07687759399414062, 0.08264923095703125, 0.08842086791992188, 0.0941925048828125, 0.09996414184570312, 0.10573577880859375, 0.11150741577148438, 0.117279052734375, 0.12305068969726562, 0.12882232666015625, 0.13459396362304688, 0.1403656005859375, 0.14613723754882812, 0.15190887451171875, 0.15768051147460938, 0.1634521484375]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 5.0, 8.0, 4.0, 4.0, 14.0, 15.0, 10.0, 14.0, 19.0, 35.0, 31.0, 45.0, 52.0, 104.0, 147.0, 135.0, 80.0, 66.0, 50.0, 36.0, 28.0, 17.0, 18.0, 10.0, 6.0, 8.0, 8.0, 7.0, 6.0, 6.0, 5.0, 1.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.396936416625977e-05, -7.179006934165955e-05, -6.961077451705933e-05, -6.74314796924591e-05, -6.525218486785889e-05, -6.307289004325867e-05, -6.089359521865845e-05, -5.871430039405823e-05, -5.653500556945801e-05, -5.435571074485779e-05, -5.217641592025757e-05, -4.999712109565735e-05, -4.781782627105713e-05, -4.563853144645691e-05, -4.345923662185669e-05, -4.127994179725647e-05, -3.910064697265625e-05, -3.692135214805603e-05, -3.474205732345581e-05, -3.256276249885559e-05, -3.038346767425537e-05, -2.820417284965515e-05, -2.602487802505493e-05, -2.3845583200454712e-05, -2.1666288375854492e-05, -1.9486993551254272e-05, -1.7307698726654053e-05, -1.5128403902053833e-05, -1.2949109077453613e-05, -1.0769814252853394e-05, -8.590519428253174e-06, -6.411224603652954e-06, -4.231929779052734e-06, -2.0526349544525146e-06, 1.2665987014770508e-07, 2.305954694747925e-06, 4.4852495193481445e-06, 6.664544343948364e-06, 8.843839168548584e-06, 1.1023133993148804e-05, 1.3202428817749023e-05, 1.5381723642349243e-05, 1.7561018466949463e-05, 1.9740313291549683e-05, 2.1919608116149902e-05, 2.4098902940750122e-05, 2.6278197765350342e-05, 2.845749258995056e-05, 3.063678741455078e-05, 3.2816082239151e-05, 3.499537706375122e-05, 3.717467188835144e-05, 3.935396671295166e-05, 4.153326153755188e-05, 4.37125563621521e-05, 4.589185118675232e-05, 4.807114601135254e-05, 5.025044083595276e-05, 5.242973566055298e-05, 5.46090304851532e-05, 5.678832530975342e-05, 5.896762013435364e-05, 6.114691495895386e-05, 6.332620978355408e-05, 6.55055046081543e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 3.0, 4.0, 4.0, 11.0, 13.0, 8.0, 17.0, 22.0, 48.0, 29.0, 60.0, 113.0, 179.0, 338.0, 639.0, 1392.0, 3597.0, 11229.0, 45735.0, 297129.0, 610290.0, 56599.0, 13628.0, 4244.0, 1571.0, 715.0, 390.0, 213.0, 114.0, 78.0, 39.0, 30.0, 29.0, 17.0, 12.0, 5.0, 5.0, 1.0, 3.0, 4.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.218994140625, -0.21216583251953125, -0.2053375244140625, -0.19850921630859375, -0.191680908203125, -0.18485260009765625, -0.1780242919921875, -0.17119598388671875, -0.16436767578125, -0.15753936767578125, -0.1507110595703125, -0.14388275146484375, -0.137054443359375, -0.13022613525390625, -0.1233978271484375, -0.11656951904296875, -0.1097412109375, -0.10291290283203125, -0.0960845947265625, -0.08925628662109375, -0.082427978515625, -0.07559967041015625, -0.0687713623046875, -0.06194305419921875, -0.05511474609375, -0.04828643798828125, -0.0414581298828125, -0.03462982177734375, -0.027801513671875, -0.02097320556640625, -0.0141448974609375, -0.00731658935546875, -0.00048828125, 0.00634002685546875, 0.0131683349609375, 0.01999664306640625, 0.026824951171875, 0.03365325927734375, 0.0404815673828125, 0.04730987548828125, 0.05413818359375, 0.06096649169921875, 0.0677947998046875, 0.07462310791015625, 0.081451416015625, 0.08827972412109375, 0.0951080322265625, 0.10193634033203125, 0.1087646484375, 0.11559295654296875, 0.1224212646484375, 0.12924957275390625, 0.136077880859375, 0.14290618896484375, 0.1497344970703125, 0.15656280517578125, 0.16339111328125, 0.17021942138671875, 0.1770477294921875, 0.18387603759765625, 0.190704345703125, 0.19753265380859375, 0.2043609619140625, 0.21118927001953125, 0.218017578125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 3.0, 5.0, 4.0, 5.0, 6.0, 7.0, 10.0, 14.0, 15.0, 27.0, 14.0, 22.0, 26.0, 31.0, 47.0, 50.0, 77.0, 67.0, 88.0, 87.0, 85.0, 50.0, 44.0, 40.0, 28.0, 20.0, 25.0, 18.0, 14.0, 17.0, 8.0, 4.0, 7.0, 4.0, 7.0, 6.0, 4.0, 5.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.140869140625, -0.13666915893554688, -0.13246917724609375, -0.12826919555664062, -0.1240692138671875, -0.11986923217773438, -0.11566925048828125, -0.11146926879882812, -0.107269287109375, -0.10306930541992188, -0.09886932373046875, -0.09466934204101562, -0.0904693603515625, -0.08626937866210938, -0.08206939697265625, -0.07786941528320312, -0.07366943359375, -0.06946945190429688, -0.06526947021484375, -0.061069488525390625, -0.0568695068359375, -0.052669525146484375, -0.04846954345703125, -0.044269561767578125, -0.040069580078125, -0.035869598388671875, -0.03166961669921875, -0.027469635009765625, -0.0232696533203125, -0.019069671630859375, -0.01486968994140625, -0.010669708251953125, -0.0064697265625, -0.002269744873046875, 0.00193023681640625, 0.006130218505859375, 0.0103302001953125, 0.014530181884765625, 0.01873016357421875, 0.022930145263671875, 0.027130126953125, 0.031330108642578125, 0.03553009033203125, 0.039730072021484375, 0.0439300537109375, 0.048130035400390625, 0.05233001708984375, 0.056529998779296875, 0.06072998046875, 0.06492996215820312, 0.06912994384765625, 0.07332992553710938, 0.0775299072265625, 0.08172988891601562, 0.08592987060546875, 0.09012985229492188, 0.094329833984375, 0.09852981567382812, 0.10272979736328125, 0.10692977905273438, 0.1111297607421875, 0.11532974243164062, 0.11952972412109375, 0.12372970581054688, 0.1279296875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 11.0, 17.0, 38.0, 80.0, 139.0, 364.0, 170.0, 109.0, 45.0, 18.0, 6.0, 4.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.640695095062256, -4.466111660003662, -4.29152774810791, -4.116944313049316, -3.9423604011535645, -3.7677769660949707, -3.593193292617798, -3.418609619140625, -3.244025945663452, -3.0694422721862793, -2.8948585987091064, -2.7202749252319336, -2.54569149017334, -2.371107578277588, -2.196524143218994, -2.0219404697418213, -1.8473567962646484, -1.6727731227874756, -1.4981894493103027, -1.3236058950424194, -1.1490222215652466, -0.9744385480880737, -0.7998549938201904, -0.6252713203430176, -0.4506876468658447, -0.27610400319099426, -0.1015203595161438, 0.07306325435638428, 0.24764692783355713, 0.42223060131073, 0.5968141555786133, 0.7713978290557861, 0.945981502532959, 1.1205651760101318, 1.2951488494873047, 1.469732403755188, 1.6443160772323608, 1.8188997507095337, 1.993483304977417, 2.16806697845459, 2.3426506519317627, 2.5172343254089355, 2.6918179988861084, 2.8664016723632812, 3.040985107421875, 3.215569019317627, 3.3901524543762207, 3.5647361278533936, 3.7393198013305664, 3.9139034748077393, 4.088487148284912, 4.263070583343506, 4.437654495239258, 4.612237930297852, 4.786821365356445, 4.961405277252197, 5.135989189147949, 5.310572624206543, 5.485156536102295, 5.659739971160889, 5.834323883056641, 6.008907318115234, 6.183490753173828, 6.35807466506958, 6.532658100128174]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 7.0, 11.0, 15.0, 11.0, 13.0, 18.0, 13.0, 19.0, 28.0, 26.0, 28.0, 43.0, 48.0, 39.0, 60.0, 118.0, 113.0, 59.0, 45.0, 36.0, 27.0, 33.0, 26.0, 25.0, 15.0, 16.0, 25.0, 17.0, 12.0, 9.0, 12.0, 7.0, 6.0, 8.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.0913805961608887, -2.0191664695739746, -1.94695246219635, -1.8747384548187256, -1.8025243282318115, -1.730310320854187, -1.6580963134765625, -1.5858821868896484, -1.513668179512024, -1.4414541721343994, -1.3692400455474854, -1.2970260381698608, -1.2248120307922363, -1.1525979042053223, -1.0803838968276978, -1.0081698894500732, -0.9359557628631592, -0.8637416958808899, -0.7915276288986206, -0.7193136215209961, -0.6470995545387268, -0.5748854875564575, -0.502671480178833, -0.4304574131965637, -0.35824334621429443, -0.28602927923202515, -0.21381524205207825, -0.14160118997097015, -0.06938713788986206, 0.0028269290924072266, 0.07504096627235413, 0.14725500345230103, 0.2194690704345703, 0.2916831374168396, 0.3638971745967865, 0.4361112117767334, 0.5083252787590027, 0.580539345741272, 0.6527533531188965, 0.7249674201011658, 0.7971814870834351, 0.8693955540657043, 0.9416096210479736, 1.0138236284255981, 1.0860376358032227, 1.1582517623901367, 1.2304657697677612, 1.3026797771453857, 1.3748939037322998, 1.4471079111099243, 1.5193220376968384, 1.591536045074463, 1.663750171661377, 1.7359641790390015, 1.808178186416626, 1.88039231300354, 1.9526063203811646, 2.024820327758789, 2.097034454345703, 2.169248580932617, 2.241462469100952, 2.313676595687866, 2.3858907222747803, 2.4581046104431152, 2.5303187370300293]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 2.0, 5.0, 8.0, 7.0, 11.0, 13.0, 24.0, 24.0, 43.0, 61.0, 74.0, 129.0, 195.0, 348.0, 630.0, 1063.0, 2056.0, 4109.0, 10045.0, 32062.0, 207316.0, 2305538.0, 1471904.0, 120520.0, 22715.0, 7693.0, 3458.0, 1725.0, 948.0, 550.0, 374.0, 184.0, 153.0, 92.0, 55.0, 39.0, 32.0, 21.0, 18.0, 9.0, 8.0, 13.0, 3.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2325439453125, -0.225250244140625, -0.21795654296875, -0.210662841796875, -0.203369140625, -0.196075439453125, -0.18878173828125, -0.181488037109375, -0.1741943359375, -0.166900634765625, -0.15960693359375, -0.152313232421875, -0.14501953125, -0.137725830078125, -0.13043212890625, -0.123138427734375, -0.1158447265625, -0.108551025390625, -0.10125732421875, -0.093963623046875, -0.086669921875, -0.079376220703125, -0.07208251953125, -0.064788818359375, -0.0574951171875, -0.050201416015625, -0.04290771484375, -0.035614013671875, -0.0283203125, -0.021026611328125, -0.01373291015625, -0.006439208984375, 0.0008544921875, 0.008148193359375, 0.01544189453125, 0.022735595703125, 0.030029296875, 0.037322998046875, 0.04461669921875, 0.051910400390625, 0.0592041015625, 0.066497802734375, 0.07379150390625, 0.081085205078125, 0.08837890625, 0.095672607421875, 0.10296630859375, 0.110260009765625, 0.1175537109375, 0.124847412109375, 0.13214111328125, 0.139434814453125, 0.146728515625, 0.154022216796875, 0.16131591796875, 0.168609619140625, 0.1759033203125, 0.183197021484375, 0.19049072265625, 0.197784423828125, 0.205078125, 0.212371826171875, 0.21966552734375, 0.226959228515625, 0.2342529296875]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 6.0, 1.0, 4.0, 7.0, 9.0, 17.0, 12.0, 12.0, 8.0, 24.0, 18.0, 17.0, 24.0, 26.0, 30.0, 28.0, 31.0, 31.0, 44.0, 36.0, 53.0, 43.0, 44.0, 37.0, 43.0, 41.0, 41.0, 43.0, 34.0, 30.0, 32.0, 39.0, 15.0, 25.0, 17.0, 15.0, 11.0, 12.0, 8.0, 7.0, 4.0, 7.0, 5.0, 2.0, 2.0, 2.0, 3.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.09619140625, -0.09303569793701172, -0.08987998962402344, -0.08672428131103516, -0.08356857299804688, -0.0804128646850586, -0.07725715637207031, -0.07410144805908203, -0.07094573974609375, -0.06779003143310547, -0.06463432312011719, -0.061478614807128906, -0.058322906494140625, -0.055167198181152344, -0.05201148986816406, -0.04885578155517578, -0.0457000732421875, -0.04254436492919922, -0.03938865661621094, -0.036232948303222656, -0.033077239990234375, -0.029921531677246094, -0.026765823364257812, -0.02361011505126953, -0.02045440673828125, -0.01729869842529297, -0.014142990112304688, -0.010987281799316406, -0.007831573486328125, -0.004675865173339844, -0.0015201568603515625, 0.0016355514526367188, 0.004791259765625, 0.007946968078613281, 0.011102676391601562, 0.014258384704589844, 0.017414093017578125, 0.020569801330566406, 0.023725509643554688, 0.02688121795654297, 0.03003692626953125, 0.03319263458251953, 0.03634834289550781, 0.039504051208496094, 0.042659759521484375, 0.045815467834472656, 0.04897117614746094, 0.05212688446044922, 0.0552825927734375, 0.05843830108642578, 0.06159400939941406, 0.06474971771240234, 0.06790542602539062, 0.0710611343383789, 0.07421684265136719, 0.07737255096435547, 0.08052825927734375, 0.08368396759033203, 0.08683967590332031, 0.0899953842163086, 0.09315109252929688, 0.09630680084228516, 0.09946250915527344, 0.10261821746826172, 0.10577392578125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 3.0, 8.0, 11.0, 30.0, 61.0, 115.0, 223.0, 503.0, 1257.0, 5312.0, 112352.0, 4045414.0, 24615.0, 2778.0, 859.0, 352.0, 187.0, 96.0, 47.0, 21.0, 17.0, 9.0, 7.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1259765625, -1.088836669921875, -1.05169677734375, -1.014556884765625, -0.9774169921875, -0.940277099609375, -0.90313720703125, -0.865997314453125, -0.828857421875, -0.791717529296875, -0.75457763671875, -0.717437744140625, -0.6802978515625, -0.643157958984375, -0.60601806640625, -0.568878173828125, -0.53173828125, -0.494598388671875, -0.45745849609375, -0.420318603515625, -0.3831787109375, -0.346038818359375, -0.30889892578125, -0.271759033203125, -0.234619140625, -0.197479248046875, -0.16033935546875, -0.123199462890625, -0.0860595703125, -0.048919677734375, -0.01177978515625, 0.025360107421875, 0.0625, 0.099639892578125, 0.13677978515625, 0.173919677734375, 0.2110595703125, 0.248199462890625, 0.28533935546875, 0.322479248046875, 0.359619140625, 0.396759033203125, 0.43389892578125, 0.471038818359375, 0.5081787109375, 0.545318603515625, 0.58245849609375, 0.619598388671875, 0.65673828125, 0.693878173828125, 0.73101806640625, 0.768157958984375, 0.8052978515625, 0.842437744140625, 0.87957763671875, 0.916717529296875, 0.953857421875, 0.990997314453125, 1.02813720703125, 1.065277099609375, 1.1024169921875, 1.139556884765625, 1.17669677734375, 1.213836669921875, 1.2509765625]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 4.0, 8.0, 8.0, 15.0, 24.0, 60.0, 113.0, 308.0, 1005.0, 1574.0, 601.0, 197.0, 68.0, 34.0, 19.0, 17.0, 12.0, 6.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.74560546875, -0.7209625244140625, -0.696319580078125, -0.6716766357421875, -0.64703369140625, -0.6223907470703125, -0.597747802734375, -0.5731048583984375, -0.5484619140625, -0.5238189697265625, -0.499176025390625, -0.4745330810546875, -0.44989013671875, -0.4252471923828125, -0.400604248046875, -0.3759613037109375, -0.351318359375, -0.3266754150390625, -0.302032470703125, -0.2773895263671875, -0.25274658203125, -0.2281036376953125, -0.203460693359375, -0.1788177490234375, -0.1541748046875, -0.1295318603515625, -0.104888916015625, -0.0802459716796875, -0.05560302734375, -0.0309600830078125, -0.006317138671875, 0.0183258056640625, 0.04296875, 0.0676116943359375, 0.092254638671875, 0.1168975830078125, 0.14154052734375, 0.1661834716796875, 0.190826416015625, 0.2154693603515625, 0.2401123046875, 0.2647552490234375, 0.289398193359375, 0.3140411376953125, 0.33868408203125, 0.3633270263671875, 0.387969970703125, 0.4126129150390625, 0.437255859375, 0.4618988037109375, 0.486541748046875, 0.5111846923828125, 0.53582763671875, 0.5604705810546875, 0.585113525390625, 0.6097564697265625, 0.6343994140625, 0.6590423583984375, 0.683685302734375, 0.7083282470703125, 0.73297119140625, 0.7576141357421875, 0.782257080078125, 0.8069000244140625, 0.83154296875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 6.0, 6.0, 7.0, 16.0, 33.0, 83.0, 160.0, 253.0, 200.0, 128.0, 64.0, 23.0, 17.0, 8.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3496012687683105, -7.156341552734375, -6.963081359863281, -6.769821643829346, -6.576561450958252, -6.383301734924316, -6.190041542053223, -5.996781826019287, -5.803522109985352, -5.610262393951416, -5.417002201080322, -5.223742485046387, -5.030482292175293, -4.837222576141357, -4.643962860107422, -4.450702667236328, -4.257442474365234, -4.064182758331299, -3.870922565460205, -3.6776628494262695, -3.484402894973755, -3.2911429405212402, -3.0978829860687256, -2.904623031616211, -2.7113633155822754, -2.5181033611297607, -2.324843406677246, -2.1315836906433105, -1.938323736190796, -1.7450637817382812, -1.5518038272857666, -1.3585439920425415, -1.1652841567993164, -0.9720242619514465, -0.7787643671035767, -0.585504412651062, -0.39224451780319214, -0.19898462295532227, -0.005724668502807617, 0.18753516674041748, 0.38079512119293213, 0.574055016040802, 0.7673149108886719, 0.9605748653411865, 1.1538348197937012, 1.3470946550369263, 1.540354609489441, 1.733614444732666, 1.9268743991851807, 2.1201343536376953, 2.31339430809021, 2.5066542625427246, 2.69991397857666, 2.893173933029175, 3.0864338874816895, 3.279693603515625, 3.4729537963867188, 3.6662137508392334, 3.859473705291748, 4.052733421325684, 4.245993614196777, 4.439253330230713, 4.632513046264648, 4.825773239135742, 5.019032955169678]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 1.0, 0.0, 4.0, 7.0, 3.0, 4.0, 8.0, 8.0, 16.0, 11.0, 13.0, 10.0, 13.0, 13.0, 20.0, 24.0, 19.0, 27.0, 20.0, 32.0, 35.0, 33.0, 44.0, 39.0, 47.0, 45.0, 46.0, 40.0, 42.0, 44.0, 44.0, 29.0, 35.0, 29.0, 27.0, 24.0, 16.0, 18.0, 17.0, 16.0, 13.0, 7.0, 13.0, 5.0, 12.0, 5.0, 5.0, 3.0, 1.0, 8.0, 7.0, 2.0, 4.0, 1.0, 3.0, 2.0, 1.0], "bins": [-1.4641828536987305, -1.419396996498108, -1.3746110200881958, -1.3298251628875732, -1.2850393056869507, -1.2402534484863281, -1.195467472076416, -1.1506816148757935, -1.105895757675171, -1.0611099004745483, -1.0163239240646362, -0.9715380668640137, -0.9267522096633911, -0.8819662928581238, -0.8371803760528564, -0.7923945188522339, -0.7476085424423218, -0.7028226256370544, -0.6580367684364319, -0.6132508516311646, -0.568464994430542, -0.5236790776252747, -0.4788931608200073, -0.4341072738170624, -0.38932138681411743, -0.3445354998111725, -0.29974961280822754, -0.2549636960029602, -0.21017780900001526, -0.1653919219970703, -0.12060600519180298, -0.07582011818885803, -0.031034231185913086, 0.013751663267612457, 0.058537557721138, 0.10332345962524414, 0.1481093466281891, 0.19289523363113403, 0.23768115043640137, 0.2824670374393463, 0.32725292444229126, 0.3720388114452362, 0.41682469844818115, 0.4616106152534485, 0.5063965320587158, 0.5511823892593384, 0.5959683060646057, 0.640754222869873, 0.6855400800704956, 0.7303259968757629, 0.7751118540763855, 0.8198977708816528, 0.8646836280822754, 0.9094695448875427, 0.9542554616928101, 0.9990413188934326, 1.0438272953033447, 1.0886131525039673, 1.1333991289138794, 1.178184986114502, 1.2229708433151245, 1.267756700515747, 1.3125426769256592, 1.3573285341262817, 1.4021143913269043]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 8.0, 13.0, 26.0, 36.0, 50.0, 82.0, 136.0, 211.0, 367.0, 672.0, 1231.0, 2241.0, 4528.0, 9234.0, 20865.0, 50579.0, 136766.0, 339584.0, 295948.0, 109882.0, 41981.0, 17651.0, 7951.0, 3942.0, 2015.0, 1046.0, 624.0, 344.0, 212.0, 113.0, 87.0, 49.0, 26.0, 23.0, 16.0, 9.0, 5.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.292236328125, -0.2836151123046875, -0.274993896484375, -0.2663726806640625, -0.25775146484375, -0.2491302490234375, -0.240509033203125, -0.2318878173828125, -0.2232666015625, -0.2146453857421875, -0.206024169921875, -0.1974029541015625, -0.18878173828125, -0.1801605224609375, -0.171539306640625, -0.1629180908203125, -0.154296875, -0.1456756591796875, -0.137054443359375, -0.1284332275390625, -0.11981201171875, -0.1111907958984375, -0.102569580078125, -0.0939483642578125, -0.0853271484375, -0.0767059326171875, -0.068084716796875, -0.0594635009765625, -0.05084228515625, -0.0422210693359375, -0.033599853515625, -0.0249786376953125, -0.016357421875, -0.0077362060546875, 0.000885009765625, 0.0095062255859375, 0.01812744140625, 0.0267486572265625, 0.035369873046875, 0.0439910888671875, 0.0526123046875, 0.0612335205078125, 0.069854736328125, 0.0784759521484375, 0.08709716796875, 0.0957183837890625, 0.104339599609375, 0.1129608154296875, 0.12158203125, 0.1302032470703125, 0.138824462890625, 0.1474456787109375, 0.15606689453125, 0.1646881103515625, 0.173309326171875, 0.1819305419921875, 0.1905517578125, 0.1991729736328125, 0.207794189453125, 0.2164154052734375, 0.22503662109375, 0.2336578369140625, 0.242279052734375, 0.2509002685546875, 0.259521484375]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 4.0, 5.0, 5.0, 4.0, 1.0, 8.0, 17.0, 18.0, 25.0, 16.0, 17.0, 25.0, 37.0, 37.0, 30.0, 56.0, 49.0, 46.0, 53.0, 58.0, 55.0, 64.0, 51.0, 49.0, 36.0, 33.0, 34.0, 33.0, 27.0, 21.0, 21.0, 22.0, 12.0, 9.0, 8.0, 3.0, 9.0, 6.0, 3.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.14111328125, -0.13640213012695312, -0.13169097900390625, -0.12697982788085938, -0.1222686767578125, -0.11755752563476562, -0.11284637451171875, -0.10813522338867188, -0.103424072265625, -0.09871292114257812, -0.09400177001953125, -0.08929061889648438, -0.0845794677734375, -0.07986831665039062, -0.07515716552734375, -0.07044601440429688, -0.06573486328125, -0.061023712158203125, -0.05631256103515625, -0.051601409912109375, -0.0468902587890625, -0.042179107666015625, -0.03746795654296875, -0.032756805419921875, -0.028045654296875, -0.023334503173828125, -0.01862335205078125, -0.013912200927734375, -0.0092010498046875, -0.004489898681640625, 0.00022125244140625, 0.004932403564453125, 0.0096435546875, 0.014354705810546875, 0.01906585693359375, 0.023777008056640625, 0.0284881591796875, 0.033199310302734375, 0.03791046142578125, 0.042621612548828125, 0.047332763671875, 0.052043914794921875, 0.05675506591796875, 0.061466217041015625, 0.0661773681640625, 0.07088851928710938, 0.07559967041015625, 0.08031082153320312, 0.08502197265625, 0.08973312377929688, 0.09444427490234375, 0.09915542602539062, 0.1038665771484375, 0.10857772827148438, 0.11328887939453125, 0.11800003051757812, 0.122711181640625, 0.12742233276367188, 0.13213348388671875, 0.13684463500976562, 0.1415557861328125, 0.14626693725585938, 0.15097808837890625, 0.15568923950195312, 0.160400390625]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 7.0, 20.0, 17.0, 18.0, 22.0, 31.0, 36.0, 75.0, 99.0, 127.0, 226.0, 365.0, 626.0, 1189.0, 2830.0, 9981.0, 59934.0, 733270.0, 205407.0, 24831.0, 5347.0, 1879.0, 871.0, 496.0, 297.0, 164.0, 106.0, 70.0, 44.0, 43.0, 30.0, 33.0, 18.0, 15.0, 8.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0], "bins": [-0.68994140625, -0.670654296875, -0.6513671875, -0.632080078125, -0.61279296875, -0.593505859375, -0.57421875, -0.554931640625, -0.53564453125, -0.516357421875, -0.4970703125, -0.477783203125, -0.45849609375, -0.439208984375, -0.419921875, -0.400634765625, -0.38134765625, -0.362060546875, -0.3427734375, -0.323486328125, -0.30419921875, -0.284912109375, -0.265625, -0.246337890625, -0.22705078125, -0.207763671875, -0.1884765625, -0.169189453125, -0.14990234375, -0.130615234375, -0.111328125, -0.092041015625, -0.07275390625, -0.053466796875, -0.0341796875, -0.014892578125, 0.00439453125, 0.023681640625, 0.04296875, 0.062255859375, 0.08154296875, 0.100830078125, 0.1201171875, 0.139404296875, 0.15869140625, 0.177978515625, 0.197265625, 0.216552734375, 0.23583984375, 0.255126953125, 0.2744140625, 0.293701171875, 0.31298828125, 0.332275390625, 0.3515625, 0.370849609375, 0.39013671875, 0.409423828125, 0.4287109375, 0.447998046875, 0.46728515625, 0.486572265625, 0.505859375, 0.525146484375, 0.54443359375]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 5.0, 3.0, 8.0, 8.0, 5.0, 8.0, 6.0, 9.0, 10.0, 12.0, 13.0, 25.0, 19.0, 36.0, 40.0, 41.0, 58.0, 46.0, 64.0, 61.0, 63.0, 47.0, 57.0, 57.0, 39.0, 45.0, 42.0, 34.0, 31.0, 17.0, 17.0, 19.0, 14.0, 11.0, 8.0, 6.0, 4.0, 6.0, 4.0, 5.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.61328125, -0.59442138671875, -0.5755615234375, -0.55670166015625, -0.537841796875, -0.51898193359375, -0.5001220703125, -0.48126220703125, -0.46240234375, -0.44354248046875, -0.4246826171875, -0.40582275390625, -0.386962890625, -0.36810302734375, -0.3492431640625, -0.33038330078125, -0.3115234375, -0.29266357421875, -0.2738037109375, -0.25494384765625, -0.236083984375, -0.21722412109375, -0.1983642578125, -0.17950439453125, -0.16064453125, -0.14178466796875, -0.1229248046875, -0.10406494140625, -0.085205078125, -0.06634521484375, -0.0474853515625, -0.02862548828125, -0.009765625, 0.00909423828125, 0.0279541015625, 0.04681396484375, 0.065673828125, 0.08453369140625, 0.1033935546875, 0.12225341796875, 0.14111328125, 0.15997314453125, 0.1788330078125, 0.19769287109375, 0.216552734375, 0.23541259765625, 0.2542724609375, 0.27313232421875, 0.2919921875, 0.31085205078125, 0.3297119140625, 0.34857177734375, 0.367431640625, 0.38629150390625, 0.4051513671875, 0.42401123046875, 0.44287109375, 0.46173095703125, 0.4805908203125, 0.49945068359375, 0.518310546875, 0.53717041015625, 0.5560302734375, 0.57489013671875, 0.59375]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 6.0, 13.0, 8.0, 3.0, 7.0, 12.0, 19.0, 19.0, 32.0, 48.0, 62.0, 112.0, 179.0, 305.0, 584.0, 1199.0, 2721.0, 7470.0, 27650.0, 190934.0, 743191.0, 54498.0, 12149.0, 3922.0, 1643.0, 754.0, 399.0, 233.0, 130.0, 68.0, 57.0, 34.0, 23.0, 21.0, 11.0, 6.0, 8.0, 7.0, 6.0, 5.0, 0.0, 2.0, 9.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.261474609375, -0.2538299560546875, -0.246185302734375, -0.2385406494140625, -0.23089599609375, -0.2232513427734375, -0.215606689453125, -0.2079620361328125, -0.2003173828125, -0.1926727294921875, -0.185028076171875, -0.1773834228515625, -0.16973876953125, -0.1620941162109375, -0.154449462890625, -0.1468048095703125, -0.13916015625, -0.1315155029296875, -0.123870849609375, -0.1162261962890625, -0.10858154296875, -0.1009368896484375, -0.093292236328125, -0.0856475830078125, -0.0780029296875, -0.0703582763671875, -0.062713623046875, -0.0550689697265625, -0.04742431640625, -0.0397796630859375, -0.032135009765625, -0.0244903564453125, -0.016845703125, -0.0092010498046875, -0.001556396484375, 0.0060882568359375, 0.01373291015625, 0.0213775634765625, 0.029022216796875, 0.0366668701171875, 0.0443115234375, 0.0519561767578125, 0.059600830078125, 0.0672454833984375, 0.07489013671875, 0.0825347900390625, 0.090179443359375, 0.0978240966796875, 0.10546875, 0.1131134033203125, 0.120758056640625, 0.1284027099609375, 0.13604736328125, 0.1436920166015625, 0.151336669921875, 0.1589813232421875, 0.1666259765625, 0.1742706298828125, 0.181915283203125, 0.1895599365234375, 0.19720458984375, 0.2048492431640625, 0.212493896484375, 0.2201385498046875, 0.227783203125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 2.0, 4.0, 3.0, 4.0, 6.0, 14.0, 14.0, 22.0, 37.0, 45.0, 65.0, 118.0, 182.0, 181.0, 89.0, 69.0, 59.0, 22.0, 12.0, 11.0, 13.0, 10.0, 3.0, 4.0, 1.0, 5.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001170039176940918, -0.00011310633271932602, -0.00010920874774456024, -0.00010531116276979446, -0.00010141357779502869, -9.751599282026291e-05, -9.361840784549713e-05, -8.972082287073135e-05, -8.582323789596558e-05, -8.19256529211998e-05, -7.802806794643402e-05, -7.413048297166824e-05, -7.023289799690247e-05, -6.633531302213669e-05, -6.243772804737091e-05, -5.854014307260513e-05, -5.4642558097839355e-05, -5.074497312307358e-05, -4.68473881483078e-05, -4.294980317354202e-05, -3.9052218198776245e-05, -3.515463322401047e-05, -3.125704824924469e-05, -2.7359463274478912e-05, -2.3461878299713135e-05, -1.9564293324947357e-05, -1.566670835018158e-05, -1.1769123375415802e-05, -7.871538400650024e-06, -3.973953425884247e-06, -7.636845111846924e-08, 3.821216523647308e-06, 7.718801498413086e-06, 1.1616386473178864e-05, 1.551397144794464e-05, 1.941155642271042e-05, 2.3309141397476196e-05, 2.7206726372241974e-05, 3.110431134700775e-05, 3.500189632177353e-05, 3.889948129653931e-05, 4.2797066271305084e-05, 4.669465124607086e-05, 5.059223622083664e-05, 5.448982119560242e-05, 5.8387406170368195e-05, 6.228499114513397e-05, 6.618257611989975e-05, 7.008016109466553e-05, 7.39777460694313e-05, 7.787533104419708e-05, 8.177291601896286e-05, 8.567050099372864e-05, 8.956808596849442e-05, 9.346567094326019e-05, 9.736325591802597e-05, 0.00010126084089279175, 0.00010515842586755753, 0.0001090560108423233, 0.00011295359581708908, 0.00011685118079185486, 0.00012074876576662064, 0.00012464635074138641, 0.0001285439357161522, 0.00013244152069091797]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 1.0, 4.0, 20.0, 9.0, 24.0, 17.0, 35.0, 41.0, 57.0, 72.0, 137.0, 195.0, 287.0, 550.0, 1057.0, 2181.0, 5928.0, 19642.0, 92924.0, 735335.0, 148680.0, 27916.0, 7786.0, 2826.0, 1188.0, 587.0, 340.0, 221.0, 170.0, 93.0, 65.0, 47.0, 29.0, 20.0, 17.0, 10.0, 11.0, 6.0, 6.0, 4.0, 6.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.177490234375, -0.17149925231933594, -0.16550827026367188, -0.1595172882080078, -0.15352630615234375, -0.1475353240966797, -0.14154434204101562, -0.13555335998535156, -0.1295623779296875, -0.12357139587402344, -0.11758041381835938, -0.11158943176269531, -0.10559844970703125, -0.09960746765136719, -0.09361648559570312, -0.08762550354003906, -0.081634521484375, -0.07564353942871094, -0.06965255737304688, -0.06366157531738281, -0.05767059326171875, -0.05167961120605469, -0.045688629150390625, -0.03969764709472656, -0.0337066650390625, -0.027715682983398438, -0.021724700927734375, -0.015733718872070312, -0.00974273681640625, -0.0037517547607421875, 0.002239227294921875, 0.008230209350585938, 0.01422119140625, 0.020212173461914062, 0.026203155517578125, 0.03219413757324219, 0.03818511962890625, 0.04417610168457031, 0.050167083740234375, 0.05615806579589844, 0.0621490478515625, 0.06814002990722656, 0.07413101196289062, 0.08012199401855469, 0.08611297607421875, 0.09210395812988281, 0.09809494018554688, 0.10408592224121094, 0.110076904296875, 0.11606788635253906, 0.12205886840820312, 0.1280498504638672, 0.13404083251953125, 0.1400318145751953, 0.14602279663085938, 0.15201377868652344, 0.1580047607421875, 0.16399574279785156, 0.16998672485351562, 0.1759777069091797, 0.18196868896484375, 0.1879596710205078, 0.19395065307617188, 0.19994163513183594, 0.2059326171875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 5.0, 9.0, 8.0, 12.0, 15.0, 14.0, 24.0, 29.0, 23.0, 32.0, 53.0, 56.0, 57.0, 81.0, 126.0, 96.0, 80.0, 56.0, 46.0, 39.0, 33.0, 18.0, 22.0, 21.0, 10.0, 15.0, 5.0, 4.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.192138671875, -0.18738651275634766, -0.1826343536376953, -0.17788219451904297, -0.17313003540039062, -0.16837787628173828, -0.16362571716308594, -0.1588735580444336, -0.15412139892578125, -0.1493692398071289, -0.14461708068847656, -0.13986492156982422, -0.13511276245117188, -0.13036060333251953, -0.1256084442138672, -0.12085628509521484, -0.1161041259765625, -0.11135196685791016, -0.10659980773925781, -0.10184764862060547, -0.09709548950195312, -0.09234333038330078, -0.08759117126464844, -0.0828390121459961, -0.07808685302734375, -0.0733346939086914, -0.06858253479003906, -0.06383037567138672, -0.059078216552734375, -0.05432605743408203, -0.04957389831542969, -0.044821739196777344, -0.040069580078125, -0.035317420959472656, -0.030565261840820312, -0.02581310272216797, -0.021060943603515625, -0.01630878448486328, -0.011556625366210938, -0.006804466247558594, -0.00205230712890625, 0.0026998519897460938, 0.0074520111083984375, 0.012204170227050781, 0.016956329345703125, 0.02170848846435547, 0.026460647583007812, 0.031212806701660156, 0.0359649658203125, 0.040717124938964844, 0.04546928405761719, 0.05022144317626953, 0.054973602294921875, 0.05972576141357422, 0.06447792053222656, 0.0692300796508789, 0.07398223876953125, 0.0787343978881836, 0.08348655700683594, 0.08823871612548828, 0.09299087524414062, 0.09774303436279297, 0.10249519348144531, 0.10724735260009766, 0.11199951171875]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 6.0, 9.0, 21.0, 29.0, 64.0, 90.0, 160.0, 364.0, 102.0, 80.0, 40.0, 21.0, 7.0, 3.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.355439186096191, -4.196050643920898, -4.0366621017456055, -3.8772735595703125, -3.7178850173950195, -3.5584964752197266, -3.3991081714630127, -3.2397196292877197, -3.0803310871124268, -2.920942544937134, -2.761554002761841, -2.602165460586548, -2.442777156829834, -2.283388614654541, -2.124000072479248, -1.964611530303955, -1.805222988128662, -1.6458344459533691, -1.4864459037780762, -1.3270574808120728, -1.1676689386367798, -1.0082803964614868, -0.8488919138908386, -0.6895034313201904, -0.5301148891448975, -0.3707263767719269, -0.2113378643989563, -0.05194935202598572, 0.10743916034698486, 0.26682770252227783, 0.426216185092926, 0.5856046676635742, 0.7449936866760254, 0.9043822288513184, 1.0637707710266113, 1.2231591939926147, 1.3825477361679077, 1.5419362783432007, 1.701324701309204, 1.860713243484497, 2.02010178565979, 2.179490327835083, 2.338878870010376, 2.498267412185669, 2.657655715942383, 2.817044258117676, 2.9764328002929688, 3.1358213424682617, 3.2952098846435547, 3.4545984268188477, 3.6139869689941406, 3.7733755111694336, 3.9327640533447266, 4.0921525955200195, 4.2515411376953125, 4.4109296798706055, 4.570318222045898, 4.729706764221191, 4.889095306396484, 5.048483848571777, 5.20787239074707, 5.367260932922363, 5.526649475097656, 5.686038017272949, 5.845426082611084]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 7.0, 1.0, 4.0, 2.0, 7.0, 15.0, 9.0, 13.0, 14.0, 19.0, 18.0, 26.0, 25.0, 19.0, 27.0, 39.0, 30.0, 47.0, 112.0, 171.0, 85.0, 40.0, 36.0, 24.0, 32.0, 27.0, 29.0, 27.0, 22.0, 14.0, 14.0, 9.0, 5.0, 9.0, 9.0, 5.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6030263900756836, -2.5252227783203125, -2.4474194049835205, -2.3696157932281494, -2.2918124198913574, -2.2140088081359863, -2.1362051963806152, -2.0584018230438232, -1.9805982112884521, -1.9027947187423706, -1.824991226196289, -1.747187614440918, -1.6693841218948364, -1.5915806293487549, -1.5137771368026733, -1.4359736442565918, -1.3581701517105103, -1.2803666591644287, -1.2025631666183472, -1.1247596740722656, -1.0469560623168945, -0.969152569770813, -0.8913490772247314, -0.8135455250740051, -0.7357420325279236, -0.657938539981842, -0.5801349878311157, -0.5023314952850342, -0.42452797293663025, -0.3467244505882263, -0.2689209580421448, -0.19111740589141846, -0.11331391334533691, -0.03551039844751358, 0.04229311645030975, 0.12009662389755249, 0.19790014624595642, 0.27570366859436035, 0.3535071611404419, 0.4313107132911682, 0.5091142058372498, 0.5869176983833313, 0.6647212505340576, 0.7425247430801392, 0.8203282356262207, 0.898131787776947, 0.9759352803230286, 1.0537388324737549, 1.1315423250198364, 1.209345817565918, 1.2871493101119995, 1.364952802658081, 1.4427564144134521, 1.5205599069595337, 1.5983633995056152, 1.6761670112609863, 1.7539703845977783, 1.8317738771438599, 1.9095773696899414, 1.9873809814453125, 2.0651843547821045, 2.1429879665374756, 2.2207913398742676, 2.2985949516296387, 2.3763985633850098]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 1.0, 6.0, 12.0, 12.0, 14.0, 18.0, 31.0, 57.0, 96.0, 135.0, 198.0, 381.0, 614.0, 1142.0, 2254.0, 4598.0, 10552.0, 27807.0, 98347.0, 615066.0, 2528292.0, 740429.0, 111409.0, 30973.0, 11646.0, 4887.0, 2444.0, 1189.0, 688.0, 381.0, 231.0, 125.0, 82.0, 62.0, 31.0, 31.0, 14.0, 9.0, 7.0, 8.0, 5.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.3232421875, -0.3138847351074219, -0.30452728271484375, -0.2951698303222656, -0.2858123779296875, -0.2764549255371094, -0.26709747314453125, -0.2577400207519531, -0.248382568359375, -0.23902511596679688, -0.22966766357421875, -0.22031021118164062, -0.2109527587890625, -0.20159530639648438, -0.19223785400390625, -0.18288040161132812, -0.17352294921875, -0.16416549682617188, -0.15480804443359375, -0.14545059204101562, -0.1360931396484375, -0.12673568725585938, -0.11737823486328125, -0.10802078247070312, -0.098663330078125, -0.08930587768554688, -0.07994842529296875, -0.07059097290039062, -0.0612335205078125, -0.051876068115234375, -0.04251861572265625, -0.033161163330078125, -0.0238037109375, -0.014446258544921875, -0.00508880615234375, 0.004268646240234375, 0.0136260986328125, 0.022983551025390625, 0.03234100341796875, 0.041698455810546875, 0.051055908203125, 0.060413360595703125, 0.06977081298828125, 0.07912826538085938, 0.0884857177734375, 0.09784317016601562, 0.10720062255859375, 0.11655807495117188, 0.12591552734375, 0.13527297973632812, 0.14463043212890625, 0.15398788452148438, 0.1633453369140625, 0.17270278930664062, 0.18206024169921875, 0.19141769409179688, 0.200775146484375, 0.21013259887695312, 0.21949005126953125, 0.22884750366210938, 0.2382049560546875, 0.24756240844726562, 0.25691986083984375, 0.2662773132324219, 0.275634765625]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 5.0, 10.0, 8.0, 6.0, 14.0, 12.0, 11.0, 9.0, 25.0, 15.0, 19.0, 28.0, 23.0, 29.0, 30.0, 51.0, 30.0, 33.0, 27.0, 42.0, 30.0, 46.0, 45.0, 33.0, 37.0, 50.0, 36.0, 38.0, 35.0, 32.0, 24.0, 20.0, 14.0, 19.0, 19.0, 13.0, 17.0, 15.0, 12.0, 5.0, 10.0, 4.0, 4.0, 2.0, 4.0, 1.0, 3.0, 6.0, 3.0, 2.0, 0.0, 3.0], "bins": [-0.1068115234375, -0.10364246368408203, -0.10047340393066406, -0.0973043441772461, -0.09413528442382812, -0.09096622467041016, -0.08779716491699219, -0.08462810516357422, -0.08145904541015625, -0.07828998565673828, -0.07512092590332031, -0.07195186614990234, -0.06878280639648438, -0.0656137466430664, -0.06244468688964844, -0.05927562713623047, -0.0561065673828125, -0.05293750762939453, -0.04976844787597656, -0.046599388122558594, -0.043430328369140625, -0.040261268615722656, -0.03709220886230469, -0.03392314910888672, -0.03075408935546875, -0.02758502960205078, -0.024415969848632812, -0.021246910095214844, -0.018077850341796875, -0.014908790588378906, -0.011739730834960938, -0.008570671081542969, -0.005401611328125, -0.0022325515747070312, 0.0009365081787109375, 0.004105567932128906, 0.007274627685546875, 0.010443687438964844, 0.013612747192382812, 0.01678180694580078, 0.01995086669921875, 0.02311992645263672, 0.026288986206054688, 0.029458045959472656, 0.032627105712890625, 0.035796165466308594, 0.03896522521972656, 0.04213428497314453, 0.0453033447265625, 0.04847240447998047, 0.05164146423339844, 0.054810523986816406, 0.057979583740234375, 0.061148643493652344, 0.06431770324707031, 0.06748676300048828, 0.07065582275390625, 0.07382488250732422, 0.07699394226074219, 0.08016300201416016, 0.08333206176757812, 0.0865011215209961, 0.08967018127441406, 0.09283924102783203, 0.09600830078125]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 12.0, 24.0, 44.0, 117.0, 312.0, 1327.0, 19745.0, 4163687.0, 7652.0, 917.0, 265.0, 88.0, 41.0, 23.0, 11.0, 5.0, 7.0, 7.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.06640625, -2.95843505859375, -2.8504638671875, -2.74249267578125, -2.634521484375, -2.52655029296875, -2.4185791015625, -2.31060791015625, -2.20263671875, -2.09466552734375, -1.9866943359375, -1.87872314453125, -1.770751953125, -1.66278076171875, -1.5548095703125, -1.44683837890625, -1.3388671875, -1.23089599609375, -1.1229248046875, -1.01495361328125, -0.906982421875, -0.79901123046875, -0.6910400390625, -0.58306884765625, -0.47509765625, -0.36712646484375, -0.2591552734375, -0.15118408203125, -0.043212890625, 0.06475830078125, 0.1727294921875, 0.28070068359375, 0.388671875, 0.49664306640625, 0.6046142578125, 0.71258544921875, 0.820556640625, 0.92852783203125, 1.0364990234375, 1.14447021484375, 1.25244140625, 1.36041259765625, 1.4683837890625, 1.57635498046875, 1.684326171875, 1.79229736328125, 1.9002685546875, 2.00823974609375, 2.1162109375, 2.22418212890625, 2.3321533203125, 2.44012451171875, 2.548095703125, 2.65606689453125, 2.7640380859375, 2.87200927734375, 2.97998046875, 3.08795166015625, 3.1959228515625, 3.30389404296875, 3.411865234375, 3.51983642578125, 3.6278076171875, 3.73577880859375, 3.84375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 10.0, 15.0, 39.0, 118.0, 283.0, 859.0, 1813.0, 666.0, 177.0, 63.0, 30.0, 8.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2783203125, -1.2210540771484375, -1.163787841796875, -1.1065216064453125, -1.04925537109375, -0.9919891357421875, -0.934722900390625, -0.8774566650390625, -0.8201904296875, -0.7629241943359375, -0.705657958984375, -0.6483917236328125, -0.59112548828125, -0.5338592529296875, -0.476593017578125, -0.4193267822265625, -0.362060546875, -0.3047943115234375, -0.247528076171875, -0.1902618408203125, -0.13299560546875, -0.0757293701171875, -0.018463134765625, 0.0388031005859375, 0.0960693359375, 0.1533355712890625, 0.210601806640625, 0.2678680419921875, 0.32513427734375, 0.3824005126953125, 0.439666748046875, 0.4969329833984375, 0.55419921875, 0.6114654541015625, 0.668731689453125, 0.7259979248046875, 0.78326416015625, 0.8405303955078125, 0.897796630859375, 0.9550628662109375, 1.0123291015625, 1.0695953369140625, 1.126861572265625, 1.1841278076171875, 1.24139404296875, 1.2986602783203125, 1.355926513671875, 1.4131927490234375, 1.470458984375, 1.5277252197265625, 1.584991455078125, 1.6422576904296875, 1.69952392578125, 1.7567901611328125, 1.814056396484375, 1.8713226318359375, 1.9285888671875, 1.9858551025390625, 2.043121337890625, 2.1003875732421875, 2.15765380859375, 2.2149200439453125, 2.272186279296875, 2.3294525146484375, 2.38671875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 1.0, 5.0, 5.0, 9.0, 8.0, 14.0, 23.0, 42.0, 81.0, 126.0, 175.0, 184.0, 135.0, 84.0, 47.0, 24.0, 15.0, 7.0, 4.0, 3.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.781458854675293, -9.523962020874023, -9.266465187072754, -9.008968353271484, -8.751472473144531, -8.493975639343262, -8.236478805541992, -7.978981971740723, -7.721485137939453, -7.463988304138184, -7.206491470336914, -6.948995113372803, -6.691498279571533, -6.434001445770264, -6.176505088806152, -5.919008255004883, -5.661511421203613, -5.404014587402344, -5.146517753601074, -4.889021396636963, -4.631524562835693, -4.374027729034424, -4.1165313720703125, -3.859034538269043, -3.6015377044677734, -3.344040870666504, -3.0865442752838135, -2.829047679901123, -2.5715508460998535, -2.314054012298584, -2.0565574169158936, -1.7990607023239136, -1.5415635108947754, -1.2840667963027954, -1.0265700817108154, -0.7690733671188354, -0.5115766525268555, -0.2540799379348755, 0.003416776657104492, 0.2609134912490845, 0.5184102058410645, 0.7759069204330444, 1.0334036350250244, 1.2909003496170044, 1.5483970642089844, 1.8058937788009644, 2.0633904933929443, 2.3208870887756348, 2.5783839225769043, 2.835880756378174, 3.0933773517608643, 3.3508739471435547, 3.608370780944824, 3.8658676147460938, 4.123364448547363, 4.380860805511475, 4.638357639312744, 4.895854473114014, 5.153350830078125, 5.4108476638793945, 5.668344497680664, 5.925841331481934, 6.183338165283203, 6.4408345222473145, 6.698331356048584]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 5.0, 4.0, 4.0, 12.0, 11.0, 10.0, 19.0, 22.0, 31.0, 29.0, 33.0, 53.0, 48.0, 56.0, 59.0, 73.0, 87.0, 71.0, 61.0, 51.0, 49.0, 32.0, 37.0, 33.0, 24.0, 16.0, 21.0, 18.0, 14.0, 5.0, 4.0, 7.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.0072526931762695, -4.854102611541748, -4.700952529907227, -4.547802448272705, -4.394652366638184, -4.24150276184082, -4.088352203369141, -3.9352025985717773, -3.782052516937256, -3.6289024353027344, -3.475752353668213, -3.3226022720336914, -3.169452428817749, -3.0163023471832275, -2.863152265548706, -2.7100024223327637, -2.556852102279663, -2.4037020206451416, -2.25055193901062, -2.0974020957946777, -1.9442520141601562, -1.7911019325256348, -1.6379518508911133, -1.4848018884658813, -1.3316518068313599, -1.1785017251968384, -1.0253517627716064, -0.872201681137085, -0.7190516591072083, -0.5659016370773315, -0.41275155544281006, -0.2596015930175781, -0.10645151138305664, 0.04669852554798126, 0.19984856247901917, 0.35299861431121826, 0.506148636341095, 0.6592986583709717, 0.8124487400054932, 0.9655987024307251, 1.1187487840652466, 1.271898865699768, 1.425048828125, 1.5781989097595215, 1.731348991394043, 1.884498953819275, 2.037649154663086, 2.1907989978790283, 2.34394907951355, 2.4970991611480713, 2.6502492427825928, 2.803399085998535, 2.9565491676330566, 3.109699249267578, 3.2628493309020996, 3.415999412536621, 3.5691494941711426, 3.722299575805664, 3.8754496574401855, 4.028599739074707, 4.1817498207092285, 4.33489990234375, 4.488049507141113, 4.641199588775635, 4.794349670410156]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 3.0, 5.0, 6.0, 11.0, 15.0, 28.0, 43.0, 56.0, 115.0, 207.0, 449.0, 966.0, 2338.0, 7037.0, 27288.0, 185052.0, 715903.0, 85254.0, 15992.0, 4703.0, 1595.0, 706.0, 369.0, 179.0, 87.0, 61.0, 33.0, 24.0, 16.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.71923828125, -0.6999664306640625, -0.680694580078125, -0.6614227294921875, -0.64215087890625, -0.6228790283203125, -0.603607177734375, -0.5843353271484375, -0.5650634765625, -0.5457916259765625, -0.526519775390625, -0.5072479248046875, -0.48797607421875, -0.4687042236328125, -0.449432373046875, -0.4301605224609375, -0.410888671875, -0.3916168212890625, -0.372344970703125, -0.3530731201171875, -0.33380126953125, -0.3145294189453125, -0.295257568359375, -0.2759857177734375, -0.2567138671875, -0.2374420166015625, -0.218170166015625, -0.1988983154296875, -0.17962646484375, -0.1603546142578125, -0.141082763671875, -0.1218109130859375, -0.1025390625, -0.0832672119140625, -0.063995361328125, -0.0447235107421875, -0.02545166015625, -0.0061798095703125, 0.013092041015625, 0.0323638916015625, 0.0516357421875, 0.0709075927734375, 0.090179443359375, 0.1094512939453125, 0.12872314453125, 0.1479949951171875, 0.167266845703125, 0.1865386962890625, 0.205810546875, 0.2250823974609375, 0.244354248046875, 0.2636260986328125, 0.28289794921875, 0.3021697998046875, 0.321441650390625, 0.3407135009765625, 0.3599853515625, 0.3792572021484375, 0.398529052734375, 0.4178009033203125, 0.43707275390625, 0.4563446044921875, 0.475616455078125, 0.4948883056640625, 0.51416015625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 5.0, 8.0, 8.0, 5.0, 7.0, 9.0, 12.0, 16.0, 22.0, 21.0, 33.0, 34.0, 43.0, 58.0, 44.0, 69.0, 54.0, 63.0, 57.0, 70.0, 48.0, 55.0, 51.0, 49.0, 24.0, 24.0, 14.0, 23.0, 14.0, 23.0, 11.0, 10.0, 8.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.24462890625, -0.2373371124267578, -0.23004531860351562, -0.22275352478027344, -0.21546173095703125, -0.20816993713378906, -0.20087814331054688, -0.1935863494873047, -0.1862945556640625, -0.1790027618408203, -0.17171096801757812, -0.16441917419433594, -0.15712738037109375, -0.14983558654785156, -0.14254379272460938, -0.1352519989013672, -0.127960205078125, -0.12066841125488281, -0.11337661743164062, -0.10608482360839844, -0.09879302978515625, -0.09150123596191406, -0.08420944213867188, -0.07691764831542969, -0.0696258544921875, -0.06233406066894531, -0.055042266845703125, -0.04775047302246094, -0.04045867919921875, -0.03316688537597656, -0.025875091552734375, -0.018583297729492188, -0.01129150390625, -0.0039997100830078125, 0.003292083740234375, 0.010583877563476562, 0.01787567138671875, 0.025167465209960938, 0.032459259033203125, 0.03975105285644531, 0.0470428466796875, 0.05433464050292969, 0.061626434326171875, 0.06891822814941406, 0.07621002197265625, 0.08350181579589844, 0.09079360961914062, 0.09808540344238281, 0.105377197265625, 0.11266899108886719, 0.11996078491210938, 0.12725257873535156, 0.13454437255859375, 0.14183616638183594, 0.14912796020507812, 0.1564197540283203, 0.1637115478515625, 0.1710033416748047, 0.17829513549804688, 0.18558692932128906, 0.19287872314453125, 0.20017051696777344, 0.20746231079101562, 0.2147541046142578, 0.2220458984375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 3.0, 5.0, 6.0, 5.0, 10.0, 9.0, 22.0, 27.0, 32.0, 52.0, 80.0, 104.0, 175.0, 282.0, 528.0, 1259.0, 3739.0, 21424.0, 815017.0, 186566.0, 14250.0, 2880.0, 1009.0, 419.0, 254.0, 112.0, 92.0, 74.0, 31.0, 20.0, 16.0, 10.0, 13.0, 8.0, 6.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.818359375, -0.795562744140625, -0.77276611328125, -0.749969482421875, -0.7271728515625, -0.704376220703125, -0.68157958984375, -0.658782958984375, -0.635986328125, -0.613189697265625, -0.59039306640625, -0.567596435546875, -0.5447998046875, -0.522003173828125, -0.49920654296875, -0.476409912109375, -0.45361328125, -0.430816650390625, -0.40802001953125, -0.385223388671875, -0.3624267578125, -0.339630126953125, -0.31683349609375, -0.294036865234375, -0.271240234375, -0.248443603515625, -0.22564697265625, -0.202850341796875, -0.1800537109375, -0.157257080078125, -0.13446044921875, -0.111663818359375, -0.0888671875, -0.066070556640625, -0.04327392578125, -0.020477294921875, 0.0023193359375, 0.025115966796875, 0.04791259765625, 0.070709228515625, 0.093505859375, 0.116302490234375, 0.13909912109375, 0.161895751953125, 0.1846923828125, 0.207489013671875, 0.23028564453125, 0.253082275390625, 0.27587890625, 0.298675537109375, 0.32147216796875, 0.344268798828125, 0.3670654296875, 0.389862060546875, 0.41265869140625, 0.435455322265625, 0.458251953125, 0.481048583984375, 0.50384521484375, 0.526641845703125, 0.5494384765625, 0.572235107421875, 0.59503173828125, 0.617828369140625, 0.640625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 4.0, 3.0, 8.0, 2.0, 11.0, 13.0, 10.0, 13.0, 21.0, 19.0, 17.0, 38.0, 46.0, 41.0, 48.0, 69.0, 90.0, 93.0, 89.0, 78.0, 64.0, 54.0, 34.0, 19.0, 19.0, 15.0, 17.0, 13.0, 9.0, 11.0, 12.0, 3.0, 4.0, 5.0, 6.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0751953125, -1.0439910888671875, -1.012786865234375, -0.9815826416015625, -0.95037841796875, -0.9191741943359375, -0.887969970703125, -0.8567657470703125, -0.8255615234375, -0.7943572998046875, -0.763153076171875, -0.7319488525390625, -0.70074462890625, -0.6695404052734375, -0.638336181640625, -0.6071319580078125, -0.575927734375, -0.5447235107421875, -0.513519287109375, -0.4823150634765625, -0.45111083984375, -0.4199066162109375, -0.388702392578125, -0.3574981689453125, -0.3262939453125, -0.2950897216796875, -0.263885498046875, -0.2326812744140625, -0.20147705078125, -0.1702728271484375, -0.139068603515625, -0.1078643798828125, -0.07666015625, -0.0454559326171875, -0.014251708984375, 0.0169525146484375, 0.04815673828125, 0.0793609619140625, 0.110565185546875, 0.1417694091796875, 0.1729736328125, 0.2041778564453125, 0.235382080078125, 0.2665863037109375, 0.29779052734375, 0.3289947509765625, 0.360198974609375, 0.3914031982421875, 0.422607421875, 0.4538116455078125, 0.485015869140625, 0.5162200927734375, 0.54742431640625, 0.5786285400390625, 0.609832763671875, 0.6410369873046875, 0.6722412109375, 0.7034454345703125, 0.734649658203125, 0.7658538818359375, 0.79705810546875, 0.8282623291015625, 0.859466552734375, 0.8906707763671875, 0.921875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 4.0, 8.0, 6.0, 10.0, 13.0, 21.0, 21.0, 45.0, 82.0, 125.0, 204.0, 385.0, 786.0, 1892.0, 5684.0, 21513.0, 198849.0, 778709.0, 28845.0, 7033.0, 2365.0, 898.0, 439.0, 246.0, 117.0, 88.0, 53.0, 52.0, 24.0, 8.0, 5.0, 6.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12359619140625, -0.11934757232666016, -0.11509895324707031, -0.11085033416748047, -0.10660171508789062, -0.10235309600830078, -0.09810447692871094, -0.0938558578491211, -0.08960723876953125, -0.0853586196899414, -0.08111000061035156, -0.07686138153076172, -0.07261276245117188, -0.06836414337158203, -0.06411552429199219, -0.059866905212402344, -0.0556182861328125, -0.051369667053222656, -0.04712104797363281, -0.04287242889404297, -0.038623809814453125, -0.03437519073486328, -0.030126571655273438, -0.025877952575683594, -0.02162933349609375, -0.017380714416503906, -0.013132095336914062, -0.008883476257324219, -0.004634857177734375, -0.00038623809814453125, 0.0038623809814453125, 0.008111000061035156, 0.012359619140625, 0.016608238220214844, 0.020856857299804688, 0.02510547637939453, 0.029354095458984375, 0.03360271453857422, 0.03785133361816406, 0.042099952697753906, 0.04634857177734375, 0.050597190856933594, 0.05484580993652344, 0.05909442901611328, 0.06334304809570312, 0.06759166717529297, 0.07184028625488281, 0.07608890533447266, 0.0803375244140625, 0.08458614349365234, 0.08883476257324219, 0.09308338165283203, 0.09733200073242188, 0.10158061981201172, 0.10582923889160156, 0.1100778579711914, 0.11432647705078125, 0.1185750961303711, 0.12282371520996094, 0.12707233428955078, 0.13132095336914062, 0.13556957244873047, 0.1398181915283203, 0.14406681060791016, 0.1483154296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 5.0, 10.0, 10.0, 22.0, 25.0, 30.0, 31.0, 25.0, 64.0, 114.0, 149.0, 151.0, 118.0, 58.0, 44.0, 28.0, 22.0, 24.0, 8.0, 7.0, 7.0, 4.0, 9.0, 4.0, 4.0, 3.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.68899917602539e-05, -7.448438555002213e-05, -7.207877933979034e-05, -6.967317312955856e-05, -6.726756691932678e-05, -6.4861960709095e-05, -6.245635449886322e-05, -6.005074828863144e-05, -5.764514207839966e-05, -5.523953586816788e-05, -5.2833929657936096e-05, -5.0428323447704315e-05, -4.8022717237472534e-05, -4.561711102724075e-05, -4.321150481700897e-05, -4.080589860677719e-05, -3.840029239654541e-05, -3.599468618631363e-05, -3.358907997608185e-05, -3.118347376585007e-05, -2.8777867555618286e-05, -2.6372261345386505e-05, -2.3966655135154724e-05, -2.1561048924922943e-05, -1.9155442714691162e-05, -1.674983650445938e-05, -1.43442302942276e-05, -1.1938624083995819e-05, -9.533017873764038e-06, -7.127411663532257e-06, -4.721805453300476e-06, -2.316199243068695e-06, 8.940696716308594e-08, 2.495013177394867e-06, 4.900619387626648e-06, 7.306225597858429e-06, 9.71183180809021e-06, 1.2117438018321991e-05, 1.4523044228553772e-05, 1.6928650438785553e-05, 1.9334256649017334e-05, 2.1739862859249115e-05, 2.4145469069480896e-05, 2.6551075279712677e-05, 2.8956681489944458e-05, 3.136228770017624e-05, 3.376789391040802e-05, 3.61735001206398e-05, 3.857910633087158e-05, 4.098471254110336e-05, 4.3390318751335144e-05, 4.5795924961566925e-05, 4.8201531171798706e-05, 5.060713738203049e-05, 5.301274359226227e-05, 5.541834980249405e-05, 5.782395601272583e-05, 6.022956222295761e-05, 6.263516843318939e-05, 6.504077464342117e-05, 6.744638085365295e-05, 6.985198706388474e-05, 7.225759327411652e-05, 7.46631994843483e-05, 7.706880569458008e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 5.0, 9.0, 25.0, 30.0, 49.0, 59.0, 116.0, 207.0, 301.0, 501.0, 842.0, 1583.0, 3277.0, 7732.0, 21188.0, 84714.0, 793304.0, 96343.0, 22645.0, 8196.0, 3464.0, 1694.0, 913.0, 501.0, 314.0, 186.0, 125.0, 71.0, 48.0, 37.0, 27.0, 15.0, 11.0, 5.0, 4.0, 3.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08087158203125, -0.07803726196289062, -0.07520294189453125, -0.07236862182617188, -0.0695343017578125, -0.06669998168945312, -0.06386566162109375, -0.061031341552734375, -0.058197021484375, -0.055362701416015625, -0.05252838134765625, -0.049694061279296875, -0.0468597412109375, -0.044025421142578125, -0.04119110107421875, -0.038356781005859375, -0.0355224609375, -0.032688140869140625, -0.02985382080078125, -0.027019500732421875, -0.0241851806640625, -0.021350860595703125, -0.01851654052734375, -0.015682220458984375, -0.012847900390625, -0.010013580322265625, -0.00717926025390625, -0.004344940185546875, -0.0015106201171875, 0.001323699951171875, 0.00415802001953125, 0.006992340087890625, 0.00982666015625, 0.012660980224609375, 0.01549530029296875, 0.018329620361328125, 0.0211639404296875, 0.023998260498046875, 0.02683258056640625, 0.029666900634765625, 0.032501220703125, 0.035335540771484375, 0.03816986083984375, 0.041004180908203125, 0.0438385009765625, 0.046672821044921875, 0.04950714111328125, 0.052341461181640625, 0.05517578125, 0.058010101318359375, 0.06084442138671875, 0.06367874145507812, 0.0665130615234375, 0.06934738159179688, 0.07218170166015625, 0.07501602172851562, 0.077850341796875, 0.08068466186523438, 0.08351898193359375, 0.08635330200195312, 0.0891876220703125, 0.09202194213867188, 0.09485626220703125, 0.09769058227539062, 0.10052490234375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 5.0, 7.0, 10.0, 16.0, 9.0, 18.0, 17.0, 23.0, 47.0, 61.0, 82.0, 90.0, 85.0, 99.0, 70.0, 80.0, 73.0, 50.0, 28.0, 30.0, 21.0, 15.0, 11.0, 11.0, 6.0, 11.0, 4.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.10302734375, -0.10017967224121094, -0.09733200073242188, -0.09448432922363281, -0.09163665771484375, -0.08878898620605469, -0.08594131469726562, -0.08309364318847656, -0.0802459716796875, -0.07739830017089844, -0.07455062866210938, -0.07170295715332031, -0.06885528564453125, -0.06600761413574219, -0.06315994262695312, -0.06031227111816406, -0.057464599609375, -0.05461692810058594, -0.051769256591796875, -0.04892158508300781, -0.04607391357421875, -0.04322624206542969, -0.040378570556640625, -0.03753089904785156, -0.0346832275390625, -0.03183555603027344, -0.028987884521484375, -0.026140213012695312, -0.02329254150390625, -0.020444869995117188, -0.017597198486328125, -0.014749526977539062, -0.01190185546875, -0.009054183959960938, -0.006206512451171875, -0.0033588409423828125, -0.00051116943359375, 0.0023365020751953125, 0.005184173583984375, 0.008031845092773438, 0.0108795166015625, 0.013727188110351562, 0.016574859619140625, 0.019422531127929688, 0.02227020263671875, 0.025117874145507812, 0.027965545654296875, 0.030813217163085938, 0.033660888671875, 0.03650856018066406, 0.039356231689453125, 0.04220390319824219, 0.04505157470703125, 0.04789924621582031, 0.050746917724609375, 0.05359458923339844, 0.0564422607421875, 0.05928993225097656, 0.062137603759765625, 0.06498527526855469, 0.06783294677734375, 0.07068061828613281, 0.07352828979492188, 0.07637596130371094, 0.0792236328125]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 6.0, 4.0, 6.0, 19.0, 22.0, 51.0, 56.0, 133.0, 468.0, 81.0, 56.0, 38.0, 21.0, 13.0, 7.0, 5.0, 7.0, 8.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.427844524383545, -3.3147034645080566, -3.2015626430511475, -3.088421583175659, -2.97528076171875, -2.8621397018432617, -2.7489986419677734, -2.6358578205108643, -2.522716999053955, -2.409575939178467, -2.2964351177215576, -2.1832940578460693, -2.07015323638916, -1.9570121765136719, -1.8438712358474731, -1.7307302951812744, -1.6175892353057861, -1.5044482946395874, -1.3913073539733887, -1.2781662940979004, -1.1650254726409912, -1.051884412765503, -0.9387434720993042, -0.8256025314331055, -0.7124615907669067, -0.599320650100708, -0.4861796796321869, -0.37303870916366577, -0.25989776849746704, -0.1467568278312683, -0.033615827560424805, 0.07952511310577393, 0.19266629219055176, 0.3058072328567505, 0.4189482033252716, 0.5320891737937927, 0.6452301144599915, 0.7583710551261902, 0.8715120553970337, 0.9846529960632324, 1.0977939367294312, 1.2109348773956299, 1.3240758180618286, 1.4372167587280273, 1.5503578186035156, 1.6634986400604248, 1.776639699935913, 1.8897806406021118, 2.0029215812683105, 2.116062641143799, 2.229203462600708, 2.3423445224761963, 2.4554853439331055, 2.5686264038085938, 2.681767463684082, 2.794908285140991, 2.9080491065979004, 3.0211901664733887, 3.134330987930298, 3.247472047805786, 3.3606128692626953, 3.4737539291381836, 3.586894989013672, 3.700035810470581, 3.8131768703460693]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 5.0, 3.0, 6.0, 7.0, 10.0, 3.0, 9.0, 16.0, 12.0, 18.0, 20.0, 30.0, 27.0, 24.0, 30.0, 88.0, 318.0, 120.0, 31.0, 26.0, 29.0, 28.0, 23.0, 25.0, 20.0, 14.0, 13.0, 12.0, 5.0, 5.0, 6.0, 5.0, 5.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9623823165893555, -2.876814365386963, -2.7912464141845703, -2.7056784629821777, -2.620110511779785, -2.5345425605773926, -2.448974609375, -2.3634066581726074, -2.277838706970215, -2.1922707557678223, -2.1067028045654297, -2.021134853363037, -1.9355669021606445, -1.849998950958252, -1.764431118965149, -1.6788631677627563, -1.5932953357696533, -1.5077273845672607, -1.4221594333648682, -1.3365914821624756, -1.251023530960083, -1.1654555797576904, -1.0798877477645874, -0.9943197965621948, -0.9087518453598022, -0.8231838941574097, -0.7376159429550171, -0.6520480513572693, -0.5664801001548767, -0.48091214895248413, -0.39534425735473633, -0.30977630615234375, -0.22420811653137207, -0.13864018023014069, -0.0530722439289093, 0.03249567747116089, 0.11806362867355347, 0.20363157987594604, 0.28919947147369385, 0.3747674226760864, 0.460335373878479, 0.5459033250808716, 0.6314712762832642, 0.717039167881012, 0.8026071190834045, 0.8881750702857971, 0.9737429618835449, 1.0593109130859375, 1.14487886428833, 1.2304468154907227, 1.3160147666931152, 1.4015827178955078, 1.4871506690979004, 1.572718620300293, 1.658286452293396, 1.7438544034957886, 1.8294223546981812, 1.9149903059005737, 2.0005581378936768, 2.0861260890960693, 2.171694040298462, 2.2572619915008545, 2.342829942703247, 2.4283978939056396, 2.5139658451080322]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 2.0, 6.0, 2.0, 6.0, 11.0, 3.0, 10.0, 7.0, 10.0, 13.0, 13.0, 21.0, 25.0, 23.0, 38.0, 28.0, 53.0, 150.0, 219.0, 79.0, 44.0, 39.0, 26.0, 36.0, 27.0, 15.0, 23.0, 12.0, 9.0, 15.0, 10.0, 7.0, 5.0, 3.0, 3.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.224365234375, -0.2174091339111328, -0.21045303344726562, -0.20349693298339844, -0.19654083251953125, -0.18958473205566406, -0.18262863159179688, -0.1756725311279297, -0.1687164306640625, -0.1617603302001953, -0.15480422973632812, -0.14784812927246094, -0.14089202880859375, -0.13393592834472656, -0.12697982788085938, -0.12002372741699219, -0.113067626953125, -0.10611152648925781, -0.09915542602539062, -0.09219932556152344, -0.08524322509765625, -0.07828712463378906, -0.07133102416992188, -0.06437492370605469, -0.0574188232421875, -0.05046272277832031, -0.043506622314453125, -0.03655052185058594, -0.02959442138671875, -0.022638320922851562, -0.015682220458984375, -0.008726119995117188, -0.00177001953125, 0.0051860809326171875, 0.012142181396484375, 0.019098281860351562, 0.02605438232421875, 0.03301048278808594, 0.039966583251953125, 0.04692268371582031, 0.0538787841796875, 0.06083488464355469, 0.06779098510742188, 0.07474708557128906, 0.08170318603515625, 0.08865928649902344, 0.09561538696289062, 0.10257148742675781, 0.109527587890625, 0.11648368835449219, 0.12343978881835938, 0.13039588928222656, 0.13735198974609375, 0.14430809020996094, 0.15126419067382812, 0.1582202911376953, 0.1651763916015625, 0.1721324920654297, 0.17908859252929688, 0.18604469299316406, 0.19300079345703125, 0.19995689392089844, 0.20691299438476562, 0.2138690948486328, 0.2208251953125]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 2.0, 4.0, 3.0, 8.0, 13.0, 6.0, 14.0, 13.0, 19.0, 38.0, 51.0, 62.0, 95.0, 156.0, 229.0, 487.0, 990.0, 2279.0, 7571.0, 102447.0, 8256723.0, 11752.0, 3067.0, 1188.0, 562.0, 280.0, 157.0, 103.0, 79.0, 44.0, 30.0, 16.0, 29.0, 15.0, 8.0, 5.0, 4.0, 4.0, 9.0, 10.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0], "bins": [-1.8863255977630615, -1.8310967683792114, -1.7758679389953613, -1.7206391096115112, -1.6654102802276611, -1.6101815700531006, -1.554952621459961, -1.4997239112854004, -1.4444950819015503, -1.3892662525177002, -1.33403742313385, -1.27880859375, -1.22357976436615, -1.1683509349822998, -1.1131222248077393, -1.0578933954238892, -1.002664566040039, -0.947435736656189, -0.8922069072723389, -0.8369780778884888, -0.7817493081092834, -0.7265204787254333, -0.6712916493415833, -0.6160628795623779, -0.5608339309692383, -0.5056051015853882, -0.4503763020038605, -0.3951474726200104, -0.33991867303848267, -0.28468984365463257, -0.22946101427078247, -0.17423221468925476, -0.11900341510772705, -0.06377460062503815, -0.008545778691768646, 0.046683043241500854, 0.10191185772418976, 0.15714067220687866, 0.21236950159072876, 0.26759830117225647, 0.32282713055610657, 0.37805595993995667, 0.4332847595214844, 0.4885135889053345, 0.5437424182891846, 0.5989712476730347, 0.6542000770568848, 0.7094288468360901, 0.7646576762199402, 0.8198865056037903, 0.8751153349876404, 0.9303441047668457, 0.9855729341506958, 1.040801763534546, 1.096030592918396, 1.151259422302246, 1.2064882516860962, 1.2617170810699463, 1.3169459104537964, 1.3721747398376465, 1.4274035692214966, 1.4826323986053467, 1.5378611087799072, 1.5930899381637573, 1.6483187675476074]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 4.0, 2.0, 2.0, 2.0, 5.0, 2.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 4.0, 7.0, 4.0, 6.0, 9.0, 3.0, 3.0, 4.0, 3.0, 2.0, 4.0, 4.0, 4.0, 0.0, 2.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7297557592391968, -1.672987461090088, -1.6162190437316895, -1.559450626373291, -1.5026823282241821, -1.4459140300750732, -1.3891456127166748, -1.3323771953582764, -1.2756088972091675, -1.2188405990600586, -1.1620721817016602, -1.1053037643432617, -1.0485354661941528, -0.9917671084403992, -0.9349987506866455, -0.8782303929328918, -0.8214620351791382, -0.7646936774253845, -0.7079253196716309, -0.6511569619178772, -0.5943886041641235, -0.5376202464103699, -0.4808518886566162, -0.42408353090286255, -0.3673151731491089, -0.3105468153953552, -0.25377845764160156, -0.1970100998878479, -0.14024174213409424, -0.08347338438034058, -0.026705026626586914, 0.030063331127166748, 0.08683180809020996, 0.14360016584396362, 0.20036852359771729, 0.25713688135147095, 0.3139052391052246, 0.37067359685897827, 0.42744195461273193, 0.4842103123664856, 0.5409786701202393, 0.5977470278739929, 0.6545153856277466, 0.7112837433815002, 0.7680521011352539, 0.8248204588890076, 0.8815888166427612, 0.9383571743965149, 0.9951255321502686, 1.051893949508667, 1.1086622476577759, 1.1654305458068848, 1.2221989631652832, 1.2789673805236816, 1.3357356786727905, 1.3925039768218994, 1.4492723941802979, 1.5060408115386963, 1.5628091096878052, 1.619577407836914, 1.6763458251953125, 1.733114242553711, 1.7898825407028198, 1.8466508388519287, 1.9034192562103271]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 5.0, 3.0, 4.0, 7.0, 12.0, 8.0, 18.0, 28.0, 37.0, 46.0, 81.0, 98.0, 177.0, 362.0, 726.0, 1458.0, 3770.0, 10955.0, 45263.0, 217580.0, 190140.0, 37934.0, 9495.0, 3268.0, 1384.0, 568.0, 330.0, 196.0, 123.0, 60.0, 45.0, 26.0, 18.0, 15.0, 15.0, 6.0, 4.0, 3.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.162109375, -3.0765380859375, -2.990966796875, -2.9053955078125, -2.81982421875, -2.7342529296875, -2.648681640625, -2.5631103515625, -2.4775390625, -2.3919677734375, -2.306396484375, -2.2208251953125, -2.13525390625, -2.0496826171875, -1.964111328125, -1.8785400390625, -1.79296875, -1.7073974609375, -1.621826171875, -1.5362548828125, -1.45068359375, -1.3651123046875, -1.279541015625, -1.1939697265625, -1.1083984375, -1.0228271484375, -0.937255859375, -0.8516845703125, -0.76611328125, -0.6805419921875, -0.594970703125, -0.5093994140625, -0.423828125, -0.3382568359375, -0.252685546875, -0.1671142578125, -0.08154296875, 0.0040283203125, 0.089599609375, 0.1751708984375, 0.2607421875, 0.3463134765625, 0.431884765625, 0.5174560546875, 0.60302734375, 0.6885986328125, 0.774169921875, 0.8597412109375, 0.9453125, 1.0308837890625, 1.116455078125, 1.2020263671875, 1.28759765625, 1.3731689453125, 1.458740234375, 1.5443115234375, 1.6298828125, 1.7154541015625, 1.801025390625, 1.8865966796875, 1.97216796875, 2.0577392578125, 2.143310546875, 2.2288818359375, 2.314453125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 7.0, 6.0, 13.0, 13.0, 15.0, 29.0, 18.0, 31.0, 42.0, 44.0, 53.0, 53.0, 69.0, 68.0, 71.0, 78.0, 71.0, 49.0, 55.0, 35.0, 36.0, 32.0, 20.0, 18.0, 12.0, 13.0, 9.0, 7.0, 5.0, 7.0, 2.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2352294921875, -0.2275829315185547, -0.21993637084960938, -0.21228981018066406, -0.20464324951171875, -0.19699668884277344, -0.18935012817382812, -0.1817035675048828, -0.1740570068359375, -0.1664104461669922, -0.15876388549804688, -0.15111732482910156, -0.14347076416015625, -0.13582420349121094, -0.12817764282226562, -0.12053108215332031, -0.112884521484375, -0.10523796081542969, -0.09759140014648438, -0.08994483947753906, -0.08229827880859375, -0.07465171813964844, -0.06700515747070312, -0.05935859680175781, -0.0517120361328125, -0.04406547546386719, -0.036418914794921875, -0.028772354125976562, -0.02112579345703125, -0.013479232788085938, -0.005832672119140625, 0.0018138885498046875, 0.00946044921875, 0.017107009887695312, 0.024753570556640625, 0.03240013122558594, 0.04004669189453125, 0.04769325256347656, 0.055339813232421875, 0.06298637390136719, 0.0706329345703125, 0.07827949523925781, 0.08592605590820312, 0.09357261657714844, 0.10121917724609375, 0.10886573791503906, 0.11651229858398438, 0.12415885925292969, 0.131805419921875, 0.1394519805908203, 0.14709854125976562, 0.15474510192871094, 0.16239166259765625, 0.17003822326660156, 0.17768478393554688, 0.1853313446044922, 0.1929779052734375, 0.2006244659423828, 0.20827102661132812, 0.21591758728027344, 0.22356414794921875, 0.23121070861816406, 0.23885726928710938, 0.2465038299560547, 0.254150390625]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 8.0, 0.0, 7.0, 17.0, 33.0, 37.0, 75.0, 94.0, 82.0, 56.0, 22.0, 14.0, 10.0, 12.0, 4.0, 4.0, 3.0, 3.0, 5.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6260509490966797, -2.540443181991577, -2.4548354148864746, -2.369227409362793, -2.2836196422576904, -2.198011875152588, -2.1124041080474854, -2.026796340942383, -1.9411884546279907, -1.8555806875228882, -1.769972801208496, -1.6843650341033936, -1.598757266998291, -1.513149380683899, -1.4275416135787964, -1.3419337272644043, -1.2563259601593018, -1.1707181930541992, -1.0851103067398071, -0.9995025396347046, -0.9138947129249573, -0.82828688621521, -0.7426791191101074, -0.6570712924003601, -0.5714634656906128, -0.4858556389808655, -0.40024784207344055, -0.3146400451660156, -0.2290322184562683, -0.143424391746521, -0.05781662464141846, 0.027791202068328857, 0.11339879035949707, 0.1990066021680832, 0.2846144139766693, 0.37022221088409424, 0.45583003759384155, 0.5414378643035889, 0.6270456314086914, 0.7126534581184387, 0.798261284828186, 0.8838691115379333, 0.9694769382476807, 1.0550847053527832, 1.1406924724578857, 1.2263003587722778, 1.3119081258773804, 1.3975160121917725, 1.483123779296875, 1.5687315464019775, 1.6543394327163696, 1.7399471998214722, 1.8255550861358643, 1.9111628532409668, 1.9967706203460693, 2.082378387451172, 2.1679863929748535, 2.253594160079956, 2.3392019271850586, 2.4248099327087402, 2.5104176998138428, 2.5960254669189453, 2.681633234024048, 2.7672410011291504, 2.852848768234253]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 1.0, 4.0, 7.0, 14.0, 39.0, 90.0, 113.0, 96.0, 37.0, 13.0, 6.0, 8.0, 7.0, 7.0, 5.0, 0.0, 4.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5219764709472656, -1.4723279476165771, -1.4226793050765991, -1.3730307817459106, -1.3233821392059326, -1.2737336158752441, -1.2240850925445557, -1.1744364500045776, -1.1247878074645996, -1.0751392841339111, -1.025490641593933, -0.9758421182632446, -0.9261934757232666, -0.8765449523925781, -0.8268963694572449, -0.7772477865219116, -0.7275992631912231, -0.6779506802558899, -0.6283020973205566, -0.5786535739898682, -0.5290049314498901, -0.4793563783168793, -0.4297078251838684, -0.38005924224853516, -0.3304106593132019, -0.28076207637786865, -0.2311135083436966, -0.18146494030952454, -0.13181635737419128, -0.08216777443885803, -0.03251922130584717, 0.017129361629486084, 0.06677794456481934, 0.11642652004957199, 0.16607509553432465, 0.2157236635684967, 0.26537224650382996, 0.3150208294391632, 0.3646693825721741, 0.4143179655075073, 0.4639665484428406, 0.5136151313781738, 0.5632637143135071, 0.6129122972488403, 0.6625608205795288, 0.7122094631195068, 0.7618579864501953, 0.8115065693855286, 0.8611551523208618, 0.9108037352561951, 0.9604523181915283, 1.0101008415222168, 1.0597494840621948, 1.1093980073928833, 1.1590466499328613, 1.2086951732635498, 1.2583436965942383, 1.3079922199249268, 1.3576408624649048, 1.4072893857955933, 1.4569380283355713, 1.5065865516662598, 1.5562350749969482, 1.6058837175369263, 1.6555323600769043]}, "_wandb": {"runtime": 3709}}