{"train/loss": 3.8865, "train/learning_rate": 2.2959183673469388e-07, "train/epoch": 1.0, "train/global_step": 892, "_runtime": 7663, "_timestamp": 1646115992, "_step": 894, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 80.0, 811.0, 124.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-18.14687728881836, -11.145160675048828, -4.143444061279297, 2.8582725524902344, 9.859989166259766, 16.861705780029297, 23.863422393798828, 30.86513900756836, 37.86685562133789, 44.86857223510742, 51.87028884887695, 58.872005462646484, 65.87371826171875, 72.87544250488281, 79.87715148925781, 86.87887573242188, 93.88058471679688, 100.8823013305664, 107.88401794433594, 114.88573455810547, 121.887451171875, 128.88916015625, 135.89088439941406, 142.89260864257812, 149.89431762695312, 156.89602661132812, 163.8977508544922, 170.89947509765625, 177.90118408203125, 184.90289306640625, 191.9046173095703, 198.90634155273438, 205.90805053710938, 212.90975952148438, 219.91148376464844, 226.9132080078125, 233.9149169921875, 240.9166259765625, 247.91835021972656, 254.92007446289062, 261.9217834472656, 268.9234924316406, 275.92523193359375, 282.92694091796875, 289.92864990234375, 296.93035888671875, 303.93206787109375, 310.9338073730469, 317.9355163574219, 324.9372253417969, 331.93896484375, 338.940673828125, 345.9423828125, 352.944091796875, 359.94580078125, 366.9475402832031, 373.9492492675781, 380.9509582519531, 387.95269775390625, 394.95440673828125, 401.95611572265625, 408.95782470703125, 415.95953369140625, 422.9612731933594, 429.9629821777344]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 7.0, 3.0, 2.0, 7.0, 13.0, 10.0, 9.0, 13.0, 18.0, 16.0, 27.0, 34.0, 34.0, 24.0, 37.0, 40.0, 36.0, 39.0, 48.0, 42.0, 52.0, 48.0, 58.0, 36.0, 42.0, 42.0, 25.0, 38.0, 50.0, 24.0, 34.0, 22.0, 13.0, 17.0, 16.0, 11.0, 6.0, 6.0, 4.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.12158966064453, -41.808921813964844, -40.496253967285156, -39.18358612060547, -37.87091827392578, -36.55824661254883, -35.24557876586914, -33.93291091918945, -32.620243072509766, -31.307575225830078, -29.99490737915039, -28.68223762512207, -27.369569778442383, -26.056901931762695, -24.744232177734375, -23.431564331054688, -22.118896484375, -20.806228637695312, -19.493560791015625, -18.180891036987305, -16.868223190307617, -15.55555534362793, -14.242886543273926, -12.930217742919922, -11.617549896240234, -10.304882049560547, -8.992213249206543, -7.679544925689697, -6.366876602172852, -5.054208278656006, -3.74153995513916, -2.4288711547851562, -1.1162033081054688, 0.19646501541137695, 1.5091333389282227, 2.8218016624450684, 4.134469985961914, 5.44713830947876, 6.7598066329956055, 8.07247543334961, 9.385143280029297, 10.697811126708984, 12.010479927062988, 13.323148727416992, 14.63581657409668, 15.948484420776367, 17.261154174804688, 18.573822021484375, 19.886489868164062, 21.19915771484375, 22.511825561523438, 23.824495315551758, 25.137163162231445, 26.449831008911133, 27.762500762939453, 29.07516860961914, 30.387836456298828, 31.700504302978516, 33.0131721496582, 34.32583999633789, 35.638511657714844, 36.95117950439453, 38.26384735107422, 39.576515197753906, 40.889183044433594]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 2.0, 5.0, 5.0, 8.0, 7.0, 6.0, 13.0, 20.0, 12.0, 23.0, 20.0, 24.0, 24.0, 26.0, 37.0, 25.0, 31.0, 43.0, 29.0, 49.0, 49.0, 37.0, 45.0, 54.0, 34.0, 43.0, 32.0, 34.0, 44.0, 26.0, 29.0, 30.0, 30.0, 22.0, 16.0, 20.0, 16.0, 11.0, 6.0, 3.0, 2.0, 5.0, 5.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-2.474609375, -2.4059295654296875, -2.337249755859375, -2.2685699462890625, -2.19989013671875, -2.1312103271484375, -2.062530517578125, -1.9938507080078125, -1.9251708984375, -1.8564910888671875, -1.787811279296875, -1.7191314697265625, -1.65045166015625, -1.5817718505859375, -1.513092041015625, -1.4444122314453125, -1.375732421875, -1.3070526123046875, -1.238372802734375, -1.1696929931640625, -1.10101318359375, -1.0323333740234375, -0.963653564453125, -0.8949737548828125, -0.8262939453125, -0.7576141357421875, -0.688934326171875, -0.6202545166015625, -0.55157470703125, -0.4828948974609375, -0.414215087890625, -0.3455352783203125, -0.27685546875, -0.2081756591796875, -0.139495849609375, -0.0708160400390625, -0.00213623046875, 0.0665435791015625, 0.135223388671875, 0.2039031982421875, 0.2725830078125, 0.3412628173828125, 0.409942626953125, 0.4786224365234375, 0.54730224609375, 0.6159820556640625, 0.684661865234375, 0.7533416748046875, 0.822021484375, 0.8907012939453125, 0.959381103515625, 1.0280609130859375, 1.09674072265625, 1.1654205322265625, 1.234100341796875, 1.3027801513671875, 1.3714599609375, 1.4401397705078125, 1.508819580078125, 1.5774993896484375, 1.64617919921875, 1.7148590087890625, 1.783538818359375, 1.8522186279296875, 1.9208984375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 5.0, 3.0, 10.0, 17.0, 24.0, 20.0, 48.0, 59.0, 79.0, 127.0, 212.0, 395.0, 604.0, 1050.0, 1945.0, 4043.0, 8696.0, 21775.0, 66183.0, 348540.0, 2509631.0, 1040575.0, 131209.0, 35512.0, 12686.0, 5310.0, 2636.0, 1221.0, 669.0, 357.0, 226.0, 141.0, 92.0, 64.0, 45.0, 21.0, 11.0, 15.0, 7.0, 8.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.85546875, -7.6356201171875, -7.415771484375, -7.1959228515625, -6.97607421875, -6.7562255859375, -6.536376953125, -6.3165283203125, -6.0966796875, -5.8768310546875, -5.656982421875, -5.4371337890625, -5.21728515625, -4.9974365234375, -4.777587890625, -4.5577392578125, -4.337890625, -4.1180419921875, -3.898193359375, -3.6783447265625, -3.45849609375, -3.2386474609375, -3.018798828125, -2.7989501953125, -2.5791015625, -2.3592529296875, -2.139404296875, -1.9195556640625, -1.69970703125, -1.4798583984375, -1.260009765625, -1.0401611328125, -0.8203125, -0.6004638671875, -0.380615234375, -0.1607666015625, 0.05908203125, 0.2789306640625, 0.498779296875, 0.7186279296875, 0.9384765625, 1.1583251953125, 1.378173828125, 1.5980224609375, 1.81787109375, 2.0377197265625, 2.257568359375, 2.4774169921875, 2.697265625, 2.9171142578125, 3.136962890625, 3.3568115234375, 3.57666015625, 3.7965087890625, 4.016357421875, 4.2362060546875, 4.4560546875, 4.6759033203125, 4.895751953125, 5.1156005859375, 5.33544921875, 5.5552978515625, 5.775146484375, 5.9949951171875, 6.21484375]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 6.0, 11.0, 30.0, 35.0, 48.0, 86.0, 126.0, 224.0, 454.0, 778.0, 847.0, 588.0, 331.0, 180.0, 144.0, 66.0, 47.0, 33.0, 11.0, 10.0, 10.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3515625, -9.9036865234375, -9.455810546875, -9.0079345703125, -8.56005859375, -8.1121826171875, -7.664306640625, -7.2164306640625, -6.7685546875, -6.3206787109375, -5.872802734375, -5.4249267578125, -4.97705078125, -4.5291748046875, -4.081298828125, -3.6334228515625, -3.185546875, -2.7376708984375, -2.289794921875, -1.8419189453125, -1.39404296875, -0.9461669921875, -0.498291015625, -0.0504150390625, 0.3974609375, 0.8453369140625, 1.293212890625, 1.7410888671875, 2.18896484375, 2.6368408203125, 3.084716796875, 3.5325927734375, 3.98046875, 4.4283447265625, 4.876220703125, 5.3240966796875, 5.77197265625, 6.2198486328125, 6.667724609375, 7.1156005859375, 7.5634765625, 8.0113525390625, 8.459228515625, 8.9071044921875, 9.35498046875, 9.8028564453125, 10.250732421875, 10.6986083984375, 11.146484375, 11.5943603515625, 12.042236328125, 12.4901123046875, 12.93798828125, 13.3858642578125, 13.833740234375, 14.2816162109375, 14.7294921875, 15.1773681640625, 15.625244140625, 16.0731201171875, 16.52099609375, 16.9688720703125, 17.416748046875, 17.8646240234375, 18.3125]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 3.0, 1.0, 4.0, 5.0, 4.0, 8.0, 11.0, 28.0, 62.0, 118.0, 198.0, 392.0, 870.0, 4744.0, 739368.0, 3437093.0, 9067.0, 1240.0, 540.0, 237.0, 146.0, 66.0, 29.0, 21.0, 14.0, 6.0, 5.0, 1.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.9375, -48.27880859375, -46.6201171875, -44.96142578125, -43.302734375, -41.64404296875, -39.9853515625, -38.32666015625, -36.66796875, -35.00927734375, -33.3505859375, -31.69189453125, -30.033203125, -28.37451171875, -26.7158203125, -25.05712890625, -23.3984375, -21.73974609375, -20.0810546875, -18.42236328125, -16.763671875, -15.10498046875, -13.4462890625, -11.78759765625, -10.12890625, -8.47021484375, -6.8115234375, -5.15283203125, -3.494140625, -1.83544921875, -0.1767578125, 1.48193359375, 3.140625, 4.79931640625, 6.4580078125, 8.11669921875, 9.775390625, 11.43408203125, 13.0927734375, 14.75146484375, 16.41015625, 18.06884765625, 19.7275390625, 21.38623046875, 23.044921875, 24.70361328125, 26.3623046875, 28.02099609375, 29.6796875, 31.33837890625, 32.9970703125, 34.65576171875, 36.314453125, 37.97314453125, 39.6318359375, 41.29052734375, 42.94921875, 44.60791015625, 46.2666015625, 47.92529296875, 49.583984375, 51.24267578125, 52.9013671875, 54.56005859375, 56.21875]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 36.0, 639.0, 329.0, 8.0, 3.0], "bins": [-439.3196105957031, -432.0898742675781, -424.860107421875, -417.63037109375, -410.400634765625, -403.1708984375, -395.9411315917969, -388.7113952636719, -381.4816589355469, -374.2519226074219, -367.02215576171875, -359.79241943359375, -352.56268310546875, -345.33294677734375, -338.1031799316406, -330.8734436035156, -323.6437072753906, -316.4139709472656, -309.1842041015625, -301.9544677734375, -294.7247314453125, -287.4949951171875, -280.2652282714844, -273.0354919433594, -265.8057556152344, -258.5760192871094, -251.3462677001953, -244.11651611328125, -236.88677978515625, -229.6570281982422, -222.4272918701172, -215.19754028320312, -207.96778869628906, -200.738037109375, -193.50830078125, -186.27854919433594, -179.04881286621094, -171.81906127929688, -164.58932495117188, -157.3595733642578, -150.12982177734375, -142.9000701904297, -135.6703338623047, -128.44058227539062, -121.21084594726562, -113.98109436035156, -106.75135803222656, -99.5216064453125, -92.2918701171875, -85.06212615966797, -77.83238220214844, -70.6026382446289, -63.372894287109375, -56.14314651489258, -48.91340255737305, -41.683658599853516, -34.45391845703125, -27.22417449951172, -19.994430541992188, -12.764684677124023, -5.534940719604492, 1.6948051452636719, 8.924549102783203, 16.154293060302734, 23.3840389251709]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 3.0, 2.0, 6.0, 9.0, 5.0, 11.0, 7.0, 17.0, 19.0, 12.0, 16.0, 21.0, 31.0, 34.0, 25.0, 27.0, 24.0, 31.0, 42.0, 32.0, 49.0, 39.0, 42.0, 36.0, 30.0, 44.0, 44.0, 41.0, 47.0, 36.0, 31.0, 33.0, 23.0, 23.0, 17.0, 16.0, 8.0, 15.0, 14.0, 7.0, 6.0, 6.0, 7.0, 5.0, 5.0, 2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-34.06159591674805, -33.06204605102539, -32.062496185302734, -31.06294822692871, -30.063400268554688, -29.06385040283203, -28.064300537109375, -27.06475257873535, -26.065204620361328, -25.065654754638672, -24.06610679626465, -23.066556930541992, -22.06700897216797, -21.067459106445312, -20.067909240722656, -19.068361282348633, -18.068811416625977, -17.06926155090332, -16.069713592529297, -15.07016372680664, -14.070615768432617, -13.071065902709961, -12.071516990661621, -11.071968078613281, -10.072419166564941, -9.072870254516602, -8.073321342468262, -7.073771953582764, -6.074223041534424, -5.074674129486084, -4.075124740600586, -3.075575828552246, -2.0760269165039062, -1.0764778852462769, -0.07692885398864746, 0.9226202964782715, 1.9221692085266113, 2.921718120574951, 3.921267509460449, 4.920816421508789, 5.920365333557129, 6.919914245605469, 7.919463157653809, 8.919012069702148, 9.918561935424805, 10.918109893798828, 11.917659759521484, 12.917208671569824, 13.916757583618164, 14.916306495666504, 15.915855407714844, 16.9154052734375, 17.914953231811523, 18.91450309753418, 19.914051055908203, 20.91360092163086, 21.913150787353516, 22.912700653076172, 23.912248611450195, 24.91179847717285, 25.911346435546875, 26.91089630126953, 27.910446166992188, 28.90999412536621, 29.909542083740234]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 11.0, 9.0, 7.0, 8.0, 4.0, 14.0, 15.0, 17.0, 27.0, 26.0, 29.0, 24.0, 29.0, 35.0, 32.0, 28.0, 40.0, 42.0, 41.0, 37.0, 56.0, 46.0, 34.0, 25.0, 39.0, 39.0, 23.0, 31.0, 41.0, 31.0, 35.0, 22.0, 21.0, 16.0, 16.0, 14.0, 9.0, 4.0, 12.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.119140625, -2.049224853515625, -1.97930908203125, -1.909393310546875, -1.8394775390625, -1.769561767578125, -1.69964599609375, -1.629730224609375, -1.559814453125, -1.489898681640625, -1.41998291015625, -1.350067138671875, -1.2801513671875, -1.210235595703125, -1.14031982421875, -1.070404052734375, -1.00048828125, -0.930572509765625, -0.86065673828125, -0.790740966796875, -0.7208251953125, -0.650909423828125, -0.58099365234375, -0.511077880859375, -0.441162109375, -0.371246337890625, -0.30133056640625, -0.231414794921875, -0.1614990234375, -0.091583251953125, -0.02166748046875, 0.048248291015625, 0.1181640625, 0.188079833984375, 0.25799560546875, 0.327911376953125, 0.3978271484375, 0.467742919921875, 0.53765869140625, 0.607574462890625, 0.677490234375, 0.747406005859375, 0.81732177734375, 0.887237548828125, 0.9571533203125, 1.027069091796875, 1.09698486328125, 1.166900634765625, 1.23681640625, 1.306732177734375, 1.37664794921875, 1.446563720703125, 1.5164794921875, 1.586395263671875, 1.65631103515625, 1.726226806640625, 1.796142578125, 1.866058349609375, 1.93597412109375, 2.005889892578125, 2.0758056640625, 2.145721435546875, 2.21563720703125, 2.285552978515625, 2.35546875]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 2.0, 7.0, 9.0, 19.0, 18.0, 37.0, 52.0, 64.0, 108.0, 169.0, 269.0, 427.0, 688.0, 1175.0, 1912.0, 3253.0, 5510.0, 9558.0, 16713.0, 30342.0, 58561.0, 119883.0, 257755.0, 274944.0, 129951.0, 62384.0, 32435.0, 17835.0, 10010.0, 5913.0, 3373.0, 1961.0, 1225.0, 737.0, 432.0, 289.0, 186.0, 108.0, 74.0, 49.0, 37.0, 29.0, 11.0, 13.0, 6.0, 7.0, 5.0, 7.0, 3.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.307373046875, -0.29807281494140625, -0.2887725830078125, -0.27947235107421875, -0.270172119140625, -0.26087188720703125, -0.2515716552734375, -0.24227142333984375, -0.23297119140625, -0.22367095947265625, -0.2143707275390625, -0.20507049560546875, -0.195770263671875, -0.18647003173828125, -0.1771697998046875, -0.16786956787109375, -0.1585693359375, -0.14926910400390625, -0.1399688720703125, -0.13066864013671875, -0.121368408203125, -0.11206817626953125, -0.1027679443359375, -0.09346771240234375, -0.08416748046875, -0.07486724853515625, -0.0655670166015625, -0.05626678466796875, -0.046966552734375, -0.03766632080078125, -0.0283660888671875, -0.01906585693359375, -0.009765625, -0.00046539306640625, 0.0088348388671875, 0.01813507080078125, 0.027435302734375, 0.03673553466796875, 0.0460357666015625, 0.05533599853515625, 0.06463623046875, 0.07393646240234375, 0.0832366943359375, 0.09253692626953125, 0.101837158203125, 0.11113739013671875, 0.1204376220703125, 0.12973785400390625, 0.1390380859375, 0.14833831787109375, 0.1576385498046875, 0.16693878173828125, 0.176239013671875, 0.18553924560546875, 0.1948394775390625, 0.20413970947265625, 0.21343994140625, 0.22274017333984375, 0.2320404052734375, 0.24134063720703125, 0.250640869140625, 0.25994110107421875, 0.2692413330078125, 0.27854156494140625, 0.287841796875]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 7.0, 8.0, 7.0, 10.0, 10.0, 18.0, 17.0, 23.0, 27.0, 25.0, 36.0, 26.0, 21.0, 26.0, 31.0, 39.0, 37.0, 49.0, 43.0, 42.0, 1063.0, 31.0, 35.0, 51.0, 35.0, 29.0, 33.0, 35.0, 30.0, 26.0, 27.0, 15.0, 21.0, 15.0, 12.0, 16.0, 10.0, 7.0, 10.0, 8.0, 5.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-1.40234375, -1.35894775390625, -1.3155517578125, -1.27215576171875, -1.228759765625, -1.18536376953125, -1.1419677734375, -1.09857177734375, -1.05517578125, -1.01177978515625, -0.9683837890625, -0.92498779296875, -0.881591796875, -0.83819580078125, -0.7947998046875, -0.75140380859375, -0.7080078125, -0.66461181640625, -0.6212158203125, -0.57781982421875, -0.534423828125, -0.49102783203125, -0.4476318359375, -0.40423583984375, -0.36083984375, -0.31744384765625, -0.2740478515625, -0.23065185546875, -0.187255859375, -0.14385986328125, -0.1004638671875, -0.05706787109375, -0.013671875, 0.02972412109375, 0.0731201171875, 0.11651611328125, 0.159912109375, 0.20330810546875, 0.2467041015625, 0.29010009765625, 0.33349609375, 0.37689208984375, 0.4202880859375, 0.46368408203125, 0.507080078125, 0.55047607421875, 0.5938720703125, 0.63726806640625, 0.6806640625, 0.72406005859375, 0.7674560546875, 0.81085205078125, 0.854248046875, 0.89764404296875, 0.9410400390625, 0.98443603515625, 1.02783203125, 1.07122802734375, 1.1146240234375, 1.15802001953125, 1.201416015625, 1.24481201171875, 1.2882080078125, 1.33160400390625, 1.375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 5.0, 3.0, 6.0, 9.0, 12.0, 15.0, 25.0, 34.0, 54.0, 77.0, 102.0, 155.0, 199.0, 291.0, 460.0, 596.0, 879.0, 1364.0, 1924.0, 2820.0, 4186.0, 6235.0, 9334.0, 14100.0, 21499.0, 33157.0, 53094.0, 88695.0, 147402.0, 1250915.0, 175700.0, 106024.0, 63665.0, 39496.0, 25234.0, 16456.0, 10709.0, 7107.0, 4764.0, 3202.0, 2177.0, 1511.0, 1057.0, 735.0, 492.0, 364.0, 245.0, 176.0, 122.0, 87.0, 46.0, 43.0, 34.0, 18.0, 10.0, 10.0, 9.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.154541015625, -0.1495037078857422, -0.14446640014648438, -0.13942909240722656, -0.13439178466796875, -0.12935447692871094, -0.12431716918945312, -0.11927986145019531, -0.1142425537109375, -0.10920524597167969, -0.10416793823242188, -0.09913063049316406, -0.09409332275390625, -0.08905601501464844, -0.08401870727539062, -0.07898139953613281, -0.073944091796875, -0.06890678405761719, -0.06386947631835938, -0.05883216857910156, -0.05379486083984375, -0.04875755310058594, -0.043720245361328125, -0.03868293762207031, -0.0336456298828125, -0.028608322143554688, -0.023571014404296875, -0.018533706665039062, -0.01349639892578125, -0.008459091186523438, -0.003421783447265625, 0.0016155242919921875, 0.00665283203125, 0.011690139770507812, 0.016727447509765625, 0.021764755249023438, 0.02680206298828125, 0.03183937072753906, 0.036876678466796875, 0.04191398620605469, 0.0469512939453125, 0.05198860168457031, 0.057025909423828125, 0.06206321716308594, 0.06710052490234375, 0.07213783264160156, 0.07717514038085938, 0.08221244812011719, 0.087249755859375, 0.09228706359863281, 0.09732437133789062, 0.10236167907714844, 0.10739898681640625, 0.11243629455566406, 0.11747360229492188, 0.12251091003417969, 0.1275482177734375, 0.1325855255126953, 0.13762283325195312, 0.14266014099121094, 0.14769744873046875, 0.15273475646972656, 0.15777206420898438, 0.1628093719482422, 0.1678466796875]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 2.0, 8.0, 4.0, 7.0, 6.0, 14.0, 16.0, 15.0, 15.0, 14.0, 25.0, 27.0, 24.0, 35.0, 54.0, 49.0, 66.0, 85.0, 75.0, 71.0, 64.0, 56.0, 52.0, 33.0, 40.0, 23.0, 26.0, 14.0, 13.0, 15.0, 13.0, 9.0, 6.0, 7.0, 2.0, 5.0, 4.0, 2.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0016546249389648438, -0.0016033649444580078, -0.0015521049499511719, -0.001500844955444336, -0.0014495849609375, -0.001398324966430664, -0.0013470649719238281, -0.0012958049774169922, -0.0012445449829101562, -0.0011932849884033203, -0.0011420249938964844, -0.0010907649993896484, -0.0010395050048828125, -0.0009882450103759766, -0.0009369850158691406, -0.0008857250213623047, -0.0008344650268554688, -0.0007832050323486328, -0.0007319450378417969, -0.0006806850433349609, -0.000629425048828125, -0.0005781650543212891, -0.0005269050598144531, -0.0004756450653076172, -0.00042438507080078125, -0.0003731250762939453, -0.0003218650817871094, -0.00027060508728027344, -0.0002193450927734375, -0.00016808509826660156, -0.00011682510375976562, -6.556510925292969e-05, -1.430511474609375e-05, 3.695487976074219e-05, 8.821487426757812e-05, 0.00013947486877441406, 0.00019073486328125, 0.00024199485778808594, 0.0002932548522949219, 0.0003445148468017578, 0.00039577484130859375, 0.0004470348358154297, 0.0004982948303222656, 0.0005495548248291016, 0.0006008148193359375, 0.0006520748138427734, 0.0007033348083496094, 0.0007545948028564453, 0.0008058547973632812, 0.0008571147918701172, 0.0009083747863769531, 0.0009596347808837891, 0.001010894775390625, 0.001062154769897461, 0.0011134147644042969, 0.0011646747589111328, 0.0012159347534179688, 0.0012671947479248047, 0.0013184547424316406, 0.0013697147369384766, 0.0014209747314453125, 0.0014722347259521484, 0.0015234947204589844, 0.0015747547149658203, 0.0016260147094726562]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 3.0, 3.0, 6.0, 10.0, 15.0, 17.0, 19.0, 21.0, 37.0, 51.0, 38.0, 47.0, 60.0, 63.0, 104.0, 101.0, 191.0, 243.0, 462.0, 2576.0, 1014105.0, 28453.0, 693.0, 312.0, 210.0, 127.0, 120.0, 97.0, 53.0, 56.0, 51.0, 46.0, 35.0, 23.0, 24.0, 14.0, 8.0, 6.0, 6.0, 8.0, 10.0, 6.0, 6.0, 5.0, 5.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.0311431884765625, -0.030219078063964844, -0.029294967651367188, -0.02837085723876953, -0.027446746826171875, -0.02652263641357422, -0.025598526000976562, -0.024674415588378906, -0.02375030517578125, -0.022826194763183594, -0.021902084350585938, -0.02097797393798828, -0.020053863525390625, -0.01912975311279297, -0.018205642700195312, -0.017281532287597656, -0.016357421875, -0.015433311462402344, -0.014509201049804688, -0.013585090637207031, -0.012660980224609375, -0.011736869812011719, -0.010812759399414062, -0.009888648986816406, -0.00896453857421875, -0.008040428161621094, -0.0071163177490234375, -0.006192207336425781, -0.005268096923828125, -0.004343986511230469, -0.0034198760986328125, -0.0024957656860351562, -0.0015716552734375, -0.0006475448608398438, 0.0002765655517578125, 0.0012006759643554688, 0.002124786376953125, 0.0030488967895507812, 0.0039730072021484375, 0.004897117614746094, 0.00582122802734375, 0.006745338439941406, 0.0076694488525390625, 0.008593559265136719, 0.009517669677734375, 0.010441780090332031, 0.011365890502929688, 0.012290000915527344, 0.013214111328125, 0.014138221740722656, 0.015062332153320312, 0.01598644256591797, 0.016910552978515625, 0.01783466339111328, 0.018758773803710938, 0.019682884216308594, 0.02060699462890625, 0.021531105041503906, 0.022455215454101562, 0.02337932586669922, 0.024303436279296875, 0.02522754669189453, 0.026151657104492188, 0.027075767517089844, 0.0279998779296875]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 8.0, 585.0, 418.0, 6.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.012455353513360023, -0.012240350246429443, -0.012025347910821438, -0.011810344643890858, -0.011595341376960278, -0.011380338110029697, -0.011165335774421692, -0.010950332507491112, -0.010735329240560532, -0.010520325973629951, -0.010305323638021946, -0.010090320371091366, -0.009875317104160786, -0.009660313837230206, -0.0094453115016222, -0.00923030823469162, -0.00901530496776104, -0.00880030170083046, -0.008585299365222454, -0.008370296098291874, -0.008155292831361294, -0.007940289564430714, -0.007725287228822708, -0.007510283961892128, -0.0072952816262841225, -0.00708027882501483, -0.0068652755580842495, -0.006650272756814957, -0.0064352694898843765, -0.006220266688615084, -0.006005263887345791, -0.005790260620415211, -0.005575257353484631, -0.005360254552215338, -0.005145251285284758, -0.004930248484015465, -0.004715245217084885, -0.004500242415815592, -0.004285239614546299, -0.004070236347615719, -0.0038552330806851387, -0.0036402300465852022, -0.0034252270124852657, -0.003210224211215973, -0.0029952209442853928, -0.0027802181430161, -0.0025652151089161634, -0.002350212074816227, -0.002135209273546934, -0.0019202062394469976, -0.0017052032053470612, -0.0014902002876624465, -0.00127519725356251, -0.0010601942194625735, -0.0008451913017779589, -0.0006301882676780224, -0.00041518511716276407, -0.00020018211216665804, 1.4820892829447985e-05, 0.00022982386872172356, 0.00044482690282166004, 0.0006598299369215965, 0.0008748328546062112, 0.0010898358887061477, 0.0013048389228060842]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 2.0, 10.0, 13.0, 20.0, 9.0, 15.0, 19.0, 16.0, 23.0, 23.0, 26.0, 40.0, 32.0, 31.0, 42.0, 50.0, 37.0, 45.0, 42.0, 39.0, 37.0, 49.0, 46.0, 47.0, 24.0, 40.0, 36.0, 31.0, 31.0, 19.0, 21.0, 14.0, 9.0, 16.0, 10.0, 10.0, 5.0, 6.0, 2.0, 7.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.0008935332298278809, -0.000865500420331955, -0.000837467610836029, -0.0008094348013401031, -0.0007814019918441772, -0.0007533691823482513, -0.0007253363728523254, -0.0006973035633563995, -0.0006692707538604736, -0.0006412379443645477, -0.0006132051348686218, -0.0005851723253726959, -0.00055713951587677, -0.0005291067063808441, -0.0005010738968849182, -0.0004730410873889923, -0.0004450082778930664, -0.0004169754683971405, -0.0003889426589012146, -0.0003609098494052887, -0.0003328770399093628, -0.0003048442304134369, -0.000276811420917511, -0.0002487786114215851, -0.00022074580192565918, -0.00019271299242973328, -0.00016468018293380737, -0.00013664737343788147, -0.00010861456394195557, -8.058175444602966e-05, -5.254894495010376e-05, -2.4516135454177856e-05, 3.516674041748047e-06, 3.154948353767395e-05, 5.9582293033599854e-05, 8.761510252952576e-05, 0.00011564791202545166, 0.00014368072152137756, 0.00017171353101730347, 0.00019974634051322937, 0.00022777915000915527, 0.0002558119595050812, 0.0002838447690010071, 0.000311877578496933, 0.0003399103879928589, 0.0003679431974887848, 0.0003959760069847107, 0.0004240088164806366, 0.0004520416259765625, 0.0004800744354724884, 0.0005081072449684143, 0.0005361400544643402, 0.0005641728639602661, 0.000592205673456192, 0.0006202384829521179, 0.0006482712924480438, 0.0006763041019439697, 0.0007043369114398956, 0.0007323697209358215, 0.0007604025304317474, 0.0007884353399276733, 0.0008164681494235992, 0.0008445009589195251, 0.000872533768415451, 0.000900566577911377]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 5.0, 11.0, 9.0, 7.0, 8.0, 4.0, 14.0, 15.0, 17.0, 27.0, 26.0, 29.0, 24.0, 29.0, 35.0, 32.0, 28.0, 40.0, 42.0, 41.0, 37.0, 56.0, 46.0, 34.0, 25.0, 39.0, 39.0, 23.0, 31.0, 41.0, 31.0, 35.0, 22.0, 21.0, 16.0, 16.0, 14.0, 9.0, 4.0, 12.0, 7.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.119140625, -2.049224853515625, -1.97930908203125, -1.909393310546875, -1.8394775390625, -1.769561767578125, -1.69964599609375, -1.629730224609375, -1.559814453125, -1.489898681640625, -1.41998291015625, -1.350067138671875, -1.2801513671875, -1.210235595703125, -1.14031982421875, -1.070404052734375, -1.00048828125, -0.930572509765625, -0.86065673828125, -0.790740966796875, -0.7208251953125, -0.650909423828125, -0.58099365234375, -0.511077880859375, -0.441162109375, -0.371246337890625, -0.30133056640625, -0.231414794921875, -0.1614990234375, -0.091583251953125, -0.02166748046875, 0.048248291015625, 0.1181640625, 0.188079833984375, 0.25799560546875, 0.327911376953125, 0.3978271484375, 0.467742919921875, 0.53765869140625, 0.607574462890625, 0.677490234375, 0.747406005859375, 0.81732177734375, 0.887237548828125, 0.9571533203125, 1.027069091796875, 1.09698486328125, 1.166900634765625, 1.23681640625, 1.306732177734375, 1.37664794921875, 1.446563720703125, 1.5164794921875, 1.586395263671875, 1.65631103515625, 1.726226806640625, 1.796142578125, 1.866058349609375, 1.93597412109375, 2.005889892578125, 2.0758056640625, 2.145721435546875, 2.21563720703125, 2.285552978515625, 2.35546875]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 3.0, 8.0, 11.0, 16.0, 17.0, 24.0, 36.0, 55.0, 56.0, 96.0, 120.0, 142.0, 213.0, 315.0, 409.0, 601.0, 850.0, 1021.0, 1493.0, 2177.0, 3042.0, 4664.0, 6745.0, 11056.0, 19261.0, 43367.0, 139239.0, 427692.0, 250754.0, 68470.0, 26538.0, 13839.0, 8307.0, 5374.0, 3609.0, 2532.0, 1848.0, 1240.0, 887.0, 646.0, 484.0, 358.0, 230.0, 209.0, 143.0, 113.0, 75.0, 48.0, 35.0, 26.0, 26.0, 19.0, 12.0, 3.0, 2.0, 5.0, 1.0, 2.0, 3.0, 5.0], "bins": [-4.625, -4.47918701171875, -4.3333740234375, -4.18756103515625, -4.041748046875, -3.89593505859375, -3.7501220703125, -3.60430908203125, -3.45849609375, -3.31268310546875, -3.1668701171875, -3.02105712890625, -2.875244140625, -2.72943115234375, -2.5836181640625, -2.43780517578125, -2.2919921875, -2.14617919921875, -2.0003662109375, -1.85455322265625, -1.708740234375, -1.56292724609375, -1.4171142578125, -1.27130126953125, -1.12548828125, -0.97967529296875, -0.8338623046875, -0.68804931640625, -0.542236328125, -0.39642333984375, -0.2506103515625, -0.10479736328125, 0.041015625, 0.18682861328125, 0.3326416015625, 0.47845458984375, 0.624267578125, 0.77008056640625, 0.9158935546875, 1.06170654296875, 1.20751953125, 1.35333251953125, 1.4991455078125, 1.64495849609375, 1.790771484375, 1.93658447265625, 2.0823974609375, 2.22821044921875, 2.3740234375, 2.51983642578125, 2.6656494140625, 2.81146240234375, 2.957275390625, 3.10308837890625, 3.2489013671875, 3.39471435546875, 3.54052734375, 3.68634033203125, 3.8321533203125, 3.97796630859375, 4.123779296875, 4.26959228515625, 4.4154052734375, 4.56121826171875, 4.70703125]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 5.0, 8.0, 15.0, 7.0, 12.0, 16.0, 14.0, 31.0, 30.0, 33.0, 36.0, 38.0, 59.0, 56.0, 62.0, 122.0, 304.0, 1500.0, 184.0, 109.0, 54.0, 58.0, 48.0, 36.0, 44.0, 27.0, 29.0, 22.0, 14.0, 15.0, 19.0, 9.0, 8.0, 4.0, 6.0, 5.0, 9.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.84375, -7.5667724609375, -7.289794921875, -7.0128173828125, -6.73583984375, -6.4588623046875, -6.181884765625, -5.9049072265625, -5.6279296875, -5.3509521484375, -5.073974609375, -4.7969970703125, -4.52001953125, -4.2430419921875, -3.966064453125, -3.6890869140625, -3.412109375, -3.1351318359375, -2.858154296875, -2.5811767578125, -2.30419921875, -2.0272216796875, -1.750244140625, -1.4732666015625, -1.1962890625, -0.9193115234375, -0.642333984375, -0.3653564453125, -0.08837890625, 0.1885986328125, 0.465576171875, 0.7425537109375, 1.01953125, 1.2965087890625, 1.573486328125, 1.8504638671875, 2.12744140625, 2.4044189453125, 2.681396484375, 2.9583740234375, 3.2353515625, 3.5123291015625, 3.789306640625, 4.0662841796875, 4.34326171875, 4.6202392578125, 4.897216796875, 5.1741943359375, 5.451171875, 5.7281494140625, 6.005126953125, 6.2821044921875, 6.55908203125, 6.8360595703125, 7.113037109375, 7.3900146484375, 7.6669921875, 7.9439697265625, 8.220947265625, 8.4979248046875, 8.77490234375, 9.0518798828125, 9.328857421875, 9.6058349609375, 9.8828125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 3.0, 2.0, 7.0, 14.0, 13.0, 18.0, 10.0, 18.0, 18.0, 25.0, 21.0, 36.0, 36.0, 61.0, 78.0, 147.0, 364.0, 1596.0, 243237.0, 2895905.0, 3050.0, 480.0, 175.0, 102.0, 59.0, 41.0, 34.0, 28.0, 24.0, 30.0, 14.0, 13.0, 13.0, 6.0, 7.0, 7.0, 6.0, 4.0, 2.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0], "bins": [-42.9375, -41.8115234375, -40.685546875, -39.5595703125, -38.43359375, -37.3076171875, -36.181640625, -35.0556640625, -33.9296875, -32.8037109375, -31.677734375, -30.5517578125, -29.42578125, -28.2998046875, -27.173828125, -26.0478515625, -24.921875, -23.7958984375, -22.669921875, -21.5439453125, -20.41796875, -19.2919921875, -18.166015625, -17.0400390625, -15.9140625, -14.7880859375, -13.662109375, -12.5361328125, -11.41015625, -10.2841796875, -9.158203125, -8.0322265625, -6.90625, -5.7802734375, -4.654296875, -3.5283203125, -2.40234375, -1.2763671875, -0.150390625, 0.9755859375, 2.1015625, 3.2275390625, 4.353515625, 5.4794921875, 6.60546875, 7.7314453125, 8.857421875, 9.9833984375, 11.109375, 12.2353515625, 13.361328125, 14.4873046875, 15.61328125, 16.7392578125, 17.865234375, 18.9912109375, 20.1171875, 21.2431640625, 22.369140625, 23.4951171875, 24.62109375, 25.7470703125, 26.873046875, 27.9990234375, 29.125]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 6.0, 288.0, 709.0, 17.0], "bins": [-214.11477661132812, -210.6689453125, -207.22312927246094, -203.7772979736328, -200.33148193359375, -196.88565063476562, -193.43983459472656, -189.99400329589844, -186.54818725585938, -183.10235595703125, -179.6565399169922, -176.21070861816406, -172.764892578125, -169.31906127929688, -165.8732452392578, -162.4274139404297, -158.98159790039062, -155.5357666015625, -152.08995056152344, -148.6441192626953, -145.19830322265625, -141.75247192382812, -138.30665588378906, -134.86082458496094, -131.4149932861328, -127.96916961669922, -124.52334594726562, -121.07752227783203, -117.63169860839844, -114.18587493896484, -110.74005126953125, -107.29421997070312, -103.84840393066406, -100.40258026123047, -96.95675659179688, -93.51093292236328, -90.06510925292969, -86.6192855834961, -83.1734619140625, -79.72763061523438, -76.28180694580078, -72.83598327636719, -69.3901596069336, -65.9443359375, -62.498512268066406, -59.05268859863281, -55.60686111450195, -52.16103744506836, -48.715213775634766, -45.26939010620117, -41.82356643676758, -38.37773895263672, -34.931915283203125, -31.486093521118164, -28.040267944335938, -24.594444274902344, -21.14862060546875, -17.702796936035156, -14.256972312927246, -10.811147689819336, -7.365324020385742, -3.9195003509521484, -0.4736747741699219, 2.972148895263672, 6.417971611022949]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 2.0, 3.0, 4.0, 4.0, 3.0, 7.0, 10.0, 12.0, 9.0, 14.0, 6.0, 21.0, 19.0, 22.0, 11.0, 12.0, 22.0, 25.0, 37.0, 18.0, 22.0, 31.0, 35.0, 29.0, 30.0, 22.0, 27.0, 34.0, 31.0, 41.0, 30.0, 38.0, 35.0, 32.0, 33.0, 27.0, 22.0, 24.0, 28.0, 30.0, 26.0, 18.0, 11.0, 10.0, 13.0, 10.0, 15.0, 9.0, 12.0, 7.0, 2.0, 7.0, 2.0, 4.0, 1.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-18.270374298095703, -17.621904373168945, -16.973434448242188, -16.324962615966797, -15.676493644714355, -15.028022766113281, -14.379552841186523, -13.731082916259766, -13.082612991333008, -12.43414306640625, -11.785672187805176, -11.137202262878418, -10.48873233795166, -9.840261459350586, -9.191791534423828, -8.54332160949707, -7.894850730895996, -7.24638032913208, -6.597910404205322, -5.949440002441406, -5.300970077514648, -4.652499675750732, -4.004029273986816, -3.3555593490600586, -2.7070889472961426, -2.0586187839508057, -1.4101485013961792, -0.7616782188415527, -0.11320805549621582, 0.5352621078491211, 1.183732509613037, 1.832202434539795, 2.480672836303711, 3.129142999649048, 3.7776131629943848, 4.426083564758301, 5.074553489685059, 5.723023891448975, 6.371494293212891, 7.019964218139648, 7.6684346199035645, 8.31690502166748, 8.965374946594238, 9.613845825195312, 10.26231575012207, 10.910785675048828, 11.559255599975586, 12.207725524902344, 12.856196403503418, 13.504666328430176, 14.15313720703125, 14.801607131958008, 15.450077056884766, 16.098546981811523, 16.74701690673828, 17.395488739013672, 18.04395866394043, 18.692428588867188, 19.340898513793945, 19.989368438720703, 20.637840270996094, 21.28631019592285, 21.93478012084961, 22.583250045776367, 23.231719970703125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 5.0, 14.0, 4.0, 2.0, 7.0, 10.0, 14.0, 14.0, 14.0, 16.0, 29.0, 27.0, 27.0, 29.0, 31.0, 36.0, 37.0, 37.0, 29.0, 36.0, 45.0, 46.0, 49.0, 38.0, 38.0, 34.0, 34.0, 37.0, 27.0, 22.0, 40.0, 31.0, 40.0, 18.0, 17.0, 16.0, 15.0, 12.0, 14.0, 5.0, 4.0, 4.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.201171875, -2.124755859375, -2.04833984375, -1.971923828125, -1.8955078125, -1.819091796875, -1.74267578125, -1.666259765625, -1.58984375, -1.513427734375, -1.43701171875, -1.360595703125, -1.2841796875, -1.207763671875, -1.13134765625, -1.054931640625, -0.978515625, -0.902099609375, -0.82568359375, -0.749267578125, -0.6728515625, -0.596435546875, -0.52001953125, -0.443603515625, -0.3671875, -0.290771484375, -0.21435546875, -0.137939453125, -0.0615234375, 0.014892578125, 0.09130859375, 0.167724609375, 0.244140625, 0.320556640625, 0.39697265625, 0.473388671875, 0.5498046875, 0.626220703125, 0.70263671875, 0.779052734375, 0.85546875, 0.931884765625, 1.00830078125, 1.084716796875, 1.1611328125, 1.237548828125, 1.31396484375, 1.390380859375, 1.466796875, 1.543212890625, 1.61962890625, 1.696044921875, 1.7724609375, 1.848876953125, 1.92529296875, 2.001708984375, 2.078125, 2.154541015625, 2.23095703125, 2.307373046875, 2.3837890625, 2.460205078125, 2.53662109375, 2.613037109375, 2.689453125]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 7.0, 4.0, 2.0, 10.0, 19.0, 13.0, 17.0, 31.0, 33.0, 39.0, 54.0, 72.0, 79.0, 107.0, 155.0, 264.0, 433.0, 918.0, 2064.0, 5335.0, 15304.0, 55146.0, 334903.0, 2920697.0, 740116.0, 85440.0, 21371.0, 6708.0, 2437.0, 1034.0, 474.0, 255.0, 200.0, 136.0, 102.0, 79.0, 60.0, 41.0, 33.0, 24.0, 16.0, 20.0, 10.0, 7.0, 5.0, 6.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.9140625, -8.6231689453125, -8.332275390625, -8.0413818359375, -7.75048828125, -7.4595947265625, -7.168701171875, -6.8778076171875, -6.5869140625, -6.2960205078125, -6.005126953125, -5.7142333984375, -5.42333984375, -5.1324462890625, -4.841552734375, -4.5506591796875, -4.259765625, -3.9688720703125, -3.677978515625, -3.3870849609375, -3.09619140625, -2.8052978515625, -2.514404296875, -2.2235107421875, -1.9326171875, -1.6417236328125, -1.350830078125, -1.0599365234375, -0.76904296875, -0.4781494140625, -0.187255859375, 0.1036376953125, 0.39453125, 0.6854248046875, 0.976318359375, 1.2672119140625, 1.55810546875, 1.8489990234375, 2.139892578125, 2.4307861328125, 2.7216796875, 3.0125732421875, 3.303466796875, 3.5943603515625, 3.88525390625, 4.1761474609375, 4.467041015625, 4.7579345703125, 5.048828125, 5.3397216796875, 5.630615234375, 5.9215087890625, 6.21240234375, 6.5032958984375, 6.794189453125, 7.0850830078125, 7.3759765625, 7.6668701171875, 7.957763671875, 8.2486572265625, 8.53955078125, 8.8304443359375, 9.121337890625, 9.4122314453125, 9.703125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 6.0, 13.0, 9.0, 24.0, 28.0, 24.0, 58.0, 53.0, 95.0, 123.0, 186.0, 324.0, 455.0, 564.0, 573.0, 453.0, 333.0, 224.0, 149.0, 109.0, 84.0, 72.0, 39.0, 17.0, 21.0, 16.0, 6.0, 7.0, 1.0, 6.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.25390625, -6.95379638671875, -6.6536865234375, -6.35357666015625, -6.053466796875, -5.75335693359375, -5.4532470703125, -5.15313720703125, -4.85302734375, -4.55291748046875, -4.2528076171875, -3.95269775390625, -3.652587890625, -3.35247802734375, -3.0523681640625, -2.75225830078125, -2.4521484375, -2.15203857421875, -1.8519287109375, -1.55181884765625, -1.251708984375, -0.95159912109375, -0.6514892578125, -0.35137939453125, -0.05126953125, 0.24884033203125, 0.5489501953125, 0.84906005859375, 1.149169921875, 1.44927978515625, 1.7493896484375, 2.04949951171875, 2.349609375, 2.64971923828125, 2.9498291015625, 3.24993896484375, 3.550048828125, 3.85015869140625, 4.1502685546875, 4.45037841796875, 4.75048828125, 5.05059814453125, 5.3507080078125, 5.65081787109375, 5.950927734375, 6.25103759765625, 6.5511474609375, 6.85125732421875, 7.1513671875, 7.45147705078125, 7.7515869140625, 8.05169677734375, 8.351806640625, 8.65191650390625, 8.9520263671875, 9.25213623046875, 9.55224609375, 9.85235595703125, 10.1524658203125, 10.45257568359375, 10.752685546875, 11.05279541015625, 11.3529052734375, 11.65301513671875, 11.953125]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 4.0, 6.0, 13.0, 12.0, 17.0, 47.0, 70.0, 149.0, 415.0, 1562.0, 8881.0, 82928.0, 3079377.0, 974924.0, 39301.0, 4975.0, 1024.0, 297.0, 117.0, 62.0, 42.0, 18.0, 14.0, 11.0, 7.0, 4.0, 5.0, 5.0, 3.0], "bins": [-40.0625, -39.2252197265625, -38.387939453125, -37.5506591796875, -36.71337890625, -35.8760986328125, -35.038818359375, -34.2015380859375, -33.3642578125, -32.5269775390625, -31.689697265625, -30.8524169921875, -30.01513671875, -29.1778564453125, -28.340576171875, -27.5032958984375, -26.666015625, -25.8287353515625, -24.991455078125, -24.1541748046875, -23.31689453125, -22.4796142578125, -21.642333984375, -20.8050537109375, -19.9677734375, -19.1304931640625, -18.293212890625, -17.4559326171875, -16.61865234375, -15.7813720703125, -14.944091796875, -14.1068115234375, -13.26953125, -12.4322509765625, -11.594970703125, -10.7576904296875, -9.92041015625, -9.0831298828125, -8.245849609375, -7.4085693359375, -6.5712890625, -5.7340087890625, -4.896728515625, -4.0594482421875, -3.22216796875, -2.3848876953125, -1.547607421875, -0.7103271484375, 0.126953125, 0.9642333984375, 1.801513671875, 2.6387939453125, 3.47607421875, 4.3133544921875, 5.150634765625, 5.9879150390625, 6.8251953125, 7.6624755859375, 8.499755859375, 9.3370361328125, 10.17431640625, 11.0115966796875, 11.848876953125, 12.6861572265625, 13.5234375]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 27.0, 104.0, 347.0, 396.0, 125.0, 13.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.57048797607422, -50.687374114990234, -46.80426025390625, -42.921142578125, -39.03803253173828, -35.15491485595703, -31.271800994873047, -27.388687133789062, -23.505573272705078, -19.622459411621094, -15.739344596862793, -11.856229782104492, -7.973115921020508, -4.090002059936523, -0.20688629150390625, 3.676227569580078, 7.5593414306640625, 11.442455291748047, 15.325570106506348, 19.20868492126465, 23.091798782348633, 26.974912643432617, 30.858028411865234, 34.74114227294922, 38.6242561340332, 42.50736999511719, 46.39048385620117, 50.273597717285156, 54.156715393066406, 58.039825439453125, 61.922943115234375, 65.80606079101562, 69.68917846679688, 73.57229614257812, 77.45540618896484, 81.3385238647461, 85.22163391113281, 89.10475158691406, 92.98786926269531, 96.87097930908203, 100.75408935546875, 104.63720703125, 108.52031707763672, 112.40343475341797, 116.28654479980469, 120.16966247558594, 124.05278015136719, 127.9358901977539, 131.81900024414062, 135.70211791992188, 139.58523559570312, 143.4683380126953, 147.35145568847656, 151.2345733642578, 155.11769104003906, 159.00079345703125, 162.88392639160156, 166.7670440673828, 170.65016174316406, 174.53326416015625, 178.4163818359375, 182.29949951171875, 186.1826171875, 190.06573486328125, 193.94883728027344]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 11.0, 9.0, 10.0, 14.0, 18.0, 16.0, 20.0, 28.0, 24.0, 26.0, 27.0, 38.0, 50.0, 54.0, 49.0, 36.0, 48.0, 39.0, 46.0, 47.0, 34.0, 48.0, 35.0, 28.0, 31.0, 36.0, 24.0, 26.0, 14.0, 21.0, 12.0, 12.0, 8.0, 12.0, 4.0, 11.0, 9.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-33.08485412597656, -32.14472579956055, -31.204601287841797, -30.26447296142578, -29.3243465423584, -28.384220123291016, -27.444093704223633, -26.50396728515625, -25.563838958740234, -24.62371253967285, -23.68358612060547, -22.743457794189453, -21.80333137512207, -20.863204956054688, -19.923078536987305, -18.982952117919922, -18.04282569885254, -17.102699279785156, -16.162572860717773, -15.222445487976074, -14.282318115234375, -13.342191696166992, -12.40206527709961, -11.461938858032227, -10.521811485290527, -9.581685066223145, -8.641557693481445, -7.7014312744140625, -6.7613043785095215, -5.8211774826049805, -4.881051063537598, -3.9409241676330566, -3.0007991790771484, -2.0606722831726074, -1.1205456256866455, -0.1804189682006836, 0.7597079277038574, 1.6998348236083984, 2.6399612426757812, 3.5800881385803223, 4.520215034484863, 5.460341930389404, 6.400468826293945, 7.340595245361328, 8.280721664428711, 9.22084903717041, 10.160975456237793, 11.101102828979492, 12.041229248046875, 12.981355667114258, 13.921483039855957, 14.86160945892334, 15.801736831665039, 16.741863250732422, 17.681989669799805, 18.622116088867188, 19.562244415283203, 20.502370834350586, 21.44249725341797, 22.382625579833984, 23.322751998901367, 24.26287841796875, 25.203004837036133, 26.143131256103516, 27.0832576751709]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 3.0, 7.0, 11.0, 13.0, 16.0, 18.0, 26.0, 22.0, 20.0, 24.0, 33.0, 27.0, 40.0, 31.0, 32.0, 41.0, 39.0, 38.0, 40.0, 45.0, 38.0, 37.0, 27.0, 33.0, 26.0, 42.0, 31.0, 25.0, 39.0, 24.0, 15.0, 16.0, 20.0, 23.0, 18.0, 10.0, 9.0, 10.0, 8.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.349609375, -2.273834228515625, -2.19805908203125, -2.122283935546875, -2.0465087890625, -1.970733642578125, -1.89495849609375, -1.819183349609375, -1.743408203125, -1.667633056640625, -1.59185791015625, -1.516082763671875, -1.4403076171875, -1.364532470703125, -1.28875732421875, -1.212982177734375, -1.13720703125, -1.061431884765625, -0.98565673828125, -0.909881591796875, -0.8341064453125, -0.758331298828125, -0.68255615234375, -0.606781005859375, -0.531005859375, -0.455230712890625, -0.37945556640625, -0.303680419921875, -0.2279052734375, -0.152130126953125, -0.07635498046875, -0.000579833984375, 0.0751953125, 0.150970458984375, 0.22674560546875, 0.302520751953125, 0.3782958984375, 0.454071044921875, 0.52984619140625, 0.605621337890625, 0.681396484375, 0.757171630859375, 0.83294677734375, 0.908721923828125, 0.9844970703125, 1.060272216796875, 1.13604736328125, 1.211822509765625, 1.28759765625, 1.363372802734375, 1.43914794921875, 1.514923095703125, 1.5906982421875, 1.666473388671875, 1.74224853515625, 1.818023681640625, 1.893798828125, 1.969573974609375, 2.04534912109375, 2.121124267578125, 2.1968994140625, 2.272674560546875, 2.34844970703125, 2.424224853515625, 2.5]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 2.0, 6.0, 7.0, 10.0, 13.0, 23.0, 22.0, 31.0, 37.0, 69.0, 130.0, 153.0, 240.0, 359.0, 595.0, 878.0, 1377.0, 2264.0, 3643.0, 5677.0, 9110.0, 14894.0, 25566.0, 45515.0, 87254.0, 176757.0, 278830.0, 186683.0, 92144.0, 48040.0, 26888.0, 15976.0, 9325.0, 5908.0, 3677.0, 2298.0, 1457.0, 927.0, 601.0, 380.0, 263.0, 157.0, 123.0, 85.0, 58.0, 38.0, 25.0, 20.0, 5.0, 8.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.348388671875, -0.3383026123046875, -0.328216552734375, -0.3181304931640625, -0.30804443359375, -0.2979583740234375, -0.287872314453125, -0.2777862548828125, -0.2677001953125, -0.2576141357421875, -0.247528076171875, -0.2374420166015625, -0.22735595703125, -0.2172698974609375, -0.207183837890625, -0.1970977783203125, -0.18701171875, -0.1769256591796875, -0.166839599609375, -0.1567535400390625, -0.14666748046875, -0.1365814208984375, -0.126495361328125, -0.1164093017578125, -0.1063232421875, -0.0962371826171875, -0.086151123046875, -0.0760650634765625, -0.06597900390625, -0.0558929443359375, -0.045806884765625, -0.0357208251953125, -0.025634765625, -0.0155487060546875, -0.005462646484375, 0.0046234130859375, 0.01470947265625, 0.0247955322265625, 0.034881591796875, 0.0449676513671875, 0.0550537109375, 0.0651397705078125, 0.075225830078125, 0.0853118896484375, 0.09539794921875, 0.1054840087890625, 0.115570068359375, 0.1256561279296875, 0.1357421875, 0.1458282470703125, 0.155914306640625, 0.1660003662109375, 0.17608642578125, 0.1861724853515625, 0.196258544921875, 0.2063446044921875, 0.2164306640625, 0.2265167236328125, 0.236602783203125, 0.2466888427734375, 0.25677490234375, 0.2668609619140625, 0.276947021484375, 0.2870330810546875, 0.297119140625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 2.0, 6.0, 6.0, 4.0, 5.0, 7.0, 20.0, 10.0, 14.0, 18.0, 21.0, 21.0, 29.0, 21.0, 45.0, 24.0, 31.0, 41.0, 34.0, 37.0, 39.0, 41.0, 1072.0, 39.0, 34.0, 35.0, 40.0, 29.0, 32.0, 33.0, 35.0, 33.0, 23.0, 26.0, 26.0, 19.0, 21.0, 13.0, 11.0, 6.0, 7.0, 4.0, 6.0, 3.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-1.84765625, -1.79632568359375, -1.7449951171875, -1.69366455078125, -1.642333984375, -1.59100341796875, -1.5396728515625, -1.48834228515625, -1.43701171875, -1.38568115234375, -1.3343505859375, -1.28302001953125, -1.231689453125, -1.18035888671875, -1.1290283203125, -1.07769775390625, -1.0263671875, -0.97503662109375, -0.9237060546875, -0.87237548828125, -0.821044921875, -0.76971435546875, -0.7183837890625, -0.66705322265625, -0.61572265625, -0.56439208984375, -0.5130615234375, -0.46173095703125, -0.410400390625, -0.35906982421875, -0.3077392578125, -0.25640869140625, -0.205078125, -0.15374755859375, -0.1024169921875, -0.05108642578125, 0.000244140625, 0.05157470703125, 0.1029052734375, 0.15423583984375, 0.20556640625, 0.25689697265625, 0.3082275390625, 0.35955810546875, 0.410888671875, 0.46221923828125, 0.5135498046875, 0.56488037109375, 0.6162109375, 0.66754150390625, 0.7188720703125, 0.77020263671875, 0.821533203125, 0.87286376953125, 0.9241943359375, 0.97552490234375, 1.02685546875, 1.07818603515625, 1.1295166015625, 1.18084716796875, 1.232177734375, 1.28350830078125, 1.3348388671875, 1.38616943359375, 1.4375]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 5.0, 3.0, 11.0, 7.0, 14.0, 21.0, 36.0, 39.0, 63.0, 100.0, 160.0, 216.0, 355.0, 547.0, 764.0, 1140.0, 1590.0, 2337.0, 3463.0, 5059.0, 7529.0, 10881.0, 16783.0, 25824.0, 40759.0, 65301.0, 107008.0, 168674.0, 1244917.0, 145207.0, 90569.0, 55766.0, 35161.0, 22673.0, 14451.0, 9451.0, 6608.0, 4283.0, 2964.0, 2043.0, 1388.0, 941.0, 670.0, 415.0, 315.0, 214.0, 131.0, 101.0, 62.0, 55.0, 31.0, 15.0, 5.0, 7.0, 7.0, 5.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.1851806640625, -0.1790752410888672, -0.17296981811523438, -0.16686439514160156, -0.16075897216796875, -0.15465354919433594, -0.14854812622070312, -0.1424427032470703, -0.1363372802734375, -0.1302318572998047, -0.12412643432617188, -0.11802101135253906, -0.11191558837890625, -0.10581016540527344, -0.09970474243164062, -0.09359931945800781, -0.087493896484375, -0.08138847351074219, -0.07528305053710938, -0.06917762756347656, -0.06307220458984375, -0.05696678161621094, -0.050861358642578125, -0.04475593566894531, -0.0386505126953125, -0.03254508972167969, -0.026439666748046875, -0.020334243774414062, -0.01422882080078125, -0.008123397827148438, -0.002017974853515625, 0.0040874481201171875, 0.01019287109375, 0.016298294067382812, 0.022403717041015625, 0.028509140014648438, 0.03461456298828125, 0.04071998596191406, 0.046825408935546875, 0.05293083190917969, 0.0590362548828125, 0.06514167785644531, 0.07124710083007812, 0.07735252380371094, 0.08345794677734375, 0.08956336975097656, 0.09566879272460938, 0.10177421569824219, 0.107879638671875, 0.11398506164550781, 0.12009048461914062, 0.12619590759277344, 0.13230133056640625, 0.13840675354003906, 0.14451217651367188, 0.1506175994873047, 0.1567230224609375, 0.1628284454345703, 0.16893386840820312, 0.17503929138183594, 0.18114471435546875, 0.18725013732910156, 0.19335556030273438, 0.1994609832763672, 0.20556640625]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 5.0, 3.0, 10.0, 5.0, 16.0, 23.0, 18.0, 29.0, 54.0, 58.0, 83.0, 116.0, 134.0, 99.0, 88.0, 60.0, 54.0, 39.0, 22.0, 25.0, 15.0, 18.0, 11.0, 4.0, 3.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023593902587890625, -0.0022822022438049316, -0.0022050142288208008, -0.00212782621383667, -0.002050638198852539, -0.001973450183868408, -0.0018962621688842773, -0.0018190741539001465, -0.0017418861389160156, -0.0016646981239318848, -0.001587510108947754, -0.001510322093963623, -0.0014331340789794922, -0.0013559460639953613, -0.0012787580490112305, -0.0012015700340270996, -0.0011243820190429688, -0.0010471940040588379, -0.000970005989074707, -0.0008928179740905762, -0.0008156299591064453, -0.0007384419441223145, -0.0006612539291381836, -0.0005840659141540527, -0.0005068778991699219, -0.000429689884185791, -0.00035250186920166016, -0.0002753138542175293, -0.00019812583923339844, -0.00012093782424926758, -4.374980926513672e-05, 3.343820571899414e-05, 0.000110626220703125, 0.00018781423568725586, 0.0002650022506713867, 0.0003421902656555176, 0.00041937828063964844, 0.0004965662956237793, 0.0005737543106079102, 0.000650942325592041, 0.0007281303405761719, 0.0008053183555603027, 0.0008825063705444336, 0.0009596943855285645, 0.0010368824005126953, 0.0011140704154968262, 0.001191258430480957, 0.0012684464454650879, 0.0013456344604492188, 0.0014228224754333496, 0.0015000104904174805, 0.0015771985054016113, 0.0016543865203857422, 0.001731574535369873, 0.001808762550354004, 0.0018859505653381348, 0.0019631385803222656, 0.0020403265953063965, 0.0021175146102905273, 0.002194702625274658, 0.002271890640258789, 0.00234907865524292, 0.0024262666702270508, 0.0025034546852111816, 0.0025806427001953125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 1.0, 2.0, 9.0, 15.0, 11.0, 13.0, 20.0, 23.0, 41.0, 63.0, 79.0, 131.0, 208.0, 388.0, 975.0, 715407.0, 329354.0, 885.0, 334.0, 194.0, 125.0, 73.0, 68.0, 39.0, 30.0, 18.0, 11.0, 12.0, 12.0, 8.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04132080078125, -0.03994178771972656, -0.038562774658203125, -0.03718376159667969, -0.03580474853515625, -0.03442573547363281, -0.033046722412109375, -0.03166770935058594, -0.0302886962890625, -0.028909683227539062, -0.027530670166015625, -0.026151657104492188, -0.02477264404296875, -0.023393630981445312, -0.022014617919921875, -0.020635604858398438, -0.019256591796875, -0.017877578735351562, -0.016498565673828125, -0.015119552612304688, -0.01374053955078125, -0.012361526489257812, -0.010982513427734375, -0.009603500366210938, -0.0082244873046875, -0.0068454742431640625, -0.005466461181640625, -0.0040874481201171875, -0.00270843505859375, -0.0013294219970703125, 4.9591064453125e-05, 0.0014286041259765625, 0.0028076171875, 0.0041866302490234375, 0.005565643310546875, 0.0069446563720703125, 0.00832366943359375, 0.009702682495117188, 0.011081695556640625, 0.012460708618164062, 0.0138397216796875, 0.015218734741210938, 0.016597747802734375, 0.017976760864257812, 0.01935577392578125, 0.020734786987304688, 0.022113800048828125, 0.023492813110351562, 0.024871826171875, 0.026250839233398438, 0.027629852294921875, 0.029008865356445312, 0.03038787841796875, 0.03176689147949219, 0.033145904541015625, 0.03452491760253906, 0.0359039306640625, 0.03728294372558594, 0.038661956787109375, 0.04004096984863281, 0.04141998291015625, 0.04279899597167969, 0.044178009033203125, 0.04555702209472656, 0.04693603515625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 2.0, 9.0, 10.0, 14.0, 11.0, 20.0, 38.0, 37.0, 54.0, 81.0, 102.0, 107.0, 122.0, 93.0, 81.0, 66.0, 41.0, 34.0, 26.0, 13.0, 13.0, 7.0, 7.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006987580563873053, -0.0006756514776498079, -0.0006525448989123106, -0.0006294383201748133, -0.0006063317414373159, -0.0005832251626998186, -0.0005601185839623213, -0.0005370120634324849, -0.0005139054846949875, -0.0004907989059574902, -0.0004676923272199929, -0.00044458574848249555, -0.0004214791988488287, -0.00039837262011133134, -0.000375266041373834, -0.00035215949174016714, -0.00032905288389883935, -0.000305946305161342, -0.0002828397264238447, -0.0002597331767901778, -0.0002366265980526805, -0.00021352001931518316, -0.00019041344057768583, -0.00016730687639210373, -0.0001442002976546064, -0.00012109372619306669, -9.798715473152697e-05, -7.488057599402964e-05, -5.1774004532489926e-05, -2.866743307095021e-05, -5.56085433345288e-06, 1.754570985212922e-05, 4.065228858962655e-05, 6.375886005116627e-05, 8.686543151270598e-05, 0.00010997201025020331, 0.0001330785744357854, 0.00015618515317328274, 0.00017929173191078007, 0.00020239829609636217, 0.0002255048748338595, 0.0002486114390194416, 0.00027171801775693893, 0.00029482459649443626, 0.0003179311752319336, 0.0003410377539694309, 0.00036414433270692825, 0.0003872508823405951, 0.00041035746107809246, 0.0004334640398155898, 0.0004565706185530871, 0.000479677168186754, 0.0005027837469242513, 0.0005258903256617486, 0.000548996904399246, 0.0005721034831367433, 0.0005952100618742406, 0.000618316640611738, 0.0006414232193492353, 0.0006645297980867326, 0.00068763637682423, 0.0007107428973540664, 0.0007338494760915637, 0.000756956054829061, 0.0007800626335665584]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 6.0, 1.0, 4.0, 1.0, 0.0, 6.0, 5.0, 7.0, 5.0, 14.0, 17.0, 12.0, 18.0, 18.0, 19.0, 24.0, 20.0, 36.0, 26.0, 38.0, 35.0, 34.0, 36.0, 45.0, 50.0, 42.0, 44.0, 39.0, 42.0, 40.0, 45.0, 39.0, 30.0, 32.0, 24.0, 24.0, 19.0, 18.0, 16.0, 20.0, 5.0, 7.0, 10.0, 5.0, 15.0, 5.0, 6.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.000858604907989502, -0.0008321870118379593, -0.0008057691156864166, -0.000779351219534874, -0.0007529333233833313, -0.0007265154272317886, -0.000700097531080246, -0.0006736796349287033, -0.0006472617387771606, -0.000620843842625618, -0.0005944259464740753, -0.0005680080503225327, -0.00054159015417099, -0.0005151722580194473, -0.0004887543618679047, -0.000462336465716362, -0.00043591856956481934, -0.00040950067341327667, -0.000383082777261734, -0.00035666488111019135, -0.0003302469849586487, -0.000303829088807106, -0.00027741119265556335, -0.0002509932965040207, -0.00022457540035247803, -0.00019815750420093536, -0.0001717396080493927, -0.00014532171189785004, -0.00011890381574630737, -9.248591959476471e-05, -6.606802344322205e-05, -3.965012729167938e-05, -1.3232231140136719e-05, 1.3185665011405945e-05, 3.960356116294861e-05, 6.602145731449127e-05, 9.243935346603394e-05, 0.0001188572496175766, 0.00014527514576911926, 0.00017169304192066193, 0.0001981109380722046, 0.00022452883422374725, 0.0002509467303752899, 0.0002773646265268326, 0.00030378252267837524, 0.0003302004188299179, 0.00035661831498146057, 0.00038303621113300323, 0.0004094541072845459, 0.00043587200343608856, 0.0004622898995876312, 0.0004887077957391739, 0.0005151256918907166, 0.0005415435880422592, 0.0005679614841938019, 0.0005943793803453445, 0.0006207972764968872, 0.0006472151726484299, 0.0006736330687999725, 0.0007000509649515152, 0.0007264688611030579, 0.0007528867572546005, 0.0007793046534061432, 0.0008057225495576859, 0.0008321404457092285]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 3.0, 7.0, 11.0, 13.0, 16.0, 18.0, 26.0, 22.0, 20.0, 24.0, 33.0, 27.0, 40.0, 31.0, 32.0, 41.0, 39.0, 38.0, 40.0, 45.0, 38.0, 37.0, 27.0, 33.0, 26.0, 42.0, 31.0, 26.0, 38.0, 24.0, 15.0, 16.0, 20.0, 23.0, 18.0, 10.0, 9.0, 10.0, 8.0, 3.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-2.349609375, -2.273834228515625, -2.19805908203125, -2.122283935546875, -2.0465087890625, -1.970733642578125, -1.89495849609375, -1.819183349609375, -1.743408203125, -1.667633056640625, -1.59185791015625, -1.516082763671875, -1.4403076171875, -1.364532470703125, -1.28875732421875, -1.212982177734375, -1.13720703125, -1.061431884765625, -0.98565673828125, -0.909881591796875, -0.8341064453125, -0.758331298828125, -0.68255615234375, -0.606781005859375, -0.531005859375, -0.455230712890625, -0.37945556640625, -0.303680419921875, -0.2279052734375, -0.152130126953125, -0.07635498046875, -0.000579833984375, 0.0751953125, 0.150970458984375, 0.22674560546875, 0.302520751953125, 0.3782958984375, 0.454071044921875, 0.52984619140625, 0.605621337890625, 0.681396484375, 0.757171630859375, 0.83294677734375, 0.908721923828125, 0.9844970703125, 1.060272216796875, 1.13604736328125, 1.211822509765625, 1.28759765625, 1.363372802734375, 1.43914794921875, 1.514923095703125, 1.5906982421875, 1.666473388671875, 1.74224853515625, 1.818023681640625, 1.893798828125, 1.969573974609375, 2.04534912109375, 2.121124267578125, 2.1968994140625, 2.272674560546875, 2.34844970703125, 2.424224853515625, 2.5]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [5.0, 1.0, 4.0, 7.0, 5.0, 13.0, 13.0, 13.0, 20.0, 26.0, 22.0, 32.0, 44.0, 64.0, 89.0, 127.0, 216.0, 308.0, 554.0, 837.0, 1390.0, 2479.0, 5205.0, 14969.0, 76324.0, 468078.0, 394029.0, 60259.0, 12902.0, 4643.0, 2331.0, 1278.0, 815.0, 469.0, 308.0, 210.0, 132.0, 95.0, 75.0, 53.0, 30.0, 20.0, 20.0, 16.0, 11.0, 10.0, 5.0, 9.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.66015625, -3.51904296875, -3.3779296875, -3.23681640625, -3.095703125, -2.95458984375, -2.8134765625, -2.67236328125, -2.53125, -2.39013671875, -2.2490234375, -2.10791015625, -1.966796875, -1.82568359375, -1.6845703125, -1.54345703125, -1.40234375, -1.26123046875, -1.1201171875, -0.97900390625, -0.837890625, -0.69677734375, -0.5556640625, -0.41455078125, -0.2734375, -0.13232421875, 0.0087890625, 0.14990234375, 0.291015625, 0.43212890625, 0.5732421875, 0.71435546875, 0.85546875, 0.99658203125, 1.1376953125, 1.27880859375, 1.419921875, 1.56103515625, 1.7021484375, 1.84326171875, 1.984375, 2.12548828125, 2.2666015625, 2.40771484375, 2.548828125, 2.68994140625, 2.8310546875, 2.97216796875, 3.11328125, 3.25439453125, 3.3955078125, 3.53662109375, 3.677734375, 3.81884765625, 3.9599609375, 4.10107421875, 4.2421875, 4.38330078125, 4.5244140625, 4.66552734375, 4.806640625, 4.94775390625, 5.0888671875, 5.22998046875, 5.37109375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 2.0, 3.0, 4.0, 6.0, 6.0, 6.0, 13.0, 10.0, 15.0, 9.0, 18.0, 24.0, 20.0, 23.0, 24.0, 31.0, 33.0, 56.0, 39.0, 52.0, 48.0, 66.0, 166.0, 1658.0, 225.0, 78.0, 54.0, 52.0, 28.0, 35.0, 37.0, 29.0, 19.0, 13.0, 24.0, 19.0, 21.0, 19.0, 10.0, 15.0, 9.0, 11.0, 8.0, 3.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0], "bins": [-8.9921875, -8.6981201171875, -8.404052734375, -8.1099853515625, -7.81591796875, -7.5218505859375, -7.227783203125, -6.9337158203125, -6.6396484375, -6.3455810546875, -6.051513671875, -5.7574462890625, -5.46337890625, -5.1693115234375, -4.875244140625, -4.5811767578125, -4.287109375, -3.9930419921875, -3.698974609375, -3.4049072265625, -3.11083984375, -2.8167724609375, -2.522705078125, -2.2286376953125, -1.9345703125, -1.6405029296875, -1.346435546875, -1.0523681640625, -0.75830078125, -0.4642333984375, -0.170166015625, 0.1239013671875, 0.41796875, 0.7120361328125, 1.006103515625, 1.3001708984375, 1.59423828125, 1.8883056640625, 2.182373046875, 2.4764404296875, 2.7705078125, 3.0645751953125, 3.358642578125, 3.6527099609375, 3.94677734375, 4.2408447265625, 4.534912109375, 4.8289794921875, 5.123046875, 5.4171142578125, 5.711181640625, 6.0052490234375, 6.29931640625, 6.5933837890625, 6.887451171875, 7.1815185546875, 7.4755859375, 7.7696533203125, 8.063720703125, 8.3577880859375, 8.65185546875, 8.9459228515625, 9.239990234375, 9.5340576171875, 9.828125]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 2.0, 2.0, 7.0, 6.0, 15.0, 9.0, 13.0, 23.0, 15.0, 22.0, 21.0, 18.0, 25.0, 41.0, 44.0, 75.0, 122.0, 179.0, 386.0, 1431.0, 9880.0, 2965010.0, 162862.0, 3837.0, 797.0, 269.0, 150.0, 93.0, 72.0, 59.0, 39.0, 33.0, 18.0, 22.0, 21.0, 16.0, 15.0, 9.0, 13.0, 8.0, 7.0, 5.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.546875, -21.879638671875, -21.21240234375, -20.545166015625, -19.8779296875, -19.210693359375, -18.54345703125, -17.876220703125, -17.208984375, -16.541748046875, -15.87451171875, -15.207275390625, -14.5400390625, -13.872802734375, -13.20556640625, -12.538330078125, -11.87109375, -11.203857421875, -10.53662109375, -9.869384765625, -9.2021484375, -8.534912109375, -7.86767578125, -7.200439453125, -6.533203125, -5.865966796875, -5.19873046875, -4.531494140625, -3.8642578125, -3.197021484375, -2.52978515625, -1.862548828125, -1.1953125, -0.528076171875, 0.13916015625, 0.806396484375, 1.4736328125, 2.140869140625, 2.80810546875, 3.475341796875, 4.142578125, 4.809814453125, 5.47705078125, 6.144287109375, 6.8115234375, 7.478759765625, 8.14599609375, 8.813232421875, 9.48046875, 10.147705078125, 10.81494140625, 11.482177734375, 12.1494140625, 12.816650390625, 13.48388671875, 14.151123046875, 14.818359375, 15.485595703125, 16.15283203125, 16.820068359375, 17.4873046875, 18.154541015625, 18.82177734375, 19.489013671875, 20.15625]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 12.0, 74.0, 173.0, 282.0, 283.0, 114.0, 47.0, 14.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.117015838623047, -28.435546875, -27.754079818725586, -27.07261085510254, -26.391141891479492, -25.709674835205078, -25.02820587158203, -24.346736907958984, -23.665267944335938, -22.98379898071289, -22.302331924438477, -21.62086296081543, -20.939393997192383, -20.25792694091797, -19.576457977294922, -18.894989013671875, -18.21352195739746, -17.532052993774414, -16.8505859375, -16.169116973876953, -15.487648010253906, -14.806180000305176, -14.124711990356445, -13.443243026733398, -12.761775016784668, -12.080307006835938, -11.39883804321289, -10.71737003326416, -10.03590202331543, -9.354433059692383, -8.672965049743652, -7.991496562957764, -7.310026168823242, -6.6285576820373535, -5.947089195251465, -5.265621185302734, -4.584152698516846, -3.902684211730957, -3.2212162017822266, -2.539747714996338, -1.8582792282104492, -1.17681086063385, -0.495342493057251, 0.1861257553100586, 0.8675942420959473, 1.549062728881836, 2.2305307388305664, 2.911999225616455, 3.5934677124023438, 4.274936199188232, 4.956404685974121, 5.637872695922852, 6.31934118270874, 7.000809669494629, 7.682277679443359, 8.363746643066406, 9.045214653015137, 9.726682662963867, 10.408151626586914, 11.089619636535645, 11.771087646484375, 12.452556610107422, 13.134024620056152, 13.815492630004883, 14.49696159362793]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 6.0, 3.0, 4.0, 4.0, 2.0, 6.0, 8.0, 3.0, 4.0, 15.0, 12.0, 13.0, 11.0, 17.0, 27.0, 19.0, 27.0, 27.0, 24.0, 35.0, 30.0, 41.0, 34.0, 43.0, 30.0, 40.0, 40.0, 32.0, 30.0, 31.0, 32.0, 45.0, 43.0, 30.0, 33.0, 22.0, 25.0, 18.0, 15.0, 14.0, 26.0, 17.0, 16.0, 10.0, 4.0, 10.0, 6.0, 8.0, 6.0, 3.0, 7.0, 1.0, 2.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.708343505859375, -23.843759536743164, -22.979175567626953, -22.114591598510742, -21.25000762939453, -20.38542366027832, -19.52083969116211, -18.65625762939453, -17.791671752929688, -16.927087783813477, -16.062503814697266, -15.197919845581055, -14.333335876464844, -13.468751907348633, -12.604168891906738, -11.739584922790527, -10.875001907348633, -10.010417938232422, -9.145833969116211, -8.28125, -7.416666507720947, -6.552082538604736, -5.687499046325684, -4.822915077209473, -3.9583311080932617, -3.093747138977051, -2.229163408279419, -1.364579677581787, -0.49999570846557617, 0.36458826065063477, 1.2291717529296875, 2.0937557220458984, 2.9583396911621094, 3.8229236602783203, 4.687507629394531, 5.552091121673584, 6.416675090789795, 7.281259059906006, 8.145842552185059, 9.01042652130127, 9.87501049041748, 10.739594459533691, 11.604178428649902, 12.468761444091797, 13.333345413208008, 14.197929382324219, 15.06251335144043, 15.92709732055664, 16.79168128967285, 17.656265258789062, 18.520849227905273, 19.385433197021484, 20.250017166137695, 21.114601135253906, 21.979183197021484, 22.843769073486328, 23.708351135253906, 24.572935104370117, 25.437519073486328, 26.30210304260254, 27.16668701171875, 28.03127098083496, 28.895854949951172, 29.76043701171875, 30.625022888183594]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 9.0, 6.0, 8.0, 9.0, 15.0, 20.0, 15.0, 22.0, 20.0, 30.0, 31.0, 24.0, 35.0, 30.0, 39.0, 39.0, 48.0, 35.0, 39.0, 42.0, 41.0, 28.0, 47.0, 22.0, 34.0, 26.0, 36.0, 31.0, 36.0, 21.0, 22.0, 22.0, 24.0, 20.0, 18.0, 11.0, 8.0, 11.0, 7.0, 2.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-2.56640625, -2.487274169921875, -2.40814208984375, -2.329010009765625, -2.2498779296875, -2.170745849609375, -2.09161376953125, -2.012481689453125, -1.933349609375, -1.854217529296875, -1.77508544921875, -1.695953369140625, -1.6168212890625, -1.537689208984375, -1.45855712890625, -1.379425048828125, -1.30029296875, -1.221160888671875, -1.14202880859375, -1.062896728515625, -0.9837646484375, -0.904632568359375, -0.82550048828125, -0.746368408203125, -0.667236328125, -0.588104248046875, -0.50897216796875, -0.429840087890625, -0.3507080078125, -0.271575927734375, -0.19244384765625, -0.113311767578125, -0.0341796875, 0.044952392578125, 0.12408447265625, 0.203216552734375, 0.2823486328125, 0.361480712890625, 0.44061279296875, 0.519744873046875, 0.598876953125, 0.678009033203125, 0.75714111328125, 0.836273193359375, 0.9154052734375, 0.994537353515625, 1.07366943359375, 1.152801513671875, 1.23193359375, 1.311065673828125, 1.39019775390625, 1.469329833984375, 1.5484619140625, 1.627593994140625, 1.70672607421875, 1.785858154296875, 1.864990234375, 1.944122314453125, 2.02325439453125, 2.102386474609375, 2.1815185546875, 2.260650634765625, 2.33978271484375, 2.418914794921875, 2.498046875]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 7.0, 10.0, 7.0, 9.0, 5.0, 16.0, 18.0, 24.0, 24.0, 31.0, 43.0, 58.0, 92.0, 138.0, 317.0, 766.0, 1862.0, 4808.0, 13799.0, 50967.0, 474368.0, 3183410.0, 394846.0, 48280.0, 12980.0, 4371.0, 1534.0, 672.0, 306.0, 136.0, 98.0, 66.0, 47.0, 38.0, 37.0, 29.0, 16.0, 14.0, 7.0, 9.0, 5.0, 4.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7421875, -9.4326171875, -9.123046875, -8.8134765625, -8.50390625, -8.1943359375, -7.884765625, -7.5751953125, -7.265625, -6.9560546875, -6.646484375, -6.3369140625, -6.02734375, -5.7177734375, -5.408203125, -5.0986328125, -4.7890625, -4.4794921875, -4.169921875, -3.8603515625, -3.55078125, -3.2412109375, -2.931640625, -2.6220703125, -2.3125, -2.0029296875, -1.693359375, -1.3837890625, -1.07421875, -0.7646484375, -0.455078125, -0.1455078125, 0.1640625, 0.4736328125, 0.783203125, 1.0927734375, 1.40234375, 1.7119140625, 2.021484375, 2.3310546875, 2.640625, 2.9501953125, 3.259765625, 3.5693359375, 3.87890625, 4.1884765625, 4.498046875, 4.8076171875, 5.1171875, 5.4267578125, 5.736328125, 6.0458984375, 6.35546875, 6.6650390625, 6.974609375, 7.2841796875, 7.59375, 7.9033203125, 8.212890625, 8.5224609375, 8.83203125, 9.1416015625, 9.451171875, 9.7607421875, 10.0703125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 8.0, 8.0, 10.0, 7.0, 15.0, 20.0, 35.0, 49.0, 59.0, 80.0, 110.0, 168.0, 216.0, 314.0, 464.0, 562.0, 533.0, 435.0, 271.0, 208.0, 158.0, 104.0, 83.0, 39.0, 30.0, 21.0, 16.0, 16.0, 13.0, 12.0, 6.0, 2.0, 3.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5078125, -8.2232666015625, -7.938720703125, -7.6541748046875, -7.36962890625, -7.0850830078125, -6.800537109375, -6.5159912109375, -6.2314453125, -5.9468994140625, -5.662353515625, -5.3778076171875, -5.09326171875, -4.8087158203125, -4.524169921875, -4.2396240234375, -3.955078125, -3.6705322265625, -3.385986328125, -3.1014404296875, -2.81689453125, -2.5323486328125, -2.247802734375, -1.9632568359375, -1.6787109375, -1.3941650390625, -1.109619140625, -0.8250732421875, -0.54052734375, -0.2559814453125, 0.028564453125, 0.3131103515625, 0.59765625, 0.8822021484375, 1.166748046875, 1.4512939453125, 1.73583984375, 2.0203857421875, 2.304931640625, 2.5894775390625, 2.8740234375, 3.1585693359375, 3.443115234375, 3.7276611328125, 4.01220703125, 4.2967529296875, 4.581298828125, 4.8658447265625, 5.150390625, 5.4349365234375, 5.719482421875, 6.0040283203125, 6.28857421875, 6.5731201171875, 6.857666015625, 7.1422119140625, 7.4267578125, 7.7113037109375, 7.995849609375, 8.2803955078125, 8.56494140625, 8.8494873046875, 9.134033203125, 9.4185791015625, 9.703125]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 11.0, 20.0, 26.0, 32.0, 72.0, 122.0, 203.0, 363.0, 732.0, 1450.0, 3095.0, 7425.0, 21594.0, 75994.0, 468569.0, 2912055.0, 577542.0, 86547.0, 23584.0, 8232.0, 3347.0, 1548.0, 791.0, 423.0, 226.0, 122.0, 62.0, 34.0, 22.0, 14.0, 5.0, 8.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-16.109375, -15.6802978515625, -15.251220703125, -14.8221435546875, -14.39306640625, -13.9639892578125, -13.534912109375, -13.1058349609375, -12.6767578125, -12.2476806640625, -11.818603515625, -11.3895263671875, -10.96044921875, -10.5313720703125, -10.102294921875, -9.6732177734375, -9.244140625, -8.8150634765625, -8.385986328125, -7.9569091796875, -7.52783203125, -7.0987548828125, -6.669677734375, -6.2406005859375, -5.8115234375, -5.3824462890625, -4.953369140625, -4.5242919921875, -4.09521484375, -3.6661376953125, -3.237060546875, -2.8079833984375, -2.37890625, -1.9498291015625, -1.520751953125, -1.0916748046875, -0.66259765625, -0.2335205078125, 0.195556640625, 0.6246337890625, 1.0537109375, 1.4827880859375, 1.911865234375, 2.3409423828125, 2.77001953125, 3.1990966796875, 3.628173828125, 4.0572509765625, 4.486328125, 4.9154052734375, 5.344482421875, 5.7735595703125, 6.20263671875, 6.6317138671875, 7.060791015625, 7.4898681640625, 7.9189453125, 8.3480224609375, 8.777099609375, 9.2061767578125, 9.63525390625, 10.0643310546875, 10.493408203125, 10.9224853515625, 11.3515625]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 4.0, 17.0, 27.0, 61.0, 75.0, 99.0, 134.0, 143.0, 151.0, 118.0, 69.0, 36.0, 25.0, 20.0, 14.0, 9.0, 3.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.562381744384766, -37.11699676513672, -35.67161178588867, -34.226226806640625, -32.78084182739258, -31.33545684814453, -29.890071868896484, -28.444686889648438, -26.99930191040039, -25.553916931152344, -24.108531951904297, -22.66314697265625, -21.217761993408203, -19.772377014160156, -18.32699203491211, -16.881607055664062, -15.436220169067383, -13.990835189819336, -12.545450210571289, -11.100065231323242, -9.654680252075195, -8.209295272827148, -6.763909339904785, -5.318524360656738, -3.8731393814086914, -2.4277544021606445, -0.9823691844940186, 0.4630160331726074, 1.9084010124206543, 3.353785991668701, 4.799171447753906, 6.244556427001953, 7.68994140625, 9.135326385498047, 10.580711364746094, 12.02609634399414, 13.471481323242188, 14.916866302490234, 16.36225128173828, 17.807636260986328, 19.253021240234375, 20.698406219482422, 22.14379119873047, 23.589176177978516, 25.034561157226562, 26.47994613647461, 27.925331115722656, 29.370716094970703, 30.816102981567383, 32.26148986816406, 33.70687484741211, 35.152259826660156, 36.5976448059082, 38.04302978515625, 39.4884147644043, 40.933799743652344, 42.37918472290039, 43.82456970214844, 45.269954681396484, 46.71533966064453, 48.16072463989258, 49.606109619140625, 51.05149459838867, 52.49687957763672, 53.942264556884766]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 2.0, 1.0, 6.0, 5.0, 11.0, 15.0, 15.0, 16.0, 16.0, 15.0, 21.0, 34.0, 35.0, 35.0, 34.0, 34.0, 37.0, 42.0, 57.0, 47.0, 49.0, 50.0, 40.0, 49.0, 43.0, 32.0, 40.0, 24.0, 25.0, 28.0, 21.0, 24.0, 17.0, 13.0, 14.0, 17.0, 12.0, 8.0, 8.0, 3.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.12009620666504, -28.23073387145996, -27.34136962890625, -26.452007293701172, -25.562644958496094, -24.673282623291016, -23.783918380737305, -22.894556045532227, -22.005191802978516, -21.115829467773438, -20.226465225219727, -19.33710289001465, -18.44774055480957, -17.55837631225586, -16.66901397705078, -15.779651641845703, -14.890289306640625, -14.00092601776123, -13.111563682556152, -12.222200393676758, -11.33283805847168, -10.443474769592285, -9.55411148071289, -8.664749145507812, -7.775385856628418, -6.886023044586182, -5.996660232543945, -5.107296943664551, -4.2179341316223145, -3.328571319580078, -2.4392080307006836, -1.5498452186584473, -0.6604843139648438, 0.22887861728668213, 1.118241548538208, 2.0076045989990234, 2.8969674110412598, 3.786330223083496, 4.675693511962891, 5.565056324005127, 6.454419136047363, 7.3437819480896, 8.233144760131836, 9.12250804901123, 10.011871337890625, 10.901233673095703, 11.790596961975098, 12.679960250854492, 13.56932258605957, 14.458685874938965, 15.348048210144043, 16.237411499023438, 17.126773834228516, 18.016136169433594, 18.905500411987305, 19.794862747192383, 20.684226989746094, 21.573589324951172, 22.462953567504883, 23.35231590270996, 24.24167823791504, 25.13104248046875, 26.020404815673828, 26.909767150878906, 27.799129486083984]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 9.0, 8.0, 5.0, 12.0, 12.0, 18.0, 15.0, 20.0, 22.0, 29.0, 36.0, 32.0, 36.0, 28.0, 42.0, 42.0, 47.0, 41.0, 44.0, 49.0, 40.0, 43.0, 28.0, 36.0, 37.0, 40.0, 27.0, 26.0, 24.0, 21.0, 17.0, 22.0, 18.0, 25.0, 16.0, 9.0, 8.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.767578125, -2.680694580078125, -2.59381103515625, -2.506927490234375, -2.4200439453125, -2.333160400390625, -2.24627685546875, -2.159393310546875, -2.072509765625, -1.985626220703125, -1.89874267578125, -1.811859130859375, -1.7249755859375, -1.638092041015625, -1.55120849609375, -1.464324951171875, -1.37744140625, -1.290557861328125, -1.20367431640625, -1.116790771484375, -1.0299072265625, -0.943023681640625, -0.85614013671875, -0.769256591796875, -0.682373046875, -0.595489501953125, -0.50860595703125, -0.421722412109375, -0.3348388671875, -0.247955322265625, -0.16107177734375, -0.074188232421875, 0.0126953125, 0.099578857421875, 0.18646240234375, 0.273345947265625, 0.3602294921875, 0.447113037109375, 0.53399658203125, 0.620880126953125, 0.707763671875, 0.794647216796875, 0.88153076171875, 0.968414306640625, 1.0552978515625, 1.142181396484375, 1.22906494140625, 1.315948486328125, 1.40283203125, 1.489715576171875, 1.57659912109375, 1.663482666015625, 1.7503662109375, 1.837249755859375, 1.92413330078125, 2.011016845703125, 2.097900390625, 2.184783935546875, 2.27166748046875, 2.358551025390625, 2.4454345703125, 2.532318115234375, 2.61920166015625, 2.706085205078125, 2.79296875]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 12.0, 9.0, 15.0, 14.0, 19.0, 35.0, 62.0, 92.0, 156.0, 217.0, 328.0, 471.0, 762.0, 1292.0, 1994.0, 3230.0, 5464.0, 9087.0, 15266.0, 25836.0, 46041.0, 86829.0, 175201.0, 280227.0, 186440.0, 92853.0, 48853.0, 27299.0, 15894.0, 9656.0, 5726.0, 3459.0, 2074.0, 1301.0, 824.0, 532.0, 358.0, 174.0, 150.0, 106.0, 65.0, 41.0, 35.0, 18.0, 18.0, 8.0, 5.0, 6.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.35986328125, -0.3491363525390625, -0.338409423828125, -0.3276824951171875, -0.31695556640625, -0.3062286376953125, -0.295501708984375, -0.2847747802734375, -0.2740478515625, -0.2633209228515625, -0.252593994140625, -0.2418670654296875, -0.23114013671875, -0.2204132080078125, -0.209686279296875, -0.1989593505859375, -0.188232421875, -0.1775054931640625, -0.166778564453125, -0.1560516357421875, -0.14532470703125, -0.1345977783203125, -0.123870849609375, -0.1131439208984375, -0.1024169921875, -0.0916900634765625, -0.080963134765625, -0.0702362060546875, -0.05950927734375, -0.0487823486328125, -0.038055419921875, -0.0273284912109375, -0.0166015625, -0.0058746337890625, 0.004852294921875, 0.0155792236328125, 0.02630615234375, 0.0370330810546875, 0.047760009765625, 0.0584869384765625, 0.0692138671875, 0.0799407958984375, 0.090667724609375, 0.1013946533203125, 0.11212158203125, 0.1228485107421875, 0.133575439453125, 0.1443023681640625, 0.155029296875, 0.1657562255859375, 0.176483154296875, 0.1872100830078125, 0.19793701171875, 0.2086639404296875, 0.219390869140625, 0.2301177978515625, 0.2408447265625, 0.2515716552734375, 0.262298583984375, 0.2730255126953125, 0.28375244140625, 0.2944793701171875, 0.305206298828125, 0.3159332275390625, 0.32666015625]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 4.0, 2.0, 2.0, 8.0, 4.0, 3.0, 8.0, 13.0, 9.0, 14.0, 17.0, 19.0, 18.0, 20.0, 30.0, 19.0, 16.0, 27.0, 32.0, 42.0, 44.0, 41.0, 34.0, 29.0, 1059.0, 41.0, 43.0, 46.0, 51.0, 46.0, 34.0, 30.0, 29.0, 23.0, 33.0, 21.0, 18.0, 17.0, 14.0, 13.0, 9.0, 6.0, 12.0, 8.0, 9.0, 8.0, 1.0, 4.0, 5.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.5654296875, -1.5145263671875, -1.463623046875, -1.4127197265625, -1.36181640625, -1.3109130859375, -1.260009765625, -1.2091064453125, -1.158203125, -1.1072998046875, -1.056396484375, -1.0054931640625, -0.95458984375, -0.9036865234375, -0.852783203125, -0.8018798828125, -0.7509765625, -0.7000732421875, -0.649169921875, -0.5982666015625, -0.54736328125, -0.4964599609375, -0.445556640625, -0.3946533203125, -0.34375, -0.2928466796875, -0.241943359375, -0.1910400390625, -0.14013671875, -0.0892333984375, -0.038330078125, 0.0125732421875, 0.0634765625, 0.1143798828125, 0.165283203125, 0.2161865234375, 0.26708984375, 0.3179931640625, 0.368896484375, 0.4197998046875, 0.470703125, 0.5216064453125, 0.572509765625, 0.6234130859375, 0.67431640625, 0.7252197265625, 0.776123046875, 0.8270263671875, 0.8779296875, 0.9288330078125, 0.979736328125, 1.0306396484375, 1.08154296875, 1.1324462890625, 1.183349609375, 1.2342529296875, 1.28515625, 1.3360595703125, 1.386962890625, 1.4378662109375, 1.48876953125, 1.5396728515625, 1.590576171875, 1.6414794921875, 1.6923828125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 6.0, 6.0, 8.0, 18.0, 20.0, 27.0, 36.0, 71.0, 102.0, 112.0, 218.0, 266.0, 418.0, 601.0, 934.0, 1240.0, 1904.0, 2733.0, 4145.0, 6261.0, 9519.0, 14477.0, 22559.0, 35804.0, 57502.0, 97094.0, 160481.0, 1259162.0, 163151.0, 98158.0, 58272.0, 36002.0, 22740.0, 14461.0, 9434.0, 6143.0, 4271.0, 2777.0, 1884.0, 1259.0, 881.0, 608.0, 410.0, 334.0, 199.0, 129.0, 101.0, 58.0, 52.0, 23.0, 29.0, 17.0, 11.0, 7.0, 3.0, 4.0, 1.0, 1.0, 1.0], "bins": [-0.2197265625, -0.2129688262939453, -0.20621109008789062, -0.19945335388183594, -0.19269561767578125, -0.18593788146972656, -0.17918014526367188, -0.1724224090576172, -0.1656646728515625, -0.1589069366455078, -0.15214920043945312, -0.14539146423339844, -0.13863372802734375, -0.13187599182128906, -0.12511825561523438, -0.11836051940917969, -0.111602783203125, -0.10484504699707031, -0.09808731079101562, -0.09132957458496094, -0.08457183837890625, -0.07781410217285156, -0.07105636596679688, -0.06429862976074219, -0.0575408935546875, -0.05078315734863281, -0.044025421142578125, -0.03726768493652344, -0.03050994873046875, -0.023752212524414062, -0.016994476318359375, -0.010236740112304688, -0.00347900390625, 0.0032787322998046875, 0.010036468505859375, 0.016794204711914062, 0.02355194091796875, 0.030309677124023438, 0.037067413330078125, 0.04382514953613281, 0.0505828857421875, 0.05734062194824219, 0.06409835815429688, 0.07085609436035156, 0.07761383056640625, 0.08437156677246094, 0.09112930297851562, 0.09788703918457031, 0.104644775390625, 0.11140251159667969, 0.11816024780273438, 0.12491798400878906, 0.13167572021484375, 0.13843345642089844, 0.14519119262695312, 0.1519489288330078, 0.1587066650390625, 0.1654644012451172, 0.17222213745117188, 0.17897987365722656, 0.18573760986328125, 0.19249534606933594, 0.19925308227539062, 0.2060108184814453, 0.2127685546875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 2.0, 3.0, 8.0, 8.0, 10.0, 7.0, 14.0, 19.0, 10.0, 10.0, 18.0, 21.0, 23.0, 35.0, 50.0, 53.0, 46.0, 77.0, 65.0, 59.0, 54.0, 63.0, 68.0, 42.0, 40.0, 31.0, 21.0, 23.0, 22.0, 26.0, 8.0, 14.0, 7.0, 8.0, 5.0, 8.0, 7.0, 2.0, 5.0, 5.0, 1.0, 4.0, 0.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0015077590942382812, -0.001458480954170227, -0.0014092028141021729, -0.0013599246740341187, -0.0013106465339660645, -0.0012613683938980103, -0.001212090253829956, -0.0011628121137619019, -0.0011135339736938477, -0.0010642558336257935, -0.0010149776935577393, -0.0009656995534896851, -0.0009164214134216309, -0.0008671432733535767, -0.0008178651332855225, -0.0007685869932174683, -0.0007193088531494141, -0.0006700307130813599, -0.0006207525730133057, -0.0005714744329452515, -0.0005221962928771973, -0.00047291815280914307, -0.00042364001274108887, -0.00037436187267303467, -0.00032508373260498047, -0.00027580559253692627, -0.00022652745246887207, -0.00017724931240081787, -0.00012797117233276367, -7.869303226470947e-05, -2.9414892196655273e-05, 1.9863247871398926e-05, 6.914138793945312e-05, 0.00011841952800750732, 0.00016769766807556152, 0.00021697580814361572, 0.0002662539482116699, 0.0003155320882797241, 0.0003648102283477783, 0.0004140883684158325, 0.0004633665084838867, 0.0005126446485519409, 0.0005619227886199951, 0.0006112009286880493, 0.0006604790687561035, 0.0007097572088241577, 0.0007590353488922119, 0.0008083134889602661, 0.0008575916290283203, 0.0009068697690963745, 0.0009561479091644287, 0.001005426049232483, 0.0010547041893005371, 0.0011039823293685913, 0.0011532604694366455, 0.0012025386095046997, 0.001251816749572754, 0.001301094889640808, 0.0013503730297088623, 0.0013996511697769165, 0.0014489293098449707, 0.001498207449913025, 0.001547485589981079, 0.0015967637300491333, 0.0016460418701171875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 4.0, 3.0, 6.0, 8.0, 8.0, 10.0, 8.0, 10.0, 21.0, 20.0, 28.0, 32.0, 57.0, 63.0, 60.0, 100.0, 175.0, 269.0, 512.0, 2782.0, 290018.0, 748101.0, 4750.0, 571.0, 317.0, 169.0, 91.0, 79.0, 54.0, 51.0, 38.0, 28.0, 23.0, 15.0, 21.0, 12.0, 13.0, 6.0, 6.0, 3.0, 3.0, 4.0, 1.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0312042236328125, -0.030231475830078125, -0.02925872802734375, -0.028285980224609375, -0.027313232421875, -0.026340484619140625, -0.02536773681640625, -0.024394989013671875, -0.0234222412109375, -0.022449493408203125, -0.02147674560546875, -0.020503997802734375, -0.01953125, -0.018558502197265625, -0.01758575439453125, -0.016613006591796875, -0.0156402587890625, -0.014667510986328125, -0.01369476318359375, -0.012722015380859375, -0.011749267578125, -0.010776519775390625, -0.00980377197265625, -0.008831024169921875, -0.0078582763671875, -0.006885528564453125, -0.00591278076171875, -0.004940032958984375, -0.00396728515625, -0.002994537353515625, -0.00202178955078125, -0.001049041748046875, -7.62939453125e-05, 0.000896453857421875, 0.00186920166015625, 0.002841949462890625, 0.003814697265625, 0.004787445068359375, 0.00576019287109375, 0.006732940673828125, 0.0077056884765625, 0.008678436279296875, 0.00965118408203125, 0.010623931884765625, 0.0115966796875, 0.012569427490234375, 0.01354217529296875, 0.014514923095703125, 0.0154876708984375, 0.016460418701171875, 0.01743316650390625, 0.018405914306640625, 0.019378662109375, 0.020351409912109375, 0.02132415771484375, 0.022296905517578125, 0.0232696533203125, 0.024242401123046875, 0.02521514892578125, 0.026187896728515625, 0.02716064453125, 0.028133392333984375, 0.02910614013671875, 0.030078887939453125, 0.0310516357421875]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 310.0, 707.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004895445425063372, -0.004290470387786627, -0.0036854955833405256, -0.0030805207788944244, -0.0024755457416176796, -0.0018705707043409348, -0.0012655958998948336, -0.0006606210954487324, -5.5646058171987534e-05, 0.0005493288626894355, 0.0011543037835508585, 0.0017592787044122815, 0.0023642536252737045, 0.0029692286625504494, 0.0035742034669965506, 0.004179178271442652, 0.004784153308719397, 0.0053891283459961414, 0.005994102917611599, 0.006599077954888344, 0.007204052992165089, 0.0078090280294418335, 0.008414003066718578, 0.009018978103995323, 0.009623952209949493, 0.010228927247226238, 0.010833902284502983, 0.011438877321779728, 0.012043852359056473, 0.012648826465010643, 0.013253801502287388, 0.013858776539564133, 0.014463752508163452, 0.015068727545440197, 0.015673702582716942, 0.016278676688671112, 0.01688365265727043, 0.017488626763224602, 0.01809360273182392, 0.01869857683777809, 0.01930355280637741, 0.01990852691233158, 0.0205135028809309, 0.02111847698688507, 0.02172345295548439, 0.02232842706143856, 0.02293340303003788, 0.02353837713599205, 0.02414335124194622, 0.02474832534790039, 0.02535330131649971, 0.02595827542245388, 0.0265632513910532, 0.02716822549700737, 0.02777320146560669, 0.02837817557156086, 0.02898314967751503, 0.0295881237834692, 0.03019309975206852, 0.03079807385802269, 0.03140304982662201, 0.03200802579522133, 0.03261299803853035, 0.03321797400712967, 0.03382294997572899]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 5.0, 4.0, 8.0, 10.0, 7.0, 11.0, 8.0, 23.0, 35.0, 35.0, 36.0, 30.0, 43.0, 39.0, 44.0, 60.0, 46.0, 58.0, 51.0, 48.0, 54.0, 49.0, 45.0, 45.0, 47.0, 38.0, 25.0, 28.0, 16.0, 16.0, 8.0, 14.0, 8.0, 4.0, 4.0, 4.0, 3.0, 1.0, 5.0], "bins": [-0.0015347599983215332, -0.0014993250370025635, -0.0014638900756835938, -0.001428455114364624, -0.0013930201530456543, -0.0013575851917266846, -0.0013221502304077148, -0.0012867152690887451, -0.0012512803077697754, -0.0012158453464508057, -0.001180410385131836, -0.0011449754238128662, -0.0011095404624938965, -0.0010741055011749268, -0.001038670539855957, -0.0010032355785369873, -0.0009678006172180176, -0.0009323656558990479, -0.0008969306945800781, -0.0008614957332611084, -0.0008260607719421387, -0.0007906258106231689, -0.0007551908493041992, -0.0007197558879852295, -0.0006843209266662598, -0.00064888596534729, -0.0006134510040283203, -0.0005780160427093506, -0.0005425810813903809, -0.0005071461200714111, -0.0004717111587524414, -0.0004362761974334717, -0.00040084123611450195, -0.0003654062747955322, -0.0003299713134765625, -0.0002945363521575928, -0.00025910139083862305, -0.00022366642951965332, -0.0001882314682006836, -0.00015279650688171387, -0.00011736154556274414, -8.192658424377441e-05, -4.649162292480469e-05, -1.1056661605834961e-05, 2.4378299713134766e-05, 5.981326103210449e-05, 9.524822235107422e-05, 0.00013068318367004395, 0.00016611814498901367, 0.0002015531063079834, 0.00023698806762695312, 0.00027242302894592285, 0.0003078579902648926, 0.0003432929515838623, 0.00037872791290283203, 0.00041416287422180176, 0.0004495978355407715, 0.0004850327968597412, 0.0005204677581787109, 0.0005559027194976807, 0.0005913376808166504, 0.0006267726421356201, 0.0006622076034545898, 0.0006976425647735596, 0.0007330775260925293]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 9.0, 8.0, 6.0, 11.0, 12.0, 18.0, 15.0, 20.0, 22.0, 29.0, 36.0, 32.0, 36.0, 28.0, 42.0, 42.0, 47.0, 41.0, 44.0, 49.0, 40.0, 43.0, 28.0, 36.0, 37.0, 40.0, 28.0, 25.0, 24.0, 21.0, 17.0, 22.0, 18.0, 25.0, 16.0, 9.0, 8.0, 4.0, 5.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.767578125, -2.680694580078125, -2.59381103515625, -2.506927490234375, -2.4200439453125, -2.333160400390625, -2.24627685546875, -2.159393310546875, -2.072509765625, -1.985626220703125, -1.89874267578125, -1.811859130859375, -1.7249755859375, -1.638092041015625, -1.55120849609375, -1.464324951171875, -1.37744140625, -1.290557861328125, -1.20367431640625, -1.116790771484375, -1.0299072265625, -0.943023681640625, -0.85614013671875, -0.769256591796875, -0.682373046875, -0.595489501953125, -0.50860595703125, -0.421722412109375, -0.3348388671875, -0.247955322265625, -0.16107177734375, -0.074188232421875, 0.0126953125, 0.099578857421875, 0.18646240234375, 0.273345947265625, 0.3602294921875, 0.447113037109375, 0.53399658203125, 0.620880126953125, 0.707763671875, 0.794647216796875, 0.88153076171875, 0.968414306640625, 1.0552978515625, 1.142181396484375, 1.22906494140625, 1.315948486328125, 1.40283203125, 1.489715576171875, 1.57659912109375, 1.663482666015625, 1.7503662109375, 1.837249755859375, 1.92413330078125, 2.011016845703125, 2.097900390625, 2.184783935546875, 2.27166748046875, 2.358551025390625, 2.4454345703125, 2.532318115234375, 2.61920166015625, 2.706085205078125, 2.79296875]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 1.0, 4.0, 4.0, 9.0, 13.0, 12.0, 19.0, 36.0, 49.0, 69.0, 111.0, 134.0, 186.0, 257.0, 355.0, 507.0, 724.0, 959.0, 1316.0, 1834.0, 2762.0, 4376.0, 7467.0, 15714.0, 41407.0, 138020.0, 424506.0, 276000.0, 77764.0, 25845.0, 10918.0, 5663.0, 3541.0, 2295.0, 1624.0, 1132.0, 822.0, 574.0, 422.0, 312.0, 227.0, 168.0, 111.0, 92.0, 63.0, 39.0, 34.0, 23.0, 10.0, 5.0, 10.0, 7.0, 1.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0], "bins": [-2.58203125, -2.500762939453125, -2.41949462890625, -2.338226318359375, -2.2569580078125, -2.175689697265625, -2.09442138671875, -2.013153076171875, -1.931884765625, -1.850616455078125, -1.76934814453125, -1.688079833984375, -1.6068115234375, -1.525543212890625, -1.44427490234375, -1.363006591796875, -1.28173828125, -1.200469970703125, -1.11920166015625, -1.037933349609375, -0.9566650390625, -0.875396728515625, -0.79412841796875, -0.712860107421875, -0.631591796875, -0.550323486328125, -0.46905517578125, -0.387786865234375, -0.3065185546875, -0.225250244140625, -0.14398193359375, -0.062713623046875, 0.0185546875, 0.099822998046875, 0.18109130859375, 0.262359619140625, 0.3436279296875, 0.424896240234375, 0.50616455078125, 0.587432861328125, 0.668701171875, 0.749969482421875, 0.83123779296875, 0.912506103515625, 0.9937744140625, 1.075042724609375, 1.15631103515625, 1.237579345703125, 1.31884765625, 1.400115966796875, 1.48138427734375, 1.562652587890625, 1.6439208984375, 1.725189208984375, 1.80645751953125, 1.887725830078125, 1.968994140625, 2.050262451171875, 2.13153076171875, 2.212799072265625, 2.2940673828125, 2.375335693359375, 2.45660400390625, 2.537872314453125, 2.619140625]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 6.0, 2.0, 6.0, 5.0, 10.0, 9.0, 16.0, 31.0, 27.0, 25.0, 25.0, 29.0, 34.0, 30.0, 27.0, 31.0, 46.0, 51.0, 61.0, 188.0, 1760.0, 164.0, 66.0, 37.0, 52.0, 43.0, 39.0, 28.0, 34.0, 18.0, 23.0, 26.0, 13.0, 15.0, 18.0, 15.0, 11.0, 6.0, 5.0, 6.0, 4.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.578125, -10.26220703125, -9.9462890625, -9.63037109375, -9.314453125, -8.99853515625, -8.6826171875, -8.36669921875, -8.05078125, -7.73486328125, -7.4189453125, -7.10302734375, -6.787109375, -6.47119140625, -6.1552734375, -5.83935546875, -5.5234375, -5.20751953125, -4.8916015625, -4.57568359375, -4.259765625, -3.94384765625, -3.6279296875, -3.31201171875, -2.99609375, -2.68017578125, -2.3642578125, -2.04833984375, -1.732421875, -1.41650390625, -1.1005859375, -0.78466796875, -0.46875, -0.15283203125, 0.1630859375, 0.47900390625, 0.794921875, 1.11083984375, 1.4267578125, 1.74267578125, 2.05859375, 2.37451171875, 2.6904296875, 3.00634765625, 3.322265625, 3.63818359375, 3.9541015625, 4.27001953125, 4.5859375, 4.90185546875, 5.2177734375, 5.53369140625, 5.849609375, 6.16552734375, 6.4814453125, 6.79736328125, 7.11328125, 7.42919921875, 7.7451171875, 8.06103515625, 8.376953125, 8.69287109375, 9.0087890625, 9.32470703125, 9.640625]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 7.0, 2.0, 8.0, 11.0, 14.0, 17.0, 19.0, 22.0, 25.0, 26.0, 29.0, 38.0, 51.0, 88.0, 145.0, 252.0, 516.0, 1606.0, 12097.0, 2321106.0, 798052.0, 8970.0, 1353.0, 486.0, 231.0, 120.0, 87.0, 66.0, 48.0, 41.0, 25.0, 28.0, 31.0, 25.0, 16.0, 8.0, 6.0, 8.0, 8.0, 5.0, 5.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.96875, -15.45263671875, -14.9365234375, -14.42041015625, -13.904296875, -13.38818359375, -12.8720703125, -12.35595703125, -11.83984375, -11.32373046875, -10.8076171875, -10.29150390625, -9.775390625, -9.25927734375, -8.7431640625, -8.22705078125, -7.7109375, -7.19482421875, -6.6787109375, -6.16259765625, -5.646484375, -5.13037109375, -4.6142578125, -4.09814453125, -3.58203125, -3.06591796875, -2.5498046875, -2.03369140625, -1.517578125, -1.00146484375, -0.4853515625, 0.03076171875, 0.546875, 1.06298828125, 1.5791015625, 2.09521484375, 2.611328125, 3.12744140625, 3.6435546875, 4.15966796875, 4.67578125, 5.19189453125, 5.7080078125, 6.22412109375, 6.740234375, 7.25634765625, 7.7724609375, 8.28857421875, 8.8046875, 9.32080078125, 9.8369140625, 10.35302734375, 10.869140625, 11.38525390625, 11.9013671875, 12.41748046875, 12.93359375, 13.44970703125, 13.9658203125, 14.48193359375, 14.998046875, 15.51416015625, 16.0302734375, 16.54638671875, 17.0625]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 27.0, 329.0, 516.0, 123.0, 16.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.863299369812012, -14.313407897949219, -12.763516426086426, -11.213624954223633, -9.663732528686523, -8.113842010498047, -6.5639495849609375, -5.0140581130981445, -3.4641666412353516, -1.914275050163269, -0.3643834590911865, 1.1855082511901855, 2.7353997230529785, 4.2852911949157715, 5.835183143615723, 7.385074615478516, 8.934966087341309, 10.484857559204102, 12.034749031066895, 13.584640502929688, 15.134532928466797, 16.684423446655273, 18.234315872192383, 19.78420639038086, 21.33409881591797, 22.883991241455078, 24.433881759643555, 25.983774185180664, 27.53366470336914, 29.08355712890625, 30.63344955444336, 32.18334197998047, 33.73323440551758, 35.28312683105469, 36.8330192565918, 38.38290786743164, 39.93280029296875, 41.48269271850586, 43.03258514404297, 44.58247375488281, 46.13236618041992, 47.68225860595703, 49.23215103149414, 50.782039642333984, 52.331932067871094, 53.8818244934082, 55.43171691894531, 56.981605529785156, 58.53150177001953, 60.08139419555664, 61.63128662109375, 63.181175231933594, 64.73107147216797, 66.28096008300781, 67.83084869384766, 69.38074493408203, 70.93063354492188, 72.48052215576172, 74.0304183959961, 75.58030700683594, 77.13020324707031, 78.68009185791016, 80.22998046875, 81.77987670898438, 83.32976531982422]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 3.0, 6.0, 7.0, 5.0, 13.0, 11.0, 17.0, 8.0, 22.0, 19.0, 20.0, 26.0, 23.0, 30.0, 26.0, 28.0, 33.0, 36.0, 35.0, 48.0, 43.0, 36.0, 56.0, 40.0, 34.0, 39.0, 43.0, 25.0, 36.0, 24.0, 20.0, 16.0, 35.0, 23.0, 18.0, 13.0, 16.0, 9.0, 11.0, 9.0, 7.0, 6.0, 5.0, 3.0, 3.0, 3.0, 5.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.4873046875, -28.522008895874023, -27.55671501159668, -26.591419219970703, -25.62612533569336, -24.660829544067383, -23.695533752441406, -22.730239868164062, -21.764944076538086, -20.79964828491211, -19.834354400634766, -18.86905860900879, -17.903764724731445, -16.93846893310547, -15.973174095153809, -15.007879257202148, -14.042584419250488, -13.077289581298828, -12.111994743347168, -11.146699905395508, -10.181404113769531, -9.216109275817871, -8.250814437866211, -7.285519123077393, -6.320224285125732, -5.354929447174072, -4.389634132385254, -3.4243392944335938, -2.4590442180633545, -1.4937491416931152, -0.5284543037414551, 0.4368410110473633, 1.4021358489990234, 2.3674309253692627, 3.332726001739502, 4.298020839691162, 5.2633161544799805, 6.228610992431641, 7.193905830383301, 8.159200668334961, 9.124496459960938, 10.089791297912598, 11.055086135864258, 12.020381927490234, 12.985676765441895, 13.950971603393555, 14.916266441345215, 15.881561279296875, 16.84685516357422, 17.812150955200195, 18.77744483947754, 19.742740631103516, 20.70803451538086, 21.673330307006836, 22.638626098632812, 23.603919982910156, 24.569215774536133, 25.53451156616211, 26.499805450439453, 27.46510124206543, 28.430395126342773, 29.39569091796875, 30.360984802246094, 31.32628059387207, 32.29157638549805]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 5.0, 15.0, 5.0, 7.0, 12.0, 18.0, 21.0, 10.0, 23.0, 38.0, 31.0, 33.0, 31.0, 35.0, 31.0, 43.0, 44.0, 49.0, 36.0, 47.0, 44.0, 42.0, 31.0, 45.0, 35.0, 44.0, 30.0, 22.0, 17.0, 21.0, 19.0, 26.0, 22.0, 19.0, 11.0, 15.0, 9.0, 6.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.921875, -2.830902099609375, -2.73992919921875, -2.648956298828125, -2.5579833984375, -2.467010498046875, -2.37603759765625, -2.285064697265625, -2.194091796875, -2.103118896484375, -2.01214599609375, -1.921173095703125, -1.8302001953125, -1.739227294921875, -1.64825439453125, -1.557281494140625, -1.46630859375, -1.375335693359375, -1.28436279296875, -1.193389892578125, -1.1024169921875, -1.011444091796875, -0.92047119140625, -0.829498291015625, -0.738525390625, -0.647552490234375, -0.55657958984375, -0.465606689453125, -0.3746337890625, -0.283660888671875, -0.19268798828125, -0.101715087890625, -0.0107421875, 0.080230712890625, 0.17120361328125, 0.262176513671875, 0.3531494140625, 0.444122314453125, 0.53509521484375, 0.626068115234375, 0.717041015625, 0.808013916015625, 0.89898681640625, 0.989959716796875, 1.0809326171875, 1.171905517578125, 1.26287841796875, 1.353851318359375, 1.44482421875, 1.535797119140625, 1.62677001953125, 1.717742919921875, 1.8087158203125, 1.899688720703125, 1.99066162109375, 2.081634521484375, 2.172607421875, 2.263580322265625, 2.35455322265625, 2.445526123046875, 2.5364990234375, 2.627471923828125, 2.71844482421875, 2.809417724609375, 2.900390625]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 4.0, 1.0, 4.0, 5.0, 9.0, 8.0, 14.0, 9.0, 10.0, 14.0, 24.0, 30.0, 28.0, 42.0, 63.0, 119.0, 291.0, 639.0, 1892.0, 6520.0, 26945.0, 204860.0, 3177086.0, 710930.0, 49734.0, 10274.0, 2892.0, 956.0, 375.0, 177.0, 71.0, 58.0, 42.0, 27.0, 28.0, 26.0, 18.0, 11.0, 8.0, 8.0, 4.0, 10.0, 7.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.9296875, -10.573486328125, -10.21728515625, -9.861083984375, -9.5048828125, -9.148681640625, -8.79248046875, -8.436279296875, -8.080078125, -7.723876953125, -7.36767578125, -7.011474609375, -6.6552734375, -6.299072265625, -5.94287109375, -5.586669921875, -5.23046875, -4.874267578125, -4.51806640625, -4.161865234375, -3.8056640625, -3.449462890625, -3.09326171875, -2.737060546875, -2.380859375, -2.024658203125, -1.66845703125, -1.312255859375, -0.9560546875, -0.599853515625, -0.24365234375, 0.112548828125, 0.46875, 0.824951171875, 1.18115234375, 1.537353515625, 1.8935546875, 2.249755859375, 2.60595703125, 2.962158203125, 3.318359375, 3.674560546875, 4.03076171875, 4.386962890625, 4.7431640625, 5.099365234375, 5.45556640625, 5.811767578125, 6.16796875, 6.524169921875, 6.88037109375, 7.236572265625, 7.5927734375, 7.948974609375, 8.30517578125, 8.661376953125, 9.017578125, 9.373779296875, 9.72998046875, 10.086181640625, 10.4423828125, 10.798583984375, 11.15478515625, 11.510986328125, 11.8671875]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 8.0, 4.0, 7.0, 9.0, 19.0, 29.0, 44.0, 62.0, 94.0, 147.0, 229.0, 409.0, 587.0, 748.0, 580.0, 399.0, 249.0, 167.0, 97.0, 68.0, 45.0, 28.0, 21.0, 15.0, 5.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5625, -14.21185302734375, -13.8612060546875, -13.51055908203125, -13.159912109375, -12.80926513671875, -12.4586181640625, -12.10797119140625, -11.75732421875, -11.40667724609375, -11.0560302734375, -10.70538330078125, -10.354736328125, -10.00408935546875, -9.6534423828125, -9.30279541015625, -8.9521484375, -8.60150146484375, -8.2508544921875, -7.90020751953125, -7.549560546875, -7.19891357421875, -6.8482666015625, -6.49761962890625, -6.14697265625, -5.79632568359375, -5.4456787109375, -5.09503173828125, -4.744384765625, -4.39373779296875, -4.0430908203125, -3.69244384765625, -3.341796875, -2.99114990234375, -2.6405029296875, -2.28985595703125, -1.939208984375, -1.58856201171875, -1.2379150390625, -0.88726806640625, -0.53662109375, -0.18597412109375, 0.1646728515625, 0.51531982421875, 0.865966796875, 1.21661376953125, 1.5672607421875, 1.91790771484375, 2.2685546875, 2.61920166015625, 2.9698486328125, 3.32049560546875, 3.671142578125, 4.02178955078125, 4.3724365234375, 4.72308349609375, 5.07373046875, 5.42437744140625, 5.7750244140625, 6.12567138671875, 6.476318359375, 6.82696533203125, 7.1776123046875, 7.52825927734375, 7.87890625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 6.0, 7.0, 18.0, 29.0, 27.0, 69.0, 108.0, 255.0, 690.0, 2183.0, 10234.0, 74936.0, 2218954.0, 1809075.0, 65171.0, 9311.0, 2102.0, 598.0, 252.0, 112.0, 56.0, 37.0, 16.0, 13.0, 19.0, 4.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.125, -14.40380859375, -13.6826171875, -12.96142578125, -12.240234375, -11.51904296875, -10.7978515625, -10.07666015625, -9.35546875, -8.63427734375, -7.9130859375, -7.19189453125, -6.470703125, -5.74951171875, -5.0283203125, -4.30712890625, -3.5859375, -2.86474609375, -2.1435546875, -1.42236328125, -0.701171875, 0.02001953125, 0.7412109375, 1.46240234375, 2.18359375, 2.90478515625, 3.6259765625, 4.34716796875, 5.068359375, 5.78955078125, 6.5107421875, 7.23193359375, 7.953125, 8.67431640625, 9.3955078125, 10.11669921875, 10.837890625, 11.55908203125, 12.2802734375, 13.00146484375, 13.72265625, 14.44384765625, 15.1650390625, 15.88623046875, 16.607421875, 17.32861328125, 18.0498046875, 18.77099609375, 19.4921875, 20.21337890625, 20.9345703125, 21.65576171875, 22.376953125, 23.09814453125, 23.8193359375, 24.54052734375, 25.26171875, 25.98291015625, 26.7041015625, 27.42529296875, 28.146484375, 28.86767578125, 29.5888671875, 30.31005859375, 31.03125]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 18.0, 18.0, 39.0, 58.0, 105.0, 143.0, 155.0, 172.0, 133.0, 79.0, 41.0, 27.0, 13.0, 7.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.5103759765625, -65.72295379638672, -63.935523986816406, -62.148101806640625, -60.36067581176758, -58.57324981689453, -56.785823822021484, -54.99839782714844, -53.210975646972656, -51.42354965209961, -49.63612365722656, -47.84870147705078, -46.061275482177734, -44.27384948730469, -42.48642349243164, -40.698997497558594, -38.91157531738281, -37.124149322509766, -35.33672332763672, -33.54930114746094, -31.76187515258789, -29.974449157714844, -28.187023162841797, -26.399599075317383, -24.612171173095703, -22.824745178222656, -21.037321090698242, -19.249895095825195, -17.46247100830078, -15.675045013427734, -13.887619972229004, -12.100194931030273, -10.31277084350586, -8.525345802307129, -6.737920761108398, -4.95049524307251, -3.1630702018737793, -1.3756446838378906, 0.41178035736083984, 2.1992053985595703, 3.986630439758301, 5.774055480957031, 7.561480522155762, 9.348905563354492, 11.136331558227539, 12.92375659942627, 14.711181640625, 16.498607635498047, 18.28603172302246, 20.073457717895508, 21.860881805419922, 23.64830780029297, 25.435731887817383, 27.22315788269043, 29.010581970214844, 30.79800796508789, 32.58543395996094, 34.372859954833984, 36.16028594970703, 37.94770812988281, 39.73513412475586, 41.522560119628906, 43.30998611450195, 45.097412109375, 46.88483428955078]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 5.0, 3.0, 9.0, 6.0, 12.0, 11.0, 20.0, 12.0, 18.0, 18.0, 24.0, 21.0, 37.0, 34.0, 25.0, 29.0, 36.0, 27.0, 47.0, 36.0, 43.0, 41.0, 51.0, 35.0, 36.0, 43.0, 33.0, 34.0, 30.0, 33.0, 34.0, 33.0, 18.0, 19.0, 12.0, 10.0, 17.0, 15.0, 11.0, 10.0, 4.0, 6.0, 3.0, 0.0, 4.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.465505599975586, -20.68788719177246, -19.910266876220703, -19.132648468017578, -18.355030059814453, -17.577409744262695, -16.79979133605957, -16.022171020507812, -15.244552612304688, -14.466933250427246, -13.689313888549805, -12.91169548034668, -12.134076118469238, -11.356456756591797, -10.578838348388672, -9.80121898651123, -9.023599624633789, -8.245980262756348, -7.4683613777160645, -6.690742492675781, -5.91312313079834, -5.135503768920898, -4.357884883880615, -3.580265998840332, -2.8026466369628906, -2.0250275135040283, -1.247408390045166, -0.4697892665863037, 0.3078298568725586, 1.085448980331421, 1.8630681037902832, 2.6406869888305664, 3.4183082580566406, 4.195927619934082, 4.973546504974365, 5.751165390014648, 6.52878475189209, 7.306404113769531, 8.084022521972656, 8.861641883850098, 9.639261245727539, 10.41688060760498, 11.194499969482422, 11.972118377685547, 12.749737739562988, 13.52735710144043, 14.304975509643555, 15.082594871520996, 15.860214233398438, 16.637832641601562, 17.41545295715332, 18.193071365356445, 18.970691680908203, 19.748310089111328, 20.525928497314453, 21.303546905517578, 22.081167221069336, 22.85878562927246, 23.63640594482422, 24.414024353027344, 25.19164276123047, 25.969263076782227, 26.74688148498535, 27.52450180053711, 28.302120208740234]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 8.0, 7.0, 6.0, 11.0, 8.0, 8.0, 18.0, 21.0, 22.0, 26.0, 26.0, 31.0, 31.0, 32.0, 42.0, 31.0, 39.0, 45.0, 38.0, 36.0, 42.0, 43.0, 50.0, 32.0, 38.0, 34.0, 30.0, 32.0, 29.0, 32.0, 24.0, 22.0, 23.0, 15.0, 19.0, 17.0, 12.0, 7.0, 10.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.794921875, -2.702606201171875, -2.61029052734375, -2.517974853515625, -2.4256591796875, -2.333343505859375, -2.24102783203125, -2.148712158203125, -2.056396484375, -1.964080810546875, -1.87176513671875, -1.779449462890625, -1.6871337890625, -1.594818115234375, -1.50250244140625, -1.410186767578125, -1.31787109375, -1.225555419921875, -1.13323974609375, -1.040924072265625, -0.9486083984375, -0.856292724609375, -0.76397705078125, -0.671661376953125, -0.579345703125, -0.487030029296875, -0.39471435546875, -0.302398681640625, -0.2100830078125, -0.117767333984375, -0.02545166015625, 0.066864013671875, 0.1591796875, 0.251495361328125, 0.34381103515625, 0.436126708984375, 0.5284423828125, 0.620758056640625, 0.71307373046875, 0.805389404296875, 0.897705078125, 0.990020751953125, 1.08233642578125, 1.174652099609375, 1.2669677734375, 1.359283447265625, 1.45159912109375, 1.543914794921875, 1.63623046875, 1.728546142578125, 1.82086181640625, 1.913177490234375, 2.0054931640625, 2.097808837890625, 2.19012451171875, 2.282440185546875, 2.374755859375, 2.467071533203125, 2.55938720703125, 2.651702880859375, 2.7440185546875, 2.836334228515625, 2.92864990234375, 3.020965576171875, 3.11328125]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 11.0, 11.0, 12.0, 26.0, 37.0, 47.0, 84.0, 103.0, 137.0, 212.0, 312.0, 431.0, 605.0, 838.0, 1273.0, 1950.0, 2768.0, 4182.0, 6226.0, 9716.0, 14795.0, 23865.0, 39027.0, 64946.0, 114766.0, 194248.0, 221823.0, 140662.0, 79937.0, 46128.0, 28243.0, 17618.0, 11065.0, 7376.0, 4823.0, 3269.0, 2150.0, 1451.0, 1011.0, 730.0, 509.0, 335.0, 255.0, 166.0, 129.0, 94.0, 48.0, 38.0, 20.0, 26.0, 9.0, 9.0, 1.0, 3.0, 3.0, 4.0, 0.0, 1.0], "bins": [-0.30712890625, -0.29758453369140625, -0.2880401611328125, -0.27849578857421875, -0.268951416015625, -0.25940704345703125, -0.2498626708984375, -0.24031829833984375, -0.23077392578125, -0.22122955322265625, -0.2116851806640625, -0.20214080810546875, -0.192596435546875, -0.18305206298828125, -0.1735076904296875, -0.16396331787109375, -0.1544189453125, -0.14487457275390625, -0.1353302001953125, -0.12578582763671875, -0.116241455078125, -0.10669708251953125, -0.0971527099609375, -0.08760833740234375, -0.07806396484375, -0.06851959228515625, -0.0589752197265625, -0.04943084716796875, -0.039886474609375, -0.03034210205078125, -0.0207977294921875, -0.01125335693359375, -0.001708984375, 0.00783538818359375, 0.0173797607421875, 0.02692413330078125, 0.036468505859375, 0.04601287841796875, 0.0555572509765625, 0.06510162353515625, 0.07464599609375, 0.08419036865234375, 0.0937347412109375, 0.10327911376953125, 0.112823486328125, 0.12236785888671875, 0.1319122314453125, 0.14145660400390625, 0.1510009765625, 0.16054534912109375, 0.1700897216796875, 0.17963409423828125, 0.189178466796875, 0.19872283935546875, 0.2082672119140625, 0.21781158447265625, 0.22735595703125, 0.23690032958984375, 0.2464447021484375, 0.25598907470703125, 0.265533447265625, 0.27507781982421875, 0.2846221923828125, 0.29416656494140625, 0.3037109375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 5.0, 8.0, 12.0, 10.0, 15.0, 17.0, 8.0, 23.0, 27.0, 33.0, 27.0, 34.0, 32.0, 34.0, 43.0, 48.0, 41.0, 35.0, 1058.0, 42.0, 54.0, 47.0, 44.0, 51.0, 37.0, 37.0, 33.0, 33.0, 19.0, 21.0, 23.0, 14.0, 14.0, 10.0, 7.0, 5.0, 5.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-2.0546875, -1.9929656982421875, -1.931243896484375, -1.8695220947265625, -1.80780029296875, -1.7460784912109375, -1.684356689453125, -1.6226348876953125, -1.5609130859375, -1.4991912841796875, -1.437469482421875, -1.3757476806640625, -1.31402587890625, -1.2523040771484375, -1.190582275390625, -1.1288604736328125, -1.067138671875, -1.0054168701171875, -0.943695068359375, -0.8819732666015625, -0.82025146484375, -0.7585296630859375, -0.696807861328125, -0.6350860595703125, -0.5733642578125, -0.5116424560546875, -0.449920654296875, -0.3881988525390625, -0.32647705078125, -0.2647552490234375, -0.203033447265625, -0.1413116455078125, -0.07958984375, -0.0178680419921875, 0.043853759765625, 0.1055755615234375, 0.16729736328125, 0.2290191650390625, 0.290740966796875, 0.3524627685546875, 0.4141845703125, 0.4759063720703125, 0.537628173828125, 0.5993499755859375, 0.66107177734375, 0.7227935791015625, 0.784515380859375, 0.8462371826171875, 0.907958984375, 0.9696807861328125, 1.031402587890625, 1.0931243896484375, 1.15484619140625, 1.2165679931640625, 1.278289794921875, 1.3400115966796875, 1.4017333984375, 1.4634552001953125, 1.525177001953125, 1.5868988037109375, 1.64862060546875, 1.7103424072265625, 1.772064208984375, 1.8337860107421875, 1.8955078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 2.0, 3.0, 6.0, 7.0, 12.0, 15.0, 16.0, 31.0, 51.0, 76.0, 125.0, 159.0, 237.0, 348.0, 469.0, 724.0, 1043.0, 1544.0, 2238.0, 3353.0, 5032.0, 7591.0, 11376.0, 17360.0, 26245.0, 41238.0, 65104.0, 107175.0, 172762.0, 1246381.0, 143914.0, 88272.0, 54091.0, 34051.0, 22216.0, 14624.0, 9571.0, 6360.0, 4286.0, 2862.0, 1954.0, 1348.0, 856.0, 598.0, 441.0, 289.0, 213.0, 155.0, 82.0, 57.0, 69.0, 33.0, 22.0, 19.0, 14.0, 8.0, 4.0, 4.0, 4.0, 1.0, 2.0], "bins": [-0.2198486328125, -0.213043212890625, -0.20623779296875, -0.199432373046875, -0.192626953125, -0.185821533203125, -0.17901611328125, -0.172210693359375, -0.1654052734375, -0.158599853515625, -0.15179443359375, -0.144989013671875, -0.13818359375, -0.131378173828125, -0.12457275390625, -0.117767333984375, -0.1109619140625, -0.104156494140625, -0.09735107421875, -0.090545654296875, -0.083740234375, -0.076934814453125, -0.07012939453125, -0.063323974609375, -0.0565185546875, -0.049713134765625, -0.04290771484375, -0.036102294921875, -0.029296875, -0.022491455078125, -0.01568603515625, -0.008880615234375, -0.0020751953125, 0.004730224609375, 0.01153564453125, 0.018341064453125, 0.025146484375, 0.031951904296875, 0.03875732421875, 0.045562744140625, 0.0523681640625, 0.059173583984375, 0.06597900390625, 0.072784423828125, 0.07958984375, 0.086395263671875, 0.09320068359375, 0.100006103515625, 0.1068115234375, 0.113616943359375, 0.12042236328125, 0.127227783203125, 0.134033203125, 0.140838623046875, 0.14764404296875, 0.154449462890625, 0.1612548828125, 0.168060302734375, 0.17486572265625, 0.181671142578125, 0.1884765625, 0.195281982421875, 0.20208740234375, 0.208892822265625, 0.2156982421875]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 0.0, 5.0, 3.0, 2.0, 3.0, 3.0, 5.0, 13.0, 3.0, 11.0, 15.0, 11.0, 29.0, 26.0, 21.0, 34.0, 44.0, 64.0, 59.0, 105.0, 114.0, 97.0, 80.0, 57.0, 36.0, 33.0, 22.0, 17.0, 19.0, 14.0, 16.0, 9.0, 7.0, 11.0, 6.0, 6.0, 4.0, 0.0, 2.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0028934478759765625, -0.002811640501022339, -0.0027298331260681152, -0.0026480257511138916, -0.002566218376159668, -0.0024844110012054443, -0.0024026036262512207, -0.002320796251296997, -0.0022389888763427734, -0.00215718150138855, -0.002075374126434326, -0.0019935667514801025, -0.001911759376525879, -0.0018299520015716553, -0.0017481446266174316, -0.001666337251663208, -0.0015845298767089844, -0.0015027225017547607, -0.0014209151268005371, -0.0013391077518463135, -0.0012573003768920898, -0.0011754930019378662, -0.0010936856269836426, -0.001011878252029419, -0.0009300708770751953, -0.0008482635021209717, -0.000766456127166748, -0.0006846487522125244, -0.0006028413772583008, -0.0005210340023040771, -0.0004392266273498535, -0.0003574192523956299, -0.00027561187744140625, -0.00019380450248718262, -0.00011199712753295898, -3.018975257873535e-05, 5.161762237548828e-05, 0.00013342499732971191, 0.00021523237228393555, 0.0002970397472381592, 0.0003788471221923828, 0.00046065449714660645, 0.0005424618721008301, 0.0006242692470550537, 0.0007060766220092773, 0.000787883996963501, 0.0008696913719177246, 0.0009514987468719482, 0.0010333061218261719, 0.0011151134967803955, 0.0011969208717346191, 0.0012787282466888428, 0.0013605356216430664, 0.00144234299659729, 0.0015241503715515137, 0.0016059577465057373, 0.001687765121459961, 0.0017695724964141846, 0.0018513798713684082, 0.0019331872463226318, 0.0020149946212768555, 0.002096801996231079, 0.0021786093711853027, 0.0022604167461395264, 0.00234222412109375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 5.0, 7.0, 9.0, 9.0, 12.0, 19.0, 14.0, 27.0, 40.0, 54.0, 61.0, 69.0, 131.0, 156.0, 226.0, 410.0, 1165.0, 45555.0, 988757.0, 9951.0, 748.0, 331.0, 227.0, 143.0, 116.0, 73.0, 65.0, 43.0, 30.0, 34.0, 20.0, 15.0, 8.0, 10.0, 7.0, 1.0, 5.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.04180908203125, -0.040555477142333984, -0.03930187225341797, -0.03804826736450195, -0.03679466247558594, -0.03554105758666992, -0.034287452697753906, -0.03303384780883789, -0.031780242919921875, -0.03052663803100586, -0.029273033142089844, -0.028019428253173828, -0.026765823364257812, -0.025512218475341797, -0.02425861358642578, -0.023005008697509766, -0.02175140380859375, -0.020497798919677734, -0.01924419403076172, -0.017990589141845703, -0.016736984252929688, -0.015483379364013672, -0.014229774475097656, -0.01297616958618164, -0.011722564697265625, -0.01046895980834961, -0.009215354919433594, -0.007961750030517578, -0.0067081451416015625, -0.005454540252685547, -0.004200935363769531, -0.0029473304748535156, -0.0016937255859375, -0.0004401206970214844, 0.0008134841918945312, 0.002067089080810547, 0.0033206939697265625, 0.004574298858642578, 0.005827903747558594, 0.007081508636474609, 0.008335113525390625, 0.00958871841430664, 0.010842323303222656, 0.012095928192138672, 0.013349533081054688, 0.014603137969970703, 0.01585674285888672, 0.017110347747802734, 0.01836395263671875, 0.019617557525634766, 0.02087116241455078, 0.022124767303466797, 0.023378372192382812, 0.024631977081298828, 0.025885581970214844, 0.02713918685913086, 0.028392791748046875, 0.02964639663696289, 0.030900001525878906, 0.03215360641479492, 0.03340721130371094, 0.03466081619262695, 0.03591442108154297, 0.037168025970458984, 0.038421630859375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 12.0, 51.0, 234.0, 413.0, 209.0, 78.0, 13.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008838488720357418, -0.0007239182596094906, -0.0005639876471832395, -0.0004040570347569883, -0.00024412642233073711, -8.419580990448594e-05, 7.573480252176523e-05, 0.0002356653567403555, 0.0003955960273742676, 0.0005555266398005188, 0.0007154572522267699, 0.0008753878646530211, 0.0010353184770792723, 0.0011952491477131844, 0.0013551797019317746, 0.0015151102561503649, 0.001675040926784277, 0.001834971597418189, 0.001994902268052101, 0.0021548327058553696, 0.0023147633764892817, 0.0024746940471231937, 0.002634624484926462, 0.0027945551555603743, 0.0029544858261942863, 0.0031144164968281984, 0.0032743471674621105, 0.003434277605265379, 0.003594208275899291, 0.003754138946533203, 0.0039140693843364716, 0.00407399982213974, 0.004233930259943008, 0.004393860697746277, 0.004553791601210833, 0.004713722039014101, 0.004873652942478657, 0.005033583380281925, 0.005193513818085194, 0.005353444255888462, 0.005513375159353018, 0.005673305597156286, 0.005833236500620842, 0.00599316693842411, 0.006153097376227379, 0.006313028279691935, 0.006472958717495203, 0.006632889620959759, 0.006792820058763027, 0.006952750496566296, 0.007112681400030851, 0.00727261183783412, 0.0074325427412986755, 0.007592473179101944, 0.007752403616905212, 0.00791233405470848, 0.00807226449251175, 0.008232194930315018, 0.008392125368118286, 0.00855205673724413, 0.008711987175047398, 0.008871917612850666, 0.009031848050653934, 0.009191778488457203, 0.009351709857583046]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 1.0, 2.0, 6.0, 6.0, 4.0, 9.0, 11.0, 13.0, 13.0, 19.0, 14.0, 25.0, 29.0, 24.0, 33.0, 23.0, 27.0, 32.0, 29.0, 26.0, 30.0, 38.0, 37.0, 46.0, 45.0, 42.0, 42.0, 34.0, 33.0, 26.0, 26.0, 23.0, 43.0, 20.0, 24.0, 22.0, 22.0, 14.0, 18.0, 13.0, 14.0, 9.0, 8.0, 4.0, 4.0, 4.0, 7.0, 3.0, 6.0, 5.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0011235475540161133, -0.0010907845571637154, -0.0010580215603113174, -0.0010252585634589195, -0.0009924955666065216, -0.0009597325697541237, -0.0009269695729017258, -0.0008942065760493279, -0.0008614435791969299, -0.000828680582344532, -0.0007959175854921341, -0.0007631545886397362, -0.0007303915917873383, -0.0006976285949349403, -0.0006648655980825424, -0.0006321026012301445, -0.0005993396043777466, -0.0005665766075253487, -0.0005338136106729507, -0.0005010506138205528, -0.0004682876169681549, -0.000435524620115757, -0.00040276162326335907, -0.00036999862641096115, -0.00033723562955856323, -0.0003044726327061653, -0.0002717096358537674, -0.00023894663900136948, -0.00020618364214897156, -0.00017342064529657364, -0.00014065764844417572, -0.0001078946515917778, -7.513165473937988e-05, -4.2368657886981964e-05, -9.605661034584045e-06, 2.3157335817813873e-05, 5.592033267021179e-05, 8.868332952260971e-05, 0.00012144632637500763, 0.00015420932322740555, 0.00018697232007980347, 0.00021973531693220139, 0.0002524983137845993, 0.0002852613106369972, 0.00031802430748939514, 0.00035078730434179306, 0.000383550301194191, 0.0004163132980465889, 0.0004490762948989868, 0.00048183929175138474, 0.0005146022886037827, 0.0005473652854561806, 0.0005801282823085785, 0.0006128912791609764, 0.0006456542760133743, 0.0006784172728657722, 0.0007111802697181702, 0.0007439432665705681, 0.000776706263422966, 0.0008094692602753639, 0.0008422322571277618, 0.0008749952539801598, 0.0009077582508325577, 0.0009405212476849556, 0.0009732842445373535]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 4.0, 0.0, 1.0, 0.0, 8.0, 7.0, 6.0, 11.0, 8.0, 8.0, 18.0, 21.0, 22.0, 26.0, 26.0, 31.0, 31.0, 32.0, 42.0, 31.0, 39.0, 45.0, 38.0, 36.0, 42.0, 43.0, 50.0, 32.0, 38.0, 34.0, 30.0, 32.0, 29.0, 32.0, 24.0, 22.0, 23.0, 15.0, 19.0, 17.0, 12.0, 7.0, 10.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.794921875, -2.702606201171875, -2.61029052734375, -2.517974853515625, -2.4256591796875, -2.333343505859375, -2.24102783203125, -2.148712158203125, -2.056396484375, -1.964080810546875, -1.87176513671875, -1.779449462890625, -1.6871337890625, -1.594818115234375, -1.50250244140625, -1.410186767578125, -1.31787109375, -1.225555419921875, -1.13323974609375, -1.040924072265625, -0.9486083984375, -0.856292724609375, -0.76397705078125, -0.671661376953125, -0.579345703125, -0.487030029296875, -0.39471435546875, -0.302398681640625, -0.2100830078125, -0.117767333984375, -0.02545166015625, 0.066864013671875, 0.1591796875, 0.251495361328125, 0.34381103515625, 0.436126708984375, 0.5284423828125, 0.620758056640625, 0.71307373046875, 0.805389404296875, 0.897705078125, 0.990020751953125, 1.08233642578125, 1.174652099609375, 1.2669677734375, 1.359283447265625, 1.45159912109375, 1.543914794921875, 1.63623046875, 1.728546142578125, 1.82086181640625, 1.913177490234375, 2.0054931640625, 2.097808837890625, 2.19012451171875, 2.282440185546875, 2.374755859375, 2.467071533203125, 2.55938720703125, 2.651702880859375, 2.7440185546875, 2.836334228515625, 2.92864990234375, 3.020965576171875, 3.11328125]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 3.0, 6.0, 5.0, 13.0, 10.0, 11.0, 10.0, 28.0, 19.0, 39.0, 51.0, 73.0, 112.0, 97.0, 161.0, 240.0, 368.0, 632.0, 1024.0, 1718.0, 2958.0, 6104.0, 15786.0, 57440.0, 275577.0, 501105.0, 134590.0, 30178.0, 9782.0, 4326.0, 2306.0, 1350.0, 831.0, 499.0, 351.0, 208.0, 114.0, 98.0, 99.0, 50.0, 50.0, 35.0, 14.0, 26.0, 18.0, 13.0, 10.0, 7.0, 3.0, 6.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0], "bins": [-2.984375, -2.888946533203125, -2.79351806640625, -2.698089599609375, -2.6026611328125, -2.507232666015625, -2.41180419921875, -2.316375732421875, -2.220947265625, -2.125518798828125, -2.03009033203125, -1.934661865234375, -1.8392333984375, -1.743804931640625, -1.64837646484375, -1.552947998046875, -1.45751953125, -1.362091064453125, -1.26666259765625, -1.171234130859375, -1.0758056640625, -0.980377197265625, -0.88494873046875, -0.789520263671875, -0.694091796875, -0.598663330078125, -0.50323486328125, -0.407806396484375, -0.3123779296875, -0.216949462890625, -0.12152099609375, -0.026092529296875, 0.0693359375, 0.164764404296875, 0.26019287109375, 0.355621337890625, 0.4510498046875, 0.546478271484375, 0.64190673828125, 0.737335205078125, 0.832763671875, 0.928192138671875, 1.02362060546875, 1.119049072265625, 1.2144775390625, 1.309906005859375, 1.40533447265625, 1.500762939453125, 1.59619140625, 1.691619873046875, 1.78704833984375, 1.882476806640625, 1.9779052734375, 2.073333740234375, 2.16876220703125, 2.264190673828125, 2.359619140625, 2.455047607421875, 2.55047607421875, 2.645904541015625, 2.7413330078125, 2.836761474609375, 2.93218994140625, 3.027618408203125, 3.123046875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 3.0, 9.0, 3.0, 8.0, 5.0, 27.0, 15.0, 24.0, 16.0, 23.0, 41.0, 41.0, 43.0, 50.0, 51.0, 63.0, 109.0, 1711.0, 341.0, 59.0, 54.0, 46.0, 40.0, 54.0, 33.0, 35.0, 33.0, 24.0, 18.0, 19.0, 12.0, 6.0, 11.0, 9.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.3515625, -11.9510498046875, -11.550537109375, -11.1500244140625, -10.74951171875, -10.3489990234375, -9.948486328125, -9.5479736328125, -9.1474609375, -8.7469482421875, -8.346435546875, -7.9459228515625, -7.54541015625, -7.1448974609375, -6.744384765625, -6.3438720703125, -5.943359375, -5.5428466796875, -5.142333984375, -4.7418212890625, -4.34130859375, -3.9407958984375, -3.540283203125, -3.1397705078125, -2.7392578125, -2.3387451171875, -1.938232421875, -1.5377197265625, -1.13720703125, -0.7366943359375, -0.336181640625, 0.0643310546875, 0.46484375, 0.8653564453125, 1.265869140625, 1.6663818359375, 2.06689453125, 2.4674072265625, 2.867919921875, 3.2684326171875, 3.6689453125, 4.0694580078125, 4.469970703125, 4.8704833984375, 5.27099609375, 5.6715087890625, 6.072021484375, 6.4725341796875, 6.873046875, 7.2735595703125, 7.674072265625, 8.0745849609375, 8.47509765625, 8.8756103515625, 9.276123046875, 9.6766357421875, 10.0771484375, 10.4776611328125, 10.878173828125, 11.2786865234375, 11.67919921875, 12.0797119140625, 12.480224609375, 12.8807373046875, 13.28125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 6.0, 3.0, 10.0, 8.0, 6.0, 10.0, 20.0, 19.0, 18.0, 19.0, 40.0, 50.0, 47.0, 105.0, 149.0, 222.0, 499.0, 2018.0, 47398.0, 3075162.0, 17480.0, 1332.0, 458.0, 194.0, 114.0, 86.0, 56.0, 45.0, 23.0, 18.0, 17.0, 22.0, 15.0, 11.0, 6.0, 6.0, 8.0, 3.0, 1.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-20.015625, -19.397705078125, -18.77978515625, -18.161865234375, -17.5439453125, -16.926025390625, -16.30810546875, -15.690185546875, -15.072265625, -14.454345703125, -13.83642578125, -13.218505859375, -12.6005859375, -11.982666015625, -11.36474609375, -10.746826171875, -10.12890625, -9.510986328125, -8.89306640625, -8.275146484375, -7.6572265625, -7.039306640625, -6.42138671875, -5.803466796875, -5.185546875, -4.567626953125, -3.94970703125, -3.331787109375, -2.7138671875, -2.095947265625, -1.47802734375, -0.860107421875, -0.2421875, 0.375732421875, 0.99365234375, 1.611572265625, 2.2294921875, 2.847412109375, 3.46533203125, 4.083251953125, 4.701171875, 5.319091796875, 5.93701171875, 6.554931640625, 7.1728515625, 7.790771484375, 8.40869140625, 9.026611328125, 9.64453125, 10.262451171875, 10.88037109375, 11.498291015625, 12.1162109375, 12.734130859375, 13.35205078125, 13.969970703125, 14.587890625, 15.205810546875, 15.82373046875, 16.441650390625, 17.0595703125, 17.677490234375, 18.29541015625, 18.913330078125, 19.53125]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [3.0, 99.0, 756.0, 159.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.281250476837158, -3.845566749572754, -1.4098830223083496, 1.0258007049560547, 3.461484432220459, 5.8971686363220215, 8.33285140991211, 10.768535614013672, 13.204219818115234, 15.639904022216797, 18.07558822631836, 20.51127052307129, 22.94695472717285, 25.382638931274414, 27.818321228027344, 30.254005432128906, 32.68968963623047, 35.12537384033203, 37.561058044433594, 39.996742248535156, 42.43242645263672, 44.86811065673828, 47.30379104614258, 49.73947525024414, 52.1751594543457, 54.610843658447266, 57.04652786254883, 59.48221206665039, 61.91789245605469, 64.35357666015625, 66.78926086425781, 69.22494506835938, 71.66062927246094, 74.0963134765625, 76.53199768066406, 78.96768188476562, 81.40336608886719, 83.83905029296875, 86.27473449707031, 88.71041870117188, 91.14610290527344, 93.581787109375, 96.01747131347656, 98.45315551757812, 100.88883972167969, 103.32452392578125, 105.76020812988281, 108.19589233398438, 110.6315689086914, 113.06725311279297, 115.50293731689453, 117.9386215209961, 120.37430572509766, 122.80998992919922, 125.24567413330078, 127.68135070800781, 130.11703491210938, 132.55271911621094, 134.9884033203125, 137.42408752441406, 139.85977172851562, 142.2954559326172, 144.73114013671875, 147.1668243408203, 149.60250854492188]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 6.0, 7.0, 6.0, 10.0, 11.0, 18.0, 17.0, 20.0, 20.0, 25.0, 26.0, 26.0, 25.0, 31.0, 32.0, 51.0, 40.0, 44.0, 37.0, 36.0, 40.0, 40.0, 53.0, 49.0, 49.0, 40.0, 24.0, 34.0, 29.0, 35.0, 26.0, 24.0, 15.0, 15.0, 10.0, 12.0, 4.0, 4.0, 8.0, 2.0, 5.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.935293197631836, -28.760990142822266, -27.586687088012695, -26.412384033203125, -25.238080978393555, -24.063777923583984, -22.88947296142578, -21.715171813964844, -20.54086685180664, -19.36656379699707, -18.1922607421875, -17.01795768737793, -15.84365463256836, -14.669351577758789, -13.495047569274902, -12.320744514465332, -11.146442413330078, -9.972139358520508, -8.797836303710938, -7.623532772064209, -6.449229717254639, -5.274926662445068, -4.10062313079834, -2.9263200759887695, -1.7520170211791992, -0.5777138471603394, 0.5965893268585205, 1.77089262008667, 2.9451956748962402, 4.1194987297058105, 5.293802261352539, 6.468105316162109, 7.642406463623047, 8.816709518432617, 9.991012573242188, 11.165315628051758, 12.339618682861328, 13.513921737670898, 14.688225746154785, 15.862528800964355, 17.03683090209961, 18.21113395690918, 19.38543701171875, 20.55974006652832, 21.73404312133789, 22.90834617614746, 24.08264923095703, 25.256954193115234, 26.431257247924805, 27.605560302734375, 28.779863357543945, 29.954166412353516, 31.128469467163086, 32.302772521972656, 33.47707748413086, 34.6513786315918, 35.82568359375, 36.9999885559082, 38.17428970336914, 39.348594665527344, 40.52289581298828, 41.697200775146484, 42.87150192260742, 44.045806884765625, 45.22010803222656]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 3.0, 2.0, 5.0, 4.0, 4.0, 9.0, 11.0, 4.0, 19.0, 7.0, 28.0, 21.0, 17.0, 24.0, 28.0, 30.0, 31.0, 45.0, 30.0, 38.0, 44.0, 39.0, 34.0, 40.0, 48.0, 36.0, 37.0, 43.0, 31.0, 36.0, 29.0, 30.0, 33.0, 29.0, 25.0, 19.0, 18.0, 10.0, 21.0, 14.0, 17.0, 3.0, 9.0, 4.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.83203125, -2.739501953125, -2.64697265625, -2.554443359375, -2.4619140625, -2.369384765625, -2.27685546875, -2.184326171875, -2.091796875, -1.999267578125, -1.90673828125, -1.814208984375, -1.7216796875, -1.629150390625, -1.53662109375, -1.444091796875, -1.3515625, -1.259033203125, -1.16650390625, -1.073974609375, -0.9814453125, -0.888916015625, -0.79638671875, -0.703857421875, -0.611328125, -0.518798828125, -0.42626953125, -0.333740234375, -0.2412109375, -0.148681640625, -0.05615234375, 0.036376953125, 0.12890625, 0.221435546875, 0.31396484375, 0.406494140625, 0.4990234375, 0.591552734375, 0.68408203125, 0.776611328125, 0.869140625, 0.961669921875, 1.05419921875, 1.146728515625, 1.2392578125, 1.331787109375, 1.42431640625, 1.516845703125, 1.609375, 1.701904296875, 1.79443359375, 1.886962890625, 1.9794921875, 2.072021484375, 2.16455078125, 2.257080078125, 2.349609375, 2.442138671875, 2.53466796875, 2.627197265625, 2.7197265625, 2.812255859375, 2.90478515625, 2.997314453125, 3.08984375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 3.0, 0.0, 4.0, 8.0, 7.0, 5.0, 10.0, 23.0, 27.0, 44.0, 67.0, 99.0, 180.0, 275.0, 414.0, 725.0, 1185.0, 2025.0, 3499.0, 6198.0, 11822.0, 25418.0, 68779.0, 293204.0, 1549641.0, 1728399.0, 366576.0, 78965.0, 28370.0, 12708.0, 6710.0, 3652.0, 2074.0, 1262.0, 700.0, 442.0, 248.0, 185.0, 107.0, 76.0, 55.0, 34.0, 22.0, 17.0, 7.0, 6.0, 3.0, 4.0, 4.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-5.5, -5.32843017578125, -5.1568603515625, -4.98529052734375, -4.813720703125, -4.64215087890625, -4.4705810546875, -4.29901123046875, -4.12744140625, -3.95587158203125, -3.7843017578125, -3.61273193359375, -3.441162109375, -3.26959228515625, -3.0980224609375, -2.92645263671875, -2.7548828125, -2.58331298828125, -2.4117431640625, -2.24017333984375, -2.068603515625, -1.89703369140625, -1.7254638671875, -1.55389404296875, -1.38232421875, -1.21075439453125, -1.0391845703125, -0.86761474609375, -0.696044921875, -0.52447509765625, -0.3529052734375, -0.18133544921875, -0.009765625, 0.16180419921875, 0.3333740234375, 0.50494384765625, 0.676513671875, 0.84808349609375, 1.0196533203125, 1.19122314453125, 1.36279296875, 1.53436279296875, 1.7059326171875, 1.87750244140625, 2.049072265625, 2.22064208984375, 2.3922119140625, 2.56378173828125, 2.7353515625, 2.90692138671875, 3.0784912109375, 3.25006103515625, 3.421630859375, 3.59320068359375, 3.7647705078125, 3.93634033203125, 4.10791015625, 4.27947998046875, 4.4510498046875, 4.62261962890625, 4.794189453125, 4.96575927734375, 5.1373291015625, 5.30889892578125, 5.48046875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 5.0, 4.0, 3.0, 12.0, 21.0, 25.0, 45.0, 53.0, 93.0, 128.0, 215.0, 376.0, 556.0, 750.0, 668.0, 434.0, 243.0, 168.0, 77.0, 74.0, 46.0, 29.0, 19.0, 19.0, 11.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-15.546875, -15.1824951171875, -14.818115234375, -14.4537353515625, -14.08935546875, -13.7249755859375, -13.360595703125, -12.9962158203125, -12.6318359375, -12.2674560546875, -11.903076171875, -11.5386962890625, -11.17431640625, -10.8099365234375, -10.445556640625, -10.0811767578125, -9.716796875, -9.3524169921875, -8.988037109375, -8.6236572265625, -8.25927734375, -7.8948974609375, -7.530517578125, -7.1661376953125, -6.8017578125, -6.4373779296875, -6.072998046875, -5.7086181640625, -5.34423828125, -4.9798583984375, -4.615478515625, -4.2510986328125, -3.88671875, -3.5223388671875, -3.157958984375, -2.7935791015625, -2.42919921875, -2.0648193359375, -1.700439453125, -1.3360595703125, -0.9716796875, -0.6072998046875, -0.242919921875, 0.1214599609375, 0.48583984375, 0.8502197265625, 1.214599609375, 1.5789794921875, 1.943359375, 2.3077392578125, 2.672119140625, 3.0364990234375, 3.40087890625, 3.7652587890625, 4.129638671875, 4.4940185546875, 4.8583984375, 5.2227783203125, 5.587158203125, 5.9515380859375, 6.31591796875, 6.6802978515625, 7.044677734375, 7.4090576171875, 7.7734375]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 8.0, 6.0, 16.0, 16.0, 36.0, 57.0, 103.0, 226.0, 580.0, 1761.0, 6440.0, 31177.0, 255929.0, 3335108.0, 503577.0, 46627.0, 8963.0, 2355.0, 733.0, 290.0, 118.0, 59.0, 32.0, 24.0, 16.0, 12.0, 5.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.5234375, -12.9254150390625, -12.327392578125, -11.7293701171875, -11.13134765625, -10.5333251953125, -9.935302734375, -9.3372802734375, -8.7392578125, -8.1412353515625, -7.543212890625, -6.9451904296875, -6.34716796875, -5.7491455078125, -5.151123046875, -4.5531005859375, -3.955078125, -3.3570556640625, -2.759033203125, -2.1610107421875, -1.56298828125, -0.9649658203125, -0.366943359375, 0.2310791015625, 0.8291015625, 1.4271240234375, 2.025146484375, 2.6231689453125, 3.22119140625, 3.8192138671875, 4.417236328125, 5.0152587890625, 5.61328125, 6.2113037109375, 6.809326171875, 7.4073486328125, 8.00537109375, 8.6033935546875, 9.201416015625, 9.7994384765625, 10.3974609375, 10.9954833984375, 11.593505859375, 12.1915283203125, 12.78955078125, 13.3875732421875, 13.985595703125, 14.5836181640625, 15.181640625, 15.7796630859375, 16.377685546875, 16.9757080078125, 17.57373046875, 18.1717529296875, 18.769775390625, 19.3677978515625, 19.9658203125, 20.5638427734375, 21.161865234375, 21.7598876953125, 22.35791015625, 22.9559326171875, 23.553955078125, 24.1519775390625, 24.75]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 4.0, 5.0, 9.0, 17.0, 31.0, 58.0, 88.0, 160.0, 194.0, 166.0, 143.0, 75.0, 34.0, 15.0, 9.0, 8.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.582496643066406, -50.53564453125, -48.488792419433594, -46.44194030761719, -44.39508819580078, -42.348236083984375, -40.3013801574707, -38.2545280456543, -36.20767593383789, -34.160823822021484, -32.11397171020508, -30.06711769104004, -28.020265579223633, -25.973413467407227, -23.926559448242188, -21.87970733642578, -19.832855224609375, -17.78600311279297, -15.739150047302246, -13.692296981811523, -11.645444869995117, -9.598592758178711, -7.551739692687988, -5.504886627197266, -3.4580345153808594, -1.411181926727295, 0.6356706619262695, 2.682523250579834, 4.729375839233398, 6.776227951049805, 8.823081016540527, 10.86993408203125, 12.916786193847656, 14.963638305664062, 17.01049041748047, 19.057344436645508, 21.104196548461914, 23.15104866027832, 25.19790267944336, 27.244754791259766, 29.291606903076172, 31.338459014892578, 33.385311126708984, 35.43216323852539, 37.47901916503906, 39.52587127685547, 41.572723388671875, 43.61957550048828, 45.66642761230469, 47.713279724121094, 49.7601318359375, 51.806983947753906, 53.85383605957031, 55.90068817138672, 57.94754409790039, 59.9943962097168, 62.0412483215332, 64.08810424804688, 66.13495635986328, 68.18180847167969, 70.2286605834961, 72.2755126953125, 74.3223648071289, 76.36921691894531, 78.41606903076172]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 9.0, 19.0, 8.0, 7.0, 14.0, 14.0, 18.0, 18.0, 23.0, 23.0, 19.0, 34.0, 26.0, 28.0, 34.0, 39.0, 42.0, 43.0, 45.0, 34.0, 27.0, 32.0, 36.0, 40.0, 41.0, 33.0, 34.0, 29.0, 25.0, 35.0, 23.0, 21.0, 11.0, 14.0, 18.0, 10.0, 6.0, 13.0, 10.0, 9.0, 5.0, 4.0, 6.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.3787899017334, -21.671953201293945, -20.965116500854492, -20.25827980041504, -19.551441192626953, -18.8446044921875, -18.137767791748047, -17.430931091308594, -16.72409439086914, -16.017257690429688, -15.310420989990234, -14.603583335876465, -13.896746635437012, -13.189909934997559, -12.483072280883789, -11.776235580444336, -11.069398880004883, -10.36256217956543, -9.655725479125977, -8.948887825012207, -8.242051124572754, -7.535214424133301, -6.8283772468566895, -6.121540069580078, -5.414703369140625, -4.707866668701172, -4.0010294914245605, -3.2941925525665283, -2.587355613708496, -1.8805186748504639, -1.1736817359924316, -0.4668445587158203, 0.239990234375, 0.9468271732330322, 1.6536641120910645, 2.3605010509490967, 3.067337989807129, 3.774174928665161, 4.481011867523193, 5.187849044799805, 5.894685745239258, 6.601522445678711, 7.308359622955322, 8.015196800231934, 8.722033500671387, 9.42887020111084, 10.13570785522461, 10.842544555664062, 11.549381256103516, 12.256217956542969, 12.963054656982422, 13.669892311096191, 14.376729011535645, 15.083565711975098, 15.790403366088867, 16.49724006652832, 17.204076766967773, 17.910913467407227, 18.61775016784668, 19.324586868286133, 20.03142547607422, 20.738262176513672, 21.445098876953125, 22.151935577392578, 22.85877227783203]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 3.0, 1.0, 4.0, 10.0, 10.0, 16.0, 13.0, 15.0, 10.0, 22.0, 25.0, 32.0, 28.0, 33.0, 36.0, 41.0, 43.0, 45.0, 46.0, 37.0, 40.0, 41.0, 36.0, 40.0, 42.0, 39.0, 33.0, 42.0, 32.0, 28.0, 31.0, 18.0, 22.0, 23.0, 20.0, 14.0, 17.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.15625, -3.05645751953125, -2.9566650390625, -2.85687255859375, -2.757080078125, -2.65728759765625, -2.5574951171875, -2.45770263671875, -2.35791015625, -2.25811767578125, -2.1583251953125, -2.05853271484375, -1.958740234375, -1.85894775390625, -1.7591552734375, -1.65936279296875, -1.5595703125, -1.45977783203125, -1.3599853515625, -1.26019287109375, -1.160400390625, -1.06060791015625, -0.9608154296875, -0.86102294921875, -0.76123046875, -0.66143798828125, -0.5616455078125, -0.46185302734375, -0.362060546875, -0.26226806640625, -0.1624755859375, -0.06268310546875, 0.037109375, 0.13690185546875, 0.2366943359375, 0.33648681640625, 0.436279296875, 0.53607177734375, 0.6358642578125, 0.73565673828125, 0.83544921875, 0.93524169921875, 1.0350341796875, 1.13482666015625, 1.234619140625, 1.33441162109375, 1.4342041015625, 1.53399658203125, 1.6337890625, 1.73358154296875, 1.8333740234375, 1.93316650390625, 2.032958984375, 2.13275146484375, 2.2325439453125, 2.33233642578125, 2.43212890625, 2.53192138671875, 2.6317138671875, 2.73150634765625, 2.831298828125, 2.93109130859375, 3.0308837890625, 3.13067626953125, 3.23046875]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 9.0, 7.0, 12.0, 19.0, 26.0, 40.0, 75.0, 90.0, 145.0, 216.0, 320.0, 423.0, 612.0, 961.0, 1329.0, 2092.0, 3098.0, 4616.0, 7083.0, 11114.0, 17546.0, 28859.0, 48353.0, 82596.0, 141621.0, 225566.0, 191542.0, 111572.0, 65455.0, 38650.0, 23214.0, 14538.0, 9113.0, 5893.0, 3833.0, 2555.0, 1724.0, 1189.0, 801.0, 504.0, 375.0, 235.0, 188.0, 98.0, 77.0, 58.0, 39.0, 25.0, 20.0, 15.0, 8.0, 6.0, 6.0, 0.0, 0.0, 2.0], "bins": [-0.34228515625, -0.3321533203125, -0.322021484375, -0.3118896484375, -0.3017578125, -0.2916259765625, -0.281494140625, -0.2713623046875, -0.26123046875, -0.2510986328125, -0.240966796875, -0.2308349609375, -0.220703125, -0.2105712890625, -0.200439453125, -0.1903076171875, -0.18017578125, -0.1700439453125, -0.159912109375, -0.1497802734375, -0.1396484375, -0.1295166015625, -0.119384765625, -0.1092529296875, -0.09912109375, -0.0889892578125, -0.078857421875, -0.0687255859375, -0.05859375, -0.0484619140625, -0.038330078125, -0.0281982421875, -0.01806640625, -0.0079345703125, 0.002197265625, 0.0123291015625, 0.0224609375, 0.0325927734375, 0.042724609375, 0.0528564453125, 0.06298828125, 0.0731201171875, 0.083251953125, 0.0933837890625, 0.103515625, 0.1136474609375, 0.123779296875, 0.1339111328125, 0.14404296875, 0.1541748046875, 0.164306640625, 0.1744384765625, 0.1845703125, 0.1947021484375, 0.204833984375, 0.2149658203125, 0.22509765625, 0.2352294921875, 0.245361328125, 0.2554931640625, 0.265625, 0.2757568359375, 0.285888671875, 0.2960205078125, 0.30615234375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 2.0, 3.0, 4.0, 4.0, 8.0, 7.0, 5.0, 10.0, 16.0, 11.0, 12.0, 15.0, 24.0, 12.0, 20.0, 36.0, 37.0, 43.0, 36.0, 42.0, 37.0, 43.0, 48.0, 51.0, 1057.0, 52.0, 40.0, 43.0, 40.0, 26.0, 30.0, 32.0, 23.0, 31.0, 18.0, 24.0, 14.0, 16.0, 13.0, 9.0, 11.0, 6.0, 4.0, 5.0, 4.0, 2.0, 4.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.857421875, -1.795654296875, -1.73388671875, -1.672119140625, -1.6103515625, -1.548583984375, -1.48681640625, -1.425048828125, -1.36328125, -1.301513671875, -1.23974609375, -1.177978515625, -1.1162109375, -1.054443359375, -0.99267578125, -0.930908203125, -0.869140625, -0.807373046875, -0.74560546875, -0.683837890625, -0.6220703125, -0.560302734375, -0.49853515625, -0.436767578125, -0.375, -0.313232421875, -0.25146484375, -0.189697265625, -0.1279296875, -0.066162109375, -0.00439453125, 0.057373046875, 0.119140625, 0.180908203125, 0.24267578125, 0.304443359375, 0.3662109375, 0.427978515625, 0.48974609375, 0.551513671875, 0.61328125, 0.675048828125, 0.73681640625, 0.798583984375, 0.8603515625, 0.922119140625, 0.98388671875, 1.045654296875, 1.107421875, 1.169189453125, 1.23095703125, 1.292724609375, 1.3544921875, 1.416259765625, 1.47802734375, 1.539794921875, 1.6015625, 1.663330078125, 1.72509765625, 1.786865234375, 1.8486328125, 1.910400390625, 1.97216796875, 2.033935546875, 2.095703125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 8.0, 9.0, 11.0, 23.0, 28.0, 40.0, 57.0, 74.0, 122.0, 177.0, 258.0, 370.0, 544.0, 783.0, 1252.0, 1923.0, 3056.0, 4660.0, 7361.0, 11817.0, 19015.0, 30774.0, 50788.0, 88437.0, 154403.0, 1270899.0, 183986.0, 108008.0, 61355.0, 36793.0, 22326.0, 14067.0, 8472.0, 5476.0, 3420.0, 2177.0, 1391.0, 868.0, 631.0, 410.0, 275.0, 184.0, 131.0, 85.0, 59.0, 42.0, 22.0, 25.0, 17.0, 12.0, 3.0, 5.0, 9.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.26611328125, -0.2579689025878906, -0.24982452392578125, -0.24168014526367188, -0.2335357666015625, -0.22539138793945312, -0.21724700927734375, -0.20910263061523438, -0.200958251953125, -0.19281387329101562, -0.18466949462890625, -0.17652511596679688, -0.1683807373046875, -0.16023635864257812, -0.15209197998046875, -0.14394760131835938, -0.13580322265625, -0.12765884399414062, -0.11951446533203125, -0.11137008666992188, -0.1032257080078125, -0.09508132934570312, -0.08693695068359375, -0.07879257202148438, -0.070648193359375, -0.06250381469726562, -0.05435943603515625, -0.046215057373046875, -0.0380706787109375, -0.029926300048828125, -0.02178192138671875, -0.013637542724609375, -0.0054931640625, 0.002651214599609375, 0.01079559326171875, 0.018939971923828125, 0.0270843505859375, 0.035228729248046875, 0.04337310791015625, 0.051517486572265625, 0.059661865234375, 0.06780624389648438, 0.07595062255859375, 0.08409500122070312, 0.0922393798828125, 0.10038375854492188, 0.10852813720703125, 0.11667251586914062, 0.12481689453125, 0.13296127319335938, 0.14110565185546875, 0.14925003051757812, 0.1573944091796875, 0.16553878784179688, 0.17368316650390625, 0.18182754516601562, 0.189971923828125, 0.19811630249023438, 0.20626068115234375, 0.21440505981445312, 0.2225494384765625, 0.23069381713867188, 0.23883819580078125, 0.24698257446289062, 0.255126953125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 5.0, 6.0, 5.0, 11.0, 7.0, 9.0, 23.0, 12.0, 21.0, 17.0, 35.0, 25.0, 30.0, 33.0, 51.0, 67.0, 80.0, 82.0, 89.0, 76.0, 51.0, 44.0, 34.0, 46.0, 25.0, 24.0, 13.0, 17.0, 16.0, 11.0, 10.0, 6.0, 7.0, 6.0, 4.0, 4.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.002323150634765625, -0.0022628754377365112, -0.0022026002407073975, -0.0021423250436782837, -0.00208204984664917, -0.002021774649620056, -0.0019614994525909424, -0.0019012242555618286, -0.0018409490585327148, -0.001780673861503601, -0.0017203986644744873, -0.0016601234674453735, -0.0015998482704162598, -0.001539573073387146, -0.0014792978763580322, -0.0014190226793289185, -0.0013587474822998047, -0.001298472285270691, -0.0012381970882415771, -0.0011779218912124634, -0.0011176466941833496, -0.0010573714971542358, -0.000997096300125122, -0.0009368211030960083, -0.0008765459060668945, -0.0008162707090377808, -0.000755995512008667, -0.0006957203149795532, -0.0006354451179504395, -0.0005751699209213257, -0.0005148947238922119, -0.00045461952686309814, -0.0003943443298339844, -0.0003340691328048706, -0.00027379393577575684, -0.00021351873874664307, -0.0001532435417175293, -9.296834468841553e-05, -3.269314765930176e-05, 2.7582049369812012e-05, 8.785724639892578e-05, 0.00014813244342803955, 0.00020840764045715332, 0.0002686828374862671, 0.00032895803451538086, 0.00038923323154449463, 0.0004495084285736084, 0.0005097836256027222, 0.0005700588226318359, 0.0006303340196609497, 0.0006906092166900635, 0.0007508844137191772, 0.000811159610748291, 0.0008714348077774048, 0.0009317100048065186, 0.0009919852018356323, 0.001052260398864746, 0.0011125355958938599, 0.0011728107929229736, 0.0012330859899520874, 0.0012933611869812012, 0.001353636384010315, 0.0014139115810394287, 0.0014741867780685425, 0.0015344619750976562]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 3.0, 8.0, 3.0, 11.0, 20.0, 16.0, 23.0, 18.0, 23.0, 38.0, 61.0, 77.0, 95.0, 137.0, 188.0, 302.0, 645.0, 3281.0, 129103.0, 894134.0, 17883.0, 1199.0, 455.0, 242.0, 137.0, 92.0, 85.0, 55.0, 57.0, 36.0, 32.0, 31.0, 10.0, 6.0, 11.0, 13.0, 8.0, 6.0, 6.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0268096923828125, -0.025861024856567383, -0.024912357330322266, -0.02396368980407715, -0.02301502227783203, -0.022066354751586914, -0.021117687225341797, -0.02016901969909668, -0.019220352172851562, -0.018271684646606445, -0.017323017120361328, -0.01637434959411621, -0.015425682067871094, -0.014477014541625977, -0.01352834701538086, -0.012579679489135742, -0.011631011962890625, -0.010682344436645508, -0.00973367691040039, -0.008785009384155273, -0.007836341857910156, -0.006887674331665039, -0.005939006805419922, -0.004990339279174805, -0.0040416717529296875, -0.0030930042266845703, -0.002144336700439453, -0.001195669174194336, -0.00024700164794921875, 0.0007016658782958984, 0.0016503334045410156, 0.002599000930786133, 0.00354766845703125, 0.004496335983276367, 0.005445003509521484, 0.0063936710357666016, 0.007342338562011719, 0.008291006088256836, 0.009239673614501953, 0.01018834114074707, 0.011137008666992188, 0.012085676193237305, 0.013034343719482422, 0.013983011245727539, 0.014931678771972656, 0.015880346298217773, 0.01682901382446289, 0.017777681350708008, 0.018726348876953125, 0.019675016403198242, 0.02062368392944336, 0.021572351455688477, 0.022521018981933594, 0.02346968650817871, 0.024418354034423828, 0.025367021560668945, 0.026315689086914062, 0.02726435661315918, 0.028213024139404297, 0.029161691665649414, 0.03011035919189453, 0.03105902671813965, 0.032007694244384766, 0.03295636177062988, 0.033905029296875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 30.0, 190.0, 478.0, 264.0, 43.0, 8.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.01151297427713871, -0.011309492401778698, -0.011106010526418686, -0.010902529582381248, -0.010699047707021236, -0.010495565831661224, -0.010292083956301212, -0.010088603012263775, -0.009885121136903763, -0.00968163926154375, -0.009478157386183739, -0.009274676442146301, -0.00907119456678629, -0.008867712691426277, -0.008664230816066265, -0.008460749872028828, -0.008257267996668816, -0.008053786121308804, -0.007850304245948792, -0.007646822836250067, -0.007443341426551342, -0.00723985955119133, -0.007036378141492605, -0.006832896266132593, -0.006629414390772581, -0.006425932515412569, -0.006222451105713844, -0.006018969230353832, -0.0058154878206551075, -0.0056120059452950954, -0.005408524535596371, -0.005205042660236359, -0.005001561250537634, -0.004798079375177622, -0.004594597965478897, -0.004391116090118885, -0.00418763468042016, -0.003984152805060148, -0.0037806713953614235, -0.0035771895200014114, -0.0033737081103026867, -0.0031702264677733183, -0.00296674482524395, -0.0027632631827145815, -0.002559781540185213, -0.002356299664825201, -0.0021528182551264763, -0.001949336496181786, -0.0017458548536524177, -0.0015423732111230493, -0.0013388915685936809, -0.0011354098096489906, -0.0009319282253272831, -0.0007284465245902538, -0.0005249648820608854, -0.00032148323953151703, -0.00011800159700214863, 8.5480060079135e-05, 0.00028896171716041863, 0.0004924433887936175, 0.0006959250313229859, 0.0008994067320600152, 0.0011028883745893836, 0.001306370017118752, 0.0015098516596481204]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 3.0, 1.0, 8.0, 8.0, 8.0, 5.0, 9.0, 5.0, 15.0, 17.0, 22.0, 12.0, 12.0, 22.0, 20.0, 23.0, 29.0, 23.0, 33.0, 19.0, 34.0, 30.0, 36.0, 42.0, 38.0, 26.0, 46.0, 35.0, 45.0, 39.0, 32.0, 27.0, 33.0, 37.0, 19.0, 28.0, 17.0, 17.0, 19.0, 17.0, 16.0, 14.0, 16.0, 10.0, 7.0, 10.0, 4.0, 13.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.0007399916648864746, -0.0007141800597310066, -0.0006883684545755386, -0.0006625568494200706, -0.0006367452442646027, -0.0006109336391091347, -0.0005851220339536667, -0.0005593104287981987, -0.0005334988236427307, -0.0005076872184872627, -0.00048187561333179474, -0.00045606400817632675, -0.00043025240302085876, -0.0004044407978653908, -0.0003786291927099228, -0.0003528175875544548, -0.0003270059823989868, -0.00030119437724351883, -0.00027538277208805084, -0.00024957116693258286, -0.00022375956177711487, -0.00019794795662164688, -0.0001721363514661789, -0.0001463247463107109, -0.00012051314115524292, -9.470153599977493e-05, -6.888993084430695e-05, -4.307832568883896e-05, -1.726672053337097e-05, 8.544884622097015e-06, 3.4356489777565e-05, 6.016809493303299e-05, 8.597970008850098e-05, 0.00011179130524396896, 0.00013760291039943695, 0.00016341451555490494, 0.00018922612071037292, 0.0002150377258658409, 0.0002408493310213089, 0.0002666609361767769, 0.0002924725413322449, 0.00031828414648771286, 0.00034409575164318085, 0.00036990735679864883, 0.0003957189619541168, 0.0004215305671095848, 0.0004473421722650528, 0.0004731537774205208, 0.0004989653825759888, 0.0005247769877314568, 0.0005505885928869247, 0.0005764001980423927, 0.0006022118031978607, 0.0006280234083533287, 0.0006538350135087967, 0.0006796466186642647, 0.0007054582238197327, 0.0007312698289752007, 0.0007570814341306686, 0.0007828930392861366, 0.0008087046444416046, 0.0008345162495970726, 0.0008603278547525406, 0.0008861394599080086, 0.0009119510650634766]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 5.0, 3.0, 1.0, 4.0, 10.0, 10.0, 16.0, 13.0, 15.0, 10.0, 22.0, 25.0, 32.0, 28.0, 33.0, 36.0, 41.0, 43.0, 45.0, 46.0, 37.0, 40.0, 41.0, 36.0, 40.0, 42.0, 39.0, 33.0, 42.0, 32.0, 28.0, 31.0, 18.0, 22.0, 23.0, 20.0, 14.0, 17.0, 1.0, 2.0, 3.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.15625, -3.05645751953125, -2.9566650390625, -2.85687255859375, -2.757080078125, -2.65728759765625, -2.5574951171875, -2.45770263671875, -2.35791015625, -2.25811767578125, -2.1583251953125, -2.05853271484375, -1.958740234375, -1.85894775390625, -1.7591552734375, -1.65936279296875, -1.5595703125, -1.45977783203125, -1.3599853515625, -1.26019287109375, -1.160400390625, -1.06060791015625, -0.9608154296875, -0.86102294921875, -0.76123046875, -0.66143798828125, -0.5616455078125, -0.46185302734375, -0.362060546875, -0.26226806640625, -0.1624755859375, -0.06268310546875, 0.037109375, 0.13690185546875, 0.2366943359375, 0.33648681640625, 0.436279296875, 0.53607177734375, 0.6358642578125, 0.73565673828125, 0.83544921875, 0.93524169921875, 1.0350341796875, 1.13482666015625, 1.234619140625, 1.33441162109375, 1.4342041015625, 1.53399658203125, 1.6337890625, 1.73358154296875, 1.8333740234375, 1.93316650390625, 2.032958984375, 2.13275146484375, 2.2325439453125, 2.33233642578125, 2.43212890625, 2.53192138671875, 2.6317138671875, 2.73150634765625, 2.831298828125, 2.93109130859375, 3.0308837890625, 3.13067626953125, 3.23046875]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 8.0, 6.0, 22.0, 26.0, 39.0, 40.0, 66.0, 83.0, 136.0, 174.0, 233.0, 374.0, 496.0, 639.0, 911.0, 1252.0, 1952.0, 3124.0, 5805.0, 12585.0, 33614.0, 102331.0, 284972.0, 361312.0, 152133.0, 50003.0, 17516.0, 7407.0, 3821.0, 2269.0, 1509.0, 1005.0, 733.0, 543.0, 393.0, 311.0, 192.0, 160.0, 102.0, 80.0, 59.0, 34.0, 22.0, 28.0, 16.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-2.283203125, -2.207550048828125, -2.13189697265625, -2.056243896484375, -1.9805908203125, -1.904937744140625, -1.82928466796875, -1.753631591796875, -1.677978515625, -1.602325439453125, -1.52667236328125, -1.451019287109375, -1.3753662109375, -1.299713134765625, -1.22406005859375, -1.148406982421875, -1.07275390625, -0.997100830078125, -0.92144775390625, -0.845794677734375, -0.7701416015625, -0.694488525390625, -0.61883544921875, -0.543182373046875, -0.467529296875, -0.391876220703125, -0.31622314453125, -0.240570068359375, -0.1649169921875, -0.089263916015625, -0.01361083984375, 0.062042236328125, 0.1376953125, 0.213348388671875, 0.28900146484375, 0.364654541015625, 0.4403076171875, 0.515960693359375, 0.59161376953125, 0.667266845703125, 0.742919921875, 0.818572998046875, 0.89422607421875, 0.969879150390625, 1.0455322265625, 1.121185302734375, 1.19683837890625, 1.272491455078125, 1.34814453125, 1.423797607421875, 1.49945068359375, 1.575103759765625, 1.6507568359375, 1.726409912109375, 1.80206298828125, 1.877716064453125, 1.953369140625, 2.029022216796875, 2.10467529296875, 2.180328369140625, 2.2559814453125, 2.331634521484375, 2.40728759765625, 2.482940673828125, 2.55859375]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 5.0, 5.0, 5.0, 6.0, 9.0, 10.0, 15.0, 9.0, 17.0, 18.0, 26.0, 13.0, 16.0, 25.0, 32.0, 38.0, 25.0, 31.0, 40.0, 47.0, 54.0, 107.0, 341.0, 1505.0, 158.0, 69.0, 46.0, 47.0, 34.0, 28.0, 27.0, 34.0, 32.0, 29.0, 16.0, 14.0, 18.0, 14.0, 9.0, 13.0, 11.0, 14.0, 6.0, 4.0, 7.0, 2.0, 6.0, 5.0, 2.0, 2.0, 1.0, 1.0, 2.0], "bins": [-10.5625, -10.25390625, -9.9453125, -9.63671875, -9.328125, -9.01953125, -8.7109375, -8.40234375, -8.09375, -7.78515625, -7.4765625, -7.16796875, -6.859375, -6.55078125, -6.2421875, -5.93359375, -5.625, -5.31640625, -5.0078125, -4.69921875, -4.390625, -4.08203125, -3.7734375, -3.46484375, -3.15625, -2.84765625, -2.5390625, -2.23046875, -1.921875, -1.61328125, -1.3046875, -0.99609375, -0.6875, -0.37890625, -0.0703125, 0.23828125, 0.546875, 0.85546875, 1.1640625, 1.47265625, 1.78125, 2.08984375, 2.3984375, 2.70703125, 3.015625, 3.32421875, 3.6328125, 3.94140625, 4.25, 4.55859375, 4.8671875, 5.17578125, 5.484375, 5.79296875, 6.1015625, 6.41015625, 6.71875, 7.02734375, 7.3359375, 7.64453125, 7.953125, 8.26171875, 8.5703125, 8.87890625, 9.1875]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 1.0, 11.0, 10.0, 23.0, 29.0, 34.0, 69.0, 137.0, 335.0, 1004.0, 6039.0, 3059236.0, 75497.0, 2225.0, 568.0, 233.0, 94.0, 53.0, 41.0, 24.0, 21.0, 15.0, 7.0, 2.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.0, -32.77587890625, -31.5517578125, -30.32763671875, -29.103515625, -27.87939453125, -26.6552734375, -25.43115234375, -24.20703125, -22.98291015625, -21.7587890625, -20.53466796875, -19.310546875, -18.08642578125, -16.8623046875, -15.63818359375, -14.4140625, -13.18994140625, -11.9658203125, -10.74169921875, -9.517578125, -8.29345703125, -7.0693359375, -5.84521484375, -4.62109375, -3.39697265625, -2.1728515625, -0.94873046875, 0.275390625, 1.49951171875, 2.7236328125, 3.94775390625, 5.171875, 6.39599609375, 7.6201171875, 8.84423828125, 10.068359375, 11.29248046875, 12.5166015625, 13.74072265625, 14.96484375, 16.18896484375, 17.4130859375, 18.63720703125, 19.861328125, 21.08544921875, 22.3095703125, 23.53369140625, 24.7578125, 25.98193359375, 27.2060546875, 28.43017578125, 29.654296875, 30.87841796875, 32.1025390625, 33.32666015625, 34.55078125, 35.77490234375, 36.9990234375, 38.22314453125, 39.447265625, 40.67138671875, 41.8955078125, 43.11962890625, 44.34375]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 110.0, 804.0, 96.0, 4.0, 2.0, 1.0], "bins": [-277.0393371582031, -272.3788146972656, -267.7182922363281, -263.0577697753906, -258.3972473144531, -253.7367401123047, -249.0762176513672, -244.41571044921875, -239.75518798828125, -235.09466552734375, -230.43414306640625, -225.7736358642578, -221.1131134033203, -216.4525909423828, -211.7920684814453, -207.13156127929688, -202.47103881835938, -197.81051635742188, -193.14999389648438, -188.48948669433594, -183.82896423339844, -179.16844177246094, -174.50791931152344, -169.847412109375, -165.18687438964844, -160.52635192871094, -155.86582946777344, -151.205322265625, -146.5447998046875, -141.88427734375, -137.2237548828125, -132.563232421875, -127.9027099609375, -123.2421875, -118.58167266845703, -113.92115020751953, -109.26063537597656, -104.60011291503906, -99.93959045410156, -95.2790756225586, -90.61856079101562, -85.95803833007812, -81.29752349853516, -76.63700103759766, -71.97648620605469, -67.31596374511719, -62.65544509887695, -57.99492645263672, -53.33440399169922, -48.673885345458984, -44.01336669921875, -39.35284423828125, -34.69232940673828, -30.031808853149414, -25.371288299560547, -20.710769653320312, -16.05025291442871, -11.389734268188477, -6.729214668273926, -2.068695068359375, 2.5918235778808594, 7.252342224121094, 11.912862777709961, 16.573381423950195, 21.23390007019043]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 1.0, 5.0, 6.0, 6.0, 7.0, 6.0, 13.0, 10.0, 14.0, 7.0, 19.0, 21.0, 17.0, 19.0, 25.0, 33.0, 38.0, 41.0, 39.0, 32.0, 41.0, 39.0, 34.0, 40.0, 31.0, 40.0, 39.0, 35.0, 38.0, 38.0, 36.0, 27.0, 19.0, 15.0, 26.0, 31.0, 18.0, 14.0, 17.0, 16.0, 6.0, 10.0, 4.0, 6.0, 2.0, 6.0, 3.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-32.61052322387695, -31.530698776245117, -30.45087432861328, -29.371047973632812, -28.291223526000977, -27.21139907836914, -26.131572723388672, -25.051748275756836, -23.971923828125, -22.892099380493164, -21.812274932861328, -20.73244857788086, -19.652624130249023, -18.572799682617188, -17.49297332763672, -16.413148880004883, -15.333324432373047, -14.253499984741211, -13.173674583435059, -12.093849182128906, -11.01402473449707, -9.934200286865234, -8.854374885559082, -7.774549961090088, -6.694725036621094, -5.6149001121521, -4.5350751876831055, -3.4552502632141113, -2.375425338745117, -1.295600414276123, -0.2157754898071289, 0.8640494346618652, 1.943878173828125, 3.023703098297119, 4.103528022766113, 5.183352947235107, 6.263177871704102, 7.343002796173096, 8.42282772064209, 9.502653121948242, 10.582477569580078, 11.662302017211914, 12.742127418518066, 13.821952819824219, 14.901777267456055, 15.98160171508789, 17.06142807006836, 18.141252517700195, 19.22107696533203, 20.300901412963867, 21.380725860595703, 22.460552215576172, 23.540376663208008, 24.620201110839844, 25.700027465820312, 26.77985191345215, 27.859676361083984, 28.93950080871582, 30.019325256347656, 31.099151611328125, 32.178977966308594, 33.2588005065918, 34.338626861572266, 35.41844940185547, 36.49827575683594]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 5.0, 2.0, 7.0, 5.0, 13.0, 15.0, 8.0, 21.0, 13.0, 23.0, 24.0, 33.0, 37.0, 36.0, 40.0, 40.0, 47.0, 44.0, 58.0, 43.0, 39.0, 44.0, 38.0, 43.0, 44.0, 32.0, 35.0, 36.0, 27.0, 33.0, 38.0, 24.0, 13.0, 15.0, 12.0, 9.0, 1.0, 4.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.66015625, -3.54852294921875, -3.4368896484375, -3.32525634765625, -3.213623046875, -3.10198974609375, -2.9903564453125, -2.87872314453125, -2.76708984375, -2.65545654296875, -2.5438232421875, -2.43218994140625, -2.320556640625, -2.20892333984375, -2.0972900390625, -1.98565673828125, -1.8740234375, -1.76239013671875, -1.6507568359375, -1.53912353515625, -1.427490234375, -1.31585693359375, -1.2042236328125, -1.09259033203125, -0.98095703125, -0.86932373046875, -0.7576904296875, -0.64605712890625, -0.534423828125, -0.42279052734375, -0.3111572265625, -0.19952392578125, -0.087890625, 0.02374267578125, 0.1353759765625, 0.24700927734375, 0.358642578125, 0.47027587890625, 0.5819091796875, 0.69354248046875, 0.80517578125, 0.91680908203125, 1.0284423828125, 1.14007568359375, 1.251708984375, 1.36334228515625, 1.4749755859375, 1.58660888671875, 1.6982421875, 1.80987548828125, 1.9215087890625, 2.03314208984375, 2.144775390625, 2.25640869140625, 2.3680419921875, 2.47967529296875, 2.59130859375, 2.70294189453125, 2.8145751953125, 2.92620849609375, 3.037841796875, 3.14947509765625, 3.2611083984375, 3.37274169921875, 3.484375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 4.0, 4.0, 2.0, 3.0, 8.0, 4.0, 6.0, 9.0, 7.0, 7.0, 11.0, 18.0, 23.0, 38.0, 53.0, 73.0, 164.0, 253.0, 455.0, 792.0, 1454.0, 2671.0, 5566.0, 12474.0, 34079.0, 129748.0, 929773.0, 2349907.0, 588318.0, 91753.0, 26695.0, 10305.0, 4646.0, 2204.0, 1208.0, 630.0, 353.0, 199.0, 118.0, 90.0, 51.0, 35.0, 15.0, 14.0, 13.0, 13.0, 11.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-6.43359375, -6.22186279296875, -6.0101318359375, -5.79840087890625, -5.586669921875, -5.37493896484375, -5.1632080078125, -4.95147705078125, -4.73974609375, -4.52801513671875, -4.3162841796875, -4.10455322265625, -3.892822265625, -3.68109130859375, -3.4693603515625, -3.25762939453125, -3.0458984375, -2.83416748046875, -2.6224365234375, -2.41070556640625, -2.198974609375, -1.98724365234375, -1.7755126953125, -1.56378173828125, -1.35205078125, -1.14031982421875, -0.9285888671875, -0.71685791015625, -0.505126953125, -0.29339599609375, -0.0816650390625, 0.13006591796875, 0.341796875, 0.55352783203125, 0.7652587890625, 0.97698974609375, 1.188720703125, 1.40045166015625, 1.6121826171875, 1.82391357421875, 2.03564453125, 2.24737548828125, 2.4591064453125, 2.67083740234375, 2.882568359375, 3.09429931640625, 3.3060302734375, 3.51776123046875, 3.7294921875, 3.94122314453125, 4.1529541015625, 4.36468505859375, 4.576416015625, 4.78814697265625, 4.9998779296875, 5.21160888671875, 5.42333984375, 5.63507080078125, 5.8468017578125, 6.05853271484375, 6.270263671875, 6.48199462890625, 6.6937255859375, 6.90545654296875, 7.1171875]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 17.0, 15.0, 24.0, 28.0, 53.0, 59.0, 88.0, 119.0, 222.0, 305.0, 445.0, 636.0, 647.0, 476.0, 323.0, 207.0, 134.0, 90.0, 62.0, 37.0, 33.0, 13.0, 6.0, 11.0, 5.0, 7.0, 4.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.9921875, -9.65966796875, -9.3271484375, -8.99462890625, -8.662109375, -8.32958984375, -7.9970703125, -7.66455078125, -7.33203125, -6.99951171875, -6.6669921875, -6.33447265625, -6.001953125, -5.66943359375, -5.3369140625, -5.00439453125, -4.671875, -4.33935546875, -4.0068359375, -3.67431640625, -3.341796875, -3.00927734375, -2.6767578125, -2.34423828125, -2.01171875, -1.67919921875, -1.3466796875, -1.01416015625, -0.681640625, -0.34912109375, -0.0166015625, 0.31591796875, 0.6484375, 0.98095703125, 1.3134765625, 1.64599609375, 1.978515625, 2.31103515625, 2.6435546875, 2.97607421875, 3.30859375, 3.64111328125, 3.9736328125, 4.30615234375, 4.638671875, 4.97119140625, 5.3037109375, 5.63623046875, 5.96875, 6.30126953125, 6.6337890625, 6.96630859375, 7.298828125, 7.63134765625, 7.9638671875, 8.29638671875, 8.62890625, 8.96142578125, 9.2939453125, 9.62646484375, 9.958984375, 10.29150390625, 10.6240234375, 10.95654296875, 11.2890625]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 6.0, 10.0, 14.0, 23.0, 27.0, 54.0, 82.0, 142.0, 254.0, 546.0, 1257.0, 3421.0, 10706.0, 41511.0, 272756.0, 2860162.0, 887979.0, 87783.0, 18737.0, 5349.0, 1931.0, 716.0, 322.0, 192.0, 101.0, 68.0, 41.0, 30.0, 16.0, 24.0, 4.0, 7.0, 5.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.6796875, -14.201904296875, -13.72412109375, -13.246337890625, -12.7685546875, -12.290771484375, -11.81298828125, -11.335205078125, -10.857421875, -10.379638671875, -9.90185546875, -9.424072265625, -8.9462890625, -8.468505859375, -7.99072265625, -7.512939453125, -7.03515625, -6.557373046875, -6.07958984375, -5.601806640625, -5.1240234375, -4.646240234375, -4.16845703125, -3.690673828125, -3.212890625, -2.735107421875, -2.25732421875, -1.779541015625, -1.3017578125, -0.823974609375, -0.34619140625, 0.131591796875, 0.609375, 1.087158203125, 1.56494140625, 2.042724609375, 2.5205078125, 2.998291015625, 3.47607421875, 3.953857421875, 4.431640625, 4.909423828125, 5.38720703125, 5.864990234375, 6.3427734375, 6.820556640625, 7.29833984375, 7.776123046875, 8.25390625, 8.731689453125, 9.20947265625, 9.687255859375, 10.1650390625, 10.642822265625, 11.12060546875, 11.598388671875, 12.076171875, 12.553955078125, 13.03173828125, 13.509521484375, 13.9873046875, 14.465087890625, 14.94287109375, 15.420654296875, 15.8984375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 6.0, 4.0, 10.0, 12.0, 19.0, 21.0, 29.0, 29.0, 58.0, 67.0, 81.0, 83.0, 89.0, 91.0, 92.0, 57.0, 56.0, 62.0, 42.0, 30.0, 25.0, 13.0, 7.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-33.387962341308594, -32.34501266479492, -31.30206298828125, -30.259113311767578, -29.216163635253906, -28.173213958740234, -27.130264282226562, -26.08731460571289, -25.04436492919922, -24.001415252685547, -22.958465576171875, -21.915515899658203, -20.87256622314453, -19.82961654663086, -18.786666870117188, -17.743717193603516, -16.70076560974121, -15.657815933227539, -14.614866256713867, -13.571916580200195, -12.528966903686523, -11.486017227172852, -10.443066596984863, -9.400116920471191, -8.35716724395752, -7.314217567443848, -6.271267890930176, -5.228317737579346, -4.185368061065674, -3.142418384552002, -2.099468231201172, -1.0565185546875, -0.013568878173828125, 1.0293809175491333, 2.0723307132720947, 3.1152806282043457, 4.158230304718018, 5.2011799812316895, 6.2441301345825195, 7.287079811096191, 8.330029487609863, 9.372979164123535, 10.415928840637207, 11.458879470825195, 12.501829147338867, 13.544778823852539, 14.587728500366211, 15.630678176879883, 16.673627853393555, 17.716577529907227, 18.7595272064209, 19.80247688293457, 20.845426559448242, 21.888376235961914, 22.93132781982422, 23.97427749633789, 25.017227172851562, 26.060176849365234, 27.103126525878906, 28.146076202392578, 29.18902587890625, 30.231975555419922, 31.274925231933594, 32.317874908447266, 33.36082458496094]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 8.0, 5.0, 6.0, 13.0, 15.0, 19.0, 28.0, 19.0, 28.0, 30.0, 26.0, 26.0, 30.0, 44.0, 41.0, 49.0, 47.0, 48.0, 52.0, 46.0, 45.0, 39.0, 38.0, 44.0, 36.0, 27.0, 36.0, 26.0, 20.0, 15.0, 21.0, 22.0, 14.0, 11.0, 10.0, 9.0, 1.0, 2.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.460285186767578, -29.486406326293945, -28.51252555847168, -27.538646697998047, -26.56476593017578, -25.59088706970215, -24.617008209228516, -23.64312744140625, -22.669248580932617, -21.695369720458984, -20.72148895263672, -19.747610092163086, -18.77372932434082, -17.799850463867188, -16.825969696044922, -15.852090835571289, -14.87821102142334, -13.90433120727539, -12.930451393127441, -11.956571578979492, -10.98269271850586, -10.00881290435791, -9.034933090209961, -8.061054229736328, -7.087173938751221, -6.1132941246032715, -5.1394147872924805, -4.165534973144531, -3.191655397415161, -2.217775821685791, -1.2438960075378418, -0.2700166702270508, 0.7038631439208984, 1.6777427196502686, 2.6516222953796387, 3.625502109527588, 4.599381446838379, 5.573261260986328, 6.547141075134277, 7.521020412445068, 8.49489974975586, 9.468779563903809, 10.442659378051758, 11.41653823852539, 12.39041805267334, 13.364297866821289, 14.338177680969238, 15.312057495117188, 16.285938262939453, 17.259817123413086, 18.23369789123535, 19.207576751708984, 20.18145751953125, 21.155336380004883, 22.129215240478516, 23.10309600830078, 24.076974868774414, 25.050853729248047, 26.024734497070312, 26.998613357543945, 27.97249412536621, 28.946372985839844, 29.92025375366211, 30.894132614135742, 31.868011474609375]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 2.0, 7.0, 5.0, 10.0, 10.0, 18.0, 8.0, 15.0, 16.0, 15.0, 25.0, 36.0, 34.0, 35.0, 28.0, 41.0, 39.0, 42.0, 49.0, 42.0, 50.0, 46.0, 41.0, 44.0, 45.0, 29.0, 34.0, 22.0, 33.0, 33.0, 27.0, 20.0, 25.0, 16.0, 17.0, 14.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.697265625, -3.58966064453125, -3.4820556640625, -3.37445068359375, -3.266845703125, -3.15924072265625, -3.0516357421875, -2.94403076171875, -2.83642578125, -2.72882080078125, -2.6212158203125, -2.51361083984375, -2.406005859375, -2.29840087890625, -2.1907958984375, -2.08319091796875, -1.9755859375, -1.86798095703125, -1.7603759765625, -1.65277099609375, -1.545166015625, -1.43756103515625, -1.3299560546875, -1.22235107421875, -1.11474609375, -1.00714111328125, -0.8995361328125, -0.79193115234375, -0.684326171875, -0.57672119140625, -0.4691162109375, -0.36151123046875, -0.25390625, -0.14630126953125, -0.0386962890625, 0.06890869140625, 0.176513671875, 0.28411865234375, 0.3917236328125, 0.49932861328125, 0.60693359375, 0.71453857421875, 0.8221435546875, 0.92974853515625, 1.037353515625, 1.14495849609375, 1.2525634765625, 1.36016845703125, 1.4677734375, 1.57537841796875, 1.6829833984375, 1.79058837890625, 1.898193359375, 2.00579833984375, 2.1134033203125, 2.22100830078125, 2.32861328125, 2.43621826171875, 2.5438232421875, 2.65142822265625, 2.759033203125, 2.86663818359375, 2.9742431640625, 3.08184814453125, 3.189453125]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 4.0, 9.0, 9.0, 11.0, 29.0, 40.0, 49.0, 75.0, 98.0, 160.0, 252.0, 355.0, 614.0, 893.0, 1313.0, 2203.0, 3339.0, 5551.0, 9088.0, 15188.0, 26338.0, 47871.0, 91096.0, 173770.0, 269657.0, 183733.0, 97287.0, 50644.0, 27900.0, 15912.0, 9319.0, 5681.0, 3571.0, 2291.0, 1438.0, 910.0, 608.0, 431.0, 256.0, 170.0, 135.0, 80.0, 53.0, 42.0, 29.0, 17.0, 13.0, 9.0, 7.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-0.392822265625, -0.3799629211425781, -0.36710357666015625, -0.3542442321777344, -0.3413848876953125, -0.3285255432128906, -0.31566619873046875, -0.3028068542480469, -0.289947509765625, -0.2770881652832031, -0.26422882080078125, -0.2513694763183594, -0.2385101318359375, -0.22565078735351562, -0.21279144287109375, -0.19993209838867188, -0.18707275390625, -0.17421340942382812, -0.16135406494140625, -0.14849472045898438, -0.1356353759765625, -0.12277603149414062, -0.10991668701171875, -0.09705734252929688, -0.084197998046875, -0.07133865356445312, -0.05847930908203125, -0.045619964599609375, -0.0327606201171875, -0.019901275634765625, -0.00704193115234375, 0.005817413330078125, 0.0186767578125, 0.031536102294921875, 0.04439544677734375, 0.057254791259765625, 0.0701141357421875, 0.08297348022460938, 0.09583282470703125, 0.10869216918945312, 0.121551513671875, 0.13441085815429688, 0.14727020263671875, 0.16012954711914062, 0.1729888916015625, 0.18584823608398438, 0.19870758056640625, 0.21156692504882812, 0.22442626953125, 0.23728561401367188, 0.25014495849609375, 0.2630043029785156, 0.2758636474609375, 0.2887229919433594, 0.30158233642578125, 0.3144416809082031, 0.327301025390625, 0.3401603698730469, 0.35301971435546875, 0.3658790588378906, 0.3787384033203125, 0.3915977478027344, 0.40445709228515625, 0.4173164367675781, 0.43017578125]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 1.0, 5.0, 5.0, 5.0, 9.0, 7.0, 13.0, 10.0, 14.0, 29.0, 14.0, 21.0, 24.0, 26.0, 37.0, 40.0, 31.0, 47.0, 37.0, 45.0, 31.0, 1069.0, 41.0, 51.0, 46.0, 41.0, 36.0, 35.0, 28.0, 33.0, 41.0, 27.0, 22.0, 20.0, 18.0, 20.0, 11.0, 9.0, 6.0, 4.0, 7.0, 7.0, 3.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.31640625, -2.246551513671875, -2.17669677734375, -2.106842041015625, -2.0369873046875, -1.967132568359375, -1.89727783203125, -1.827423095703125, -1.757568359375, -1.687713623046875, -1.61785888671875, -1.548004150390625, -1.4781494140625, -1.408294677734375, -1.33843994140625, -1.268585205078125, -1.19873046875, -1.128875732421875, -1.05902099609375, -0.989166259765625, -0.9193115234375, -0.849456787109375, -0.77960205078125, -0.709747314453125, -0.639892578125, -0.570037841796875, -0.50018310546875, -0.430328369140625, -0.3604736328125, -0.290618896484375, -0.22076416015625, -0.150909423828125, -0.0810546875, -0.011199951171875, 0.05865478515625, 0.128509521484375, 0.1983642578125, 0.268218994140625, 0.33807373046875, 0.407928466796875, 0.477783203125, 0.547637939453125, 0.61749267578125, 0.687347412109375, 0.7572021484375, 0.827056884765625, 0.89691162109375, 0.966766357421875, 1.03662109375, 1.106475830078125, 1.17633056640625, 1.246185302734375, 1.3160400390625, 1.385894775390625, 1.45574951171875, 1.525604248046875, 1.595458984375, 1.665313720703125, 1.73516845703125, 1.805023193359375, 1.8748779296875, 1.944732666015625, 2.01458740234375, 2.084442138671875, 2.154296875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 12.0, 16.0, 16.0, 29.0, 41.0, 75.0, 102.0, 167.0, 249.0, 398.0, 605.0, 1035.0, 1725.0, 2840.0, 4802.0, 8145.0, 14278.0, 24605.0, 43268.0, 78892.0, 149709.0, 1293938.0, 214291.0, 114580.0, 61325.0, 34089.0, 19551.0, 11529.0, 6696.0, 4059.0, 2367.0, 1397.0, 893.0, 497.0, 322.0, 204.0, 143.0, 92.0, 44.0, 28.0, 25.0, 17.0, 8.0, 10.0, 6.0, 2.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.314453125, -0.3042411804199219, -0.29402923583984375, -0.2838172912597656, -0.2736053466796875, -0.2633934020996094, -0.25318145751953125, -0.24296951293945312, -0.232757568359375, -0.22254562377929688, -0.21233367919921875, -0.20212173461914062, -0.1919097900390625, -0.18169784545898438, -0.17148590087890625, -0.16127395629882812, -0.15106201171875, -0.14085006713867188, -0.13063812255859375, -0.12042617797851562, -0.1102142333984375, -0.10000228881835938, -0.08979034423828125, -0.07957839965820312, -0.069366455078125, -0.059154510498046875, -0.04894256591796875, -0.038730621337890625, -0.0285186767578125, -0.018306732177734375, -0.00809478759765625, 0.002117156982421875, 0.0123291015625, 0.022541046142578125, 0.03275299072265625, 0.042964935302734375, 0.0531768798828125, 0.06338882446289062, 0.07360076904296875, 0.08381271362304688, 0.094024658203125, 0.10423660278320312, 0.11444854736328125, 0.12466049194335938, 0.1348724365234375, 0.14508438110351562, 0.15529632568359375, 0.16550827026367188, 0.17572021484375, 0.18593215942382812, 0.19614410400390625, 0.20635604858398438, 0.2165679931640625, 0.22677993774414062, 0.23699188232421875, 0.24720382690429688, 0.257415771484375, 0.2676277160644531, 0.27783966064453125, 0.2880516052246094, 0.2982635498046875, 0.3084754943847656, 0.31868743896484375, 0.3288993835449219, 0.339111328125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 5.0, 4.0, 2.0, 9.0, 11.0, 11.0, 14.0, 20.0, 13.0, 42.0, 40.0, 43.0, 57.0, 56.0, 79.0, 96.0, 90.0, 87.0, 62.0, 47.0, 52.0, 21.0, 29.0, 19.0, 17.0, 9.0, 6.0, 12.0, 5.0, 9.0, 6.0, 1.0, 3.0, 3.0, 4.0, 2.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002574920654296875, -0.0025003254413604736, -0.0024257302284240723, -0.002351135015487671, -0.0022765398025512695, -0.002201944589614868, -0.002127349376678467, -0.0020527541637420654, -0.001978158950805664, -0.0019035637378692627, -0.0018289685249328613, -0.00175437331199646, -0.0016797780990600586, -0.0016051828861236572, -0.0015305876731872559, -0.0014559924602508545, -0.0013813972473144531, -0.0013068020343780518, -0.0012322068214416504, -0.001157611608505249, -0.0010830163955688477, -0.0010084211826324463, -0.0009338259696960449, -0.0008592307567596436, -0.0007846355438232422, -0.0007100403308868408, -0.0006354451179504395, -0.0005608499050140381, -0.0004862546920776367, -0.00041165947914123535, -0.000337064266204834, -0.0002624690532684326, -0.00018787384033203125, -0.00011327862739562988, -3.8683414459228516e-05, 3.591179847717285e-05, 0.00011050701141357422, 0.00018510222434997559, 0.00025969743728637695, 0.0003342926502227783, 0.0004088878631591797, 0.00048348307609558105, 0.0005580782890319824, 0.0006326735019683838, 0.0007072687149047852, 0.0007818639278411865, 0.0008564591407775879, 0.0009310543537139893, 0.0010056495666503906, 0.001080244779586792, 0.0011548399925231934, 0.0012294352054595947, 0.001304030418395996, 0.0013786256313323975, 0.0014532208442687988, 0.0015278160572052002, 0.0016024112701416016, 0.001677006483078003, 0.0017516016960144043, 0.0018261969089508057, 0.001900792121887207, 0.0019753873348236084, 0.0020499825477600098, 0.002124577760696411, 0.0021991729736328125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 5.0, 5.0, 2.0, 5.0, 7.0, 5.0, 10.0, 10.0, 10.0, 16.0, 14.0, 22.0, 29.0, 39.0, 55.0, 63.0, 86.0, 110.0, 155.0, 272.0, 567.0, 2550.0, 49738.0, 953243.0, 37940.0, 2175.0, 522.0, 254.0, 179.0, 100.0, 94.0, 71.0, 53.0, 32.0, 23.0, 25.0, 14.0, 16.0, 12.0, 11.0, 9.0, 3.0, 4.0, 1.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.0306854248046875, -0.0295259952545166, -0.028366565704345703, -0.027207136154174805, -0.026047706604003906, -0.024888277053833008, -0.02372884750366211, -0.02256941795349121, -0.021409988403320312, -0.020250558853149414, -0.019091129302978516, -0.017931699752807617, -0.01677227020263672, -0.01561284065246582, -0.014453411102294922, -0.013293981552124023, -0.012134552001953125, -0.010975122451782227, -0.009815692901611328, -0.00865626335144043, -0.007496833801269531, -0.006337404251098633, -0.005177974700927734, -0.004018545150756836, -0.0028591156005859375, -0.001699686050415039, -0.0005402565002441406, 0.0006191730499267578, 0.0017786026000976562, 0.0029380321502685547, 0.004097461700439453, 0.0052568912506103516, 0.00641632080078125, 0.0075757503509521484, 0.008735179901123047, 0.009894609451293945, 0.011054039001464844, 0.012213468551635742, 0.01337289810180664, 0.014532327651977539, 0.015691757202148438, 0.016851186752319336, 0.018010616302490234, 0.019170045852661133, 0.02032947540283203, 0.02148890495300293, 0.022648334503173828, 0.023807764053344727, 0.024967193603515625, 0.026126623153686523, 0.027286052703857422, 0.02844548225402832, 0.02960491180419922, 0.030764341354370117, 0.031923770904541016, 0.033083200454711914, 0.03424263000488281, 0.03540205955505371, 0.03656148910522461, 0.03772091865539551, 0.038880348205566406, 0.040039777755737305, 0.0411992073059082, 0.0423586368560791, 0.04351806640625]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 49.0, 611.0, 339.0, 19.0, 2.0], "bins": [-0.029197389259934425, -0.02871725521981716, -0.028237121179699898, -0.027756987139582634, -0.02727685309946537, -0.026796719059348106, -0.026316583156585693, -0.02583644911646843, -0.025356315076351166, -0.024876181036233902, -0.024396046996116638, -0.023915912955999374, -0.02343577891588211, -0.022955644875764847, -0.022475510835647583, -0.02199537679553032, -0.021515242755413055, -0.02103510871529579, -0.020554974675178528, -0.020074840635061264, -0.019594706594944, -0.019114572554826736, -0.018634438514709473, -0.01815430447459221, -0.017674168571829796, -0.017194034531712532, -0.016713900491595268, -0.016233766451478004, -0.01575363241136074, -0.015273497439920902, -0.014793363399803638, -0.014313229359686375, -0.013833094388246536, -0.013352960348129272, -0.012872826308012009, -0.012392692267894745, -0.011912557296454906, -0.011432423256337643, -0.010952289216220379, -0.010472155176103115, -0.009992021135985851, -0.009511887095868587, -0.009031753055751324, -0.008551618084311485, -0.008071484044194221, -0.007591350004076958, -0.007111215963959694, -0.00663108192384243, -0.006150947883725166, -0.0056708138436079025, -0.005190679337829351, -0.004710545297712088, -0.004230411257594824, -0.0037502769846469164, -0.003270142711699009, -0.002790008671581745, -0.0023098743986338377, -0.001829740242101252, -0.0013496060855686665, -0.000869471812620759, -0.0003893376560881734, 9.079650044441223e-05, 0.0005709307733923197, 0.0010510648135095835, 0.001531199086457491]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 7.0, 2.0, 5.0, 2.0, 4.0, 8.0, 7.0, 20.0, 17.0, 22.0, 30.0, 35.0, 31.0, 28.0, 37.0, 41.0, 37.0, 48.0, 50.0, 40.0, 57.0, 59.0, 37.0, 43.0, 35.0, 46.0, 32.0, 44.0, 29.0, 28.0, 25.0, 16.0, 24.0, 12.0, 16.0, 12.0, 4.0, 6.0, 9.0, 3.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0009323954582214355, -0.0008912673220038414, -0.0008501391857862473, -0.0008090110495686531, -0.000767882913351059, -0.0007267547771334648, -0.0006856266409158707, -0.0006444985046982765, -0.0006033703684806824, -0.0005622422322630882, -0.0005211140960454941, -0.00047998595982789993, -0.0004388578236103058, -0.00039772968739271164, -0.0003566015511751175, -0.00031547341495752335, -0.0002743452787399292, -0.00023321714252233505, -0.0001920890063047409, -0.00015096087008714676, -0.00010983273386955261, -6.870459765195847e-05, -2.757646143436432e-05, 1.3551674783229828e-05, 5.4679811000823975e-05, 9.580794721841812e-05, 0.00013693608343601227, 0.00017806421965360641, 0.00021919235587120056, 0.0002603204920887947, 0.00030144862830638885, 0.000342576764523983, 0.00038370490074157715, 0.0004248330369591713, 0.00046596117317676544, 0.0005070893093943596, 0.0005482174456119537, 0.0005893455818295479, 0.000630473718047142, 0.0006716018542647362, 0.0007127299904823303, 0.0007538581266999245, 0.0007949862629175186, 0.0008361143991351128, 0.0008772425353527069, 0.0009183706715703011, 0.0009594988077878952, 0.0010006269440054893, 0.0010417550802230835, 0.0010828832164406776, 0.0011240113526582718, 0.001165139488875866, 0.00120626762509346, 0.0012473957613110542, 0.0012885238975286484, 0.0013296520337462425, 0.0013707801699638367, 0.0014119083061814308, 0.001453036442399025, 0.0014941645786166191, 0.0015352927148342133, 0.0015764208510518074, 0.0016175489872694016, 0.0016586771234869957, 0.0016998052597045898]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 7.0, 2.0, 7.0, 5.0, 10.0, 10.0, 18.0, 8.0, 15.0, 16.0, 15.0, 25.0, 36.0, 34.0, 35.0, 28.0, 41.0, 39.0, 42.0, 49.0, 42.0, 50.0, 46.0, 41.0, 44.0, 45.0, 30.0, 33.0, 22.0, 33.0, 33.0, 28.0, 19.0, 25.0, 16.0, 17.0, 14.0, 10.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.697265625, -3.58966064453125, -3.4820556640625, -3.37445068359375, -3.266845703125, -3.15924072265625, -3.0516357421875, -2.94403076171875, -2.83642578125, -2.72882080078125, -2.6212158203125, -2.51361083984375, -2.406005859375, -2.29840087890625, -2.1907958984375, -2.08319091796875, -1.9755859375, -1.86798095703125, -1.7603759765625, -1.65277099609375, -1.545166015625, -1.43756103515625, -1.3299560546875, -1.22235107421875, -1.11474609375, -1.00714111328125, -0.8995361328125, -0.79193115234375, -0.684326171875, -0.57672119140625, -0.4691162109375, -0.36151123046875, -0.25390625, -0.14630126953125, -0.0386962890625, 0.06890869140625, 0.176513671875, 0.28411865234375, 0.3917236328125, 0.49932861328125, 0.60693359375, 0.71453857421875, 0.8221435546875, 0.92974853515625, 1.037353515625, 1.14495849609375, 1.2525634765625, 1.36016845703125, 1.4677734375, 1.57537841796875, 1.6829833984375, 1.79058837890625, 1.898193359375, 2.00579833984375, 2.1134033203125, 2.22100830078125, 2.32861328125, 2.43621826171875, 2.5438232421875, 2.65142822265625, 2.759033203125, 2.86663818359375, 2.9742431640625, 3.08184814453125, 3.189453125]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 1.0, 8.0, 7.0, 11.0, 22.0, 19.0, 22.0, 58.0, 71.0, 115.0, 185.0, 252.0, 434.0, 681.0, 1161.0, 1707.0, 2967.0, 4880.0, 8649.0, 17488.0, 44577.0, 156761.0, 548064.0, 172272.0, 47602.0, 18279.0, 9381.0, 4988.0, 2986.0, 1796.0, 1135.0, 688.0, 427.0, 313.0, 196.0, 122.0, 88.0, 45.0, 34.0, 25.0, 15.0, 6.0, 10.0, 6.0, 8.0, 4.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.767578125, -3.625579833984375, -3.48358154296875, -3.341583251953125, -3.1995849609375, -3.057586669921875, -2.91558837890625, -2.773590087890625, -2.631591796875, -2.489593505859375, -2.34759521484375, -2.205596923828125, -2.0635986328125, -1.921600341796875, -1.77960205078125, -1.637603759765625, -1.49560546875, -1.353607177734375, -1.21160888671875, -1.069610595703125, -0.9276123046875, -0.785614013671875, -0.64361572265625, -0.501617431640625, -0.359619140625, -0.217620849609375, -0.07562255859375, 0.066375732421875, 0.2083740234375, 0.350372314453125, 0.49237060546875, 0.634368896484375, 0.7763671875, 0.918365478515625, 1.06036376953125, 1.202362060546875, 1.3443603515625, 1.486358642578125, 1.62835693359375, 1.770355224609375, 1.912353515625, 2.054351806640625, 2.19635009765625, 2.338348388671875, 2.4803466796875, 2.622344970703125, 2.76434326171875, 2.906341552734375, 3.04833984375, 3.190338134765625, 3.33233642578125, 3.474334716796875, 3.6163330078125, 3.758331298828125, 3.90032958984375, 4.042327880859375, 4.184326171875, 4.326324462890625, 4.46832275390625, 4.610321044921875, 4.7523193359375, 4.894317626953125, 5.03631591796875, 5.178314208984375, 5.3203125]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 3.0, 1.0, 3.0, 7.0, 5.0, 7.0, 4.0, 13.0, 16.0, 13.0, 15.0, 19.0, 23.0, 28.0, 21.0, 24.0, 27.0, 44.0, 51.0, 52.0, 53.0, 85.0, 146.0, 1504.0, 293.0, 113.0, 57.0, 53.0, 48.0, 45.0, 31.0, 38.0, 28.0, 31.0, 29.0, 22.0, 17.0, 16.0, 17.0, 6.0, 15.0, 9.0, 4.0, 4.0, 3.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-10.953125, -10.619384765625, -10.28564453125, -9.951904296875, -9.6181640625, -9.284423828125, -8.95068359375, -8.616943359375, -8.283203125, -7.949462890625, -7.61572265625, -7.281982421875, -6.9482421875, -6.614501953125, -6.28076171875, -5.947021484375, -5.61328125, -5.279541015625, -4.94580078125, -4.612060546875, -4.2783203125, -3.944580078125, -3.61083984375, -3.277099609375, -2.943359375, -2.609619140625, -2.27587890625, -1.942138671875, -1.6083984375, -1.274658203125, -0.94091796875, -0.607177734375, -0.2734375, 0.060302734375, 0.39404296875, 0.727783203125, 1.0615234375, 1.395263671875, 1.72900390625, 2.062744140625, 2.396484375, 2.730224609375, 3.06396484375, 3.397705078125, 3.7314453125, 4.065185546875, 4.39892578125, 4.732666015625, 5.06640625, 5.400146484375, 5.73388671875, 6.067626953125, 6.4013671875, 6.735107421875, 7.06884765625, 7.402587890625, 7.736328125, 8.070068359375, 8.40380859375, 8.737548828125, 9.0712890625, 9.405029296875, 9.73876953125, 10.072509765625, 10.40625]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 4.0, 5.0, 5.0, 8.0, 11.0, 11.0, 30.0, 40.0, 23.0, 43.0, 73.0, 94.0, 135.0, 265.0, 563.0, 2463.0, 44890.0, 3055724.0, 37801.0, 2219.0, 525.0, 285.0, 136.0, 80.0, 75.0, 52.0, 41.0, 25.0, 18.0, 17.0, 13.0, 6.0, 8.0, 3.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.9375, -26.95654296875, -25.9755859375, -24.99462890625, -24.013671875, -23.03271484375, -22.0517578125, -21.07080078125, -20.08984375, -19.10888671875, -18.1279296875, -17.14697265625, -16.166015625, -15.18505859375, -14.2041015625, -13.22314453125, -12.2421875, -11.26123046875, -10.2802734375, -9.29931640625, -8.318359375, -7.33740234375, -6.3564453125, -5.37548828125, -4.39453125, -3.41357421875, -2.4326171875, -1.45166015625, -0.470703125, 0.51025390625, 1.4912109375, 2.47216796875, 3.453125, 4.43408203125, 5.4150390625, 6.39599609375, 7.376953125, 8.35791015625, 9.3388671875, 10.31982421875, 11.30078125, 12.28173828125, 13.2626953125, 14.24365234375, 15.224609375, 16.20556640625, 17.1865234375, 18.16748046875, 19.1484375, 20.12939453125, 21.1103515625, 22.09130859375, 23.072265625, 24.05322265625, 25.0341796875, 26.01513671875, 26.99609375, 27.97705078125, 28.9580078125, 29.93896484375, 30.919921875, 31.90087890625, 32.8818359375, 33.86279296875, 34.84375]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 49.0, 411.0, 470.0, 75.0, 9.0, 2.0, 0.0, 1.0], "bins": [-164.82701110839844, -161.98956298828125, -159.152099609375, -156.3146514892578, -153.47720336914062, -150.63975524902344, -147.8022918701172, -144.96484375, -142.1273956298828, -139.28994750976562, -136.45248413085938, -133.6150360107422, -130.777587890625, -127.94013214111328, -125.10267639160156, -122.26522827148438, -119.42777252197266, -116.59031677246094, -113.75286865234375, -110.91541290283203, -108.07796478271484, -105.24050903320312, -102.40306091308594, -99.56560516357422, -96.7281494140625, -93.89069366455078, -91.0532455444336, -88.21578979492188, -85.37834167480469, -82.54088592529297, -79.70343017578125, -76.86598205566406, -74.02853393554688, -71.19107818603516, -68.35363006591797, -65.51617431640625, -62.67872619628906, -59.841270446777344, -57.00381851196289, -54.16636657714844, -51.32891082763672, -48.491458892822266, -45.65400695800781, -42.816551208496094, -39.979103088378906, -37.14164733886719, -34.304195404052734, -31.46674346923828, -28.62929344177246, -25.791841506958008, -22.954387664794922, -20.11693572998047, -17.279483795166016, -14.442031860351562, -11.604578018188477, -8.767126083374023, -5.92967414855957, -3.092221736907959, -0.25476932525634766, 2.582683563232422, 5.420135498046875, 8.257587432861328, 11.095041275024414, 13.932493209838867, 16.76994514465332]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 3.0, 5.0, 2.0, 8.0, 5.0, 8.0, 7.0, 8.0, 8.0, 14.0, 14.0, 17.0, 24.0, 28.0, 17.0, 27.0, 32.0, 37.0, 46.0, 46.0, 39.0, 39.0, 37.0, 39.0, 48.0, 40.0, 34.0, 43.0, 46.0, 36.0, 31.0, 30.0, 29.0, 26.0, 27.0, 17.0, 24.0, 19.0, 10.0, 13.0, 7.0, 3.0, 11.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0], "bins": [-37.04316711425781, -36.027320861816406, -35.011474609375, -33.995628356933594, -32.97978210449219, -31.96393585205078, -30.948089599609375, -29.93224334716797, -28.916397094726562, -27.900550842285156, -26.88470458984375, -25.868858337402344, -24.853012084960938, -23.83716583251953, -22.821319580078125, -21.80547332763672, -20.78962516784668, -19.773778915405273, -18.757932662963867, -17.74208641052246, -16.726240158081055, -15.710393905639648, -14.694546699523926, -13.67870044708252, -12.662854194641113, -11.647007942199707, -10.6311616897583, -9.615314483642578, -8.599468231201172, -7.583622455596924, -6.567775726318359, -5.551929473876953, -4.536083221435547, -3.5202369689941406, -2.5043904781341553, -1.48854398727417, -0.47269773483276367, 0.5431485176086426, 1.558995246887207, 2.5748414993286133, 3.5906877517700195, 4.606534004211426, 5.622380256652832, 6.6382269859313965, 7.654073238372803, 8.669919967651367, 9.685766220092773, 10.70161247253418, 11.717458724975586, 12.733304977416992, 13.749151229858398, 14.764997482299805, 15.780843734741211, 16.796689987182617, 17.812538146972656, 18.828384399414062, 19.84423065185547, 20.860076904296875, 21.87592315673828, 22.891769409179688, 23.907615661621094, 24.9234619140625, 25.939308166503906, 26.955154418945312, 27.97100067138672]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 2.0, 5.0, 3.0, 8.0, 14.0, 10.0, 15.0, 15.0, 19.0, 16.0, 21.0, 27.0, 32.0, 35.0, 38.0, 29.0, 42.0, 34.0, 43.0, 48.0, 50.0, 39.0, 37.0, 58.0, 31.0, 39.0, 33.0, 24.0, 32.0, 32.0, 32.0, 23.0, 26.0, 14.0, 14.0, 20.0, 7.0, 11.0, 8.0, 9.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0], "bins": [-3.80078125, -3.691802978515625, -3.58282470703125, -3.473846435546875, -3.3648681640625, -3.255889892578125, -3.14691162109375, -3.037933349609375, -2.928955078125, -2.819976806640625, -2.71099853515625, -2.602020263671875, -2.4930419921875, -2.384063720703125, -2.27508544921875, -2.166107177734375, -2.05712890625, -1.948150634765625, -1.83917236328125, -1.730194091796875, -1.6212158203125, -1.512237548828125, -1.40325927734375, -1.294281005859375, -1.185302734375, -1.076324462890625, -0.96734619140625, -0.858367919921875, -0.7493896484375, -0.640411376953125, -0.53143310546875, -0.422454833984375, -0.3134765625, -0.204498291015625, -0.09552001953125, 0.013458251953125, 0.1224365234375, 0.231414794921875, 0.34039306640625, 0.449371337890625, 0.558349609375, 0.667327880859375, 0.77630615234375, 0.885284423828125, 0.9942626953125, 1.103240966796875, 1.21221923828125, 1.321197509765625, 1.43017578125, 1.539154052734375, 1.64813232421875, 1.757110595703125, 1.8660888671875, 1.975067138671875, 2.08404541015625, 2.193023681640625, 2.302001953125, 2.410980224609375, 2.51995849609375, 2.628936767578125, 2.7379150390625, 2.846893310546875, 2.95587158203125, 3.064849853515625, 3.173828125]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 8.0, 22.0, 21.0, 48.0, 52.0, 84.0, 130.0, 205.0, 346.0, 529.0, 915.0, 1630.0, 2855.0, 5130.0, 9966.0, 21823.0, 61187.0, 263438.0, 1312327.0, 1845509.0, 508169.0, 100672.0, 31620.0, 13289.0, 6421.0, 3312.0, 1883.0, 1074.0, 606.0, 359.0, 208.0, 154.0, 96.0, 59.0, 42.0, 33.0, 14.0, 12.0, 8.0, 7.0, 7.0, 0.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25, -5.07012939453125, -4.8902587890625, -4.71038818359375, -4.530517578125, -4.35064697265625, -4.1707763671875, -3.99090576171875, -3.81103515625, -3.63116455078125, -3.4512939453125, -3.27142333984375, -3.091552734375, -2.91168212890625, -2.7318115234375, -2.55194091796875, -2.3720703125, -2.19219970703125, -2.0123291015625, -1.83245849609375, -1.652587890625, -1.47271728515625, -1.2928466796875, -1.11297607421875, -0.93310546875, -0.75323486328125, -0.5733642578125, -0.39349365234375, -0.213623046875, -0.03375244140625, 0.1461181640625, 0.32598876953125, 0.505859375, 0.68572998046875, 0.8656005859375, 1.04547119140625, 1.225341796875, 1.40521240234375, 1.5850830078125, 1.76495361328125, 1.94482421875, 2.12469482421875, 2.3045654296875, 2.48443603515625, 2.664306640625, 2.84417724609375, 3.0240478515625, 3.20391845703125, 3.3837890625, 3.56365966796875, 3.7435302734375, 3.92340087890625, 4.103271484375, 4.28314208984375, 4.4630126953125, 4.64288330078125, 4.82275390625, 5.00262451171875, 5.1824951171875, 5.36236572265625, 5.542236328125, 5.72210693359375, 5.9019775390625, 6.08184814453125, 6.26171875]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 6.0, 11.0, 10.0, 14.0, 21.0, 25.0, 31.0, 44.0, 82.0, 75.0, 142.0, 207.0, 289.0, 361.0, 475.0, 491.0, 445.0, 370.0, 289.0, 197.0, 145.0, 84.0, 65.0, 49.0, 46.0, 26.0, 14.0, 11.0, 13.0, 8.0, 7.0, 3.0, 7.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0], "bins": [-10.671875, -10.4019775390625, -10.132080078125, -9.8621826171875, -9.59228515625, -9.3223876953125, -9.052490234375, -8.7825927734375, -8.5126953125, -8.2427978515625, -7.972900390625, -7.7030029296875, -7.43310546875, -7.1632080078125, -6.893310546875, -6.6234130859375, -6.353515625, -6.0836181640625, -5.813720703125, -5.5438232421875, -5.27392578125, -5.0040283203125, -4.734130859375, -4.4642333984375, -4.1943359375, -3.9244384765625, -3.654541015625, -3.3846435546875, -3.11474609375, -2.8448486328125, -2.574951171875, -2.3050537109375, -2.03515625, -1.7652587890625, -1.495361328125, -1.2254638671875, -0.95556640625, -0.6856689453125, -0.415771484375, -0.1458740234375, 0.1240234375, 0.3939208984375, 0.663818359375, 0.9337158203125, 1.20361328125, 1.4735107421875, 1.743408203125, 2.0133056640625, 2.283203125, 2.5531005859375, 2.822998046875, 3.0928955078125, 3.36279296875, 3.6326904296875, 3.902587890625, 4.1724853515625, 4.4423828125, 4.7122802734375, 4.982177734375, 5.2520751953125, 5.52197265625, 5.7918701171875, 6.061767578125, 6.3316650390625, 6.6015625]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 4.0, 1.0, 3.0, 5.0, 10.0, 11.0, 23.0, 25.0, 37.0, 63.0, 97.0, 168.0, 309.0, 583.0, 1393.0, 3363.0, 9516.0, 33607.0, 174610.0, 1791583.0, 1937647.0, 189764.0, 35316.0, 9938.0, 3403.0, 1410.0, 613.0, 307.0, 179.0, 98.0, 63.0, 34.0, 27.0, 19.0, 20.0, 5.0, 7.0, 11.0, 5.0, 5.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-11.0625, -10.653076171875, -10.24365234375, -9.834228515625, -9.4248046875, -9.015380859375, -8.60595703125, -8.196533203125, -7.787109375, -7.377685546875, -6.96826171875, -6.558837890625, -6.1494140625, -5.739990234375, -5.33056640625, -4.921142578125, -4.51171875, -4.102294921875, -3.69287109375, -3.283447265625, -2.8740234375, -2.464599609375, -2.05517578125, -1.645751953125, -1.236328125, -0.826904296875, -0.41748046875, -0.008056640625, 0.4013671875, 0.810791015625, 1.22021484375, 1.629638671875, 2.0390625, 2.448486328125, 2.85791015625, 3.267333984375, 3.6767578125, 4.086181640625, 4.49560546875, 4.905029296875, 5.314453125, 5.723876953125, 6.13330078125, 6.542724609375, 6.9521484375, 7.361572265625, 7.77099609375, 8.180419921875, 8.58984375, 8.999267578125, 9.40869140625, 9.818115234375, 10.2275390625, 10.636962890625, 11.04638671875, 11.455810546875, 11.865234375, 12.274658203125, 12.68408203125, 13.093505859375, 13.5029296875, 13.912353515625, 14.32177734375, 14.731201171875, 15.140625]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 5.0, 7.0, 16.0, 21.0, 27.0, 40.0, 67.0, 114.0, 120.0, 127.0, 109.0, 116.0, 78.0, 47.0, 43.0, 23.0, 21.0, 10.0, 4.0, 2.0, 2.0, 5.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-50.32038497924805, -48.87887954711914, -47.4373779296875, -45.995872497558594, -44.55436706542969, -43.11286544799805, -41.67136001586914, -40.2298583984375, -38.788352966308594, -37.34684753417969, -35.90534591674805, -34.46384048461914, -33.0223388671875, -31.580833435058594, -30.139328002929688, -28.697824478149414, -27.25632095336914, -25.814817428588867, -24.373313903808594, -22.931808471679688, -21.490304946899414, -20.04880142211914, -18.607295989990234, -17.16579246520996, -15.724288940429688, -14.282785415649414, -12.841280937194824, -11.399776458740234, -9.958272933959961, -8.516769409179688, -7.075264930725098, -5.633760452270508, -4.192253112792969, -2.750749111175537, -1.3092451095581055, 0.13225889205932617, 1.5737628936767578, 3.0152668952941895, 4.456770896911621, 5.898275375366211, 7.339778900146484, 8.781282424926758, 10.222786903381348, 11.664291381835938, 13.105794906616211, 14.547298431396484, 15.988802909851074, 17.430307388305664, 18.871810913085938, 20.31331443786621, 21.754817962646484, 23.19632339477539, 24.637826919555664, 26.079330444335938, 27.520835876464844, 28.962339401245117, 30.40384292602539, 31.845346450805664, 33.28684997558594, 34.728355407714844, 36.16986083984375, 37.61136245727539, 39.0528678894043, 40.49436950683594, 41.935874938964844]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 3.0, 3.0, 7.0, 1.0, 5.0, 9.0, 6.0, 11.0, 7.0, 17.0, 20.0, 18.0, 15.0, 12.0, 30.0, 28.0, 29.0, 37.0, 35.0, 46.0, 43.0, 45.0, 53.0, 37.0, 50.0, 46.0, 29.0, 33.0, 33.0, 41.0, 32.0, 36.0, 23.0, 22.0, 32.0, 14.0, 20.0, 21.0, 12.0, 8.0, 10.0, 9.0, 5.0, 7.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-29.854324340820312, -28.95223045349121, -28.050138473510742, -27.14804458618164, -26.245952606201172, -25.34385871887207, -24.44176483154297, -23.5396728515625, -22.6375789642334, -21.735485076904297, -20.833393096923828, -19.931299209594727, -19.029205322265625, -18.127113342285156, -17.225019454956055, -16.322925567626953, -15.420833587646484, -14.5187406539917, -13.616647720336914, -12.714553833007812, -11.812460899353027, -10.910367965698242, -10.00827407836914, -9.106181144714355, -8.20408821105957, -7.301995277404785, -6.399901866912842, -5.497808456420898, -4.595715522766113, -3.693622589111328, -2.7915291786193848, -1.8894357681274414, -0.9873428344726562, -0.08524966239929199, 0.8168435096740723, 1.7189366817474365, 2.621029853820801, 3.523122787475586, 4.425216197967529, 5.327309608459473, 6.229402542114258, 7.131495475769043, 8.033588409423828, 8.93568229675293, 9.837775230407715, 10.7398681640625, 11.641962051391602, 12.544054985046387, 13.446147918701172, 14.348240852355957, 15.250333786010742, 16.152427673339844, 17.054519653320312, 17.956613540649414, 18.858707427978516, 19.760799407958984, 20.662893295288086, 21.564987182617188, 22.467079162597656, 23.369173049926758, 24.27126693725586, 25.173358917236328, 26.07545280456543, 26.97754669189453, 27.879638671875]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 14.0, 7.0, 8.0, 19.0, 14.0, 16.0, 17.0, 24.0, 25.0, 29.0, 41.0, 37.0, 37.0, 36.0, 39.0, 58.0, 41.0, 43.0, 38.0, 61.0, 45.0, 43.0, 37.0, 25.0, 32.0, 37.0, 25.0, 25.0, 21.0, 15.0, 17.0, 21.0, 10.0, 10.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.0390625, -3.924896240234375, -3.81072998046875, -3.696563720703125, -3.5823974609375, -3.468231201171875, -3.35406494140625, -3.239898681640625, -3.125732421875, -3.011566162109375, -2.89739990234375, -2.783233642578125, -2.6690673828125, -2.554901123046875, -2.44073486328125, -2.326568603515625, -2.21240234375, -2.098236083984375, -1.98406982421875, -1.869903564453125, -1.7557373046875, -1.641571044921875, -1.52740478515625, -1.413238525390625, -1.299072265625, -1.184906005859375, -1.07073974609375, -0.956573486328125, -0.8424072265625, -0.728240966796875, -0.61407470703125, -0.499908447265625, -0.3857421875, -0.271575927734375, -0.15740966796875, -0.043243408203125, 0.0709228515625, 0.185089111328125, 0.29925537109375, 0.413421630859375, 0.527587890625, 0.641754150390625, 0.75592041015625, 0.870086669921875, 0.9842529296875, 1.098419189453125, 1.21258544921875, 1.326751708984375, 1.44091796875, 1.555084228515625, 1.66925048828125, 1.783416748046875, 1.8975830078125, 2.011749267578125, 2.12591552734375, 2.240081787109375, 2.354248046875, 2.468414306640625, 2.58258056640625, 2.696746826171875, 2.8109130859375, 2.925079345703125, 3.03924560546875, 3.153411865234375, 3.267578125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 2.0, 6.0, 4.0, 9.0, 15.0, 18.0, 40.0, 40.0, 63.0, 83.0, 110.0, 188.0, 243.0, 384.0, 589.0, 846.0, 1338.0, 1983.0, 3114.0, 4704.0, 7410.0, 11876.0, 19550.0, 33604.0, 59599.0, 113743.0, 212124.0, 248408.0, 146561.0, 76324.0, 41540.0, 24234.0, 14416.0, 9029.0, 5701.0, 3696.0, 2292.0, 1518.0, 1016.0, 723.0, 464.0, 319.0, 205.0, 123.0, 107.0, 70.0, 34.0, 29.0, 19.0, 12.0, 8.0, 13.0, 6.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.40869140625, -0.3951568603515625, -0.381622314453125, -0.3680877685546875, -0.35455322265625, -0.3410186767578125, -0.327484130859375, -0.3139495849609375, -0.3004150390625, -0.2868804931640625, -0.273345947265625, -0.2598114013671875, -0.24627685546875, -0.2327423095703125, -0.219207763671875, -0.2056732177734375, -0.192138671875, -0.1786041259765625, -0.165069580078125, -0.1515350341796875, -0.13800048828125, -0.1244659423828125, -0.110931396484375, -0.0973968505859375, -0.0838623046875, -0.0703277587890625, -0.056793212890625, -0.0432586669921875, -0.02972412109375, -0.0161895751953125, -0.002655029296875, 0.0108795166015625, 0.0244140625, 0.0379486083984375, 0.051483154296875, 0.0650177001953125, 0.07855224609375, 0.0920867919921875, 0.105621337890625, 0.1191558837890625, 0.1326904296875, 0.1462249755859375, 0.159759521484375, 0.1732940673828125, 0.18682861328125, 0.2003631591796875, 0.213897705078125, 0.2274322509765625, 0.240966796875, 0.2545013427734375, 0.268035888671875, 0.2815704345703125, 0.29510498046875, 0.3086395263671875, 0.322174072265625, 0.3357086181640625, 0.3492431640625, 0.3627777099609375, 0.376312255859375, 0.3898468017578125, 0.40338134765625, 0.4169158935546875, 0.430450439453125, 0.4439849853515625, 0.45751953125]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 9.0, 8.0, 13.0, 13.0, 15.0, 18.0, 19.0, 20.0, 27.0, 29.0, 24.0, 37.0, 41.0, 44.0, 34.0, 42.0, 53.0, 1075.0, 55.0, 42.0, 46.0, 47.0, 40.0, 35.0, 37.0, 34.0, 23.0, 29.0, 20.0, 17.0, 25.0, 11.0, 9.0, 7.0, 9.0, 2.0, 7.0, 2.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.14453125, -2.069671630859375, -1.99481201171875, -1.919952392578125, -1.8450927734375, -1.770233154296875, -1.69537353515625, -1.620513916015625, -1.545654296875, -1.470794677734375, -1.39593505859375, -1.321075439453125, -1.2462158203125, -1.171356201171875, -1.09649658203125, -1.021636962890625, -0.94677734375, -0.871917724609375, -0.79705810546875, -0.722198486328125, -0.6473388671875, -0.572479248046875, -0.49761962890625, -0.422760009765625, -0.347900390625, -0.273040771484375, -0.19818115234375, -0.123321533203125, -0.0484619140625, 0.026397705078125, 0.10125732421875, 0.176116943359375, 0.2509765625, 0.325836181640625, 0.40069580078125, 0.475555419921875, 0.5504150390625, 0.625274658203125, 0.70013427734375, 0.774993896484375, 0.849853515625, 0.924713134765625, 0.99957275390625, 1.074432373046875, 1.1492919921875, 1.224151611328125, 1.29901123046875, 1.373870849609375, 1.44873046875, 1.523590087890625, 1.59844970703125, 1.673309326171875, 1.7481689453125, 1.823028564453125, 1.89788818359375, 1.972747802734375, 2.047607421875, 2.122467041015625, 2.19732666015625, 2.272186279296875, 2.3470458984375, 2.421905517578125, 2.49676513671875, 2.571624755859375, 2.646484375]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 6.0, 14.0, 17.0, 22.0, 42.0, 65.0, 88.0, 149.0, 213.0, 265.0, 395.0, 557.0, 857.0, 1260.0, 1791.0, 2740.0, 3882.0, 5617.0, 8175.0, 12245.0, 17819.0, 27014.0, 41437.0, 67221.0, 114094.0, 188176.0, 1241374.0, 136550.0, 80739.0, 49119.0, 31170.0, 20561.0, 13934.0, 9403.0, 6243.0, 4394.0, 2961.0, 2062.0, 1370.0, 971.0, 632.0, 486.0, 332.0, 228.0, 147.0, 97.0, 60.0, 35.0, 33.0, 25.0, 16.0, 9.0, 8.0, 6.0, 4.0, 1.0, 3.0], "bins": [-0.292724609375, -0.2839012145996094, -0.27507781982421875, -0.2662544250488281, -0.2574310302734375, -0.24860763549804688, -0.23978424072265625, -0.23096084594726562, -0.222137451171875, -0.21331405639648438, -0.20449066162109375, -0.19566726684570312, -0.1868438720703125, -0.17802047729492188, -0.16919708251953125, -0.16037368774414062, -0.15155029296875, -0.14272689819335938, -0.13390350341796875, -0.12508010864257812, -0.1162567138671875, -0.10743331909179688, -0.09860992431640625, -0.08978652954101562, -0.080963134765625, -0.07213973999023438, -0.06331634521484375, -0.054492950439453125, -0.0456695556640625, -0.036846160888671875, -0.02802276611328125, -0.019199371337890625, -0.0103759765625, -0.001552581787109375, 0.00727081298828125, 0.016094207763671875, 0.0249176025390625, 0.033740997314453125, 0.04256439208984375, 0.051387786865234375, 0.060211181640625, 0.06903457641601562, 0.07785797119140625, 0.08668136596679688, 0.0955047607421875, 0.10432815551757812, 0.11315155029296875, 0.12197494506835938, 0.13079833984375, 0.13962173461914062, 0.14844512939453125, 0.15726852416992188, 0.1660919189453125, 0.17491531372070312, 0.18373870849609375, 0.19256210327148438, 0.201385498046875, 0.21020889282226562, 0.21903228759765625, 0.22785568237304688, 0.2366790771484375, 0.24550247192382812, 0.25432586669921875, 0.2631492614746094, 0.27197265625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 2.0, 6.0, 2.0, 9.0, 12.0, 12.0, 13.0, 15.0, 26.0, 20.0, 35.0, 29.0, 40.0, 40.0, 48.0, 69.0, 79.0, 64.0, 66.0, 67.0, 51.0, 50.0, 42.0, 25.0, 28.0, 24.0, 29.0, 24.0, 13.0, 13.0, 9.0, 5.0, 4.0, 5.0, 4.0, 6.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0018301010131835938, -0.0017698854207992554, -0.001709669828414917, -0.0016494542360305786, -0.0015892386436462402, -0.0015290230512619019, -0.0014688074588775635, -0.001408591866493225, -0.0013483762741088867, -0.0012881606817245483, -0.00122794508934021, -0.0011677294969558716, -0.0011075139045715332, -0.0010472983121871948, -0.0009870827198028564, -0.0009268671274185181, -0.0008666515350341797, -0.0008064359426498413, -0.0007462203502655029, -0.0006860047578811646, -0.0006257891654968262, -0.0005655735731124878, -0.0005053579807281494, -0.00044514238834381104, -0.00038492679595947266, -0.0003247112035751343, -0.0002644956111907959, -0.00020428001880645752, -0.00014406442642211914, -8.384883403778076e-05, -2.3633241653442383e-05, 3.6582350730895996e-05, 9.679794311523438e-05, 0.00015701353549957275, 0.00021722912788391113, 0.0002774447202682495, 0.0003376603126525879, 0.00039787590503692627, 0.00045809149742126465, 0.000518307089805603, 0.0005785226821899414, 0.0006387382745742798, 0.0006989538669586182, 0.0007591694593429565, 0.0008193850517272949, 0.0008796006441116333, 0.0009398162364959717, 0.00100003182888031, 0.0010602474212646484, 0.0011204630136489868, 0.0011806786060333252, 0.0012408941984176636, 0.001301109790802002, 0.0013613253831863403, 0.0014215409755706787, 0.001481756567955017, 0.0015419721603393555, 0.0016021877527236938, 0.0016624033451080322, 0.0017226189374923706, 0.001782834529876709, 0.0018430501222610474, 0.0019032657146453857, 0.001963481307029724, 0.0020236968994140625]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 3.0, 5.0, 3.0, 7.0, 13.0, 17.0, 23.0, 30.0, 35.0, 63.0, 79.0, 105.0, 138.0, 239.0, 396.0, 1316.0, 34286.0, 969669.0, 39554.0, 1354.0, 419.0, 230.0, 169.0, 113.0, 77.0, 58.0, 50.0, 28.0, 19.0, 15.0, 10.0, 9.0, 4.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.041168212890625, -0.03993988037109375, -0.0387115478515625, -0.03748321533203125, -0.0362548828125, -0.03502655029296875, -0.0337982177734375, -0.03256988525390625, -0.031341552734375, -0.03011322021484375, -0.0288848876953125, -0.02765655517578125, -0.02642822265625, -0.02519989013671875, -0.0239715576171875, -0.02274322509765625, -0.021514892578125, -0.02028656005859375, -0.0190582275390625, -0.01782989501953125, -0.0166015625, -0.01537322998046875, -0.0141448974609375, -0.01291656494140625, -0.011688232421875, -0.01045989990234375, -0.0092315673828125, -0.00800323486328125, -0.00677490234375, -0.00554656982421875, -0.0043182373046875, -0.00308990478515625, -0.001861572265625, -0.00063323974609375, 0.0005950927734375, 0.00182342529296875, 0.0030517578125, 0.00428009033203125, 0.0055084228515625, 0.00673675537109375, 0.007965087890625, 0.00919342041015625, 0.0104217529296875, 0.01165008544921875, 0.01287841796875, 0.01410675048828125, 0.0153350830078125, 0.01656341552734375, 0.017791748046875, 0.01902008056640625, 0.0202484130859375, 0.02147674560546875, 0.022705078125, 0.02393341064453125, 0.0251617431640625, 0.02639007568359375, 0.027618408203125, 0.02884674072265625, 0.0300750732421875, 0.03130340576171875, 0.03253173828125, 0.03376007080078125, 0.0349884033203125, 0.03621673583984375, 0.037445068359375]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 48.0, 725.0, 236.0, 9.0], "bins": [-0.0299942996352911, -0.02950856275856495, -0.02902282401919365, -0.0285370871424675, -0.02805135026574135, -0.027565613389015198, -0.027079874649643898, -0.026594137772917747, -0.026108400896191597, -0.025622664019465446, -0.025136925280094147, -0.024651188403367996, -0.024165451526641846, -0.023679714649915695, -0.023193975910544395, -0.022708239033818245, -0.022222500294446945, -0.021736763417720795, -0.021251024678349495, -0.020765287801623344, -0.020279550924897194, -0.019793814048171043, -0.019308075308799744, -0.018822338432073593, -0.018336601555347443, -0.017850864678621292, -0.017365125939249992, -0.016879389062523842, -0.01639365218579769, -0.01590791530907154, -0.015422176569700241, -0.01493643969297409, -0.014450701884925365, -0.01396496407687664, -0.01347922720015049, -0.012993489392101765, -0.012507752515375614, -0.012022014707326889, -0.011536277830600739, -0.011050540022552013, -0.010564802214503288, -0.010079064406454563, -0.009593327529728413, -0.009107589721679688, -0.008621852844953537, -0.008136115036904812, -0.007650377694517374, -0.007164640352129936, -0.006678903475403786, -0.006193166133016348, -0.00570742879062891, -0.005221690982580185, -0.004735954105854034, -0.004250216297805309, -0.0037644789554178715, -0.0032787416130304337, -0.002793004270642996, -0.002307266928255558, -0.0018215294694527984, -0.0013357920106500387, -0.0008500546682626009, -0.0003643173258751631, 0.0001214202493429184, 0.0006071575917303562, 0.001092894934117794]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 4.0, 9.0, 11.0, 13.0, 9.0, 13.0, 21.0, 29.0, 44.0, 48.0, 48.0, 54.0, 46.0, 51.0, 61.0, 63.0, 75.0, 57.0, 53.0, 67.0, 45.0, 41.0, 29.0, 20.0, 28.0, 20.0, 14.0, 7.0, 7.0, 9.0, 4.0, 3.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0011525154113769531, -0.001105966977775097, -0.0010594185441732407, -0.0010128701105713844, -0.0009663216769695282, -0.000919773243367672, -0.0008732248097658157, -0.0008266763761639595, -0.0007801279425621033, -0.000733579508960247, -0.0006870310753583908, -0.0006404826417565346, -0.0005939342081546783, -0.0005473857745528221, -0.0005008373409509659, -0.00045428890734910965, -0.0004077404737472534, -0.0003611920401453972, -0.00031464360654354095, -0.0002680951729416847, -0.0002215467393398285, -0.00017499830573797226, -0.00012844987213611603, -8.19014385342598e-05, -3.5353004932403564e-05, 1.1195428669452667e-05, 5.77438622713089e-05, 0.00010429229587316513, 0.00015084072947502136, 0.0001973891630768776, 0.00024393759667873383, 0.00029048603028059006, 0.0003370344638824463, 0.0003835828974843025, 0.00043013133108615875, 0.000476679764688015, 0.0005232281982898712, 0.0005697766318917274, 0.0006163250654935837, 0.0006628734990954399, 0.0007094219326972961, 0.0007559703662991524, 0.0008025187999010086, 0.0008490672335028648, 0.0008956156671047211, 0.0009421641007065773, 0.0009887125343084335, 0.0010352609679102898, 0.001081809401512146, 0.0011283578351140022, 0.0011749062687158585, 0.0012214547023177147, 0.001268003135919571, 0.0013145515695214272, 0.0013611000031232834, 0.0014076484367251396, 0.0014541968703269958, 0.001500745303928852, 0.0015472937375307083, 0.0015938421711325645, 0.0016403906047344208, 0.001686939038336277, 0.0017334874719381332, 0.0017800359055399895, 0.0018265843391418457]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 8.0, 14.0, 7.0, 8.0, 19.0, 14.0, 16.0, 17.0, 24.0, 25.0, 29.0, 41.0, 37.0, 37.0, 36.0, 39.0, 58.0, 41.0, 43.0, 38.0, 61.0, 45.0, 43.0, 37.0, 25.0, 32.0, 37.0, 25.0, 25.0, 21.0, 15.0, 17.0, 21.0, 10.0, 10.0, 9.0, 6.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0], "bins": [-4.0390625, -3.924896240234375, -3.81072998046875, -3.696563720703125, -3.5823974609375, -3.468231201171875, -3.35406494140625, -3.239898681640625, -3.125732421875, -3.011566162109375, -2.89739990234375, -2.783233642578125, -2.6690673828125, -2.554901123046875, -2.44073486328125, -2.326568603515625, -2.21240234375, -2.098236083984375, -1.98406982421875, -1.869903564453125, -1.7557373046875, -1.641571044921875, -1.52740478515625, -1.413238525390625, -1.299072265625, -1.184906005859375, -1.07073974609375, -0.956573486328125, -0.8424072265625, -0.728240966796875, -0.61407470703125, -0.499908447265625, -0.3857421875, -0.271575927734375, -0.15740966796875, -0.043243408203125, 0.0709228515625, 0.185089111328125, 0.29925537109375, 0.413421630859375, 0.527587890625, 0.641754150390625, 0.75592041015625, 0.870086669921875, 0.9842529296875, 1.098419189453125, 1.21258544921875, 1.326751708984375, 1.44091796875, 1.555084228515625, 1.66925048828125, 1.783416748046875, 1.8975830078125, 2.011749267578125, 2.12591552734375, 2.240081787109375, 2.354248046875, 2.468414306640625, 2.58258056640625, 2.696746826171875, 2.8109130859375, 2.925079345703125, 3.03924560546875, 3.153411865234375, 3.267578125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 15.0, 12.0, 18.0, 22.0, 37.0, 61.0, 77.0, 91.0, 142.0, 189.0, 254.0, 405.0, 557.0, 845.0, 1274.0, 1982.0, 3086.0, 5530.0, 10312.0, 24113.0, 67289.0, 229639.0, 459974.0, 154496.0, 48510.0, 18674.0, 8444.0, 4549.0, 2641.0, 1726.0, 1100.0, 767.0, 517.0, 354.0, 250.0, 180.0, 116.0, 84.0, 77.0, 46.0, 35.0, 20.0, 15.0, 9.0, 9.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-4.1953125, -4.06951904296875, -3.9437255859375, -3.81793212890625, -3.692138671875, -3.56634521484375, -3.4405517578125, -3.31475830078125, -3.18896484375, -3.06317138671875, -2.9373779296875, -2.81158447265625, -2.685791015625, -2.55999755859375, -2.4342041015625, -2.30841064453125, -2.1826171875, -2.05682373046875, -1.9310302734375, -1.80523681640625, -1.679443359375, -1.55364990234375, -1.4278564453125, -1.30206298828125, -1.17626953125, -1.05047607421875, -0.9246826171875, -0.79888916015625, -0.673095703125, -0.54730224609375, -0.4215087890625, -0.29571533203125, -0.169921875, -0.04412841796875, 0.0816650390625, 0.20745849609375, 0.333251953125, 0.45904541015625, 0.5848388671875, 0.71063232421875, 0.83642578125, 0.96221923828125, 1.0880126953125, 1.21380615234375, 1.339599609375, 1.46539306640625, 1.5911865234375, 1.71697998046875, 1.8427734375, 1.96856689453125, 2.0943603515625, 2.22015380859375, 2.345947265625, 2.47174072265625, 2.5975341796875, 2.72332763671875, 2.84912109375, 2.97491455078125, 3.1007080078125, 3.22650146484375, 3.352294921875, 3.47808837890625, 3.6038818359375, 3.72967529296875, 3.85546875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 3.0, 0.0, 4.0, 5.0, 7.0, 7.0, 6.0, 7.0, 6.0, 16.0, 15.0, 11.0, 22.0, 15.0, 30.0, 28.0, 30.0, 34.0, 39.0, 41.0, 56.0, 82.0, 125.0, 336.0, 1474.0, 169.0, 81.0, 70.0, 50.0, 38.0, 28.0, 38.0, 32.0, 30.0, 23.0, 17.0, 14.0, 13.0, 8.0, 19.0, 9.0, 5.0, 8.0, 4.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.0234375, -12.6182861328125, -12.213134765625, -11.8079833984375, -11.40283203125, -10.9976806640625, -10.592529296875, -10.1873779296875, -9.7822265625, -9.3770751953125, -8.971923828125, -8.5667724609375, -8.16162109375, -7.7564697265625, -7.351318359375, -6.9461669921875, -6.541015625, -6.1358642578125, -5.730712890625, -5.3255615234375, -4.92041015625, -4.5152587890625, -4.110107421875, -3.7049560546875, -3.2998046875, -2.8946533203125, -2.489501953125, -2.0843505859375, -1.67919921875, -1.2740478515625, -0.868896484375, -0.4637451171875, -0.05859375, 0.3465576171875, 0.751708984375, 1.1568603515625, 1.56201171875, 1.9671630859375, 2.372314453125, 2.7774658203125, 3.1826171875, 3.5877685546875, 3.992919921875, 4.3980712890625, 4.80322265625, 5.2083740234375, 5.613525390625, 6.0186767578125, 6.423828125, 6.8289794921875, 7.234130859375, 7.6392822265625, 8.04443359375, 8.4495849609375, 8.854736328125, 9.2598876953125, 9.6650390625, 10.0701904296875, 10.475341796875, 10.8804931640625, 11.28564453125, 11.6907958984375, 12.095947265625, 12.5010986328125, 12.90625]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 7.0, 9.0, 4.0, 17.0, 18.0, 23.0, 33.0, 43.0, 57.0, 95.0, 145.0, 245.0, 604.0, 2110.0, 99542.0, 3033491.0, 7400.0, 965.0, 324.0, 182.0, 116.0, 81.0, 51.0, 35.0, 31.0, 18.0, 18.0, 12.0, 16.0, 4.0, 6.0, 1.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-43.6875, -42.41162109375, -41.1357421875, -39.85986328125, -38.583984375, -37.30810546875, -36.0322265625, -34.75634765625, -33.48046875, -32.20458984375, -30.9287109375, -29.65283203125, -28.376953125, -27.10107421875, -25.8251953125, -24.54931640625, -23.2734375, -21.99755859375, -20.7216796875, -19.44580078125, -18.169921875, -16.89404296875, -15.6181640625, -14.34228515625, -13.06640625, -11.79052734375, -10.5146484375, -9.23876953125, -7.962890625, -6.68701171875, -5.4111328125, -4.13525390625, -2.859375, -1.58349609375, -0.3076171875, 0.96826171875, 2.244140625, 3.52001953125, 4.7958984375, 6.07177734375, 7.34765625, 8.62353515625, 9.8994140625, 11.17529296875, 12.451171875, 13.72705078125, 15.0029296875, 16.27880859375, 17.5546875, 18.83056640625, 20.1064453125, 21.38232421875, 22.658203125, 23.93408203125, 25.2099609375, 26.48583984375, 27.76171875, 29.03759765625, 30.3134765625, 31.58935546875, 32.865234375, 34.14111328125, 35.4169921875, 36.69287109375, 37.96875]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 39.0, 315.0, 536.0, 114.0, 8.0], "bins": [-160.869140625, -158.24110412597656, -155.6130828857422, -152.98504638671875, -150.35702514648438, -147.72898864746094, -145.10096740722656, -142.47293090820312, -139.84490966796875, -137.2168731689453, -134.58885192871094, -131.9608154296875, -129.33279418945312, -126.70475769042969, -124.07672882080078, -121.44869995117188, -118.82066345214844, -116.19263458251953, -113.56460571289062, -110.93657684326172, -108.30854797363281, -105.68051147460938, -103.05248260498047, -100.42445373535156, -97.79642486572266, -95.16839599609375, -92.54036712646484, -89.91233825683594, -87.2843017578125, -84.6562728881836, -82.02824401855469, -79.40021514892578, -76.77218627929688, -74.14415740966797, -71.51612854003906, -68.88809967041016, -66.26007080078125, -63.63203811645508, -61.004005432128906, -58.3759765625, -55.747947692871094, -53.11991882324219, -50.49188995361328, -47.86385726928711, -45.2358283996582, -42.6077995300293, -39.979766845703125, -37.35173797607422, -34.72370910644531, -32.095680236816406, -29.467649459838867, -26.839618682861328, -24.211589813232422, -21.583560943603516, -18.955530166625977, -16.327499389648438, -13.699471473693848, -11.071441650390625, -8.443411827087402, -5.81538200378418, -3.187352180480957, -0.5593223571777344, 2.0687074661254883, 4.696738243103027, 7.324767112731934]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 0.0, 1.0, 5.0, 7.0, 8.0, 12.0, 10.0, 17.0, 15.0, 17.0, 21.0, 30.0, 34.0, 43.0, 48.0, 44.0, 44.0, 50.0, 43.0, 50.0, 45.0, 64.0, 38.0, 41.0, 46.0, 38.0, 30.0, 37.0, 27.0, 28.0, 25.0, 23.0, 14.0, 15.0, 7.0, 10.0, 11.0, 3.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-41.28052520751953, -40.12986373901367, -38.97920227050781, -37.82854080200195, -36.677879333496094, -35.52721405029297, -34.376556396484375, -33.22589111328125, -32.07522964477539, -30.92456817626953, -29.773906707763672, -28.623245239257812, -27.47258186340332, -26.32192039489746, -25.1712589263916, -24.02059555053711, -22.869935989379883, -21.719274520874023, -20.568613052368164, -19.417949676513672, -18.267288208007812, -17.116626739501953, -15.965965270996094, -14.815302848815918, -13.664641380310059, -12.5139799118042, -11.363317489624023, -10.212656021118164, -9.061994552612305, -7.911332130432129, -6.7606706619262695, -5.610008239746094, -4.459346771240234, -3.308684825897217, -2.1580231189727783, -1.0073614120483398, 0.14330053329467773, 1.2939624786376953, 2.4446239471435547, 3.5952863693237305, 4.74594783782959, 5.896609783172607, 7.047271728515625, 8.197933197021484, 9.348594665527344, 10.49925708770752, 11.649918556213379, 12.800580978393555, 13.951242446899414, 15.101903915405273, 16.252565383911133, 17.403228759765625, 18.553890228271484, 19.704551696777344, 20.855213165283203, 22.005874633789062, 23.156536102294922, 24.30719757080078, 25.45785903930664, 26.6085205078125, 27.759183883666992, 28.90984535217285, 30.06050682067871, 31.211170196533203, 32.36183166503906]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 6.0, 6.0, 5.0, 7.0, 15.0, 12.0, 21.0, 12.0, 21.0, 25.0, 24.0, 24.0, 27.0, 34.0, 44.0, 39.0, 54.0, 48.0, 59.0, 44.0, 39.0, 48.0, 46.0, 35.0, 40.0, 41.0, 35.0, 33.0, 24.0, 29.0, 19.0, 17.0, 16.0, 17.0, 15.0, 11.0, 5.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.37109375, -4.2481689453125, -4.125244140625, -4.0023193359375, -3.87939453125, -3.7564697265625, -3.633544921875, -3.5106201171875, -3.3876953125, -3.2647705078125, -3.141845703125, -3.0189208984375, -2.89599609375, -2.7730712890625, -2.650146484375, -2.5272216796875, -2.404296875, -2.2813720703125, -2.158447265625, -2.0355224609375, -1.91259765625, -1.7896728515625, -1.666748046875, -1.5438232421875, -1.4208984375, -1.2979736328125, -1.175048828125, -1.0521240234375, -0.92919921875, -0.8062744140625, -0.683349609375, -0.5604248046875, -0.4375, -0.3145751953125, -0.191650390625, -0.0687255859375, 0.05419921875, 0.1771240234375, 0.300048828125, 0.4229736328125, 0.5458984375, 0.6688232421875, 0.791748046875, 0.9146728515625, 1.03759765625, 1.1605224609375, 1.283447265625, 1.4063720703125, 1.529296875, 1.6522216796875, 1.775146484375, 1.8980712890625, 2.02099609375, 2.1439208984375, 2.266845703125, 2.3897705078125, 2.5126953125, 2.6356201171875, 2.758544921875, 2.8814697265625, 3.00439453125, 3.1273193359375, 3.250244140625, 3.3731689453125, 3.49609375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 5.0, 2.0, 6.0, 10.0, 6.0, 8.0, 8.0, 18.0, 13.0, 22.0, 35.0, 29.0, 45.0, 58.0, 85.0, 128.0, 210.0, 498.0, 1557.0, 5941.0, 37733.0, 1249418.0, 2802077.0, 83297.0, 9435.0, 2158.0, 664.0, 286.0, 148.0, 108.0, 62.0, 59.0, 39.0, 29.0, 20.0, 22.0, 16.0, 12.0, 9.0, 7.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-16.03125, -15.547607421875, -15.06396484375, -14.580322265625, -14.0966796875, -13.613037109375, -13.12939453125, -12.645751953125, -12.162109375, -11.678466796875, -11.19482421875, -10.711181640625, -10.2275390625, -9.743896484375, -9.26025390625, -8.776611328125, -8.29296875, -7.809326171875, -7.32568359375, -6.842041015625, -6.3583984375, -5.874755859375, -5.39111328125, -4.907470703125, -4.423828125, -3.940185546875, -3.45654296875, -2.972900390625, -2.4892578125, -2.005615234375, -1.52197265625, -1.038330078125, -0.5546875, -0.071044921875, 0.41259765625, 0.896240234375, 1.3798828125, 1.863525390625, 2.34716796875, 2.830810546875, 3.314453125, 3.798095703125, 4.28173828125, 4.765380859375, 5.2490234375, 5.732666015625, 6.21630859375, 6.699951171875, 7.18359375, 7.667236328125, 8.15087890625, 8.634521484375, 9.1181640625, 9.601806640625, 10.08544921875, 10.569091796875, 11.052734375, 11.536376953125, 12.02001953125, 12.503662109375, 12.9873046875, 13.470947265625, 13.95458984375, 14.438232421875, 14.921875]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 5.0, 5.0, 8.0, 11.0, 22.0, 50.0, 94.0, 223.0, 430.0, 793.0, 1056.0, 727.0, 346.0, 154.0, 78.0, 33.0, 26.0, 12.0, 7.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.359375, -20.787109375, -20.21484375, -19.642578125, -19.0703125, -18.498046875, -17.92578125, -17.353515625, -16.78125, -16.208984375, -15.63671875, -15.064453125, -14.4921875, -13.919921875, -13.34765625, -12.775390625, -12.203125, -11.630859375, -11.05859375, -10.486328125, -9.9140625, -9.341796875, -8.76953125, -8.197265625, -7.625, -7.052734375, -6.48046875, -5.908203125, -5.3359375, -4.763671875, -4.19140625, -3.619140625, -3.046875, -2.474609375, -1.90234375, -1.330078125, -0.7578125, -0.185546875, 0.38671875, 0.958984375, 1.53125, 2.103515625, 2.67578125, 3.248046875, 3.8203125, 4.392578125, 4.96484375, 5.537109375, 6.109375, 6.681640625, 7.25390625, 7.826171875, 8.3984375, 8.970703125, 9.54296875, 10.115234375, 10.6875, 11.259765625, 11.83203125, 12.404296875, 12.9765625, 13.548828125, 14.12109375, 14.693359375, 15.265625]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 6.0, 9.0, 20.0, 34.0, 88.0, 162.0, 500.0, 2254.0, 101210.0, 4054662.0, 33232.0, 1432.0, 403.0, 159.0, 56.0, 25.0, 18.0, 7.0, 9.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.0, -37.5224609375, -36.044921875, -34.5673828125, -33.08984375, -31.6123046875, -30.134765625, -28.6572265625, -27.1796875, -25.7021484375, -24.224609375, -22.7470703125, -21.26953125, -19.7919921875, -18.314453125, -16.8369140625, -15.359375, -13.8818359375, -12.404296875, -10.9267578125, -9.44921875, -7.9716796875, -6.494140625, -5.0166015625, -3.5390625, -2.0615234375, -0.583984375, 0.8935546875, 2.37109375, 3.8486328125, 5.326171875, 6.8037109375, 8.28125, 9.7587890625, 11.236328125, 12.7138671875, 14.19140625, 15.6689453125, 17.146484375, 18.6240234375, 20.1015625, 21.5791015625, 23.056640625, 24.5341796875, 26.01171875, 27.4892578125, 28.966796875, 30.4443359375, 31.921875, 33.3994140625, 34.876953125, 36.3544921875, 37.83203125, 39.3095703125, 40.787109375, 42.2646484375, 43.7421875, 45.2197265625, 46.697265625, 48.1748046875, 49.65234375, 51.1298828125, 52.607421875, 54.0849609375, 55.5625]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 7.0, 16.0, 40.0, 88.0, 154.0, 208.0, 211.0, 138.0, 95.0, 40.0, 12.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.899803161621094, -20.331382751464844, -17.762962341308594, -15.194540023803711, -12.626119613647461, -10.057699203491211, -7.4892778396606445, -4.920856475830078, -2.352436065673828, 0.21598482131958008, 2.7844057083129883, 5.3528265953063965, 7.921247482299805, 10.489667892456055, 13.058089256286621, 15.626510620117188, 18.194931030273438, 20.763351440429688, 23.331771850585938, 25.90019416809082, 28.46861457824707, 31.03703498840332, 33.6054573059082, 36.17387771606445, 38.7422981262207, 41.31071853637695, 43.8791389465332, 46.44755935668945, 49.01598358154297, 51.58440399169922, 54.15282440185547, 56.72124481201172, 59.2896728515625, 61.85809326171875, 64.426513671875, 66.99493408203125, 69.5633544921875, 72.13177490234375, 74.7001953125, 77.26861572265625, 79.8370361328125, 82.40545654296875, 84.973876953125, 87.54229736328125, 90.1107177734375, 92.67913818359375, 95.24755859375, 97.81597900390625, 100.38440704345703, 102.95282745361328, 105.52124786376953, 108.08966827392578, 110.65808868408203, 113.22650909423828, 115.79492950439453, 118.36335754394531, 120.93177795410156, 123.50019836425781, 126.06861877441406, 128.6370391845703, 131.20545959472656, 133.7738800048828, 136.34230041503906, 138.9107208251953, 141.47914123535156]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 11.0, 13.0, 15.0, 18.0, 17.0, 16.0, 14.0, 19.0, 31.0, 21.0, 34.0, 37.0, 22.0, 36.0, 31.0, 49.0, 45.0, 36.0, 44.0, 40.0, 42.0, 31.0, 42.0, 38.0, 31.0, 43.0, 27.0, 18.0, 30.0, 21.0, 14.0, 16.0, 10.0, 12.0, 6.0, 14.0, 13.0, 10.0, 7.0, 4.0, 1.0, 9.0, 2.0, 3.0, 1.0, 2.0, 3.0], "bins": [-28.88116455078125, -28.062463760375977, -27.243762969970703, -26.42506217956543, -25.606361389160156, -24.787660598754883, -23.96895980834961, -23.150259017944336, -22.331558227539062, -21.51285743713379, -20.694156646728516, -19.875455856323242, -19.05675506591797, -18.238054275512695, -17.419353485107422, -16.60065269470215, -15.781950950622559, -14.963250160217285, -14.144549369812012, -13.325848579406738, -12.507147789001465, -11.688446044921875, -10.869745254516602, -10.051044464111328, -9.232343673706055, -8.413642883300781, -7.594942092895508, -6.776241302490234, -5.957540512084961, -5.138839244842529, -4.320138454437256, -3.5014376640319824, -2.682737350463867, -1.8640365600585938, -1.0453356504440308, -0.22663474082946777, 0.5920660495758057, 1.4107670783996582, 2.2294678688049316, 3.048168659210205, 3.8668694496154785, 4.685570240020752, 5.504271030426025, 6.322972297668457, 7.1416730880737305, 7.960373878479004, 8.779074668884277, 9.59777545928955, 10.416476249694824, 11.235177040100098, 12.053877830505371, 12.872578620910645, 13.691279411315918, 14.509981155395508, 15.328681945800781, 16.147382736206055, 16.966083526611328, 17.7847843170166, 18.603485107421875, 19.42218589782715, 20.240886688232422, 21.059587478637695, 21.87828826904297, 22.696989059448242, 23.515689849853516]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 5.0, 11.0, 14.0, 13.0, 17.0, 21.0, 20.0, 35.0, 29.0, 42.0, 36.0, 40.0, 43.0, 53.0, 51.0, 57.0, 46.0, 50.0, 39.0, 54.0, 35.0, 39.0, 46.0, 37.0, 30.0, 25.0, 23.0, 13.0, 14.0, 19.0, 13.0, 9.0, 4.0, 3.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.800628662109375, -4.66766357421875, -4.534698486328125, -4.4017333984375, -4.268768310546875, -4.13580322265625, -4.002838134765625, -3.869873046875, -3.736907958984375, -3.60394287109375, -3.470977783203125, -3.3380126953125, -3.205047607421875, -3.07208251953125, -2.939117431640625, -2.80615234375, -2.673187255859375, -2.54022216796875, -2.407257080078125, -2.2742919921875, -2.141326904296875, -2.00836181640625, -1.875396728515625, -1.742431640625, -1.609466552734375, -1.47650146484375, -1.343536376953125, -1.2105712890625, -1.077606201171875, -0.94464111328125, -0.811676025390625, -0.6787109375, -0.545745849609375, -0.41278076171875, -0.279815673828125, -0.1468505859375, -0.013885498046875, 0.11907958984375, 0.252044677734375, 0.385009765625, 0.517974853515625, 0.65093994140625, 0.783905029296875, 0.9168701171875, 1.049835205078125, 1.18280029296875, 1.315765380859375, 1.44873046875, 1.581695556640625, 1.71466064453125, 1.847625732421875, 1.9805908203125, 2.113555908203125, 2.24652099609375, 2.379486083984375, 2.512451171875, 2.645416259765625, 2.77838134765625, 2.911346435546875, 3.0443115234375, 3.177276611328125, 3.31024169921875, 3.443206787109375, 3.576171875]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 4.0, 3.0, 6.0, 8.0, 10.0, 16.0, 25.0, 42.0, 56.0, 89.0, 122.0, 165.0, 274.0, 423.0, 668.0, 1111.0, 1660.0, 2912.0, 4834.0, 8143.0, 13847.0, 24514.0, 44311.0, 85057.0, 173030.0, 288559.0, 191307.0, 94414.0, 48795.0, 26804.0, 15161.0, 8828.0, 5187.0, 3110.0, 1831.0, 1192.0, 707.0, 442.0, 319.0, 189.0, 127.0, 82.0, 49.0, 48.0, 17.0, 22.0, 13.0, 12.0, 9.0, 4.0, 3.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52587890625, -0.509735107421875, -0.49359130859375, -0.477447509765625, -0.4613037109375, -0.445159912109375, -0.42901611328125, -0.412872314453125, -0.396728515625, -0.380584716796875, -0.36444091796875, -0.348297119140625, -0.3321533203125, -0.316009521484375, -0.29986572265625, -0.283721923828125, -0.267578125, -0.251434326171875, -0.23529052734375, -0.219146728515625, -0.2030029296875, -0.186859130859375, -0.17071533203125, -0.154571533203125, -0.138427734375, -0.122283935546875, -0.10614013671875, -0.089996337890625, -0.0738525390625, -0.057708740234375, -0.04156494140625, -0.025421142578125, -0.00927734375, 0.006866455078125, 0.02301025390625, 0.039154052734375, 0.0552978515625, 0.071441650390625, 0.08758544921875, 0.103729248046875, 0.119873046875, 0.136016845703125, 0.15216064453125, 0.168304443359375, 0.1844482421875, 0.200592041015625, 0.21673583984375, 0.232879638671875, 0.2490234375, 0.265167236328125, 0.28131103515625, 0.297454833984375, 0.3135986328125, 0.329742431640625, 0.34588623046875, 0.362030029296875, 0.378173828125, 0.394317626953125, 0.41046142578125, 0.426605224609375, 0.4427490234375, 0.458892822265625, 0.47503662109375, 0.491180419921875, 0.50732421875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 5.0, 2.0, 6.0, 3.0, 6.0, 10.0, 13.0, 5.0, 11.0, 17.0, 13.0, 19.0, 16.0, 24.0, 24.0, 22.0, 28.0, 20.0, 28.0, 31.0, 38.0, 37.0, 49.0, 33.0, 1063.0, 35.0, 54.0, 39.0, 40.0, 33.0, 33.0, 21.0, 31.0, 30.0, 18.0, 25.0, 16.0, 23.0, 18.0, 15.0, 15.0, 8.0, 9.0, 9.0, 8.0, 3.0, 5.0, 7.0, 4.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.12109375, -2.05670166015625, -1.9923095703125, -1.92791748046875, -1.863525390625, -1.79913330078125, -1.7347412109375, -1.67034912109375, -1.60595703125, -1.54156494140625, -1.4771728515625, -1.41278076171875, -1.348388671875, -1.28399658203125, -1.2196044921875, -1.15521240234375, -1.0908203125, -1.02642822265625, -0.9620361328125, -0.89764404296875, -0.833251953125, -0.76885986328125, -0.7044677734375, -0.64007568359375, -0.57568359375, -0.51129150390625, -0.4468994140625, -0.38250732421875, -0.318115234375, -0.25372314453125, -0.1893310546875, -0.12493896484375, -0.060546875, 0.00384521484375, 0.0682373046875, 0.13262939453125, 0.197021484375, 0.26141357421875, 0.3258056640625, 0.39019775390625, 0.45458984375, 0.51898193359375, 0.5833740234375, 0.64776611328125, 0.712158203125, 0.77655029296875, 0.8409423828125, 0.90533447265625, 0.9697265625, 1.03411865234375, 1.0985107421875, 1.16290283203125, 1.227294921875, 1.29168701171875, 1.3560791015625, 1.42047119140625, 1.48486328125, 1.54925537109375, 1.6136474609375, 1.67803955078125, 1.742431640625, 1.80682373046875, 1.8712158203125, 1.93560791015625, 2.0]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 4.0, 3.0, 7.0, 10.0, 13.0, 12.0, 17.0, 41.0, 44.0, 69.0, 113.0, 175.0, 211.0, 347.0, 493.0, 670.0, 987.0, 1474.0, 2194.0, 3114.0, 4594.0, 6763.0, 9973.0, 14554.0, 21789.0, 33140.0, 50780.0, 81313.0, 129749.0, 1189267.0, 214932.0, 117980.0, 73604.0, 46420.0, 30019.0, 19918.0, 13526.0, 9094.0, 6229.0, 4314.0, 2866.0, 2042.0, 1344.0, 904.0, 632.0, 430.0, 302.0, 207.0, 146.0, 104.0, 65.0, 56.0, 24.0, 23.0, 16.0, 15.0, 4.0, 5.0, 3.0, 6.0, 0.0, 0.0, 1.0], "bins": [-0.259033203125, -0.25064849853515625, -0.2422637939453125, -0.23387908935546875, -0.225494384765625, -0.21710968017578125, -0.2087249755859375, -0.20034027099609375, -0.19195556640625, -0.18357086181640625, -0.1751861572265625, -0.16680145263671875, -0.158416748046875, -0.15003204345703125, -0.1416473388671875, -0.13326263427734375, -0.1248779296875, -0.11649322509765625, -0.1081085205078125, -0.09972381591796875, -0.091339111328125, -0.08295440673828125, -0.0745697021484375, -0.06618499755859375, -0.05780029296875, -0.04941558837890625, -0.0410308837890625, -0.03264617919921875, -0.024261474609375, -0.01587677001953125, -0.0074920654296875, 0.00089263916015625, 0.00927734375, 0.01766204833984375, 0.0260467529296875, 0.03443145751953125, 0.042816162109375, 0.05120086669921875, 0.0595855712890625, 0.06797027587890625, 0.07635498046875, 0.08473968505859375, 0.0931243896484375, 0.10150909423828125, 0.109893798828125, 0.11827850341796875, 0.1266632080078125, 0.13504791259765625, 0.1434326171875, 0.15181732177734375, 0.1602020263671875, 0.16858673095703125, 0.176971435546875, 0.18535614013671875, 0.1937408447265625, 0.20212554931640625, 0.21051025390625, 0.21889495849609375, 0.2272796630859375, 0.23566436767578125, 0.244049072265625, 0.25243377685546875, 0.2608184814453125, 0.26920318603515625, 0.277587890625]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 7.0, 9.0, 6.0, 6.0, 10.0, 14.0, 23.0, 22.0, 15.0, 31.0, 44.0, 48.0, 62.0, 90.0, 93.0, 92.0, 80.0, 73.0, 49.0, 37.0, 35.0, 22.0, 33.0, 14.0, 21.0, 15.0, 8.0, 13.0, 8.0, 2.0, 6.0, 4.0, 6.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029163360595703125, -0.002823352813720703, -0.0027303695678710938, -0.0026373863220214844, -0.002544403076171875, -0.0024514198303222656, -0.0023584365844726562, -0.002265453338623047, -0.0021724700927734375, -0.002079486846923828, -0.0019865036010742188, -0.0018935203552246094, -0.001800537109375, -0.0017075538635253906, -0.0016145706176757812, -0.0015215873718261719, -0.0014286041259765625, -0.0013356208801269531, -0.0012426376342773438, -0.0011496543884277344, -0.001056671142578125, -0.0009636878967285156, -0.0008707046508789062, -0.0007777214050292969, -0.0006847381591796875, -0.0005917549133300781, -0.0004987716674804688, -0.0004057884216308594, -0.00031280517578125, -0.00021982192993164062, -0.00012683868408203125, -3.3855438232421875e-05, 5.91278076171875e-05, 0.00015211105346679688, 0.00024509429931640625, 0.0003380775451660156, 0.000431060791015625, 0.0005240440368652344, 0.0006170272827148438, 0.0007100105285644531, 0.0008029937744140625, 0.0008959770202636719, 0.0009889602661132812, 0.0010819435119628906, 0.0011749267578125, 0.0012679100036621094, 0.0013608932495117188, 0.0014538764953613281, 0.0015468597412109375, 0.0016398429870605469, 0.0017328262329101562, 0.0018258094787597656, 0.001918792724609375, 0.0020117759704589844, 0.0021047592163085938, 0.002197742462158203, 0.0022907257080078125, 0.002383708953857422, 0.0024766921997070312, 0.0025696754455566406, 0.00266265869140625, 0.0027556419372558594, 0.0028486251831054688, 0.002941608428955078, 0.0030345916748046875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 2.0, 4.0, 4.0, 5.0, 9.0, 12.0, 12.0, 15.0, 25.0, 41.0, 65.0, 68.0, 107.0, 170.0, 296.0, 707.0, 10000.0, 993337.0, 41778.0, 921.0, 362.0, 226.0, 116.0, 84.0, 49.0, 49.0, 29.0, 18.0, 5.0, 14.0, 10.0, 10.0, 7.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.059356689453125, -0.05753755569458008, -0.055718421936035156, -0.053899288177490234, -0.05208015441894531, -0.05026102066040039, -0.04844188690185547, -0.04662275314331055, -0.044803619384765625, -0.0429844856262207, -0.04116535186767578, -0.03934621810913086, -0.03752708435058594, -0.035707950592041016, -0.033888816833496094, -0.03206968307495117, -0.03025054931640625, -0.028431415557861328, -0.026612281799316406, -0.024793148040771484, -0.022974014282226562, -0.02115488052368164, -0.01933574676513672, -0.017516613006591797, -0.015697479248046875, -0.013878345489501953, -0.012059211730957031, -0.01024007797241211, -0.008420944213867188, -0.006601810455322266, -0.004782676696777344, -0.002963542938232422, -0.0011444091796875, 0.0006747245788574219, 0.0024938583374023438, 0.004312992095947266, 0.0061321258544921875, 0.00795125961303711, 0.009770393371582031, 0.011589527130126953, 0.013408660888671875, 0.015227794647216797, 0.01704692840576172, 0.01886606216430664, 0.020685195922851562, 0.022504329681396484, 0.024323463439941406, 0.026142597198486328, 0.02796173095703125, 0.029780864715576172, 0.031599998474121094, 0.033419132232666016, 0.03523826599121094, 0.03705739974975586, 0.03887653350830078, 0.0406956672668457, 0.042514801025390625, 0.04433393478393555, 0.04615306854248047, 0.04797220230102539, 0.04979133605957031, 0.051610469818115234, 0.053429603576660156, 0.05524873733520508, 0.05706787109375]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 11.0, 17.0, 62.0, 139.0, 228.0, 265.0, 171.0, 78.0, 25.0, 8.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0029499554075300694, -0.0028038104064762592, -0.002657665405422449, -0.002511520404368639, -0.0023653756361454725, -0.0022192306350916624, -0.0020730856340378523, -0.001926940749399364, -0.0017807957483455539, -0.0016346507472917438, -0.0014885058626532555, -0.0013423608615994453, -0.0011962158605456352, -0.001050070975907147, -0.0009039259748533368, -0.0007577810902148485, -0.0006116360891610384, -0.0004654911463148892, -0.00031934617436490953, -0.00017320120241492987, -2.705625956878066e-05, 0.00011908868327736855, 0.00026523368433117867, 0.00041137856896966696, 0.0005575235700234771, 0.0007036685128696263, 0.0008498134557157755, 0.0009959584567695856, 0.0011421034578233957, 0.001288248342461884, 0.0014343933435156941, 0.0015805382281541824, 0.0017266832292079926, 0.0018728282302618027, 0.002018973231315613, 0.002165118232369423, 0.0023112630005925894, 0.0024574080016463995, 0.0026035530027002096, 0.002749697770923376, 0.002895842771977186, 0.0030419877730309963, 0.0031881327740848064, 0.0033342777751386166, 0.003480422543361783, 0.003626567544415593, 0.0037727125454694033, 0.00391885731369257, 0.00406500231474638, 0.00421114731580019, 0.004357292316854, 0.00450343731790781, 0.00464958231896162, 0.0047957273200154305, 0.004941872321069241, 0.005088016856461763, 0.005234162323176861, 0.005380307324230671, 0.005526452325284481, 0.005672597326338291, 0.005818742327392101, 0.005964887328445911, 0.0061110323294997215, 0.006257176864892244, 0.0064033218659460545]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 2.0, 2.0, 5.0, 4.0, 4.0, 6.0, 11.0, 12.0, 8.0, 17.0, 20.0, 18.0, 16.0, 23.0, 25.0, 34.0, 36.0, 34.0, 39.0, 47.0, 46.0, 44.0, 48.0, 52.0, 37.0, 35.0, 35.0, 46.0, 36.0, 32.0, 32.0, 35.0, 29.0, 22.0, 25.0, 22.0, 9.0, 14.0, 8.0, 8.0, 3.0, 5.0, 8.0, 6.0, 4.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0014315247535705566, -0.001389126293361187, -0.0013467278331518173, -0.0013043293729424477, -0.001261930912733078, -0.0012195324525237083, -0.0011771339923143387, -0.001134735532104969, -0.0010923370718955994, -0.0010499386116862297, -0.00100754015147686, -0.0009651416912674904, -0.0009227432310581207, -0.0008803447708487511, -0.0008379463106393814, -0.0007955478504300117, -0.0007531493902206421, -0.0007107509300112724, -0.0006683524698019028, -0.0006259540095925331, -0.0005835555493831635, -0.0005411570891737938, -0.0004987586289644241, -0.0004563601687550545, -0.0004139617085456848, -0.00037156324833631516, -0.0003291647881269455, -0.00028676632791757584, -0.0002443678677082062, -0.00020196940749883652, -0.00015957094728946686, -0.0001171724870800972, -7.477402687072754e-05, -3.237556666135788e-05, 1.002289354801178e-05, 5.242135375738144e-05, 9.48198139667511e-05, 0.00013721827417612076, 0.00017961673438549042, 0.00022201519459486008, 0.00026441365480422974, 0.0003068121150135994, 0.00034921057522296906, 0.0003916090354323387, 0.0004340074956417084, 0.00047640595585107803, 0.0005188044160604477, 0.0005612028762698174, 0.000603601336479187, 0.0006459997966885567, 0.0006883982568979263, 0.000730796717107296, 0.0007731951773166656, 0.0008155936375260353, 0.000857992097735405, 0.0009003905579447746, 0.0009427890181541443, 0.000985187478363514, 0.0010275859385728836, 0.0010699843987822533, 0.001112382858991623, 0.0011547813192009926, 0.0011971797794103622, 0.001239578239619732, 0.0012819766998291016]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 5.0, 4.0, 7.0, 5.0, 11.0, 14.0, 13.0, 17.0, 21.0, 20.0, 35.0, 29.0, 42.0, 36.0, 40.0, 43.0, 53.0, 51.0, 57.0, 46.0, 50.0, 39.0, 54.0, 35.0, 39.0, 46.0, 37.0, 30.0, 25.0, 23.0, 13.0, 14.0, 19.0, 13.0, 9.0, 4.0, 4.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.93359375, -4.800628662109375, -4.66766357421875, -4.534698486328125, -4.4017333984375, -4.268768310546875, -4.13580322265625, -4.002838134765625, -3.869873046875, -3.736907958984375, -3.60394287109375, -3.470977783203125, -3.3380126953125, -3.205047607421875, -3.07208251953125, -2.939117431640625, -2.80615234375, -2.673187255859375, -2.54022216796875, -2.407257080078125, -2.2742919921875, -2.141326904296875, -2.00836181640625, -1.875396728515625, -1.742431640625, -1.609466552734375, -1.47650146484375, -1.343536376953125, -1.2105712890625, -1.077606201171875, -0.94464111328125, -0.811676025390625, -0.6787109375, -0.545745849609375, -0.41278076171875, -0.279815673828125, -0.1468505859375, -0.013885498046875, 0.11907958984375, 0.252044677734375, 0.385009765625, 0.517974853515625, 0.65093994140625, 0.783905029296875, 0.9168701171875, 1.049835205078125, 1.18280029296875, 1.315765380859375, 1.44873046875, 1.581695556640625, 1.71466064453125, 1.847625732421875, 1.9805908203125, 2.113555908203125, 2.24652099609375, 2.379486083984375, 2.512451171875, 2.645416259765625, 2.77838134765625, 2.911346435546875, 3.0443115234375, 3.177276611328125, 3.31024169921875, 3.443206787109375, 3.576171875]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 3.0, 10.0, 12.0, 20.0, 30.0, 43.0, 44.0, 90.0, 93.0, 162.0, 241.0, 382.0, 556.0, 835.0, 1225.0, 2068.0, 3434.0, 6652.0, 13297.0, 29504.0, 73325.0, 246088.0, 439905.0, 139154.0, 48419.0, 20775.0, 9580.0, 5106.0, 2751.0, 1640.0, 1052.0, 685.0, 447.0, 288.0, 186.0, 137.0, 95.0, 82.0, 47.0, 30.0, 27.0, 14.0, 5.0, 5.0, 4.0, 6.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.322265625, -3.216064453125, -3.10986328125, -3.003662109375, -2.8974609375, -2.791259765625, -2.68505859375, -2.578857421875, -2.47265625, -2.366455078125, -2.26025390625, -2.154052734375, -2.0478515625, -1.941650390625, -1.83544921875, -1.729248046875, -1.623046875, -1.516845703125, -1.41064453125, -1.304443359375, -1.1982421875, -1.092041015625, -0.98583984375, -0.879638671875, -0.7734375, -0.667236328125, -0.56103515625, -0.454833984375, -0.3486328125, -0.242431640625, -0.13623046875, -0.030029296875, 0.076171875, 0.182373046875, 0.28857421875, 0.394775390625, 0.5009765625, 0.607177734375, 0.71337890625, 0.819580078125, 0.92578125, 1.031982421875, 1.13818359375, 1.244384765625, 1.3505859375, 1.456787109375, 1.56298828125, 1.669189453125, 1.775390625, 1.881591796875, 1.98779296875, 2.093994140625, 2.2001953125, 2.306396484375, 2.41259765625, 2.518798828125, 2.625, 2.731201171875, 2.83740234375, 2.943603515625, 3.0498046875, 3.156005859375, 3.26220703125, 3.368408203125, 3.474609375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 4.0, 5.0, 9.0, 5.0, 5.0, 6.0, 11.0, 9.0, 10.0, 12.0, 24.0, 12.0, 34.0, 26.0, 26.0, 41.0, 34.0, 46.0, 34.0, 41.0, 53.0, 78.0, 171.0, 1446.0, 261.0, 107.0, 75.0, 46.0, 50.0, 39.0, 26.0, 32.0, 38.0, 26.0, 28.0, 17.0, 26.0, 24.0, 21.0, 12.0, 14.0, 14.0, 9.0, 6.0, 7.0, 6.0, 5.0, 7.0, 1.0, 5.0, 2.0, 4.0, 0.0, 2.0, 2.0, 3.0], "bins": [-10.671875, -10.3350830078125, -9.998291015625, -9.6614990234375, -9.32470703125, -8.9879150390625, -8.651123046875, -8.3143310546875, -7.9775390625, -7.6407470703125, -7.303955078125, -6.9671630859375, -6.63037109375, -6.2935791015625, -5.956787109375, -5.6199951171875, -5.283203125, -4.9464111328125, -4.609619140625, -4.2728271484375, -3.93603515625, -3.5992431640625, -3.262451171875, -2.9256591796875, -2.5888671875, -2.2520751953125, -1.915283203125, -1.5784912109375, -1.24169921875, -0.9049072265625, -0.568115234375, -0.2313232421875, 0.10546875, 0.4422607421875, 0.779052734375, 1.1158447265625, 1.45263671875, 1.7894287109375, 2.126220703125, 2.4630126953125, 2.7998046875, 3.1365966796875, 3.473388671875, 3.8101806640625, 4.14697265625, 4.4837646484375, 4.820556640625, 5.1573486328125, 5.494140625, 5.8309326171875, 6.167724609375, 6.5045166015625, 6.84130859375, 7.1781005859375, 7.514892578125, 7.8516845703125, 8.1884765625, 8.5252685546875, 8.862060546875, 9.1988525390625, 9.53564453125, 9.8724365234375, 10.209228515625, 10.5460205078125, 10.8828125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 2.0, 7.0, 10.0, 5.0, 12.0, 30.0, 29.0, 48.0, 65.0, 137.0, 237.0, 474.0, 2004.0, 3052273.0, 88568.0, 1024.0, 332.0, 177.0, 109.0, 63.0, 34.0, 24.0, 11.0, 8.0, 5.0, 9.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.1875, -69.14453125, -67.1015625, -65.05859375, -63.015625, -60.97265625, -58.9296875, -56.88671875, -54.84375, -52.80078125, -50.7578125, -48.71484375, -46.671875, -44.62890625, -42.5859375, -40.54296875, -38.5, -36.45703125, -34.4140625, -32.37109375, -30.328125, -28.28515625, -26.2421875, -24.19921875, -22.15625, -20.11328125, -18.0703125, -16.02734375, -13.984375, -11.94140625, -9.8984375, -7.85546875, -5.8125, -3.76953125, -1.7265625, 0.31640625, 2.359375, 4.40234375, 6.4453125, 8.48828125, 10.53125, 12.57421875, 14.6171875, 16.66015625, 18.703125, 20.74609375, 22.7890625, 24.83203125, 26.875, 28.91796875, 30.9609375, 33.00390625, 35.046875, 37.08984375, 39.1328125, 41.17578125, 43.21875, 45.26171875, 47.3046875, 49.34765625, 51.390625, 53.43359375, 55.4765625, 57.51953125, 59.5625]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [2.0, 0.0, 10.0, 558.0, 440.0, 7.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.675748825073242, -14.715578079223633, -9.755406379699707, -4.795234680175781, 0.16493606567382812, 5.1251068115234375, 10.08527946472168, 15.045450210571289, 20.0056209564209, 24.965791702270508, 29.92596435546875, 34.88613510131836, 39.84630584716797, 44.80647659301758, 49.76664733886719, 54.72682189941406, 59.686988830566406, 64.64716339111328, 69.60733032226562, 74.5675048828125, 79.52767181396484, 84.48784637451172, 89.44801330566406, 94.40818786621094, 99.36836242675781, 104.32853698730469, 109.28870391845703, 114.2488784790039, 119.20904541015625, 124.16921997070312, 129.12939453125, 134.08956909179688, 139.0497283935547, 144.00990295410156, 148.97007751464844, 153.93023681640625, 158.89041137695312, 163.8505859375, 168.81076049804688, 173.77093505859375, 178.73109436035156, 183.69126892089844, 188.6514434814453, 193.61160278320312, 198.57177734375, 203.53195190429688, 208.49212646484375, 213.45230102539062, 218.4124755859375, 223.37265014648438, 228.33282470703125, 233.29298400878906, 238.25315856933594, 243.2133331298828, 248.1735076904297, 253.1336669921875, 258.0938415527344, 263.05401611328125, 268.0141906738281, 272.974365234375, 277.9345397949219, 282.8946838378906, 287.8548583984375, 292.8150329589844, 297.77520751953125]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 5.0, 4.0, 2.0, 5.0, 6.0, 17.0, 9.0, 13.0, 15.0, 13.0, 18.0, 15.0, 20.0, 31.0, 27.0, 30.0, 29.0, 32.0, 33.0, 35.0, 25.0, 41.0, 35.0, 48.0, 38.0, 35.0, 42.0, 42.0, 34.0, 24.0, 35.0, 36.0, 25.0, 32.0, 23.0, 25.0, 21.0, 18.0, 10.0, 8.0, 10.0, 9.0, 8.0, 7.0, 5.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-36.41526794433594, -35.305206298828125, -34.19514465332031, -33.0850830078125, -31.97502326965332, -30.864961624145508, -29.754901885986328, -28.644840240478516, -27.534778594970703, -26.42471694946289, -25.314655303955078, -24.2045955657959, -23.094533920288086, -21.984472274780273, -20.874412536621094, -19.76435089111328, -18.65428924560547, -17.544227600097656, -16.434165954589844, -15.324106216430664, -14.214044570922852, -13.103982925415039, -11.993922233581543, -10.883861541748047, -9.773799896240234, -8.663738250732422, -7.553677558898926, -6.4436163902282715, -5.333555221557617, -4.223494052886963, -3.1134328842163086, -2.0033717155456543, -0.893310546875, 0.2167506217956543, 1.3268117904663086, 2.436872959136963, 3.546934127807617, 4.6569952964782715, 5.767056465148926, 6.87711763381958, 7.987178802490234, 9.097240447998047, 10.207301139831543, 11.317361831665039, 12.427423477172852, 13.537485122680664, 14.64754581451416, 15.757606506347656, 16.86766815185547, 17.97772979736328, 19.087791442871094, 20.197851181030273, 21.307912826538086, 22.4179744720459, 23.528034210205078, 24.63809585571289, 25.748157501220703, 26.858219146728516, 27.968280792236328, 29.078340530395508, 30.18840217590332, 31.298463821411133, 32.40852355957031, 33.518585205078125, 34.62864685058594]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 5.0, 2.0, 5.0, 6.0, 11.0, 10.0, 10.0, 14.0, 16.0, 18.0, 38.0, 31.0, 28.0, 45.0, 37.0, 43.0, 38.0, 46.0, 56.0, 53.0, 43.0, 38.0, 44.0, 48.0, 41.0, 44.0, 38.0, 33.0, 30.0, 27.0, 18.0, 14.0, 20.0, 12.0, 16.0, 10.0, 4.0, 5.0, 1.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-5.02734375, -4.891265869140625, -4.75518798828125, -4.619110107421875, -4.4830322265625, -4.346954345703125, -4.21087646484375, -4.074798583984375, -3.938720703125, -3.802642822265625, -3.66656494140625, -3.530487060546875, -3.3944091796875, -3.258331298828125, -3.12225341796875, -2.986175537109375, -2.85009765625, -2.714019775390625, -2.57794189453125, -2.441864013671875, -2.3057861328125, -2.169708251953125, -2.03363037109375, -1.897552490234375, -1.761474609375, -1.625396728515625, -1.48931884765625, -1.353240966796875, -1.2171630859375, -1.081085205078125, -0.94500732421875, -0.808929443359375, -0.6728515625, -0.536773681640625, -0.40069580078125, -0.264617919921875, -0.1285400390625, 0.007537841796875, 0.14361572265625, 0.279693603515625, 0.415771484375, 0.551849365234375, 0.68792724609375, 0.824005126953125, 0.9600830078125, 1.096160888671875, 1.23223876953125, 1.368316650390625, 1.50439453125, 1.640472412109375, 1.77655029296875, 1.912628173828125, 2.0487060546875, 2.184783935546875, 2.32086181640625, 2.456939697265625, 2.593017578125, 2.729095458984375, 2.86517333984375, 3.001251220703125, 3.1373291015625, 3.273406982421875, 3.40948486328125, 3.545562744140625, 3.681640625]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 8.0, 10.0, 13.0, 21.0, 27.0, 40.0, 51.0, 51.0, 86.0, 102.0, 193.0, 321.0, 615.0, 1138.0, 2485.0, 5859.0, 15305.0, 57563.0, 387086.0, 1918020.0, 1494566.0, 247543.0, 41707.0, 12047.0, 4838.0, 2180.0, 1003.0, 542.0, 297.0, 161.0, 120.0, 86.0, 62.0, 37.0, 35.0, 25.0, 12.0, 8.0, 7.0, 6.0, 4.0, 5.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.8828125, -7.6568603515625, -7.430908203125, -7.2049560546875, -6.97900390625, -6.7530517578125, -6.527099609375, -6.3011474609375, -6.0751953125, -5.8492431640625, -5.623291015625, -5.3973388671875, -5.17138671875, -4.9454345703125, -4.719482421875, -4.4935302734375, -4.267578125, -4.0416259765625, -3.815673828125, -3.5897216796875, -3.36376953125, -3.1378173828125, -2.911865234375, -2.6859130859375, -2.4599609375, -2.2340087890625, -2.008056640625, -1.7821044921875, -1.55615234375, -1.3302001953125, -1.104248046875, -0.8782958984375, -0.65234375, -0.4263916015625, -0.200439453125, 0.0255126953125, 0.25146484375, 0.4774169921875, 0.703369140625, 0.9293212890625, 1.1552734375, 1.3812255859375, 1.607177734375, 1.8331298828125, 2.05908203125, 2.2850341796875, 2.510986328125, 2.7369384765625, 2.962890625, 3.1888427734375, 3.414794921875, 3.6407470703125, 3.86669921875, 4.0926513671875, 4.318603515625, 4.5445556640625, 4.7705078125, 4.9964599609375, 5.222412109375, 5.4483642578125, 5.67431640625, 5.9002685546875, 6.126220703125, 6.3521728515625, 6.578125]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 7.0, 7.0, 10.0, 10.0, 22.0, 28.0, 54.0, 57.0, 84.0, 151.0, 207.0, 324.0, 410.0, 547.0, 510.0, 480.0, 393.0, 237.0, 150.0, 124.0, 99.0, 55.0, 37.0, 29.0, 15.0, 12.0, 6.0, 2.0, 5.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.046875, -6.7291259765625, -6.411376953125, -6.0936279296875, -5.77587890625, -5.4581298828125, -5.140380859375, -4.8226318359375, -4.5048828125, -4.1871337890625, -3.869384765625, -3.5516357421875, -3.23388671875, -2.9161376953125, -2.598388671875, -2.2806396484375, -1.962890625, -1.6451416015625, -1.327392578125, -1.0096435546875, -0.69189453125, -0.3741455078125, -0.056396484375, 0.2613525390625, 0.5791015625, 0.8968505859375, 1.214599609375, 1.5323486328125, 1.85009765625, 2.1678466796875, 2.485595703125, 2.8033447265625, 3.12109375, 3.4388427734375, 3.756591796875, 4.0743408203125, 4.39208984375, 4.7098388671875, 5.027587890625, 5.3453369140625, 5.6630859375, 5.9808349609375, 6.298583984375, 6.6163330078125, 6.93408203125, 7.2518310546875, 7.569580078125, 7.8873291015625, 8.205078125, 8.5228271484375, 8.840576171875, 9.1583251953125, 9.47607421875, 9.7938232421875, 10.111572265625, 10.4293212890625, 10.7470703125, 11.0648193359375, 11.382568359375, 11.7003173828125, 12.01806640625, 12.3358154296875, 12.653564453125, 12.9713134765625, 13.2890625]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 10.0, 14.0, 17.0, 21.0, 42.0, 59.0, 102.0, 154.0, 221.0, 376.0, 766.0, 2622.0, 14453.0, 166687.0, 3139116.0, 820592.0, 40832.0, 5509.0, 1371.0, 539.0, 269.0, 162.0, 109.0, 87.0, 49.0, 31.0, 29.0, 19.0, 12.0, 5.0, 3.0, 3.0, 4.0, 0.0, 1.0, 1.0], "bins": [-24.984375, -24.3997802734375, -23.815185546875, -23.2305908203125, -22.64599609375, -22.0614013671875, -21.476806640625, -20.8922119140625, -20.3076171875, -19.7230224609375, -19.138427734375, -18.5538330078125, -17.96923828125, -17.3846435546875, -16.800048828125, -16.2154541015625, -15.630859375, -15.0462646484375, -14.461669921875, -13.8770751953125, -13.29248046875, -12.7078857421875, -12.123291015625, -11.5386962890625, -10.9541015625, -10.3695068359375, -9.784912109375, -9.2003173828125, -8.61572265625, -8.0311279296875, -7.446533203125, -6.8619384765625, -6.27734375, -5.6927490234375, -5.108154296875, -4.5235595703125, -3.93896484375, -3.3543701171875, -2.769775390625, -2.1851806640625, -1.6005859375, -1.0159912109375, -0.431396484375, 0.1531982421875, 0.73779296875, 1.3223876953125, 1.906982421875, 2.4915771484375, 3.076171875, 3.6607666015625, 4.245361328125, 4.8299560546875, 5.41455078125, 5.9991455078125, 6.583740234375, 7.1683349609375, 7.7529296875, 8.3375244140625, 8.922119140625, 9.5067138671875, 10.09130859375, 10.6759033203125, 11.260498046875, 11.8450927734375, 12.4296875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 21.0, 54.0, 162.0, 257.0, 238.0, 170.0, 75.0, 24.0, 8.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-143.08447265625, -139.96670532226562, -136.84893798828125, -133.7311553955078, -130.61338806152344, -127.49562072753906, -124.37785339355469, -121.26008605957031, -118.1423110961914, -115.02454376220703, -111.90676879882812, -108.78900146484375, -105.67123413085938, -102.55345916748047, -99.4356918334961, -96.31791687011719, -93.20014953613281, -90.08238220214844, -86.96460723876953, -83.84683990478516, -80.72906494140625, -77.61129760742188, -74.4935302734375, -71.37576293945312, -68.25798797607422, -65.14022064208984, -62.02244567871094, -58.90467834472656, -55.78690719604492, -52.66913604736328, -49.551368713378906, -46.433597564697266, -43.31583023071289, -40.19805908203125, -37.080291748046875, -33.962520599365234, -30.844749450683594, -27.726978302001953, -24.609209060668945, -21.491439819335938, -18.373668670654297, -15.255898475646973, -12.138128280639648, -9.020358085632324, -5.902587890625, -2.784817695617676, 0.33295249938964844, 3.4507217407226562, 6.568492889404297, 9.686263084411621, 12.804033279418945, 15.92180347442627, 19.039573669433594, 22.157344818115234, 25.275114059448242, 28.39288330078125, 31.51065444946289, 34.62842559814453, 37.746192932128906, 40.86396408081055, 43.98173522949219, 47.09950637817383, 50.21727752685547, 53.335044860839844, 56.452816009521484]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 6.0, 9.0, 6.0, 10.0, 13.0, 13.0, 20.0, 9.0, 20.0, 25.0, 30.0, 34.0, 23.0, 32.0, 52.0, 36.0, 45.0, 36.0, 38.0, 43.0, 46.0, 40.0, 53.0, 42.0, 40.0, 33.0, 22.0, 26.0, 24.0, 28.0, 21.0, 28.0, 21.0, 15.0, 10.0, 10.0, 12.0, 7.0, 11.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.38205337524414, -28.42592430114746, -27.469797134399414, -26.513668060302734, -25.557540893554688, -24.601411819458008, -23.645282745361328, -22.68915557861328, -21.7330265045166, -20.776897430419922, -19.820770263671875, -18.864641189575195, -17.90851402282715, -16.95238494873047, -15.996256828308105, -15.040128707885742, -14.084000587463379, -13.127872467041016, -12.171744346618652, -11.215616226196289, -10.25948715209961, -9.303359031677246, -8.347230911254883, -7.391102313995361, -6.434974193572998, -5.478846073150635, -4.522717475891113, -3.56658935546875, -2.6104609966278076, -1.6543326377868652, -0.698204517364502, 0.25792407989501953, 1.2140522003173828, 2.170180559158325, 3.1263089179992676, 4.082437038421631, 5.038565635681152, 5.994693756103516, 6.950821876525879, 7.9069504737854, 8.863079071044922, 9.819207191467285, 10.775335311889648, 11.731464385986328, 12.687592506408691, 13.643720626831055, 14.599848747253418, 15.555976867675781, 16.512104034423828, 17.468233108520508, 18.424360275268555, 19.380489349365234, 20.33661651611328, 21.29274559020996, 22.24887466430664, 23.205001831054688, 24.161130905151367, 25.117259979248047, 26.073387145996094, 27.029516220092773, 27.98564338684082, 28.9417724609375, 29.897899627685547, 30.854028701782227, 31.810157775878906]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 3.0, 8.0, 5.0, 14.0, 15.0, 10.0, 27.0, 29.0, 22.0, 23.0, 39.0, 37.0, 44.0, 42.0, 42.0, 51.0, 42.0, 49.0, 50.0, 46.0, 46.0, 51.0, 52.0, 36.0, 42.0, 26.0, 29.0, 20.0, 26.0, 14.0, 13.0, 16.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.01171875, -4.87109375, -4.73046875, -4.58984375, -4.44921875, -4.30859375, -4.16796875, -4.02734375, -3.88671875, -3.74609375, -3.60546875, -3.46484375, -3.32421875, -3.18359375, -3.04296875, -2.90234375, -2.76171875, -2.62109375, -2.48046875, -2.33984375, -2.19921875, -2.05859375, -1.91796875, -1.77734375, -1.63671875, -1.49609375, -1.35546875, -1.21484375, -1.07421875, -0.93359375, -0.79296875, -0.65234375, -0.51171875, -0.37109375, -0.23046875, -0.08984375, 0.05078125, 0.19140625, 0.33203125, 0.47265625, 0.61328125, 0.75390625, 0.89453125, 1.03515625, 1.17578125, 1.31640625, 1.45703125, 1.59765625, 1.73828125, 1.87890625, 2.01953125, 2.16015625, 2.30078125, 2.44140625, 2.58203125, 2.72265625, 2.86328125, 3.00390625, 3.14453125, 3.28515625, 3.42578125, 3.56640625, 3.70703125, 3.84765625, 3.98828125]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 4.0, 4.0, 6.0, 10.0, 18.0, 23.0, 32.0, 47.0, 74.0, 124.0, 162.0, 290.0, 409.0, 664.0, 1173.0, 1977.0, 3254.0, 5785.0, 10524.0, 19389.0, 36592.0, 71083.0, 143716.0, 277641.0, 235778.0, 114968.0, 57612.0, 30101.0, 16180.0, 8913.0, 4893.0, 2725.0, 1675.0, 1041.0, 597.0, 366.0, 232.0, 170.0, 96.0, 83.0, 37.0, 31.0, 23.0, 8.0, 12.0, 7.0, 4.0, 5.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.61669921875, -0.5973358154296875, -0.577972412109375, -0.5586090087890625, -0.53924560546875, -0.5198822021484375, -0.500518798828125, -0.4811553955078125, -0.4617919921875, -0.4424285888671875, -0.423065185546875, -0.4037017822265625, -0.38433837890625, -0.3649749755859375, -0.345611572265625, -0.3262481689453125, -0.306884765625, -0.2875213623046875, -0.268157958984375, -0.2487945556640625, -0.22943115234375, -0.2100677490234375, -0.190704345703125, -0.1713409423828125, -0.1519775390625, -0.1326141357421875, -0.113250732421875, -0.0938873291015625, -0.07452392578125, -0.0551605224609375, -0.035797119140625, -0.0164337158203125, 0.0029296875, 0.0222930908203125, 0.041656494140625, 0.0610198974609375, 0.08038330078125, 0.0997467041015625, 0.119110107421875, 0.1384735107421875, 0.1578369140625, 0.1772003173828125, 0.196563720703125, 0.2159271240234375, 0.23529052734375, 0.2546539306640625, 0.274017333984375, 0.2933807373046875, 0.312744140625, 0.3321075439453125, 0.351470947265625, 0.3708343505859375, 0.39019775390625, 0.4095611572265625, 0.428924560546875, 0.4482879638671875, 0.4676513671875, 0.4870147705078125, 0.506378173828125, 0.5257415771484375, 0.54510498046875, 0.5644683837890625, 0.583831787109375, 0.6031951904296875, 0.62255859375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 5.0, 1.0, 4.0, 7.0, 11.0, 11.0, 16.0, 12.0, 23.0, 20.0, 29.0, 27.0, 22.0, 30.0, 40.0, 45.0, 62.0, 39.0, 47.0, 44.0, 1069.0, 46.0, 41.0, 47.0, 39.0, 30.0, 36.0, 35.0, 27.0, 37.0, 26.0, 21.0, 19.0, 10.0, 12.0, 15.0, 10.0, 6.0, 2.0, 5.0, 2.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6328125, -2.546478271484375, -2.46014404296875, -2.373809814453125, -2.2874755859375, -2.201141357421875, -2.11480712890625, -2.028472900390625, -1.942138671875, -1.855804443359375, -1.76947021484375, -1.683135986328125, -1.5968017578125, -1.510467529296875, -1.42413330078125, -1.337799072265625, -1.25146484375, -1.165130615234375, -1.07879638671875, -0.992462158203125, -0.9061279296875, -0.819793701171875, -0.73345947265625, -0.647125244140625, -0.560791015625, -0.474456787109375, -0.38812255859375, -0.301788330078125, -0.2154541015625, -0.129119873046875, -0.04278564453125, 0.043548583984375, 0.1298828125, 0.216217041015625, 0.30255126953125, 0.388885498046875, 0.4752197265625, 0.561553955078125, 0.64788818359375, 0.734222412109375, 0.820556640625, 0.906890869140625, 0.99322509765625, 1.079559326171875, 1.1658935546875, 1.252227783203125, 1.33856201171875, 1.424896240234375, 1.51123046875, 1.597564697265625, 1.68389892578125, 1.770233154296875, 1.8565673828125, 1.942901611328125, 2.02923583984375, 2.115570068359375, 2.201904296875, 2.288238525390625, 2.37457275390625, 2.460906982421875, 2.5472412109375, 2.633575439453125, 2.71990966796875, 2.806243896484375, 2.892578125]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 7.0, 5.0, 17.0, 19.0, 29.0, 56.0, 82.0, 127.0, 193.0, 311.0, 501.0, 874.0, 1475.0, 2313.0, 3964.0, 6812.0, 11305.0, 19126.0, 32828.0, 57126.0, 105255.0, 193750.0, 1295823.0, 162855.0, 86562.0, 47860.0, 27688.0, 16112.0, 9584.0, 5816.0, 3323.0, 2072.0, 1246.0, 765.0, 487.0, 268.0, 181.0, 96.0, 76.0, 56.0, 23.0, 26.0, 13.0, 5.0, 8.0, 6.0, 4.0, 3.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.407958984375, -0.3957252502441406, -0.38349151611328125, -0.3712577819824219, -0.3590240478515625, -0.3467903137207031, -0.33455657958984375, -0.3223228454589844, -0.310089111328125, -0.2978553771972656, -0.28562164306640625, -0.2733879089355469, -0.2611541748046875, -0.24892044067382812, -0.23668670654296875, -0.22445297241210938, -0.21221923828125, -0.19998550415039062, -0.18775177001953125, -0.17551803588867188, -0.1632843017578125, -0.15105056762695312, -0.13881683349609375, -0.12658309936523438, -0.114349365234375, -0.10211563110351562, -0.08988189697265625, -0.07764816284179688, -0.0654144287109375, -0.053180694580078125, -0.04094696044921875, -0.028713226318359375, -0.0164794921875, -0.004245758056640625, 0.00798797607421875, 0.020221710205078125, 0.0324554443359375, 0.044689178466796875, 0.05692291259765625, 0.06915664672851562, 0.081390380859375, 0.09362411499023438, 0.10585784912109375, 0.11809158325195312, 0.1303253173828125, 0.14255905151367188, 0.15479278564453125, 0.16702651977539062, 0.17926025390625, 0.19149398803710938, 0.20372772216796875, 0.21596145629882812, 0.2281951904296875, 0.24042892456054688, 0.25266265869140625, 0.2648963928222656, 0.277130126953125, 0.2893638610839844, 0.30159759521484375, 0.3138313293457031, 0.3260650634765625, 0.3382987976074219, 0.35053253173828125, 0.3627662658691406, 0.375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 2.0, 3.0, 6.0, 5.0, 10.0, 6.0, 11.0, 7.0, 8.0, 19.0, 22.0, 17.0, 32.0, 34.0, 35.0, 59.0, 59.0, 80.0, 89.0, 95.0, 77.0, 49.0, 48.0, 41.0, 42.0, 27.0, 19.0, 23.0, 15.0, 5.0, 11.0, 5.0, 8.0, 9.0, 5.0, 7.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0030918121337890625, -0.0029938220977783203, -0.002895832061767578, -0.002797842025756836, -0.0026998519897460938, -0.0026018619537353516, -0.0025038719177246094, -0.002405881881713867, -0.002307891845703125, -0.002209901809692383, -0.0021119117736816406, -0.0020139217376708984, -0.0019159317016601562, -0.001817941665649414, -0.0017199516296386719, -0.0016219615936279297, -0.0015239715576171875, -0.0014259815216064453, -0.0013279914855957031, -0.001230001449584961, -0.0011320114135742188, -0.0010340213775634766, -0.0009360313415527344, -0.0008380413055419922, -0.00074005126953125, -0.0006420612335205078, -0.0005440711975097656, -0.00044608116149902344, -0.00034809112548828125, -0.00025010108947753906, -0.00015211105346679688, -5.412101745605469e-05, 4.38690185546875e-05, 0.0001418590545654297, 0.00023984909057617188, 0.00033783912658691406, 0.00043582916259765625, 0.0005338191986083984, 0.0006318092346191406, 0.0007297992706298828, 0.000827789306640625, 0.0009257793426513672, 0.0010237693786621094, 0.0011217594146728516, 0.0012197494506835938, 0.001317739486694336, 0.0014157295227050781, 0.0015137195587158203, 0.0016117095947265625, 0.0017096996307373047, 0.0018076896667480469, 0.001905679702758789, 0.0020036697387695312, 0.0021016597747802734, 0.0021996498107910156, 0.002297639846801758, 0.0023956298828125, 0.002493619918823242, 0.0025916099548339844, 0.0026895999908447266, 0.0027875900268554688, 0.002885580062866211, 0.002983570098876953, 0.0030815601348876953, 0.0031795501708984375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 5.0, 2.0, 2.0, 2.0, 2.0, 5.0, 9.0, 8.0, 9.0, 12.0, 16.0, 14.0, 30.0, 40.0, 44.0, 67.0, 112.0, 201.0, 387.0, 1865.0, 71654.0, 958322.0, 14156.0, 883.0, 267.0, 153.0, 78.0, 47.0, 38.0, 28.0, 22.0, 17.0, 16.0, 12.0, 8.0, 6.0, 6.0, 4.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0616455078125, -0.059612274169921875, -0.05757904052734375, -0.055545806884765625, -0.0535125732421875, -0.051479339599609375, -0.04944610595703125, -0.047412872314453125, -0.045379638671875, -0.043346405029296875, -0.04131317138671875, -0.039279937744140625, -0.0372467041015625, -0.035213470458984375, -0.03318023681640625, -0.031147003173828125, -0.02911376953125, -0.027080535888671875, -0.02504730224609375, -0.023014068603515625, -0.0209808349609375, -0.018947601318359375, -0.01691436767578125, -0.014881134033203125, -0.012847900390625, -0.010814666748046875, -0.00878143310546875, -0.006748199462890625, -0.0047149658203125, -0.002681732177734375, -0.00064849853515625, 0.001384735107421875, 0.00341796875, 0.005451202392578125, 0.00748443603515625, 0.009517669677734375, 0.0115509033203125, 0.013584136962890625, 0.01561737060546875, 0.017650604248046875, 0.019683837890625, 0.021717071533203125, 0.02375030517578125, 0.025783538818359375, 0.0278167724609375, 0.029850006103515625, 0.03188323974609375, 0.033916473388671875, 0.03594970703125, 0.037982940673828125, 0.04001617431640625, 0.042049407958984375, 0.0440826416015625, 0.046115875244140625, 0.04814910888671875, 0.050182342529296875, 0.052215576171875, 0.054248809814453125, 0.05628204345703125, 0.058315277099609375, 0.0603485107421875, 0.062381744384765625, 0.06441497802734375, 0.06644821166992188, 0.0684814453125]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [69.0, 793.0, 154.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013103475794196129, -0.0005017980583943427, 0.00030675146263092756, 0.0011153009254485369, 0.001923850504681468, 0.0027323998510837555, 0.0035409494303166866, 0.004349499009549618, 0.005158048588782549, 0.00596659816801548, 0.006775147747248411, 0.007583697326481342, 0.008392246440052986, 0.009200796484947205, 0.010009345598518848, 0.010817894712090492, 0.01162644475698471, 0.012434993870556355, 0.013243543915450573, 0.014052093029022217, 0.014860643073916435, 0.015669193118810654, 0.016477741301059723, 0.01728629134595394, 0.01809484139084816, 0.018903391435742378, 0.019711939617991447, 0.020520489662885666, 0.021329039707779884, 0.022137589752674103, 0.022946137934923172, 0.02375468797981739, 0.02456323616206646, 0.025371786206960678, 0.026180334389209747, 0.026988884434103966, 0.027797434478998184, 0.028605982661247253, 0.029414532706141472, 0.03022308275103569, 0.03103163279592991, 0.03184018284082413, 0.032648731023073196, 0.033457282930612564, 0.03426583111286163, 0.0350743792951107, 0.03588293120265007, 0.03669147938489914, 0.03750002756714821, 0.03830857574939728, 0.039117127656936646, 0.039925675839185715, 0.040734224021434784, 0.04154277592897415, 0.04235132411122322, 0.04315987229347229, 0.04396842420101166, 0.04477697238326073, 0.045585524290800095, 0.046394072473049164, 0.04720262065529823, 0.0480111725628376, 0.04881972074508667, 0.04962827265262604, 0.05043682083487511]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 5.0, 6.0, 9.0, 14.0, 16.0, 11.0, 19.0, 30.0, 37.0, 41.0, 46.0, 47.0, 68.0, 53.0, 61.0, 61.0, 59.0, 61.0, 54.0, 44.0, 48.0, 37.0, 38.0, 41.0, 28.0, 22.0, 16.0, 8.0, 9.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002431333065032959, -0.002360250800848007, -0.0022891685366630554, -0.0022180862724781036, -0.002147004008293152, -0.0020759217441082, -0.0020048394799232483, -0.0019337572157382965, -0.0018626749515533447, -0.001791592687368393, -0.0017205104231834412, -0.0016494281589984894, -0.0015783458948135376, -0.0015072636306285858, -0.001436181366443634, -0.0013650991022586823, -0.0012940168380737305, -0.0012229345738887787, -0.001151852309703827, -0.0010807700455188751, -0.0010096877813339233, -0.0009386055171489716, -0.0008675232529640198, -0.000796440988779068, -0.0007253587245941162, -0.0006542764604091644, -0.0005831941962242126, -0.0005121119320392609, -0.0004410296678543091, -0.0003699474036693573, -0.0002988651394844055, -0.00022778287529945374, -0.00015670061111450195, -8.561834692955017e-05, -1.4536082744598389e-05, 5.6546181440353394e-05, 0.00012762844562530518, 0.00019871070981025696, 0.00026979297399520874, 0.0003408752381801605, 0.0004119575023651123, 0.0004830397665500641, 0.0005541220307350159, 0.0006252042949199677, 0.0006962865591049194, 0.0007673688232898712, 0.000838451087474823, 0.0009095333516597748, 0.0009806156158447266, 0.0010516978800296783, 0.0011227801442146301, 0.001193862408399582, 0.0012649446725845337, 0.0013360269367694855, 0.0014071092009544373, 0.001478191465139389, 0.0015492737293243408, 0.0016203559935092926, 0.0016914382576942444, 0.0017625205218791962, 0.001833602786064148, 0.0019046850502490997, 0.0019757673144340515, 0.0020468495786190033, 0.002117931842803955]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 6.0, 3.0, 8.0, 5.0, 14.0, 15.0, 10.0, 27.0, 29.0, 22.0, 23.0, 38.0, 38.0, 44.0, 42.0, 42.0, 51.0, 42.0, 49.0, 50.0, 46.0, 46.0, 51.0, 52.0, 36.0, 42.0, 26.0, 29.0, 20.0, 26.0, 14.0, 13.0, 16.0, 14.0, 5.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.01171875, -4.87109375, -4.73046875, -4.58984375, -4.44921875, -4.30859375, -4.16796875, -4.02734375, -3.88671875, -3.74609375, -3.60546875, -3.46484375, -3.32421875, -3.18359375, -3.04296875, -2.90234375, -2.76171875, -2.62109375, -2.48046875, -2.33984375, -2.19921875, -2.05859375, -1.91796875, -1.77734375, -1.63671875, -1.49609375, -1.35546875, -1.21484375, -1.07421875, -0.93359375, -0.79296875, -0.65234375, -0.51171875, -0.37109375, -0.23046875, -0.08984375, 0.05078125, 0.19140625, 0.33203125, 0.47265625, 0.61328125, 0.75390625, 0.89453125, 1.03515625, 1.17578125, 1.31640625, 1.45703125, 1.59765625, 1.73828125, 1.87890625, 2.01953125, 2.16015625, 2.30078125, 2.44140625, 2.58203125, 2.72265625, 2.86328125, 3.00390625, 3.14453125, 3.28515625, 3.42578125, 3.56640625, 3.70703125, 3.84765625, 3.98828125]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 5.0, 2.0, 11.0, 7.0, 17.0, 31.0, 37.0, 57.0, 84.0, 84.0, 148.0, 197.0, 253.0, 399.0, 557.0, 962.0, 1449.0, 2516.0, 4684.0, 9370.0, 18674.0, 38988.0, 83114.0, 180966.0, 305364.0, 210498.0, 99059.0, 45533.0, 21886.0, 10616.0, 5347.0, 2957.0, 1646.0, 956.0, 637.0, 427.0, 329.0, 199.0, 131.0, 108.0, 84.0, 49.0, 40.0, 27.0, 13.0, 14.0, 10.0, 9.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-3.28125, -3.186431884765625, -3.09161376953125, -2.996795654296875, -2.9019775390625, -2.807159423828125, -2.71234130859375, -2.617523193359375, -2.522705078125, -2.427886962890625, -2.33306884765625, -2.238250732421875, -2.1434326171875, -2.048614501953125, -1.95379638671875, -1.858978271484375, -1.76416015625, -1.669342041015625, -1.57452392578125, -1.479705810546875, -1.3848876953125, -1.290069580078125, -1.19525146484375, -1.100433349609375, -1.005615234375, -0.910797119140625, -0.81597900390625, -0.721160888671875, -0.6263427734375, -0.531524658203125, -0.43670654296875, -0.341888427734375, -0.2470703125, -0.152252197265625, -0.05743408203125, 0.037384033203125, 0.1322021484375, 0.227020263671875, 0.32183837890625, 0.416656494140625, 0.511474609375, 0.606292724609375, 0.70111083984375, 0.795928955078125, 0.8907470703125, 0.985565185546875, 1.08038330078125, 1.175201416015625, 1.27001953125, 1.364837646484375, 1.45965576171875, 1.554473876953125, 1.6492919921875, 1.744110107421875, 1.83892822265625, 1.933746337890625, 2.028564453125, 2.123382568359375, 2.21820068359375, 2.313018798828125, 2.4078369140625, 2.502655029296875, 2.59747314453125, 2.692291259765625, 2.787109375]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 10.0, 6.0, 9.0, 21.0, 13.0, 22.0, 24.0, 23.0, 31.0, 33.0, 46.0, 64.0, 65.0, 87.0, 182.0, 1555.0, 307.0, 118.0, 63.0, 57.0, 56.0, 43.0, 31.0, 23.0, 31.0, 22.0, 24.0, 12.0, 10.0, 9.0, 6.0, 13.0, 5.0, 5.0, 6.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-17.1875, -16.678466796875, -16.16943359375, -15.660400390625, -15.1513671875, -14.642333984375, -14.13330078125, -13.624267578125, -13.115234375, -12.606201171875, -12.09716796875, -11.588134765625, -11.0791015625, -10.570068359375, -10.06103515625, -9.552001953125, -9.04296875, -8.533935546875, -8.02490234375, -7.515869140625, -7.0068359375, -6.497802734375, -5.98876953125, -5.479736328125, -4.970703125, -4.461669921875, -3.95263671875, -3.443603515625, -2.9345703125, -2.425537109375, -1.91650390625, -1.407470703125, -0.8984375, -0.389404296875, 0.11962890625, 0.628662109375, 1.1376953125, 1.646728515625, 2.15576171875, 2.664794921875, 3.173828125, 3.682861328125, 4.19189453125, 4.700927734375, 5.2099609375, 5.718994140625, 6.22802734375, 6.737060546875, 7.24609375, 7.755126953125, 8.26416015625, 8.773193359375, 9.2822265625, 9.791259765625, 10.30029296875, 10.809326171875, 11.318359375, 11.827392578125, 12.33642578125, 12.845458984375, 13.3544921875, 13.863525390625, 14.37255859375, 14.881591796875, 15.390625]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 6.0, 2.0, 3.0, 4.0, 8.0, 7.0, 9.0, 13.0, 16.0, 28.0, 36.0, 50.0, 67.0, 80.0, 120.0, 189.0, 281.0, 517.0, 1634.0, 317384.0, 2820610.0, 3063.0, 563.0, 343.0, 209.0, 140.0, 83.0, 68.0, 44.0, 37.0, 31.0, 22.0, 15.0, 8.0, 6.0, 2.0, 4.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0], "bins": [-45.21875, -43.853515625, -42.48828125, -41.123046875, -39.7578125, -38.392578125, -37.02734375, -35.662109375, -34.296875, -32.931640625, -31.56640625, -30.201171875, -28.8359375, -27.470703125, -26.10546875, -24.740234375, -23.375, -22.009765625, -20.64453125, -19.279296875, -17.9140625, -16.548828125, -15.18359375, -13.818359375, -12.453125, -11.087890625, -9.72265625, -8.357421875, -6.9921875, -5.626953125, -4.26171875, -2.896484375, -1.53125, -0.166015625, 1.19921875, 2.564453125, 3.9296875, 5.294921875, 6.66015625, 8.025390625, 9.390625, 10.755859375, 12.12109375, 13.486328125, 14.8515625, 16.216796875, 17.58203125, 18.947265625, 20.3125, 21.677734375, 23.04296875, 24.408203125, 25.7734375, 27.138671875, 28.50390625, 29.869140625, 31.234375, 32.599609375, 33.96484375, 35.330078125, 36.6953125, 38.060546875, 39.42578125, 40.791015625, 42.15625]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 65.0, 400.0, 449.0, 92.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.653289794921875, -14.306504249572754, -11.959718704223633, -9.612934112548828, -7.266148567199707, -4.919363021850586, -2.5725784301757812, -0.22579193115234375, 2.120992660522461, 4.467778205871582, 6.814563274383545, 9.161348342895508, 11.508133888244629, 13.85491943359375, 16.201704025268555, 18.548490524291992, 20.895275115966797, 23.2420597076416, 25.58884620666504, 27.935630798339844, 30.28241729736328, 32.62920379638672, 34.97598648071289, 37.32277297973633, 39.6695556640625, 42.01634216308594, 44.36312484741211, 46.70991134643555, 49.056697845458984, 51.403480529785156, 53.750267028808594, 56.09705352783203, 58.44384002685547, 60.790626525878906, 63.13740921020508, 65.48419189453125, 67.83097839355469, 70.17776489257812, 72.52455139160156, 74.871337890625, 77.21812438964844, 79.56491088867188, 81.91169738769531, 84.25848388671875, 86.60526275634766, 88.9520492553711, 91.29883575439453, 93.64562225341797, 95.99240112304688, 98.33918762207031, 100.68597412109375, 103.03276062011719, 105.3795394897461, 107.72632598876953, 110.07311248779297, 112.4198989868164, 114.76668548583984, 117.11347198486328, 119.46025848388672, 121.80703735351562, 124.15382385253906, 126.5006103515625, 128.84739685058594, 131.19418334960938, 133.5409698486328]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 1.0, 5.0, 2.0, 4.0, 7.0, 8.0, 9.0, 5.0, 13.0, 9.0, 12.0, 20.0, 19.0, 27.0, 33.0, 32.0, 28.0, 36.0, 36.0, 41.0, 40.0, 38.0, 36.0, 46.0, 37.0, 40.0, 42.0, 42.0, 38.0, 36.0, 42.0, 28.0, 24.0, 27.0, 22.0, 26.0, 23.0, 12.0, 10.0, 4.0, 16.0, 9.0, 5.0, 7.0, 5.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.362545013427734, -33.20852279663086, -32.05449676513672, -30.900474548339844, -29.746450424194336, -28.592426300048828, -27.438404083251953, -26.284379959106445, -25.130355834960938, -23.97633171081543, -22.822307586669922, -21.668285369873047, -20.51426124572754, -19.36023712158203, -18.206214904785156, -17.05219078063965, -15.89816665649414, -14.744142532348633, -13.590119361877441, -12.43609619140625, -11.282072067260742, -10.128047943115234, -8.974024772644043, -7.820001602172852, -6.665977478027344, -5.511953830718994, -4.3579301834106445, -3.203906536102295, -2.0498828887939453, -0.8958592414855957, 0.2581644058227539, 1.4121875762939453, 2.5662078857421875, 3.720231533050537, 4.874255180358887, 6.028278827667236, 7.182302474975586, 8.336326599121094, 9.490349769592285, 10.644372940063477, 11.798397064208984, 12.952421188354492, 14.106444358825684, 15.260467529296875, 16.414491653442383, 17.56851577758789, 18.722537994384766, 19.876562118530273, 21.03058624267578, 22.18461036682129, 23.338634490966797, 24.492656707763672, 25.64668083190918, 26.800704956054688, 27.954727172851562, 29.10875129699707, 30.262775421142578, 31.416799545288086, 32.570823669433594, 33.72484588623047, 34.878868103027344, 36.032894134521484, 37.18691635131836, 38.3409423828125, 39.494964599609375]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 2.0, 1.0, 4.0, 3.0, 5.0, 8.0, 10.0, 13.0, 19.0, 23.0, 22.0, 25.0, 31.0, 27.0, 34.0, 44.0, 45.0, 27.0, 36.0, 43.0, 59.0, 43.0, 46.0, 41.0, 48.0, 49.0, 30.0, 36.0, 31.0, 41.0, 32.0, 22.0, 25.0, 14.0, 14.0, 10.0, 19.0, 10.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-4.953125, -4.8131103515625, -4.673095703125, -4.5330810546875, -4.39306640625, -4.2530517578125, -4.113037109375, -3.9730224609375, -3.8330078125, -3.6929931640625, -3.552978515625, -3.4129638671875, -3.27294921875, -3.1329345703125, -2.992919921875, -2.8529052734375, -2.712890625, -2.5728759765625, -2.432861328125, -2.2928466796875, -2.15283203125, -2.0128173828125, -1.872802734375, -1.7327880859375, -1.5927734375, -1.4527587890625, -1.312744140625, -1.1727294921875, -1.03271484375, -0.8927001953125, -0.752685546875, -0.6126708984375, -0.47265625, -0.3326416015625, -0.192626953125, -0.0526123046875, 0.08740234375, 0.2274169921875, 0.367431640625, 0.5074462890625, 0.6474609375, 0.7874755859375, 0.927490234375, 1.0675048828125, 1.20751953125, 1.3475341796875, 1.487548828125, 1.6275634765625, 1.767578125, 1.9075927734375, 2.047607421875, 2.1876220703125, 2.32763671875, 2.4676513671875, 2.607666015625, 2.7476806640625, 2.8876953125, 3.0277099609375, 3.167724609375, 3.3077392578125, 3.44775390625, 3.5877685546875, 3.727783203125, 3.8677978515625, 4.0078125]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 2.0, 4.0, 1.0, 7.0, 6.0, 6.0, 11.0, 11.0, 17.0, 21.0, 16.0, 33.0, 28.0, 46.0, 44.0, 76.0, 178.0, 458.0, 1514.0, 6652.0, 50012.0, 1611722.0, 2422256.0, 88445.0, 9442.0, 2089.0, 606.0, 222.0, 90.0, 59.0, 44.0, 33.0, 19.0, 29.0, 16.0, 14.0, 16.0, 10.0, 7.0, 10.0, 6.0, 3.0, 1.0, 4.0, 0.0, 0.0, 4.0, 0.0, 1.0, 1.0, 1.0], "bins": [-16.140625, -15.6806640625, -15.220703125, -14.7607421875, -14.30078125, -13.8408203125, -13.380859375, -12.9208984375, -12.4609375, -12.0009765625, -11.541015625, -11.0810546875, -10.62109375, -10.1611328125, -9.701171875, -9.2412109375, -8.78125, -8.3212890625, -7.861328125, -7.4013671875, -6.94140625, -6.4814453125, -6.021484375, -5.5615234375, -5.1015625, -4.6416015625, -4.181640625, -3.7216796875, -3.26171875, -2.8017578125, -2.341796875, -1.8818359375, -1.421875, -0.9619140625, -0.501953125, -0.0419921875, 0.41796875, 0.8779296875, 1.337890625, 1.7978515625, 2.2578125, 2.7177734375, 3.177734375, 3.6376953125, 4.09765625, 4.5576171875, 5.017578125, 5.4775390625, 5.9375, 6.3974609375, 6.857421875, 7.3173828125, 7.77734375, 8.2373046875, 8.697265625, 9.1572265625, 9.6171875, 10.0771484375, 10.537109375, 10.9970703125, 11.45703125, 11.9169921875, 12.376953125, 12.8369140625, 13.296875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 9.0, 6.0, 11.0, 10.0, 22.0, 50.0, 49.0, 107.0, 134.0, 186.0, 281.0, 401.0, 569.0, 603.0, 496.0, 407.0, 245.0, 160.0, 108.0, 74.0, 48.0, 37.0, 27.0, 10.0, 13.0, 3.0, 6.0, 4.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-14.203125, -13.8505859375, -13.498046875, -13.1455078125, -12.79296875, -12.4404296875, -12.087890625, -11.7353515625, -11.3828125, -11.0302734375, -10.677734375, -10.3251953125, -9.97265625, -9.6201171875, -9.267578125, -8.9150390625, -8.5625, -8.2099609375, -7.857421875, -7.5048828125, -7.15234375, -6.7998046875, -6.447265625, -6.0947265625, -5.7421875, -5.3896484375, -5.037109375, -4.6845703125, -4.33203125, -3.9794921875, -3.626953125, -3.2744140625, -2.921875, -2.5693359375, -2.216796875, -1.8642578125, -1.51171875, -1.1591796875, -0.806640625, -0.4541015625, -0.1015625, 0.2509765625, 0.603515625, 0.9560546875, 1.30859375, 1.6611328125, 2.013671875, 2.3662109375, 2.71875, 3.0712890625, 3.423828125, 3.7763671875, 4.12890625, 4.4814453125, 4.833984375, 5.1865234375, 5.5390625, 5.8916015625, 6.244140625, 6.5966796875, 6.94921875, 7.3017578125, 7.654296875, 8.0068359375, 8.359375]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 5.0, 8.0, 3.0, 6.0, 13.0, 27.0, 33.0, 52.0, 73.0, 115.0, 150.0, 269.0, 540.0, 1593.0, 11425.0, 289138.0, 3694171.0, 185370.0, 8789.0, 1328.0, 454.0, 256.0, 161.0, 106.0, 59.0, 57.0, 30.0, 19.0, 19.0, 9.0, 5.0, 4.0, 2.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.328125, -17.578369140625, -16.82861328125, -16.078857421875, -15.3291015625, -14.579345703125, -13.82958984375, -13.079833984375, -12.330078125, -11.580322265625, -10.83056640625, -10.080810546875, -9.3310546875, -8.581298828125, -7.83154296875, -7.081787109375, -6.33203125, -5.582275390625, -4.83251953125, -4.082763671875, -3.3330078125, -2.583251953125, -1.83349609375, -1.083740234375, -0.333984375, 0.415771484375, 1.16552734375, 1.915283203125, 2.6650390625, 3.414794921875, 4.16455078125, 4.914306640625, 5.6640625, 6.413818359375, 7.16357421875, 7.913330078125, 8.6630859375, 9.412841796875, 10.16259765625, 10.912353515625, 11.662109375, 12.411865234375, 13.16162109375, 13.911376953125, 14.6611328125, 15.410888671875, 16.16064453125, 16.910400390625, 17.66015625, 18.409912109375, 19.15966796875, 19.909423828125, 20.6591796875, 21.408935546875, 22.15869140625, 22.908447265625, 23.658203125, 24.407958984375, 25.15771484375, 25.907470703125, 26.6572265625, 27.406982421875, 28.15673828125, 28.906494140625, 29.65625]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 7.0, 15.0, 31.0, 76.0, 167.0, 235.0, 215.0, 160.0, 62.0, 30.0, 13.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.11603355407715, -20.50728416442871, -17.898536682128906, -15.289787292480469, -12.681038856506348, -10.072290420532227, -7.463541030883789, -4.854793548583984, -2.246044158935547, 0.3627045154571533, 2.9714531898498535, 5.580202102661133, 8.188950538635254, 10.797698974609375, 13.406448364257812, 16.015195846557617, 18.623945236206055, 21.232694625854492, 23.841442108154297, 26.450191497802734, 29.058940887451172, 31.667688369750977, 34.27643585205078, 36.88518524169922, 39.493934631347656, 42.102684020996094, 44.71143341064453, 47.32018280029297, 49.92892837524414, 52.53767776489258, 55.146427154541016, 57.75517272949219, 60.363929748535156, 62.972679138183594, 65.58142852783203, 68.19017791748047, 70.7989273071289, 73.40766906738281, 76.01641845703125, 78.62516784667969, 81.23391723632812, 83.84266662597656, 86.451416015625, 89.06016540527344, 91.66891479492188, 94.27766418457031, 96.88641357421875, 99.49515533447266, 102.10391235351562, 104.71266174316406, 107.3214111328125, 109.93016052246094, 112.53890991210938, 115.14765930175781, 117.75640869140625, 120.36515045166016, 122.9738998413086, 125.58264923095703, 128.19139099121094, 130.80014038085938, 133.4088897705078, 136.01763916015625, 138.6263885498047, 141.23513793945312, 143.84388732910156]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 4.0, 7.0, 9.0, 8.0, 10.0, 16.0, 13.0, 20.0, 15.0, 13.0, 17.0, 24.0, 19.0, 28.0, 36.0, 33.0, 35.0, 43.0, 32.0, 34.0, 51.0, 30.0, 44.0, 38.0, 30.0, 32.0, 30.0, 36.0, 24.0, 25.0, 28.0, 27.0, 18.0, 25.0, 22.0, 22.0, 25.0, 8.0, 7.0, 16.0, 9.0, 5.0, 7.0, 4.0, 5.0, 9.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0], "bins": [-25.119091033935547, -24.333511352539062, -23.547929763793945, -22.76235008239746, -21.976768493652344, -21.19118881225586, -20.405609130859375, -19.620027542114258, -18.83444595336914, -18.048866271972656, -17.26328468322754, -16.477705001831055, -15.692123413085938, -14.906543731689453, -14.120963096618652, -13.335382461547852, -12.549802780151367, -11.764222145080566, -10.978641510009766, -10.193061828613281, -9.407480239868164, -8.62190055847168, -7.836319923400879, -7.050739288330078, -6.265158653259277, -5.479578018188477, -4.693997383117676, -3.908417224884033, -3.1228365898132324, -2.3372559547424316, -1.551675796508789, -0.7660951614379883, 0.0194854736328125, 0.8050659894943237, 1.590646505355835, 2.3762269020080566, 3.1618075370788574, 3.947388172149658, 4.732968330383301, 5.518548965454102, 6.304129600524902, 7.089710235595703, 7.875290870666504, 8.660871505737305, 9.446451187133789, 10.232032775878906, 11.01761245727539, 11.803193092346191, 12.588773727416992, 13.374354362487793, 14.159934997558594, 14.945514678955078, 15.731096267700195, 16.51667594909668, 17.302257537841797, 18.08783721923828, 18.873416900634766, 19.65899658203125, 20.444578170776367, 21.23015785217285, 22.01573944091797, 22.801319122314453, 23.586898803710938, 24.372480392456055, 25.158061981201172]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 6.0, 10.0, 14.0, 15.0, 17.0, 28.0, 31.0, 28.0, 26.0, 31.0, 38.0, 40.0, 26.0, 35.0, 43.0, 56.0, 38.0, 42.0, 37.0, 45.0, 46.0, 34.0, 40.0, 38.0, 29.0, 36.0, 18.0, 22.0, 26.0, 17.0, 11.0, 9.0, 7.0, 15.0, 5.0, 8.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.983917236328125, -3.85845947265625, -3.733001708984375, -3.6075439453125, -3.482086181640625, -3.35662841796875, -3.231170654296875, -3.105712890625, -2.980255126953125, -2.85479736328125, -2.729339599609375, -2.6038818359375, -2.478424072265625, -2.35296630859375, -2.227508544921875, -2.10205078125, -1.976593017578125, -1.85113525390625, -1.725677490234375, -1.6002197265625, -1.474761962890625, -1.34930419921875, -1.223846435546875, -1.098388671875, -0.972930908203125, -0.84747314453125, -0.722015380859375, -0.5965576171875, -0.471099853515625, -0.34564208984375, -0.220184326171875, -0.0947265625, 0.030731201171875, 0.15618896484375, 0.281646728515625, 0.4071044921875, 0.532562255859375, 0.65802001953125, 0.783477783203125, 0.908935546875, 1.034393310546875, 1.15985107421875, 1.285308837890625, 1.4107666015625, 1.536224365234375, 1.66168212890625, 1.787139892578125, 1.91259765625, 2.038055419921875, 2.16351318359375, 2.288970947265625, 2.4144287109375, 2.539886474609375, 2.66534423828125, 2.790802001953125, 2.916259765625, 3.041717529296875, 3.16717529296875, 3.292633056640625, 3.4180908203125, 3.543548583984375, 3.66900634765625, 3.794464111328125, 3.919921875]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 5.0, 9.0, 8.0, 13.0, 33.0, 37.0, 54.0, 82.0, 110.0, 215.0, 313.0, 448.0, 854.0, 1369.0, 2087.0, 3243.0, 5507.0, 9021.0, 15154.0, 25744.0, 44820.0, 83369.0, 167665.0, 286007.0, 189342.0, 93404.0, 49623.0, 28076.0, 16339.0, 9889.0, 5957.0, 3704.0, 2298.0, 1403.0, 873.0, 545.0, 310.0, 226.0, 143.0, 90.0, 60.0, 49.0, 20.0, 17.0, 11.0, 4.0, 3.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.55810546875, -0.5409774780273438, -0.5238494873046875, -0.5067214965820312, -0.489593505859375, -0.47246551513671875, -0.4553375244140625, -0.43820953369140625, -0.42108154296875, -0.40395355224609375, -0.3868255615234375, -0.36969757080078125, -0.352569580078125, -0.33544158935546875, -0.3183135986328125, -0.30118560791015625, -0.2840576171875, -0.26692962646484375, -0.2498016357421875, -0.23267364501953125, -0.215545654296875, -0.19841766357421875, -0.1812896728515625, -0.16416168212890625, -0.14703369140625, -0.12990570068359375, -0.1127777099609375, -0.09564971923828125, -0.078521728515625, -0.06139373779296875, -0.0442657470703125, -0.02713775634765625, -0.010009765625, 0.00711822509765625, 0.0242462158203125, 0.04137420654296875, 0.058502197265625, 0.07563018798828125, 0.0927581787109375, 0.10988616943359375, 0.12701416015625, 0.14414215087890625, 0.1612701416015625, 0.17839813232421875, 0.195526123046875, 0.21265411376953125, 0.2297821044921875, 0.24691009521484375, 0.2640380859375, 0.28116607666015625, 0.2982940673828125, 0.31542205810546875, 0.332550048828125, 0.34967803955078125, 0.3668060302734375, 0.38393402099609375, 0.40106201171875, 0.41819000244140625, 0.4353179931640625, 0.45244598388671875, 0.469573974609375, 0.48670196533203125, 0.5038299560546875, 0.5209579467773438, 0.5380859375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 3.0, 2.0, 7.0, 7.0, 11.0, 6.0, 12.0, 13.0, 15.0, 12.0, 12.0, 24.0, 30.0, 22.0, 49.0, 40.0, 43.0, 40.0, 35.0, 56.0, 33.0, 1071.0, 46.0, 44.0, 50.0, 26.0, 44.0, 39.0, 42.0, 30.0, 38.0, 25.0, 24.0, 14.0, 14.0, 9.0, 8.0, 11.0, 3.0, 6.0, 4.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.431640625, -2.348419189453125, -2.26519775390625, -2.181976318359375, -2.0987548828125, -2.015533447265625, -1.93231201171875, -1.849090576171875, -1.765869140625, -1.682647705078125, -1.59942626953125, -1.516204833984375, -1.4329833984375, -1.349761962890625, -1.26654052734375, -1.183319091796875, -1.10009765625, -1.016876220703125, -0.93365478515625, -0.850433349609375, -0.7672119140625, -0.683990478515625, -0.60076904296875, -0.517547607421875, -0.434326171875, -0.351104736328125, -0.26788330078125, -0.184661865234375, -0.1014404296875, -0.018218994140625, 0.06500244140625, 0.148223876953125, 0.2314453125, 0.314666748046875, 0.39788818359375, 0.481109619140625, 0.5643310546875, 0.647552490234375, 0.73077392578125, 0.813995361328125, 0.897216796875, 0.980438232421875, 1.06365966796875, 1.146881103515625, 1.2301025390625, 1.313323974609375, 1.39654541015625, 1.479766845703125, 1.56298828125, 1.646209716796875, 1.72943115234375, 1.812652587890625, 1.8958740234375, 1.979095458984375, 2.06231689453125, 2.145538330078125, 2.228759765625, 2.311981201171875, 2.39520263671875, 2.478424072265625, 2.5616455078125, 2.644866943359375, 2.72808837890625, 2.811309814453125, 2.89453125]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 9.0, 9.0, 16.0, 24.0, 28.0, 53.0, 83.0, 140.0, 201.0, 304.0, 504.0, 762.0, 1255.0, 2037.0, 3181.0, 5202.0, 8508.0, 14120.0, 23432.0, 39520.0, 69076.0, 125876.0, 266445.0, 1215506.0, 138029.0, 76250.0, 42690.0, 24774.0, 15023.0, 9147.0, 5512.0, 3502.0, 2182.0, 1395.0, 817.0, 547.0, 347.0, 203.0, 154.0, 90.0, 65.0, 42.0, 23.0, 19.0, 11.0, 10.0, 4.0, 5.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.393310546875, -0.3814201354980469, -0.36952972412109375, -0.3576393127441406, -0.3457489013671875, -0.3338584899902344, -0.32196807861328125, -0.3100776672363281, -0.298187255859375, -0.2862968444824219, -0.27440643310546875, -0.2625160217285156, -0.2506256103515625, -0.23873519897460938, -0.22684478759765625, -0.21495437622070312, -0.20306396484375, -0.19117355346679688, -0.17928314208984375, -0.16739273071289062, -0.1555023193359375, -0.14361190795898438, -0.13172149658203125, -0.11983108520507812, -0.107940673828125, -0.09605026245117188, -0.08415985107421875, -0.07226943969726562, -0.0603790283203125, -0.048488616943359375, -0.03659820556640625, -0.024707794189453125, -0.0128173828125, -0.000926971435546875, 0.01096343994140625, 0.022853851318359375, 0.0347442626953125, 0.046634674072265625, 0.05852508544921875, 0.07041549682617188, 0.082305908203125, 0.09419631958007812, 0.10608673095703125, 0.11797714233398438, 0.1298675537109375, 0.14175796508789062, 0.15364837646484375, 0.16553878784179688, 0.17742919921875, 0.18931961059570312, 0.20121002197265625, 0.21310043334960938, 0.2249908447265625, 0.23688125610351562, 0.24877166748046875, 0.2606620788574219, 0.272552490234375, 0.2844429016113281, 0.29633331298828125, 0.3082237243652344, 0.3201141357421875, 0.3320045471191406, 0.34389495849609375, 0.3557853698730469, 0.36767578125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 4.0, 1.0, 3.0, 3.0, 4.0, 6.0, 4.0, 10.0, 8.0, 10.0, 21.0, 17.0, 23.0, 29.0, 37.0, 38.0, 55.0, 60.0, 105.0, 109.0, 103.0, 69.0, 62.0, 35.0, 42.0, 32.0, 27.0, 16.0, 14.0, 9.0, 8.0, 6.0, 4.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.0037288665771484375, -0.0036171376705169678, -0.003505408763885498, -0.0033936798572540283, -0.0032819509506225586, -0.003170222043991089, -0.003058493137359619, -0.0029467642307281494, -0.0028350353240966797, -0.00272330641746521, -0.0026115775108337402, -0.0024998486042022705, -0.0023881196975708008, -0.002276390790939331, -0.0021646618843078613, -0.0020529329776763916, -0.0019412040710449219, -0.0018294751644134521, -0.0017177462577819824, -0.0016060173511505127, -0.001494288444519043, -0.0013825595378875732, -0.0012708306312561035, -0.0011591017246246338, -0.001047372817993164, -0.0009356439113616943, -0.0008239150047302246, -0.0007121860980987549, -0.0006004571914672852, -0.0004887282848358154, -0.0003769993782043457, -0.000265270471572876, -0.00015354156494140625, -4.1812658309936523e-05, 6.99162483215332e-05, 0.00018164515495300293, 0.00029337406158447266, 0.0004051029682159424, 0.0005168318748474121, 0.0006285607814788818, 0.0007402896881103516, 0.0008520185947418213, 0.000963747501373291, 0.0010754764080047607, 0.0011872053146362305, 0.0012989342212677002, 0.00141066312789917, 0.0015223920345306396, 0.0016341209411621094, 0.001745849847793579, 0.0018575787544250488, 0.0019693076610565186, 0.0020810365676879883, 0.002192765474319458, 0.0023044943809509277, 0.0024162232875823975, 0.002527952194213867, 0.002639681100845337, 0.0027514100074768066, 0.0028631389141082764, 0.002974867820739746, 0.003086596727371216, 0.0031983256340026855, 0.0033100545406341553, 0.003421783447265625]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 4.0, 2.0, 5.0, 3.0, 6.0, 6.0, 8.0, 6.0, 8.0, 15.0, 17.0, 28.0, 35.0, 53.0, 62.0, 99.0, 153.0, 246.0, 418.0, 1450.0, 263286.0, 779062.0, 2349.0, 456.0, 249.0, 158.0, 105.0, 69.0, 45.0, 32.0, 31.0, 20.0, 12.0, 10.0, 10.0, 8.0, 7.0, 5.0, 4.0, 3.0, 2.0, 6.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.06658935546875, -0.06444644927978516, -0.06230354309082031, -0.06016063690185547, -0.058017730712890625, -0.05587482452392578, -0.05373191833496094, -0.051589012145996094, -0.04944610595703125, -0.047303199768066406, -0.04516029357910156, -0.04301738739013672, -0.040874481201171875, -0.03873157501220703, -0.03658866882324219, -0.034445762634277344, -0.0323028564453125, -0.030159950256347656, -0.028017044067382812, -0.02587413787841797, -0.023731231689453125, -0.02158832550048828, -0.019445419311523438, -0.017302513122558594, -0.01515960693359375, -0.013016700744628906, -0.010873794555664062, -0.008730888366699219, -0.006587982177734375, -0.004445075988769531, -0.0023021697998046875, -0.00015926361083984375, 0.001983642578125, 0.004126548767089844, 0.0062694549560546875, 0.008412361145019531, 0.010555267333984375, 0.012698173522949219, 0.014841079711914062, 0.016983985900878906, 0.01912689208984375, 0.021269798278808594, 0.023412704467773438, 0.02555561065673828, 0.027698516845703125, 0.02984142303466797, 0.03198432922363281, 0.034127235412597656, 0.0362701416015625, 0.038413047790527344, 0.04055595397949219, 0.04269886016845703, 0.044841766357421875, 0.04698467254638672, 0.04912757873535156, 0.051270484924316406, 0.05341339111328125, 0.055556297302246094, 0.05769920349121094, 0.05984210968017578, 0.061985015869140625, 0.06412792205810547, 0.06627082824707031, 0.06841373443603516, 0.070556640625]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 25.0, 941.0, 50.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05297432467341423, -0.0520046204328537, -0.05103491619229317, -0.050065211951732635, -0.0490955114364624, -0.04812580719590187, -0.04715610295534134, -0.04618639871478081, -0.045216694474220276, -0.044246990233659744, -0.04327728599309921, -0.04230758175253868, -0.04133787751197815, -0.040368176996707916, -0.039398472756147385, -0.03842876851558685, -0.03745906427502632, -0.03648936003446579, -0.03551965579390526, -0.03454995155334473, -0.03358025103807449, -0.03261054679751396, -0.03164084255695343, -0.0306711383163929, -0.029701434075832367, -0.028731729835271835, -0.027762025594711304, -0.02679232321679592, -0.02582261897623539, -0.024852914735674858, -0.023883212357759476, -0.022913508117198944, -0.021943803876638412, -0.02097409963607788, -0.02000439539551735, -0.019034693017601967, -0.018064988777041435, -0.017095284536480904, -0.01612558215856552, -0.01515587791800499, -0.014186174608767033, -0.013216471299529076, -0.012246767058968544, -0.011277062818408012, -0.010307359509170055, -0.009337656199932098, -0.008367951959371567, -0.0073982481844723225, -0.006428544409573078, -0.005458840634673834, -0.0044891368597745895, -0.0035194330848753452, -0.002549729309976101, -0.0015800255350768566, -0.0006103217601776123, 0.000359382014721632, 0.0013290857896208763, 0.0022987895645201206, 0.003268493339419365, 0.004238197114318609, 0.0052079008892178535, 0.006177604664117098, 0.007147308439016342, 0.008117012679576874, 0.00908671598881483]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 1.0, 6.0, 11.0, 10.0, 11.0, 5.0, 23.0, 23.0, 30.0, 39.0, 59.0, 63.0, 61.0, 60.0, 50.0, 74.0, 57.0, 58.0, 35.0, 65.0, 38.0, 57.0, 34.0, 30.0, 24.0, 26.0, 11.0, 14.0, 10.0, 13.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0023848414421081543, -0.002305316738784313, -0.002225792035460472, -0.002146267332136631, -0.00206674262881279, -0.001987217925488949, -0.0019076932221651077, -0.0018281685188412666, -0.0017486438155174255, -0.0016691191121935844, -0.0015895944088697433, -0.0015100697055459023, -0.0014305450022220612, -0.00135102029889822, -0.001271495595574379, -0.0011919708922505379, -0.0011124461889266968, -0.0010329214856028557, -0.0009533967822790146, -0.0008738720789551735, -0.0007943473756313324, -0.0007148226723074913, -0.0006352979689836502, -0.0005557732656598091, -0.000476248562335968, -0.0003967238590121269, -0.00031719915568828583, -0.00023767445236444473, -0.00015814974904060364, -7.862504571676254e-05, 8.996576070785522e-07, 8.042436093091965e-05, 0.00015994906425476074, 0.00023947376757860184, 0.00031899847090244293, 0.000398523174226284, 0.0004780478775501251, 0.0005575725808739662, 0.0006370972841978073, 0.0007166219875216484, 0.0007961466908454895, 0.0008756713941693306, 0.0009551960974931717, 0.0010347208008170128, 0.0011142455041408539, 0.001193770207464695, 0.001273294910788536, 0.0013528196141123772, 0.0014323443174362183, 0.0015118690207600594, 0.0015913937240839005, 0.0016709184274077415, 0.0017504431307315826, 0.0018299678340554237, 0.0019094925373792648, 0.001989017240703106, 0.002068541944026947, 0.002148066647350788, 0.002227591350674629, 0.0023071160539984703, 0.0023866407573223114, 0.0024661654606461525, 0.0025456901639699936, 0.0026252148672938347, 0.0027047395706176758]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 3.0, 1.0, 2.0, 3.0, 6.0, 7.0, 7.0, 6.0, 10.0, 14.0, 15.0, 17.0, 28.0, 31.0, 28.0, 26.0, 31.0, 38.0, 40.0, 26.0, 35.0, 43.0, 56.0, 38.0, 42.0, 37.0, 45.0, 46.0, 34.0, 40.0, 38.0, 29.0, 36.0, 18.0, 22.0, 26.0, 17.0, 11.0, 9.0, 7.0, 15.0, 5.0, 8.0, 3.0, 5.0, 2.0, 4.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.109375, -3.983917236328125, -3.85845947265625, -3.733001708984375, -3.6075439453125, -3.482086181640625, -3.35662841796875, -3.231170654296875, -3.105712890625, -2.980255126953125, -2.85479736328125, -2.729339599609375, -2.6038818359375, -2.478424072265625, -2.35296630859375, -2.227508544921875, -2.10205078125, -1.976593017578125, -1.85113525390625, -1.725677490234375, -1.6002197265625, -1.474761962890625, -1.34930419921875, -1.223846435546875, -1.098388671875, -0.972930908203125, -0.84747314453125, -0.722015380859375, -0.5965576171875, -0.471099853515625, -0.34564208984375, -0.220184326171875, -0.0947265625, 0.030731201171875, 0.15618896484375, 0.281646728515625, 0.4071044921875, 0.532562255859375, 0.65802001953125, 0.783477783203125, 0.908935546875, 1.034393310546875, 1.15985107421875, 1.285308837890625, 1.4107666015625, 1.536224365234375, 1.66168212890625, 1.787139892578125, 1.91259765625, 2.038055419921875, 2.16351318359375, 2.288970947265625, 2.4144287109375, 2.539886474609375, 2.66534423828125, 2.790802001953125, 2.916259765625, 3.041717529296875, 3.16717529296875, 3.292633056640625, 3.4180908203125, 3.543548583984375, 3.66900634765625, 3.794464111328125, 3.919921875]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 7.0, 3.0, 5.0, 13.0, 28.0, 37.0, 51.0, 110.0, 193.0, 352.0, 695.0, 1412.0, 3259.0, 7638.0, 18124.0, 45359.0, 113146.0, 278578.0, 334380.0, 145848.0, 58487.0, 23770.0, 9444.0, 4056.0, 1751.0, 865.0, 425.0, 209.0, 128.0, 74.0, 34.0, 29.0, 17.0, 12.0, 11.0, 3.0, 3.0, 5.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.259765625, -3.130096435546875, -3.00042724609375, -2.870758056640625, -2.7410888671875, -2.611419677734375, -2.48175048828125, -2.352081298828125, -2.222412109375, -2.092742919921875, -1.96307373046875, -1.833404541015625, -1.7037353515625, -1.574066162109375, -1.44439697265625, -1.314727783203125, -1.18505859375, -1.055389404296875, -0.92572021484375, -0.796051025390625, -0.6663818359375, -0.536712646484375, -0.40704345703125, -0.277374267578125, -0.147705078125, -0.018035888671875, 0.11163330078125, 0.241302490234375, 0.3709716796875, 0.500640869140625, 0.63031005859375, 0.759979248046875, 0.8896484375, 1.019317626953125, 1.14898681640625, 1.278656005859375, 1.4083251953125, 1.537994384765625, 1.66766357421875, 1.797332763671875, 1.927001953125, 2.056671142578125, 2.18634033203125, 2.316009521484375, 2.4456787109375, 2.575347900390625, 2.70501708984375, 2.834686279296875, 2.96435546875, 3.094024658203125, 3.22369384765625, 3.353363037109375, 3.4830322265625, 3.612701416015625, 3.74237060546875, 3.872039794921875, 4.001708984375, 4.131378173828125, 4.26104736328125, 4.390716552734375, 4.5203857421875, 4.650054931640625, 4.77972412109375, 4.909393310546875, 5.0390625]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 6.0, 3.0, 3.0, 10.0, 9.0, 20.0, 10.0, 9.0, 18.0, 19.0, 21.0, 30.0, 30.0, 36.0, 50.0, 43.0, 52.0, 77.0, 236.0, 1603.0, 252.0, 72.0, 62.0, 59.0, 52.0, 54.0, 34.0, 26.0, 35.0, 21.0, 20.0, 13.0, 13.0, 14.0, 14.0, 10.0, 5.0, 2.0, 3.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-13.84375, -13.391357421875, -12.93896484375, -12.486572265625, -12.0341796875, -11.581787109375, -11.12939453125, -10.677001953125, -10.224609375, -9.772216796875, -9.31982421875, -8.867431640625, -8.4150390625, -7.962646484375, -7.51025390625, -7.057861328125, -6.60546875, -6.153076171875, -5.70068359375, -5.248291015625, -4.7958984375, -4.343505859375, -3.89111328125, -3.438720703125, -2.986328125, -2.533935546875, -2.08154296875, -1.629150390625, -1.1767578125, -0.724365234375, -0.27197265625, 0.180419921875, 0.6328125, 1.085205078125, 1.53759765625, 1.989990234375, 2.4423828125, 2.894775390625, 3.34716796875, 3.799560546875, 4.251953125, 4.704345703125, 5.15673828125, 5.609130859375, 6.0615234375, 6.513916015625, 6.96630859375, 7.418701171875, 7.87109375, 8.323486328125, 8.77587890625, 9.228271484375, 9.6806640625, 10.133056640625, 10.58544921875, 11.037841796875, 11.490234375, 11.942626953125, 12.39501953125, 12.847412109375, 13.2998046875, 13.752197265625, 14.20458984375, 14.656982421875, 15.109375]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 11.0, 9.0, 8.0, 14.0, 15.0, 25.0, 28.0, 47.0, 37.0, 47.0, 66.0, 81.0, 123.0, 184.0, 286.0, 515.0, 1591.0, 192737.0, 2943787.0, 4353.0, 690.0, 332.0, 200.0, 117.0, 91.0, 72.0, 52.0, 26.0, 39.0, 32.0, 23.0, 14.0, 12.0, 20.0, 8.0, 3.0, 3.0, 6.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.53125, -32.341796875, -31.15234375, -29.962890625, -28.7734375, -27.583984375, -26.39453125, -25.205078125, -24.015625, -22.826171875, -21.63671875, -20.447265625, -19.2578125, -18.068359375, -16.87890625, -15.689453125, -14.5, -13.310546875, -12.12109375, -10.931640625, -9.7421875, -8.552734375, -7.36328125, -6.173828125, -4.984375, -3.794921875, -2.60546875, -1.416015625, -0.2265625, 0.962890625, 2.15234375, 3.341796875, 4.53125, 5.720703125, 6.91015625, 8.099609375, 9.2890625, 10.478515625, 11.66796875, 12.857421875, 14.046875, 15.236328125, 16.42578125, 17.615234375, 18.8046875, 19.994140625, 21.18359375, 22.373046875, 23.5625, 24.751953125, 25.94140625, 27.130859375, 28.3203125, 29.509765625, 30.69921875, 31.888671875, 33.078125, 34.267578125, 35.45703125, 36.646484375, 37.8359375, 39.025390625, 40.21484375, 41.404296875, 42.59375]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [2.0, 3.0, 90.0, 788.0, 134.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.632203102111816, -11.252185821533203, -6.872167587280273, -2.49215030670166, 1.8878679275512695, 6.267886161804199, 10.647902488708496, 15.027920722961426, 19.407939910888672, 23.7879581451416, 28.16797637939453, 32.54799270629883, 36.928009033203125, 41.30802917480469, 45.688045501708984, 50.06806182861328, 54.448081970214844, 58.82809829711914, 63.2081184387207, 67.588134765625, 71.96815490722656, 76.34817504882812, 80.72818756103516, 85.10820770263672, 89.48822021484375, 93.86824035644531, 98.24825286865234, 102.6282730102539, 107.00829315185547, 111.3883056640625, 115.76832580566406, 120.14834594726562, 124.52836608886719, 128.90838623046875, 133.2884063720703, 137.66842651367188, 142.04843139648438, 146.42845153808594, 150.8084716796875, 155.18849182128906, 159.56851196289062, 163.9485321044922, 168.32855224609375, 172.70855712890625, 177.0885772705078, 181.46859741210938, 185.84861755371094, 190.2286376953125, 194.608642578125, 198.98866271972656, 203.36868286132812, 207.74868774414062, 212.1287078857422, 216.50872802734375, 220.8887481689453, 225.26876831054688, 229.64878845214844, 234.02880859375, 238.40882873535156, 242.78884887695312, 247.16885375976562, 251.5488739013672, 255.92889404296875, 260.30889892578125, 264.6889343261719]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 5.0, 14.0, 18.0, 9.0, 15.0, 22.0, 17.0, 18.0, 36.0, 25.0, 27.0, 30.0, 32.0, 31.0, 34.0, 36.0, 43.0, 44.0, 42.0, 39.0, 48.0, 38.0, 39.0, 43.0, 32.0, 30.0, 25.0, 32.0, 28.0, 21.0, 19.0, 23.0, 16.0, 11.0, 8.0, 10.0, 11.0, 5.0, 2.0, 4.0, 3.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-35.932838439941406, -34.80192184448242, -33.67100143432617, -32.54008483886719, -31.409164428710938, -30.27824592590332, -29.147327423095703, -28.01641082763672, -26.88549041748047, -25.75457191467285, -24.623653411865234, -23.492734909057617, -22.36181640625, -21.230897903442383, -20.099979400634766, -18.96906280517578, -17.838144302368164, -16.707225799560547, -15.57630729675293, -14.445388793945312, -13.314470291137695, -12.183551788330078, -11.052634239196777, -9.92171573638916, -8.790797233581543, -7.659878730773926, -6.528960227966309, -5.39804220199585, -4.267123699188232, -3.1362051963806152, -2.0052871704101562, -0.8743686676025391, 0.2565498352050781, 1.3874682188034058, 2.5183866024017334, 3.6493048667907715, 4.780223369598389, 5.911141872406006, 7.042059898376465, 8.172978401184082, 9.3038969039917, 10.434815406799316, 11.565733909606934, 12.696651458740234, 13.827569961547852, 14.958488464355469, 16.089406967163086, 17.220325469970703, 18.35124397277832, 19.482162475585938, 20.613080978393555, 21.743999481201172, 22.87491798400879, 24.005836486816406, 25.13675308227539, 26.26767349243164, 27.398590087890625, 28.529508590698242, 29.66042709350586, 30.791345596313477, 31.922264099121094, 33.05318069458008, 34.18410110473633, 35.31501770019531, 36.44593811035156]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 7.0, 10.0, 7.0, 14.0, 11.0, 15.0, 27.0, 26.0, 29.0, 28.0, 30.0, 29.0, 33.0, 41.0, 41.0, 38.0, 35.0, 42.0, 41.0, 42.0, 46.0, 45.0, 34.0, 28.0, 36.0, 40.0, 27.0, 37.0, 23.0, 16.0, 16.0, 18.0, 18.0, 13.0, 11.0, 9.0, 11.0, 5.0, 3.0, 2.0, 3.0, 7.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.390625, -4.2557373046875, -4.120849609375, -3.9859619140625, -3.85107421875, -3.7161865234375, -3.581298828125, -3.4464111328125, -3.3115234375, -3.1766357421875, -3.041748046875, -2.9068603515625, -2.77197265625, -2.6370849609375, -2.502197265625, -2.3673095703125, -2.232421875, -2.0975341796875, -1.962646484375, -1.8277587890625, -1.69287109375, -1.5579833984375, -1.423095703125, -1.2882080078125, -1.1533203125, -1.0184326171875, -0.883544921875, -0.7486572265625, -0.61376953125, -0.4788818359375, -0.343994140625, -0.2091064453125, -0.07421875, 0.0606689453125, 0.195556640625, 0.3304443359375, 0.46533203125, 0.6002197265625, 0.735107421875, 0.8699951171875, 1.0048828125, 1.1397705078125, 1.274658203125, 1.4095458984375, 1.54443359375, 1.6793212890625, 1.814208984375, 1.9490966796875, 2.083984375, 2.2188720703125, 2.353759765625, 2.4886474609375, 2.62353515625, 2.7584228515625, 2.893310546875, 3.0281982421875, 3.1630859375, 3.2979736328125, 3.432861328125, 3.5677490234375, 3.70263671875, 3.8375244140625, 3.972412109375, 4.1072998046875, 4.2421875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 6.0, 2.0, 4.0, 4.0, 6.0, 8.0, 9.0, 11.0, 8.0, 13.0, 27.0, 25.0, 25.0, 41.0, 40.0, 49.0, 111.0, 211.0, 434.0, 1114.0, 3561.0, 16726.0, 221324.0, 2751380.0, 1136293.0, 51797.0, 7555.0, 2019.0, 686.0, 310.0, 151.0, 90.0, 60.0, 34.0, 24.0, 20.0, 20.0, 15.0, 23.0, 3.0, 15.0, 12.0, 7.0, 2.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-13.34375, -12.9364013671875, -12.529052734375, -12.1217041015625, -11.71435546875, -11.3070068359375, -10.899658203125, -10.4923095703125, -10.0849609375, -9.6776123046875, -9.270263671875, -8.8629150390625, -8.45556640625, -8.0482177734375, -7.640869140625, -7.2335205078125, -6.826171875, -6.4188232421875, -6.011474609375, -5.6041259765625, -5.19677734375, -4.7894287109375, -4.382080078125, -3.9747314453125, -3.5673828125, -3.1600341796875, -2.752685546875, -2.3453369140625, -1.93798828125, -1.5306396484375, -1.123291015625, -0.7159423828125, -0.30859375, 0.0987548828125, 0.506103515625, 0.9134521484375, 1.32080078125, 1.7281494140625, 2.135498046875, 2.5428466796875, 2.9501953125, 3.3575439453125, 3.764892578125, 4.1722412109375, 4.57958984375, 4.9869384765625, 5.394287109375, 5.8016357421875, 6.208984375, 6.6163330078125, 7.023681640625, 7.4310302734375, 7.83837890625, 8.2457275390625, 8.653076171875, 9.0604248046875, 9.4677734375, 9.8751220703125, 10.282470703125, 10.6898193359375, 11.09716796875, 11.5045166015625, 11.911865234375, 12.3192138671875, 12.7265625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 3.0, 10.0, 17.0, 19.0, 51.0, 55.0, 111.0, 151.0, 288.0, 409.0, 614.0, 701.0, 584.0, 375.0, 262.0, 163.0, 99.0, 67.0, 36.0, 24.0, 14.0, 5.0, 12.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.265625, -17.844970703125, -17.42431640625, -17.003662109375, -16.5830078125, -16.162353515625, -15.74169921875, -15.321044921875, -14.900390625, -14.479736328125, -14.05908203125, -13.638427734375, -13.2177734375, -12.797119140625, -12.37646484375, -11.955810546875, -11.53515625, -11.114501953125, -10.69384765625, -10.273193359375, -9.8525390625, -9.431884765625, -9.01123046875, -8.590576171875, -8.169921875, -7.749267578125, -7.32861328125, -6.907958984375, -6.4873046875, -6.066650390625, -5.64599609375, -5.225341796875, -4.8046875, -4.384033203125, -3.96337890625, -3.542724609375, -3.1220703125, -2.701416015625, -2.28076171875, -1.860107421875, -1.439453125, -1.018798828125, -0.59814453125, -0.177490234375, 0.2431640625, 0.663818359375, 1.08447265625, 1.505126953125, 1.92578125, 2.346435546875, 2.76708984375, 3.187744140625, 3.6083984375, 4.029052734375, 4.44970703125, 4.870361328125, 5.291015625, 5.711669921875, 6.13232421875, 6.552978515625, 6.9736328125, 7.394287109375, 7.81494140625, 8.235595703125, 8.65625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 8.0, 4.0, 7.0, 11.0, 9.0, 24.0, 37.0, 64.0, 106.0, 201.0, 302.0, 586.0, 3387.0, 1488556.0, 2694992.0, 4572.0, 648.0, 336.0, 185.0, 94.0, 65.0, 40.0, 26.0, 19.0, 5.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.65625, -28.2470703125, -26.837890625, -25.4287109375, -24.01953125, -22.6103515625, -21.201171875, -19.7919921875, -18.3828125, -16.9736328125, -15.564453125, -14.1552734375, -12.74609375, -11.3369140625, -9.927734375, -8.5185546875, -7.109375, -5.7001953125, -4.291015625, -2.8818359375, -1.47265625, -0.0634765625, 1.345703125, 2.7548828125, 4.1640625, 5.5732421875, 6.982421875, 8.3916015625, 9.80078125, 11.2099609375, 12.619140625, 14.0283203125, 15.4375, 16.8466796875, 18.255859375, 19.6650390625, 21.07421875, 22.4833984375, 23.892578125, 25.3017578125, 26.7109375, 28.1201171875, 29.529296875, 30.9384765625, 32.34765625, 33.7568359375, 35.166015625, 36.5751953125, 37.984375, 39.3935546875, 40.802734375, 42.2119140625, 43.62109375, 45.0302734375, 46.439453125, 47.8486328125, 49.2578125, 50.6669921875, 52.076171875, 53.4853515625, 54.89453125, 56.3037109375, 57.712890625, 59.1220703125, 60.53125]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 11.0, 75.0, 261.0, 394.0, 207.0, 56.0, 10.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-159.6854248046875, -155.52272033691406, -151.36001586914062, -147.19729614257812, -143.0345916748047, -138.87188720703125, -134.70916748046875, -130.5464630126953, -126.38375854492188, -122.22105407714844, -118.05834197998047, -113.8956298828125, -109.73292541503906, -105.57022094726562, -101.40750885009766, -97.24479675292969, -93.08209228515625, -88.91938781738281, -84.75667572021484, -80.59396362304688, -76.43125915527344, -72.2685546875, -68.10584259033203, -63.94313430786133, -59.780426025390625, -55.61771774291992, -51.45500946044922, -47.292301177978516, -43.12959289550781, -38.96688461303711, -34.804176330566406, -30.641468048095703, -26.478744506835938, -22.316036224365234, -18.15332794189453, -13.990619659423828, -9.827911376953125, -5.665203094482422, -1.5024948120117188, 2.6602134704589844, 6.8229217529296875, 10.98563003540039, 15.148338317871094, 19.311046600341797, 23.4737548828125, 27.636463165283203, 31.799171447753906, 35.96187973022461, 40.12458801269531, 44.287296295166016, 48.45000457763672, 52.61271286010742, 56.775421142578125, 60.93812942504883, 65.10083770751953, 69.2635498046875, 73.42625427246094, 77.58895874023438, 81.75167083740234, 85.91438293457031, 90.07708740234375, 94.23979187011719, 98.40250396728516, 102.56521606445312, 106.72792053222656]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 8.0, 6.0, 6.0, 8.0, 7.0, 17.0, 14.0, 14.0, 20.0, 22.0, 28.0, 21.0, 33.0, 36.0, 27.0, 40.0, 35.0, 31.0, 38.0, 33.0, 39.0, 39.0, 37.0, 33.0, 42.0, 39.0, 34.0, 44.0, 35.0, 39.0, 22.0, 21.0, 20.0, 20.0, 12.0, 14.0, 16.0, 7.0, 9.0, 9.0, 3.0, 2.0, 4.0, 6.0, 3.0, 5.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-27.480281829833984, -26.63507080078125, -25.789859771728516, -24.94464874267578, -24.099437713623047, -23.254226684570312, -22.409015655517578, -21.56380271911621, -20.718591690063477, -19.873380661010742, -19.028169631958008, -18.182958602905273, -17.33774757385254, -16.492534637451172, -15.647324562072754, -14.802112579345703, -13.956902503967285, -13.11169147491455, -12.266480445861816, -11.421268463134766, -10.576057434082031, -9.730846405029297, -8.885635375976562, -8.040424346923828, -7.1952128410339355, -6.350001811981201, -5.504790306091309, -4.659579277038574, -3.8143680095672607, -2.9691567420959473, -2.123945713043213, -1.2787342071533203, -0.43352317810058594, 0.41168802976608276, 1.2568992376327515, 2.1021103858947754, 2.947321653366089, 3.7925329208374023, 4.637743949890137, 5.482955455780029, 6.328166484832764, 7.173377513885498, 8.01858901977539, 8.863800048828125, 9.70901107788086, 10.554222106933594, 11.399433135986328, 12.244645118713379, 13.089856147766113, 13.935067176818848, 14.780278205871582, 15.625490188598633, 16.470701217651367, 17.3159122467041, 18.161123275756836, 19.00633430480957, 19.851545333862305, 20.69675636291504, 21.541967391967773, 22.387178421020508, 23.232389450073242, 24.07760238647461, 24.922813415527344, 25.768024444580078, 26.613235473632812]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 8.0, 12.0, 11.0, 8.0, 9.0, 11.0, 16.0, 29.0, 27.0, 28.0, 17.0, 36.0, 27.0, 28.0, 43.0, 39.0, 48.0, 48.0, 39.0, 25.0, 38.0, 48.0, 36.0, 41.0, 42.0, 32.0, 31.0, 33.0, 18.0, 28.0, 21.0, 21.0, 12.0, 14.0, 15.0, 8.0, 13.0, 9.0, 5.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.978515625, -3.851776123046875, -3.72503662109375, -3.598297119140625, -3.4715576171875, -3.344818115234375, -3.21807861328125, -3.091339111328125, -2.964599609375, -2.837860107421875, -2.71112060546875, -2.584381103515625, -2.4576416015625, -2.330902099609375, -2.20416259765625, -2.077423095703125, -1.95068359375, -1.823944091796875, -1.69720458984375, -1.570465087890625, -1.4437255859375, -1.316986083984375, -1.19024658203125, -1.063507080078125, -0.936767578125, -0.810028076171875, -0.68328857421875, -0.556549072265625, -0.4298095703125, -0.303070068359375, -0.17633056640625, -0.049591064453125, 0.0771484375, 0.203887939453125, 0.33062744140625, 0.457366943359375, 0.5841064453125, 0.710845947265625, 0.83758544921875, 0.964324951171875, 1.091064453125, 1.217803955078125, 1.34454345703125, 1.471282958984375, 1.5980224609375, 1.724761962890625, 1.85150146484375, 1.978240966796875, 2.10498046875, 2.231719970703125, 2.35845947265625, 2.485198974609375, 2.6119384765625, 2.738677978515625, 2.86541748046875, 2.992156982421875, 3.118896484375, 3.245635986328125, 3.37237548828125, 3.499114990234375, 3.6258544921875, 3.752593994140625, 3.87933349609375, 4.006072998046875, 4.1328125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 6.0, 4.0, 13.0, 12.0, 15.0, 27.0, 45.0, 71.0, 116.0, 156.0, 226.0, 321.0, 522.0, 780.0, 1279.0, 1939.0, 2919.0, 4525.0, 7168.0, 11340.0, 17883.0, 28597.0, 46437.0, 78836.0, 137965.0, 223883.0, 197104.0, 114022.0, 65943.0, 39552.0, 24329.0, 15287.0, 9798.0, 6182.0, 4019.0, 2494.0, 1605.0, 1082.0, 722.0, 426.0, 307.0, 197.0, 138.0, 101.0, 55.0, 37.0, 32.0, 14.0, 14.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0], "bins": [-0.494873046875, -0.4798011779785156, -0.46472930908203125, -0.4496574401855469, -0.4345855712890625, -0.4195137023925781, -0.40444183349609375, -0.3893699645996094, -0.374298095703125, -0.3592262268066406, -0.34415435791015625, -0.3290824890136719, -0.3140106201171875, -0.2989387512207031, -0.28386688232421875, -0.2687950134277344, -0.25372314453125, -0.23865127563476562, -0.22357940673828125, -0.20850753784179688, -0.1934356689453125, -0.17836380004882812, -0.16329193115234375, -0.14822006225585938, -0.133148193359375, -0.11807632446289062, -0.10300445556640625, -0.08793258666992188, -0.0728607177734375, -0.057788848876953125, -0.04271697998046875, -0.027645111083984375, -0.0125732421875, 0.002498626708984375, 0.01757049560546875, 0.032642364501953125, 0.0477142333984375, 0.06278610229492188, 0.07785797119140625, 0.09292984008789062, 0.108001708984375, 0.12307357788085938, 0.13814544677734375, 0.15321731567382812, 0.1682891845703125, 0.18336105346679688, 0.19843292236328125, 0.21350479125976562, 0.22857666015625, 0.24364852905273438, 0.25872039794921875, 0.2737922668457031, 0.2888641357421875, 0.3039360046386719, 0.31900787353515625, 0.3340797424316406, 0.349151611328125, 0.3642234802246094, 0.37929534912109375, 0.3943672180175781, 0.4094390869140625, 0.4245109558105469, 0.43958282470703125, 0.4546546936035156, 0.4697265625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 1.0, 1.0, 3.0, 7.0, 12.0, 6.0, 4.0, 4.0, 12.0, 12.0, 15.0, 14.0, 15.0, 22.0, 27.0, 31.0, 24.0, 26.0, 29.0, 39.0, 24.0, 40.0, 34.0, 37.0, 33.0, 1065.0, 44.0, 39.0, 33.0, 42.0, 42.0, 35.0, 32.0, 36.0, 33.0, 29.0, 19.0, 21.0, 12.0, 13.0, 17.0, 12.0, 7.0, 9.0, 5.0, 3.0, 3.0, 6.0, 4.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.333984375, -2.25531005859375, -2.1766357421875, -2.09796142578125, -2.019287109375, -1.94061279296875, -1.8619384765625, -1.78326416015625, -1.70458984375, -1.62591552734375, -1.5472412109375, -1.46856689453125, -1.389892578125, -1.31121826171875, -1.2325439453125, -1.15386962890625, -1.0751953125, -0.99652099609375, -0.9178466796875, -0.83917236328125, -0.760498046875, -0.68182373046875, -0.6031494140625, -0.52447509765625, -0.44580078125, -0.36712646484375, -0.2884521484375, -0.20977783203125, -0.131103515625, -0.05242919921875, 0.0262451171875, 0.10491943359375, 0.18359375, 0.26226806640625, 0.3409423828125, 0.41961669921875, 0.498291015625, 0.57696533203125, 0.6556396484375, 0.73431396484375, 0.81298828125, 0.89166259765625, 0.9703369140625, 1.04901123046875, 1.127685546875, 1.20635986328125, 1.2850341796875, 1.36370849609375, 1.4423828125, 1.52105712890625, 1.5997314453125, 1.67840576171875, 1.757080078125, 1.83575439453125, 1.9144287109375, 1.99310302734375, 2.07177734375, 2.15045166015625, 2.2291259765625, 2.30780029296875, 2.386474609375, 2.46514892578125, 2.5438232421875, 2.62249755859375, 2.701171875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 10.0, 12.0, 17.0, 23.0, 39.0, 45.0, 75.0, 104.0, 175.0, 268.0, 354.0, 506.0, 750.0, 1074.0, 1599.0, 2342.0, 3437.0, 4948.0, 7409.0, 11242.0, 16991.0, 26179.0, 41382.0, 67004.0, 112149.0, 180189.0, 1246899.0, 140712.0, 85396.0, 51258.0, 32030.0, 20678.0, 13675.0, 9086.0, 6044.0, 4136.0, 2818.0, 1878.0, 1336.0, 920.0, 598.0, 422.0, 289.0, 190.0, 146.0, 93.0, 69.0, 35.0, 31.0, 34.0, 14.0, 11.0, 6.0, 5.0, 1.0, 3.0, 0.0, 1.0], "bins": [-0.343505859375, -0.33284759521484375, -0.3221893310546875, -0.31153106689453125, -0.300872802734375, -0.29021453857421875, -0.2795562744140625, -0.26889801025390625, -0.25823974609375, -0.24758148193359375, -0.2369232177734375, -0.22626495361328125, -0.215606689453125, -0.20494842529296875, -0.1942901611328125, -0.18363189697265625, -0.1729736328125, -0.16231536865234375, -0.1516571044921875, -0.14099884033203125, -0.130340576171875, -0.11968231201171875, -0.1090240478515625, -0.09836578369140625, -0.08770751953125, -0.07704925537109375, -0.0663909912109375, -0.05573272705078125, -0.045074462890625, -0.03441619873046875, -0.0237579345703125, -0.01309967041015625, -0.00244140625, 0.00821685791015625, 0.0188751220703125, 0.02953338623046875, 0.040191650390625, 0.05084991455078125, 0.0615081787109375, 0.07216644287109375, 0.08282470703125, 0.09348297119140625, 0.1041412353515625, 0.11479949951171875, 0.125457763671875, 0.13611602783203125, 0.1467742919921875, 0.15743255615234375, 0.1680908203125, 0.17874908447265625, 0.1894073486328125, 0.20006561279296875, 0.210723876953125, 0.22138214111328125, 0.2320404052734375, 0.24269866943359375, 0.25335693359375, 0.26401519775390625, 0.2746734619140625, 0.28533172607421875, 0.295989990234375, 0.30664825439453125, 0.3173065185546875, 0.32796478271484375, 0.338623046875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 1.0, 3.0, 2.0, 4.0, 11.0, 5.0, 4.0, 9.0, 14.0, 11.0, 31.0, 19.0, 26.0, 29.0, 37.0, 50.0, 56.0, 67.0, 72.0, 56.0, 77.0, 61.0, 46.0, 51.0, 32.0, 48.0, 24.0, 30.0, 31.0, 24.0, 17.0, 14.0, 8.0, 4.0, 5.0, 7.0, 5.0, 4.0, 3.0, 1.0, 2.0, 3.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00238800048828125, -0.0023109912872314453, -0.0022339820861816406, -0.002156972885131836, -0.0020799636840820312, -0.0020029544830322266, -0.0019259452819824219, -0.0018489360809326172, -0.0017719268798828125, -0.0016949176788330078, -0.0016179084777832031, -0.0015408992767333984, -0.0014638900756835938, -0.001386880874633789, -0.0013098716735839844, -0.0012328624725341797, -0.001155853271484375, -0.0010788440704345703, -0.0010018348693847656, -0.0009248256683349609, -0.0008478164672851562, -0.0007708072662353516, -0.0006937980651855469, -0.0006167888641357422, -0.0005397796630859375, -0.0004627704620361328, -0.0003857612609863281, -0.00030875205993652344, -0.00023174285888671875, -0.00015473365783691406, -7.772445678710938e-05, -7.152557373046875e-07, 7.62939453125e-05, 0.0001533031463623047, 0.00023031234741210938, 0.00030732154846191406, 0.00038433074951171875, 0.00046133995056152344, 0.0005383491516113281, 0.0006153583526611328, 0.0006923675537109375, 0.0007693767547607422, 0.0008463859558105469, 0.0009233951568603516, 0.0010004043579101562, 0.001077413558959961, 0.0011544227600097656, 0.0012314319610595703, 0.001308441162109375, 0.0013854503631591797, 0.0014624595642089844, 0.001539468765258789, 0.0016164779663085938, 0.0016934871673583984, 0.0017704963684082031, 0.0018475055694580078, 0.0019245147705078125, 0.002001523971557617, 0.002078533172607422, 0.0021555423736572266, 0.0022325515747070312, 0.002309560775756836, 0.0023865699768066406, 0.0024635791778564453, 0.00254058837890625]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 7.0, 8.0, 7.0, 2.0, 9.0, 13.0, 10.0, 20.0, 34.0, 39.0, 48.0, 73.0, 95.0, 153.0, 230.0, 527.0, 4929.0, 877764.0, 161723.0, 1754.0, 459.0, 219.0, 98.0, 89.0, 57.0, 40.0, 31.0, 32.0, 22.0, 11.0, 12.0, 8.0, 6.0, 5.0, 7.0, 1.0, 2.0, 6.0, 5.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05438232421875, -0.05272626876831055, -0.051070213317871094, -0.04941415786743164, -0.04775810241699219, -0.046102046966552734, -0.04444599151611328, -0.04278993606567383, -0.041133880615234375, -0.03947782516479492, -0.03782176971435547, -0.036165714263916016, -0.03450965881347656, -0.03285360336303711, -0.031197547912597656, -0.029541492462158203, -0.02788543701171875, -0.026229381561279297, -0.024573326110839844, -0.02291727066040039, -0.021261215209960938, -0.019605159759521484, -0.01794910430908203, -0.016293048858642578, -0.014636993408203125, -0.012980937957763672, -0.011324882507324219, -0.009668827056884766, -0.008012771606445312, -0.006356716156005859, -0.004700660705566406, -0.003044605255126953, -0.0013885498046875, 0.0002675056457519531, 0.0019235610961914062, 0.0035796165466308594, 0.0052356719970703125, 0.006891727447509766, 0.008547782897949219, 0.010203838348388672, 0.011859893798828125, 0.013515949249267578, 0.015172004699707031, 0.016828060150146484, 0.018484115600585938, 0.02014017105102539, 0.021796226501464844, 0.023452281951904297, 0.02510833740234375, 0.026764392852783203, 0.028420448303222656, 0.03007650375366211, 0.03173255920410156, 0.033388614654541016, 0.03504467010498047, 0.03670072555541992, 0.038356781005859375, 0.04001283645629883, 0.04166889190673828, 0.043324947357177734, 0.04498100280761719, 0.04663705825805664, 0.048293113708496094, 0.04994916915893555, 0.051605224609375]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 10.0, 144.0, 527.0, 299.0, 29.0, 7.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.01465591136366129, -0.014320953749120235, -0.013985995203256607, -0.013651037588715553, -0.013316079042851925, -0.012981121428310871, -0.012646162882447243, -0.012311205267906189, -0.01197624672204256, -0.011641289107501507, -0.011306330561637878, -0.010971372947096825, -0.010636414401233196, -0.010301456786692142, -0.009966498240828514, -0.00963154062628746, -0.009296583011746407, -0.008961625397205353, -0.008626666851341724, -0.00829170923680067, -0.007956750690937042, -0.007621792610734701, -0.00728683453053236, -0.006951876915991306, -0.006616918370127678, -0.006281960289925337, -0.005947002209722996, -0.005612044129520655, -0.005277086049318314, -0.0049421279691159725, -0.0046071698889136314, -0.004272212274372578, -0.003937254194170237, -0.0036022961139678955, -0.0032673380337655544, -0.0029323799535632133, -0.0025974218733608723, -0.002262463793158531, -0.0019275059457868338, -0.0015925478655844927, -0.0012575897853821516, -0.0009226317051798105, -0.0005876736831851304, -0.0002527156611904502, 8.224241901189089e-05, 0.00041720049921423197, 0.0007521584630012512, 0.0010871165432035923, 0.0014220746234059334, 0.0017570327036082745, 0.0020919907838106155, 0.0024269488640129566, 0.0027619069442152977, 0.0030968650244176388, 0.003431822871789336, 0.0037667809519916773, 0.004101739265024662, 0.004436697345227003, 0.004771655425429344, 0.005106613505631685, 0.005441571585834026, 0.005776529666036367, 0.0061114877462387085, 0.006446445360779762, 0.006781403440982103]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 0.0, 6.0, 3.0, 3.0, 8.0, 7.0, 6.0, 3.0, 12.0, 18.0, 16.0, 13.0, 19.0, 20.0, 27.0, 25.0, 25.0, 23.0, 36.0, 32.0, 35.0, 26.0, 35.0, 26.0, 32.0, 35.0, 34.0, 39.0, 38.0, 27.0, 40.0, 34.0, 42.0, 27.0, 34.0, 26.0, 24.0, 18.0, 20.0, 18.0, 20.0, 16.0, 7.0, 13.0, 11.0, 7.0, 8.0, 5.0, 2.0, 2.0, 3.0, 5.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.0011160969734191895, -0.0010811658576130867, -0.001046234741806984, -0.0010113036260008812, -0.0009763725101947784, -0.0009414413943886757, -0.0009065102785825729, -0.0008715791627764702, -0.0008366480469703674, -0.0008017169311642647, -0.0007667858153581619, -0.0007318546995520592, -0.0006969235837459564, -0.0006619924679398537, -0.0006270613521337509, -0.0005921302363276482, -0.0005571991205215454, -0.0005222680047154427, -0.0004873368889093399, -0.00045240577310323715, -0.0004174746572971344, -0.00038254354149103165, -0.0003476124256849289, -0.00031268130987882614, -0.0002777501940727234, -0.00024281907826662064, -0.00020788796246051788, -0.00017295684665441513, -0.00013802573084831238, -0.00010309461504220963, -6.816349923610687e-05, -3.323238343000412e-05, 1.6987323760986328e-06, 3.6629848182201385e-05, 7.156096398830414e-05, 0.00010649207979440689, 0.00014142319560050964, 0.0001763543114066124, 0.00021128542721271515, 0.0002462165430188179, 0.00028114765882492065, 0.0003160787746310234, 0.00035100989043712616, 0.0003859410062432289, 0.00042087212204933167, 0.0004558032378554344, 0.0004907343536615372, 0.0005256654694676399, 0.0005605965852737427, 0.0005955277010798454, 0.0006304588168859482, 0.0006653899326920509, 0.0007003210484981537, 0.0007352521643042564, 0.0007701832801103592, 0.0008051143959164619, 0.0008400455117225647, 0.0008749766275286674, 0.0009099077433347702, 0.000944838859140873, 0.0009797699749469757, 0.0010147010907530785, 0.0010496322065591812, 0.001084563322365284, 0.0011194944381713867]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 4.0, 8.0, 12.0, 11.0, 8.0, 9.0, 11.0, 16.0, 29.0, 27.0, 28.0, 17.0, 36.0, 27.0, 28.0, 43.0, 39.0, 48.0, 48.0, 39.0, 25.0, 38.0, 48.0, 36.0, 41.0, 42.0, 32.0, 31.0, 33.0, 18.0, 28.0, 21.0, 21.0, 12.0, 14.0, 15.0, 8.0, 13.0, 9.0, 5.0, 7.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.978515625, -3.851776123046875, -3.72503662109375, -3.598297119140625, -3.4715576171875, -3.344818115234375, -3.21807861328125, -3.091339111328125, -2.964599609375, -2.837860107421875, -2.71112060546875, -2.584381103515625, -2.4576416015625, -2.330902099609375, -2.20416259765625, -2.077423095703125, -1.95068359375, -1.823944091796875, -1.69720458984375, -1.570465087890625, -1.4437255859375, -1.316986083984375, -1.19024658203125, -1.063507080078125, -0.936767578125, -0.810028076171875, -0.68328857421875, -0.556549072265625, -0.4298095703125, -0.303070068359375, -0.17633056640625, -0.049591064453125, 0.0771484375, 0.203887939453125, 0.33062744140625, 0.457366943359375, 0.5841064453125, 0.710845947265625, 0.83758544921875, 0.964324951171875, 1.091064453125, 1.217803955078125, 1.34454345703125, 1.471282958984375, 1.5980224609375, 1.724761962890625, 1.85150146484375, 1.978240966796875, 2.10498046875, 2.231719970703125, 2.35845947265625, 2.485198974609375, 2.6119384765625, 2.738677978515625, 2.86541748046875, 2.992156982421875, 3.118896484375, 3.245635986328125, 3.37237548828125, 3.499114990234375, 3.6258544921875, 3.752593994140625, 3.87933349609375, 4.006072998046875, 4.1328125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 4.0, 3.0, 6.0, 8.0, 17.0, 19.0, 30.0, 41.0, 60.0, 92.0, 144.0, 209.0, 307.0, 443.0, 750.0, 1226.0, 2119.0, 3863.0, 7706.0, 17518.0, 45095.0, 123243.0, 326823.0, 320391.0, 120193.0, 44171.0, 17154.0, 7689.0, 3802.0, 2113.0, 1201.0, 741.0, 492.0, 297.0, 180.0, 128.0, 89.0, 64.0, 41.0, 27.0, 18.0, 10.0, 14.0, 7.0, 5.0, 5.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.12890625, -3.99566650390625, -3.8624267578125, -3.72918701171875, -3.595947265625, -3.46270751953125, -3.3294677734375, -3.19622802734375, -3.06298828125, -2.92974853515625, -2.7965087890625, -2.66326904296875, -2.530029296875, -2.39678955078125, -2.2635498046875, -2.13031005859375, -1.9970703125, -1.86383056640625, -1.7305908203125, -1.59735107421875, -1.464111328125, -1.33087158203125, -1.1976318359375, -1.06439208984375, -0.93115234375, -0.79791259765625, -0.6646728515625, -0.53143310546875, -0.398193359375, -0.26495361328125, -0.1317138671875, 0.00152587890625, 0.134765625, 0.26800537109375, 0.4012451171875, 0.53448486328125, 0.667724609375, 0.80096435546875, 0.9342041015625, 1.06744384765625, 1.20068359375, 1.33392333984375, 1.4671630859375, 1.60040283203125, 1.733642578125, 1.86688232421875, 2.0001220703125, 2.13336181640625, 2.2666015625, 2.39984130859375, 2.5330810546875, 2.66632080078125, 2.799560546875, 2.93280029296875, 3.0660400390625, 3.19927978515625, 3.33251953125, 3.46575927734375, 3.5989990234375, 3.73223876953125, 3.865478515625, 3.99871826171875, 4.1319580078125, 4.26519775390625, 4.3984375]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 1.0, 6.0, 4.0, 5.0, 1.0, 6.0, 11.0, 5.0, 16.0, 18.0, 23.0, 24.0, 24.0, 20.0, 37.0, 32.0, 40.0, 47.0, 64.0, 86.0, 158.0, 1430.0, 419.0, 142.0, 87.0, 56.0, 35.0, 40.0, 35.0, 35.0, 22.0, 20.0, 17.0, 16.0, 15.0, 12.0, 12.0, 7.0, 10.0, 2.0, 5.0, 3.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-15.5, -15.015380859375, -14.53076171875, -14.046142578125, -13.5615234375, -13.076904296875, -12.59228515625, -12.107666015625, -11.623046875, -11.138427734375, -10.65380859375, -10.169189453125, -9.6845703125, -9.199951171875, -8.71533203125, -8.230712890625, -7.74609375, -7.261474609375, -6.77685546875, -6.292236328125, -5.8076171875, -5.322998046875, -4.83837890625, -4.353759765625, -3.869140625, -3.384521484375, -2.89990234375, -2.415283203125, -1.9306640625, -1.446044921875, -0.96142578125, -0.476806640625, 0.0078125, 0.492431640625, 0.97705078125, 1.461669921875, 1.9462890625, 2.430908203125, 2.91552734375, 3.400146484375, 3.884765625, 4.369384765625, 4.85400390625, 5.338623046875, 5.8232421875, 6.307861328125, 6.79248046875, 7.277099609375, 7.76171875, 8.246337890625, 8.73095703125, 9.215576171875, 9.7001953125, 10.184814453125, 10.66943359375, 11.154052734375, 11.638671875, 12.123291015625, 12.60791015625, 13.092529296875, 13.5771484375, 14.061767578125, 14.54638671875, 15.031005859375, 15.515625]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 4.0, 2.0, 3.0, 5.0, 7.0, 6.0, 4.0, 17.0, 13.0, 13.0, 23.0, 27.0, 46.0, 76.0, 93.0, 120.0, 222.0, 314.0, 562.0, 3326.0, 3087336.0, 51182.0, 1036.0, 419.0, 231.0, 174.0, 118.0, 87.0, 59.0, 41.0, 37.0, 22.0, 19.0, 16.0, 6.0, 8.0, 3.0, 9.0, 7.0, 2.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 3.0, 1.0], "bins": [-60.09375, -58.412109375, -56.73046875, -55.048828125, -53.3671875, -51.685546875, -50.00390625, -48.322265625, -46.640625, -44.958984375, -43.27734375, -41.595703125, -39.9140625, -38.232421875, -36.55078125, -34.869140625, -33.1875, -31.505859375, -29.82421875, -28.142578125, -26.4609375, -24.779296875, -23.09765625, -21.416015625, -19.734375, -18.052734375, -16.37109375, -14.689453125, -13.0078125, -11.326171875, -9.64453125, -7.962890625, -6.28125, -4.599609375, -2.91796875, -1.236328125, 0.4453125, 2.126953125, 3.80859375, 5.490234375, 7.171875, 8.853515625, 10.53515625, 12.216796875, 13.8984375, 15.580078125, 17.26171875, 18.943359375, 20.625, 22.306640625, 23.98828125, 25.669921875, 27.3515625, 29.033203125, 30.71484375, 32.396484375, 34.078125, 35.759765625, 37.44140625, 39.123046875, 40.8046875, 42.486328125, 44.16796875, 45.849609375, 47.53125]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 20.0, 175.0, 489.0, 288.0, 40.0, 1.0, 1.0, 3.0, 0.0, 1.0], "bins": [-130.77835083007812, -128.47015380859375, -126.1619644165039, -123.85377502441406, -121.54557800292969, -119.23738098144531, -116.92919158935547, -114.62100219726562, -112.31280517578125, -110.00460815429688, -107.69641876220703, -105.38822937011719, -103.08003234863281, -100.77183532714844, -98.4636459350586, -96.15545654296875, -93.84725952148438, -91.5390625, -89.23087310791016, -86.92268371582031, -84.61448669433594, -82.30628967285156, -79.99810028076172, -77.68991088867188, -75.3817138671875, -73.07351684570312, -70.76532745361328, -68.45713806152344, -66.14894104003906, -63.84074783325195, -61.532554626464844, -59.224361419677734, -56.916168212890625, -54.607975006103516, -52.299781799316406, -49.9915885925293, -47.68339538574219, -45.37520217895508, -43.06700897216797, -40.75881576538086, -38.45062255859375, -36.14242935180664, -33.83423614501953, -31.526042938232422, -29.217849731445312, -26.909656524658203, -24.601463317871094, -22.293270111083984, -19.985074996948242, -17.676881790161133, -15.368688583374023, -13.060495376586914, -10.752302169799805, -8.444108963012695, -6.135915756225586, -3.8277225494384766, -1.5195293426513672, 0.7886638641357422, 3.0968570709228516, 5.405050277709961, 7.71324348449707, 10.02143669128418, 12.329629898071289, 14.637823104858398, 16.946016311645508]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 4.0, 4.0, 3.0, 9.0, 6.0, 7.0, 11.0, 15.0, 12.0, 13.0, 17.0, 23.0, 25.0, 12.0, 26.0, 24.0, 39.0, 34.0, 30.0, 33.0, 44.0, 24.0, 33.0, 28.0, 39.0, 38.0, 33.0, 38.0, 41.0, 36.0, 29.0, 42.0, 34.0, 26.0, 28.0, 20.0, 15.0, 15.0, 18.0, 12.0, 8.0, 11.0, 12.0, 11.0, 4.0, 3.0, 0.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0], "bins": [-32.98579406738281, -31.951248168945312, -30.916702270507812, -29.882158279418945, -28.847612380981445, -27.813066482543945, -26.778522491455078, -25.743976593017578, -24.709430694580078, -23.674884796142578, -22.640338897705078, -21.60579490661621, -20.57124900817871, -19.53670310974121, -18.502159118652344, -17.467613220214844, -16.433067321777344, -15.398521423339844, -14.36397647857666, -13.329431533813477, -12.294885635375977, -11.260339736938477, -10.225794792175293, -9.19124984741211, -8.15670394897461, -7.122158527374268, -6.087613105773926, -5.053067684173584, -4.018522262573242, -2.9839768409729004, -1.9494314193725586, -0.9148859977722168, 0.11965560913085938, 1.1542010307312012, 2.188746452331543, 3.2232918739318848, 4.257837295532227, 5.292382717132568, 6.32692813873291, 7.361473560333252, 8.396018981933594, 9.430564880371094, 10.465109825134277, 11.499654769897461, 12.534200668334961, 13.568746566772461, 14.603291511535645, 15.637836456298828, 16.672382354736328, 17.706928253173828, 18.741474151611328, 19.776018142700195, 20.810564041137695, 21.845109939575195, 22.879653930664062, 23.914199829101562, 24.948745727539062, 25.983291625976562, 27.017837524414062, 28.05238151550293, 29.08692741394043, 30.12147331237793, 31.156017303466797, 32.1905632019043, 33.2251091003418]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 3.0, 5.0, 2.0, 1.0, 8.0, 6.0, 7.0, 12.0, 18.0, 9.0, 12.0, 19.0, 26.0, 25.0, 19.0, 29.0, 25.0, 27.0, 35.0, 45.0, 38.0, 45.0, 44.0, 50.0, 47.0, 46.0, 31.0, 39.0, 53.0, 28.0, 24.0, 26.0, 35.0, 20.0, 17.0, 23.0, 30.0, 10.0, 11.0, 13.0, 12.0, 9.0, 8.0, 7.0, 1.0, 2.0, 2.0, 2.0, 2.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.6875, -4.5457763671875, -4.404052734375, -4.2623291015625, -4.12060546875, -3.9788818359375, -3.837158203125, -3.6954345703125, -3.5537109375, -3.4119873046875, -3.270263671875, -3.1285400390625, -2.98681640625, -2.8450927734375, -2.703369140625, -2.5616455078125, -2.419921875, -2.2781982421875, -2.136474609375, -1.9947509765625, -1.85302734375, -1.7113037109375, -1.569580078125, -1.4278564453125, -1.2861328125, -1.1444091796875, -1.002685546875, -0.8609619140625, -0.71923828125, -0.5775146484375, -0.435791015625, -0.2940673828125, -0.15234375, -0.0106201171875, 0.131103515625, 0.2728271484375, 0.41455078125, 0.5562744140625, 0.697998046875, 0.8397216796875, 0.9814453125, 1.1231689453125, 1.264892578125, 1.4066162109375, 1.54833984375, 1.6900634765625, 1.831787109375, 1.9735107421875, 2.115234375, 2.2569580078125, 2.398681640625, 2.5404052734375, 2.68212890625, 2.8238525390625, 2.965576171875, 3.1072998046875, 3.2490234375, 3.3907470703125, 3.532470703125, 3.6741943359375, 3.81591796875, 3.9576416015625, 4.099365234375, 4.2410888671875, 4.3828125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 3.0, 5.0, 5.0, 8.0, 11.0, 12.0, 12.0, 15.0, 22.0, 38.0, 56.0, 68.0, 97.0, 149.0, 234.0, 378.0, 669.0, 1315.0, 3504.0, 12667.0, 92792.0, 917364.0, 2371403.0, 708687.0, 68255.0, 10544.0, 3023.0, 1253.0, 651.0, 369.0, 202.0, 142.0, 100.0, 65.0, 31.0, 33.0, 28.0, 18.0, 9.0, 12.0, 5.0, 8.0, 6.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-8.6875, -8.4111328125, -8.134765625, -7.8583984375, -7.58203125, -7.3056640625, -7.029296875, -6.7529296875, -6.4765625, -6.2001953125, -5.923828125, -5.6474609375, -5.37109375, -5.0947265625, -4.818359375, -4.5419921875, -4.265625, -3.9892578125, -3.712890625, -3.4365234375, -3.16015625, -2.8837890625, -2.607421875, -2.3310546875, -2.0546875, -1.7783203125, -1.501953125, -1.2255859375, -0.94921875, -0.6728515625, -0.396484375, -0.1201171875, 0.15625, 0.4326171875, 0.708984375, 0.9853515625, 1.26171875, 1.5380859375, 1.814453125, 2.0908203125, 2.3671875, 2.6435546875, 2.919921875, 3.1962890625, 3.47265625, 3.7490234375, 4.025390625, 4.3017578125, 4.578125, 4.8544921875, 5.130859375, 5.4072265625, 5.68359375, 5.9599609375, 6.236328125, 6.5126953125, 6.7890625, 7.0654296875, 7.341796875, 7.6181640625, 7.89453125, 8.1708984375, 8.447265625, 8.7236328125, 9.0]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 6.0, 3.0, 3.0, 2.0, 6.0, 6.0, 3.0, 5.0, 6.0, 16.0, 25.0, 25.0, 39.0, 42.0, 48.0, 72.0, 89.0, 118.0, 162.0, 235.0, 254.0, 333.0, 395.0, 443.0, 374.0, 323.0, 268.0, 191.0, 131.0, 102.0, 78.0, 72.0, 57.0, 38.0, 25.0, 14.0, 15.0, 13.0, 12.0, 6.0, 5.0, 10.0, 3.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.984375, -7.75115966796875, -7.5179443359375, -7.28472900390625, -7.051513671875, -6.81829833984375, -6.5850830078125, -6.35186767578125, -6.11865234375, -5.88543701171875, -5.6522216796875, -5.41900634765625, -5.185791015625, -4.95257568359375, -4.7193603515625, -4.48614501953125, -4.2529296875, -4.01971435546875, -3.7864990234375, -3.55328369140625, -3.320068359375, -3.08685302734375, -2.8536376953125, -2.62042236328125, -2.38720703125, -2.15399169921875, -1.9207763671875, -1.68756103515625, -1.454345703125, -1.22113037109375, -0.9879150390625, -0.75469970703125, -0.521484375, -0.28826904296875, -0.0550537109375, 0.17816162109375, 0.411376953125, 0.64459228515625, 0.8778076171875, 1.11102294921875, 1.34423828125, 1.57745361328125, 1.8106689453125, 2.04388427734375, 2.277099609375, 2.51031494140625, 2.7435302734375, 2.97674560546875, 3.2099609375, 3.44317626953125, 3.6763916015625, 3.90960693359375, 4.142822265625, 4.37603759765625, 4.6092529296875, 4.84246826171875, 5.07568359375, 5.30889892578125, 5.5421142578125, 5.77532958984375, 6.008544921875, 6.24176025390625, 6.4749755859375, 6.70819091796875, 6.94140625]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 2.0, 9.0, 9.0, 9.0, 13.0, 17.0, 29.0, 34.0, 65.0, 69.0, 97.0, 123.0, 159.0, 210.0, 340.0, 711.0, 3388.0, 88274.0, 3755727.0, 335998.0, 6798.0, 873.0, 395.0, 245.0, 164.0, 109.0, 115.0, 69.0, 62.0, 49.0, 31.0, 28.0, 11.0, 9.0, 4.0, 7.0, 5.0, 2.0, 5.0, 2.0, 4.0, 3.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.15625, -23.34130859375, -22.5263671875, -21.71142578125, -20.896484375, -20.08154296875, -19.2666015625, -18.45166015625, -17.63671875, -16.82177734375, -16.0068359375, -15.19189453125, -14.376953125, -13.56201171875, -12.7470703125, -11.93212890625, -11.1171875, -10.30224609375, -9.4873046875, -8.67236328125, -7.857421875, -7.04248046875, -6.2275390625, -5.41259765625, -4.59765625, -3.78271484375, -2.9677734375, -2.15283203125, -1.337890625, -0.52294921875, 0.2919921875, 1.10693359375, 1.921875, 2.73681640625, 3.5517578125, 4.36669921875, 5.181640625, 5.99658203125, 6.8115234375, 7.62646484375, 8.44140625, 9.25634765625, 10.0712890625, 10.88623046875, 11.701171875, 12.51611328125, 13.3310546875, 14.14599609375, 14.9609375, 15.77587890625, 16.5908203125, 17.40576171875, 18.220703125, 19.03564453125, 19.8505859375, 20.66552734375, 21.48046875, 22.29541015625, 23.1103515625, 23.92529296875, 24.740234375, 25.55517578125, 26.3701171875, 27.18505859375, 28.0]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 10.0, 24.0, 55.0, 123.0, 200.0, 215.0, 199.0, 125.0, 53.0, 8.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-118.74240112304688, -116.43351745605469, -114.1246337890625, -111.81575012207031, -109.50686645507812, -107.19798278808594, -104.88909912109375, -102.5802230834961, -100.2713394165039, -97.96245574951172, -95.65357208251953, -93.34468841552734, -91.03580474853516, -88.7269287109375, -86.41804504394531, -84.10916137695312, -81.80027770996094, -79.49139404296875, -77.18251037597656, -74.87362670898438, -72.56474304199219, -70.255859375, -67.94697570800781, -65.63809967041016, -63.32920837402344, -61.02032470703125, -58.71144104003906, -56.402557373046875, -54.09367752075195, -51.784793853759766, -49.47591018676758, -47.167030334472656, -44.85814666748047, -42.54926300048828, -40.240379333496094, -37.931495666503906, -35.622615814208984, -33.3137321472168, -31.00484848022461, -28.695966720581055, -26.387081146240234, -24.078197479248047, -21.769315719604492, -19.460432052612305, -17.15155029296875, -14.842666625976562, -12.533782958984375, -10.22490119934082, -7.916017532348633, -5.607134819030762, -3.2982516288757324, -0.9893684387207031, 1.319514274597168, 3.628396987915039, 5.937280654907227, 8.246162414550781, 10.555046081542969, 12.86392879486084, 15.172811508178711, 17.4816951751709, 19.790576934814453, 22.09946060180664, 24.408344268798828, 26.717226028442383, 29.02610969543457]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 4.0, 5.0, 6.0, 5.0, 10.0, 8.0, 9.0, 11.0, 13.0, 20.0, 14.0, 18.0, 26.0, 28.0, 34.0, 35.0, 29.0, 48.0, 30.0, 38.0, 36.0, 43.0, 40.0, 50.0, 46.0, 36.0, 33.0, 32.0, 29.0, 25.0, 30.0, 31.0, 18.0, 34.0, 23.0, 19.0, 13.0, 13.0, 14.0, 11.0, 11.0, 8.0, 11.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-27.83289909362793, -26.98099136352539, -26.12908172607422, -25.27717399597168, -24.42526626586914, -23.57335662841797, -22.72144889831543, -21.86954116821289, -21.01763153076172, -20.16572380065918, -19.313814163208008, -18.46190643310547, -17.609996795654297, -16.758089065551758, -15.906181335449219, -15.054272651672363, -14.202363967895508, -13.350455284118652, -12.498546600341797, -11.646638870239258, -10.794730186462402, -9.942821502685547, -9.090913772583008, -8.239005088806152, -7.387096405029297, -6.535187721252441, -5.683279514312744, -4.831371307373047, -3.9794626235961914, -3.127553939819336, -2.2756457328796387, -1.4237375259399414, -0.5718307495117188, 0.2800776958465576, 1.131986141204834, 1.9838945865631104, 2.8358030319213867, 3.687711715698242, 4.5396199226379395, 5.391528129577637, 6.243436813354492, 7.095345497131348, 7.947253704071045, 8.799161911010742, 9.651070594787598, 10.502979278564453, 11.354887008666992, 12.206795692443848, 13.058704376220703, 13.910613059997559, 14.762521743774414, 15.614429473876953, 16.466339111328125, 17.318246841430664, 18.170154571533203, 19.022064208984375, 19.873971939086914, 20.725879669189453, 21.577789306640625, 22.429697036743164, 23.281604766845703, 24.133514404296875, 24.985422134399414, 25.837329864501953, 26.689239501953125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 5.0, 6.0, 9.0, 7.0, 13.0, 16.0, 15.0, 18.0, 17.0, 27.0, 21.0, 21.0, 35.0, 23.0, 34.0, 40.0, 46.0, 40.0, 50.0, 35.0, 38.0, 39.0, 43.0, 43.0, 40.0, 26.0, 30.0, 35.0, 24.0, 34.0, 19.0, 16.0, 16.0, 18.0, 25.0, 14.0, 17.0, 8.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.859375, -3.7325439453125, -3.605712890625, -3.4788818359375, -3.35205078125, -3.2252197265625, -3.098388671875, -2.9715576171875, -2.8447265625, -2.7178955078125, -2.591064453125, -2.4642333984375, -2.33740234375, -2.2105712890625, -2.083740234375, -1.9569091796875, -1.830078125, -1.7032470703125, -1.576416015625, -1.4495849609375, -1.32275390625, -1.1959228515625, -1.069091796875, -0.9422607421875, -0.8154296875, -0.6885986328125, -0.561767578125, -0.4349365234375, -0.30810546875, -0.1812744140625, -0.054443359375, 0.0723876953125, 0.19921875, 0.3260498046875, 0.452880859375, 0.5797119140625, 0.70654296875, 0.8333740234375, 0.960205078125, 1.0870361328125, 1.2138671875, 1.3406982421875, 1.467529296875, 1.5943603515625, 1.72119140625, 1.8480224609375, 1.974853515625, 2.1016845703125, 2.228515625, 2.3553466796875, 2.482177734375, 2.6090087890625, 2.73583984375, 2.8626708984375, 2.989501953125, 3.1163330078125, 3.2431640625, 3.3699951171875, 3.496826171875, 3.6236572265625, 3.75048828125, 3.8773193359375, 4.004150390625, 4.1309814453125, 4.2578125]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 6.0, 2.0, 7.0, 14.0, 28.0, 30.0, 33.0, 58.0, 75.0, 127.0, 185.0, 297.0, 411.0, 595.0, 916.0, 1304.0, 2066.0, 3118.0, 4636.0, 7010.0, 10774.0, 16829.0, 26497.0, 43568.0, 73790.0, 128233.0, 211415.0, 206387.0, 124004.0, 71084.0, 41993.0, 25703.0, 16298.0, 10656.0, 6936.0, 4443.0, 2976.0, 2018.0, 1286.0, 929.0, 627.0, 401.0, 264.0, 184.0, 95.0, 86.0, 48.0, 47.0, 28.0, 19.0, 12.0, 8.0, 6.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.47998046875, -0.4649658203125, -0.449951171875, -0.4349365234375, -0.419921875, -0.4049072265625, -0.389892578125, -0.3748779296875, -0.35986328125, -0.3448486328125, -0.329833984375, -0.3148193359375, -0.2998046875, -0.2847900390625, -0.269775390625, -0.2547607421875, -0.23974609375, -0.2247314453125, -0.209716796875, -0.1947021484375, -0.1796875, -0.1646728515625, -0.149658203125, -0.1346435546875, -0.11962890625, -0.1046142578125, -0.089599609375, -0.0745849609375, -0.0595703125, -0.0445556640625, -0.029541015625, -0.0145263671875, 0.00048828125, 0.0155029296875, 0.030517578125, 0.0455322265625, 0.060546875, 0.0755615234375, 0.090576171875, 0.1055908203125, 0.12060546875, 0.1356201171875, 0.150634765625, 0.1656494140625, 0.1806640625, 0.1956787109375, 0.210693359375, 0.2257080078125, 0.24072265625, 0.2557373046875, 0.270751953125, 0.2857666015625, 0.30078125, 0.3157958984375, 0.330810546875, 0.3458251953125, 0.36083984375, 0.3758544921875, 0.390869140625, 0.4058837890625, 0.4208984375, 0.4359130859375, 0.450927734375, 0.4659423828125, 0.48095703125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 3.0, 11.0, 8.0, 9.0, 14.0, 12.0, 17.0, 20.0, 23.0, 25.0, 33.0, 38.0, 27.0, 35.0, 39.0, 37.0, 47.0, 49.0, 39.0, 1066.0, 38.0, 47.0, 40.0, 44.0, 35.0, 41.0, 34.0, 29.0, 30.0, 20.0, 24.0, 15.0, 14.0, 10.0, 13.0, 7.0, 7.0, 11.0, 7.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.23046875, -2.141876220703125, -2.05328369140625, -1.964691162109375, -1.8760986328125, -1.787506103515625, -1.69891357421875, -1.610321044921875, -1.521728515625, -1.433135986328125, -1.34454345703125, -1.255950927734375, -1.1673583984375, -1.078765869140625, -0.99017333984375, -0.901580810546875, -0.81298828125, -0.724395751953125, -0.63580322265625, -0.547210693359375, -0.4586181640625, -0.370025634765625, -0.28143310546875, -0.192840576171875, -0.104248046875, -0.015655517578125, 0.07293701171875, 0.161529541015625, 0.2501220703125, 0.338714599609375, 0.42730712890625, 0.515899658203125, 0.6044921875, 0.693084716796875, 0.78167724609375, 0.870269775390625, 0.9588623046875, 1.047454833984375, 1.13604736328125, 1.224639892578125, 1.313232421875, 1.401824951171875, 1.49041748046875, 1.579010009765625, 1.6676025390625, 1.756195068359375, 1.84478759765625, 1.933380126953125, 2.02197265625, 2.110565185546875, 2.19915771484375, 2.287750244140625, 2.3763427734375, 2.464935302734375, 2.55352783203125, 2.642120361328125, 2.730712890625, 2.819305419921875, 2.90789794921875, 2.996490478515625, 3.0850830078125, 3.173675537109375, 3.26226806640625, 3.350860595703125, 3.439453125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 4.0, 3.0, 20.0, 14.0, 26.0, 31.0, 61.0, 78.0, 110.0, 182.0, 285.0, 399.0, 574.0, 830.0, 1222.0, 1857.0, 2726.0, 4005.0, 5845.0, 8970.0, 13531.0, 20675.0, 32202.0, 51860.0, 84627.0, 138456.0, 1240189.0, 182241.0, 114380.0, 69860.0, 42790.0, 27018.0, 17610.0, 11325.0, 7518.0, 5098.0, 3394.0, 2321.0, 1517.0, 1027.0, 730.0, 484.0, 343.0, 236.0, 163.0, 90.0, 59.0, 48.0, 33.0, 37.0, 16.0, 8.0, 6.0, 4.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.35546875, -0.3446311950683594, -0.33379364013671875, -0.3229560852050781, -0.3121185302734375, -0.3012809753417969, -0.29044342041015625, -0.2796058654785156, -0.268768310546875, -0.2579307556152344, -0.24709320068359375, -0.23625564575195312, -0.2254180908203125, -0.21458053588867188, -0.20374298095703125, -0.19290542602539062, -0.18206787109375, -0.17123031616210938, -0.16039276123046875, -0.14955520629882812, -0.1387176513671875, -0.12788009643554688, -0.11704254150390625, -0.10620498657226562, -0.095367431640625, -0.08452987670898438, -0.07369232177734375, -0.06285476684570312, -0.0520172119140625, -0.041179656982421875, -0.03034210205078125, -0.019504547119140625, -0.0086669921875, 0.002170562744140625, 0.01300811767578125, 0.023845672607421875, 0.0346832275390625, 0.045520782470703125, 0.05635833740234375, 0.06719589233398438, 0.078033447265625, 0.08887100219726562, 0.09970855712890625, 0.11054611206054688, 0.1213836669921875, 0.13222122192382812, 0.14305877685546875, 0.15389633178710938, 0.16473388671875, 0.17557144165039062, 0.18640899658203125, 0.19724655151367188, 0.2080841064453125, 0.21892166137695312, 0.22975921630859375, 0.24059677124023438, 0.251434326171875, 0.2622718811035156, 0.27310943603515625, 0.2839469909667969, 0.2947845458984375, 0.3056221008300781, 0.31645965576171875, 0.3272972106933594, 0.338134765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 0.0, 3.0, 2.0, 4.0, 1.0, 5.0, 4.0, 5.0, 11.0, 7.0, 11.0, 19.0, 19.0, 17.0, 18.0, 37.0, 36.0, 39.0, 55.0, 64.0, 74.0, 81.0, 83.0, 74.0, 60.0, 59.0, 42.0, 38.0, 26.0, 15.0, 19.0, 17.0, 7.0, 13.0, 7.0, 4.0, 3.0, 7.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0025310516357421875, -0.0024459660053253174, -0.0023608803749084473, -0.002275794744491577, -0.002190709114074707, -0.002105623483657837, -0.002020537853240967, -0.0019354522228240967, -0.0018503665924072266, -0.0017652809619903564, -0.0016801953315734863, -0.0015951097011566162, -0.001510024070739746, -0.001424938440322876, -0.0013398528099060059, -0.0012547671794891357, -0.0011696815490722656, -0.0010845959186553955, -0.0009995102882385254, -0.0009144246578216553, -0.0008293390274047852, -0.000744253396987915, -0.0006591677665710449, -0.0005740821361541748, -0.0004889965057373047, -0.00040391087532043457, -0.00031882524490356445, -0.00023373961448669434, -0.00014865398406982422, -6.35683536529541e-05, 2.1517276763916016e-05, 0.00010660290718078613, 0.00019168853759765625, 0.00027677416801452637, 0.0003618597984313965, 0.0004469454288482666, 0.0005320310592651367, 0.0006171166896820068, 0.000702202320098877, 0.0007872879505157471, 0.0008723735809326172, 0.0009574592113494873, 0.0010425448417663574, 0.0011276304721832275, 0.0012127161026000977, 0.0012978017330169678, 0.0013828873634338379, 0.001467972993850708, 0.0015530586242675781, 0.0016381442546844482, 0.0017232298851013184, 0.0018083155155181885, 0.0018934011459350586, 0.0019784867763519287, 0.002063572406768799, 0.002148658037185669, 0.002233743667602539, 0.002318829298019409, 0.0024039149284362793, 0.0024890005588531494, 0.0025740861892700195, 0.0026591718196868896, 0.0027442574501037598, 0.00282934308052063, 0.0029144287109375]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 5.0, 4.0, 8.0, 8.0, 6.0, 7.0, 9.0, 16.0, 22.0, 24.0, 30.0, 32.0, 58.0, 88.0, 136.0, 224.0, 577.0, 5124.0, 962562.0, 77626.0, 1087.0, 323.0, 180.0, 104.0, 67.0, 50.0, 30.0, 27.0, 25.0, 18.0, 18.0, 11.0, 11.0, 7.0, 6.0, 5.0, 2.0, 4.0, 3.0, 1.0, 3.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.0611572265625, -0.059345245361328125, -0.05753326416015625, -0.055721282958984375, -0.0539093017578125, -0.052097320556640625, -0.05028533935546875, -0.048473358154296875, -0.046661376953125, -0.044849395751953125, -0.04303741455078125, -0.041225433349609375, -0.0394134521484375, -0.037601470947265625, -0.03578948974609375, -0.033977508544921875, -0.03216552734375, -0.030353546142578125, -0.02854156494140625, -0.026729583740234375, -0.0249176025390625, -0.023105621337890625, -0.02129364013671875, -0.019481658935546875, -0.017669677734375, -0.015857696533203125, -0.01404571533203125, -0.012233734130859375, -0.0104217529296875, -0.008609771728515625, -0.00679779052734375, -0.004985809326171875, -0.003173828125, -0.001361846923828125, 0.00045013427734375, 0.002262115478515625, 0.0040740966796875, 0.005886077880859375, 0.00769805908203125, 0.009510040283203125, 0.011322021484375, 0.013134002685546875, 0.01494598388671875, 0.016757965087890625, 0.0185699462890625, 0.020381927490234375, 0.02219390869140625, 0.024005889892578125, 0.02581787109375, 0.027629852294921875, 0.02944183349609375, 0.031253814697265625, 0.0330657958984375, 0.034877777099609375, 0.03668975830078125, 0.038501739501953125, 0.040313720703125, 0.042125701904296875, 0.04393768310546875, 0.045749664306640625, 0.0475616455078125, 0.049373626708984375, 0.05118560791015625, 0.052997589111328125, 0.0548095703125]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 149.0, 645.0, 203.0, 9.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.021819373592734337, -0.021404584869742393, -0.0209897980093956, -0.020575009286403656, -0.020160220563411713, -0.01974543370306492, -0.019330644980072975, -0.018915856257081032, -0.018501069396734238, -0.018086280673742294, -0.0176714938133955, -0.017256705090403557, -0.016841916367411613, -0.01642712950706482, -0.016012340784072876, -0.015597552061080933, -0.01518276333808899, -0.01476797554641962, -0.014353186823427677, -0.013938399031758308, -0.01352361124008894, -0.013108822517096996, -0.012694034725427628, -0.012279246002435684, -0.01186445914208889, -0.011449671350419521, -0.011034882627427578, -0.01062009483575821, -0.01020530704408884, -0.009790518321096897, -0.009375730529427528, -0.008960941806435585, -0.008546153083443642, -0.008131365291774273, -0.007716577034443617, -0.007301788777112961, -0.006887000519782305, -0.006472212262451649, -0.00605742447078228, -0.005642636213451624, -0.0052278488874435425, -0.004813060630112886, -0.004398272838443518, -0.003983484581112862, -0.0035686963237822056, -0.003153908299282193, -0.002739120274782181, -0.0023243320174515247, -0.0019095437601208687, -0.0014947556192055345, -0.0010799674782902002, -0.0006651794537901878, -0.0002503913128748536, 0.00016439682804048061, 0.000579184852540493, 0.000993973109871149, 0.0014087611343711615, 0.0018235492752864957, 0.00223833741620183, 0.0026531254407018423, 0.0030679134652018547, 0.0034827017225325108, 0.003897489747032523, 0.0043122777715325356, 0.004727066028863192]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 2.0, 3.0, 4.0, 2.0, 7.0, 11.0, 13.0, 9.0, 7.0, 14.0, 13.0, 19.0, 18.0, 18.0, 23.0, 20.0, 36.0, 34.0, 36.0, 39.0, 26.0, 38.0, 35.0, 46.0, 48.0, 37.0, 37.0, 42.0, 32.0, 24.0, 33.0, 21.0, 27.0, 34.0, 31.0, 21.0, 24.0, 23.0, 15.0, 12.0, 15.0, 8.0, 5.0, 10.0, 8.0, 5.0, 4.0, 4.0, 6.0, 1.0, 7.0, 1.0, 0.0, 4.0, 1.0], "bins": [-0.0013173222541809082, -0.0012782933190464973, -0.0012392643839120865, -0.0012002354487776756, -0.0011612065136432648, -0.001122177578508854, -0.001083148643374443, -0.0010441197082400322, -0.0010050907731056213, -0.0009660618379712105, -0.0009270329028367996, -0.0008880039677023888, -0.0008489750325679779, -0.000809946097433567, -0.0007709171622991562, -0.0007318882271647453, -0.0006928592920303345, -0.0006538303568959236, -0.0006148014217615128, -0.0005757724866271019, -0.000536743551492691, -0.0004977146163582802, -0.0004586856812238693, -0.00041965674608945847, -0.0003806278109550476, -0.00034159887582063675, -0.0003025699406862259, -0.00026354100555181503, -0.00022451207041740417, -0.00018548313528299332, -0.00014645420014858246, -0.0001074252650141716, -6.839632987976074e-05, -2.9367394745349884e-05, 9.661540389060974e-06, 4.869047552347183e-05, 8.771941065788269e-05, 0.00012674834579229355, 0.0001657772809267044, 0.00020480621606111526, 0.00024383515119552612, 0.000282864086329937, 0.00032189302146434784, 0.0003609219565987587, 0.00039995089173316956, 0.0004389798268675804, 0.00047800876200199127, 0.0005170376971364021, 0.000556066632270813, 0.0005950955674052238, 0.0006341245025396347, 0.0006731534376740456, 0.0007121823728084564, 0.0007512113079428673, 0.0007902402430772781, 0.000829269178211689, 0.0008682981133460999, 0.0009073270484805107, 0.0009463559836149216, 0.0009853849187493324, 0.0010244138538837433, 0.0010634427890181541, 0.001102471724152565, 0.0011415006592869759, 0.0011805295944213867]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 5.0, 6.0, 9.0, 7.0, 13.0, 16.0, 15.0, 18.0, 17.0, 27.0, 21.0, 21.0, 35.0, 23.0, 34.0, 40.0, 46.0, 40.0, 50.0, 35.0, 38.0, 39.0, 43.0, 43.0, 40.0, 26.0, 30.0, 35.0, 24.0, 34.0, 19.0, 16.0, 16.0, 18.0, 25.0, 14.0, 17.0, 8.0, 6.0, 6.0, 2.0, 3.0, 3.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.859375, -3.7325439453125, -3.605712890625, -3.4788818359375, -3.35205078125, -3.2252197265625, -3.098388671875, -2.9715576171875, -2.8447265625, -2.7178955078125, -2.591064453125, -2.4642333984375, -2.33740234375, -2.2105712890625, -2.083740234375, -1.9569091796875, -1.830078125, -1.7032470703125, -1.576416015625, -1.4495849609375, -1.32275390625, -1.1959228515625, -1.069091796875, -0.9422607421875, -0.8154296875, -0.6885986328125, -0.561767578125, -0.4349365234375, -0.30810546875, -0.1812744140625, -0.054443359375, 0.0723876953125, 0.19921875, 0.3260498046875, 0.452880859375, 0.5797119140625, 0.70654296875, 0.8333740234375, 0.960205078125, 1.0870361328125, 1.2138671875, 1.3406982421875, 1.467529296875, 1.5943603515625, 1.72119140625, 1.8480224609375, 1.974853515625, 2.1016845703125, 2.228515625, 2.3553466796875, 2.482177734375, 2.6090087890625, 2.73583984375, 2.8626708984375, 2.989501953125, 3.1163330078125, 3.2431640625, 3.3699951171875, 3.496826171875, 3.6236572265625, 3.75048828125, 3.8773193359375, 4.004150390625, 4.1309814453125, 4.2578125]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 6.0, 5.0, 13.0, 12.0, 24.0, 27.0, 27.0, 59.0, 62.0, 91.0, 135.0, 193.0, 260.0, 424.0, 643.0, 1060.0, 1638.0, 3087.0, 6173.0, 13703.0, 33423.0, 85353.0, 205300.0, 379916.0, 184744.0, 76484.0, 30521.0, 12225.0, 5616.0, 2823.0, 1606.0, 933.0, 611.0, 412.0, 257.0, 162.0, 152.0, 97.0, 76.0, 64.0, 29.0, 24.0, 27.0, 10.0, 8.0, 5.0, 9.0, 8.0, 8.0, 3.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-3.73828125, -3.615478515625, -3.49267578125, -3.369873046875, -3.2470703125, -3.124267578125, -3.00146484375, -2.878662109375, -2.755859375, -2.633056640625, -2.51025390625, -2.387451171875, -2.2646484375, -2.141845703125, -2.01904296875, -1.896240234375, -1.7734375, -1.650634765625, -1.52783203125, -1.405029296875, -1.2822265625, -1.159423828125, -1.03662109375, -0.913818359375, -0.791015625, -0.668212890625, -0.54541015625, -0.422607421875, -0.2998046875, -0.177001953125, -0.05419921875, 0.068603515625, 0.19140625, 0.314208984375, 0.43701171875, 0.559814453125, 0.6826171875, 0.805419921875, 0.92822265625, 1.051025390625, 1.173828125, 1.296630859375, 1.41943359375, 1.542236328125, 1.6650390625, 1.787841796875, 1.91064453125, 2.033447265625, 2.15625, 2.279052734375, 2.40185546875, 2.524658203125, 2.6474609375, 2.770263671875, 2.89306640625, 3.015869140625, 3.138671875, 3.261474609375, 3.38427734375, 3.507080078125, 3.6298828125, 3.752685546875, 3.87548828125, 3.998291015625, 4.12109375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 2.0, 5.0, 2.0, 6.0, 7.0, 10.0, 2.0, 9.0, 20.0, 23.0, 22.0, 19.0, 23.0, 24.0, 40.0, 39.0, 37.0, 40.0, 48.0, 58.0, 96.0, 266.0, 1520.0, 241.0, 93.0, 54.0, 39.0, 41.0, 53.0, 34.0, 31.0, 24.0, 24.0, 16.0, 15.0, 16.0, 13.0, 8.0, 6.0, 8.0, 8.0, 7.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-12.4453125, -12.00732421875, -11.5693359375, -11.13134765625, -10.693359375, -10.25537109375, -9.8173828125, -9.37939453125, -8.94140625, -8.50341796875, -8.0654296875, -7.62744140625, -7.189453125, -6.75146484375, -6.3134765625, -5.87548828125, -5.4375, -4.99951171875, -4.5615234375, -4.12353515625, -3.685546875, -3.24755859375, -2.8095703125, -2.37158203125, -1.93359375, -1.49560546875, -1.0576171875, -0.61962890625, -0.181640625, 0.25634765625, 0.6943359375, 1.13232421875, 1.5703125, 2.00830078125, 2.4462890625, 2.88427734375, 3.322265625, 3.76025390625, 4.1982421875, 4.63623046875, 5.07421875, 5.51220703125, 5.9501953125, 6.38818359375, 6.826171875, 7.26416015625, 7.7021484375, 8.14013671875, 8.578125, 9.01611328125, 9.4541015625, 9.89208984375, 10.330078125, 10.76806640625, 11.2060546875, 11.64404296875, 12.08203125, 12.52001953125, 12.9580078125, 13.39599609375, 13.833984375, 14.27197265625, 14.7099609375, 15.14794921875, 15.5859375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 2.0, 1.0, 6.0, 4.0, 4.0, 4.0, 12.0, 8.0, 12.0, 20.0, 27.0, 40.0, 39.0, 60.0, 76.0, 110.0, 172.0, 291.0, 599.0, 2128.0, 1116480.0, 2021701.0, 2380.0, 568.0, 326.0, 185.0, 120.0, 79.0, 67.0, 54.0, 31.0, 29.0, 17.0, 13.0, 9.0, 11.0, 8.0, 2.0, 5.0, 3.0, 3.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-49.5, -47.904296875, -46.30859375, -44.712890625, -43.1171875, -41.521484375, -39.92578125, -38.330078125, -36.734375, -35.138671875, -33.54296875, -31.947265625, -30.3515625, -28.755859375, -27.16015625, -25.564453125, -23.96875, -22.373046875, -20.77734375, -19.181640625, -17.5859375, -15.990234375, -14.39453125, -12.798828125, -11.203125, -9.607421875, -8.01171875, -6.416015625, -4.8203125, -3.224609375, -1.62890625, -0.033203125, 1.5625, 3.158203125, 4.75390625, 6.349609375, 7.9453125, 9.541015625, 11.13671875, 12.732421875, 14.328125, 15.923828125, 17.51953125, 19.115234375, 20.7109375, 22.306640625, 23.90234375, 25.498046875, 27.09375, 28.689453125, 30.28515625, 31.880859375, 33.4765625, 35.072265625, 36.66796875, 38.263671875, 39.859375, 41.455078125, 43.05078125, 44.646484375, 46.2421875, 47.837890625, 49.43359375, 51.029296875, 52.625]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 49.0, 280.0, 485.0, 181.0, 18.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-108.87791442871094, -106.79844665527344, -104.7189712524414, -102.6395034790039, -100.5600357055664, -98.48056030273438, -96.40109252929688, -94.32162475585938, -92.24215698242188, -90.16268920898438, -88.08321380615234, -86.00374603271484, -83.92427825927734, -81.84480285644531, -79.76533508300781, -77.68586730957031, -75.60639190673828, -73.52692413330078, -71.44744873046875, -69.36798095703125, -67.28851318359375, -65.20904541015625, -63.12957000732422, -61.05010223388672, -58.97063064575195, -56.89115905761719, -54.81169128417969, -52.73221969604492, -50.652748107910156, -48.573280334472656, -46.49380874633789, -44.414337158203125, -42.334869384765625, -40.25539779663086, -38.17593002319336, -36.096458435058594, -34.016990661621094, -31.937519073486328, -29.858047485351562, -27.77857780456543, -25.69911003112793, -23.619640350341797, -21.54016876220703, -19.4606990814209, -17.381229400634766, -15.301759719848633, -13.222289085388184, -11.142818450927734, -9.063348770141602, -6.9838786125183105, -4.9044084548950195, -2.8249382972717285, -0.7454681396484375, 1.3340015411376953, 3.4134721755981445, 5.492942810058594, 7.572412490844727, 9.65188217163086, 11.731352806091309, 13.810823440551758, 15.89029312133789, 17.969762802124023, 20.049232482910156, 22.128704071044922, 24.208173751831055]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 7.0, 8.0, 5.0, 11.0, 8.0, 20.0, 15.0, 21.0, 13.0, 29.0, 34.0, 40.0, 41.0, 47.0, 46.0, 33.0, 51.0, 53.0, 48.0, 47.0, 51.0, 44.0, 52.0, 32.0, 42.0, 31.0, 31.0, 24.0, 29.0, 24.0, 17.0, 11.0, 14.0, 6.0, 6.0, 5.0, 8.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.48274230957031, -32.26897430419922, -31.055206298828125, -29.84143829345703, -28.627670288085938, -27.413902282714844, -26.20013427734375, -24.986366271972656, -23.772598266601562, -22.55883026123047, -21.345062255859375, -20.13129425048828, -18.917526245117188, -17.703758239746094, -16.489990234375, -15.27622127532959, -14.06245231628418, -12.848684310913086, -11.634916305541992, -10.421148300170898, -9.207380294799805, -7.993611812591553, -6.779843330383301, -5.566075325012207, -4.352307319641113, -3.1385393142700195, -1.9247710704803467, -0.7110028266906738, 0.5027651786804199, 1.7165331840515137, 2.9303016662597656, 4.144069671630859, 5.357837677001953, 6.571605682373047, 7.785373687744141, 8.999141693115234, 10.212909698486328, 11.426677703857422, 12.640446662902832, 13.854214668273926, 15.06798267364502, 16.28175163269043, 17.495519638061523, 18.709287643432617, 19.92305564880371, 21.136823654174805, 22.3505916595459, 23.564359664916992, 24.778127670288086, 25.99189567565918, 27.205663681030273, 28.419431686401367, 29.63319969177246, 30.846967697143555, 32.06073760986328, 33.274505615234375, 34.48827362060547, 35.70204162597656, 36.915809631347656, 38.12957763671875, 39.343345642089844, 40.55711364746094, 41.77088165283203, 42.984649658203125, 44.19841766357422]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 2.0, 3.0, 6.0, 4.0, 2.0, 5.0, 9.0, 10.0, 12.0, 11.0, 14.0, 16.0, 30.0, 15.0, 23.0, 25.0, 29.0, 32.0, 39.0, 38.0, 36.0, 42.0, 44.0, 41.0, 40.0, 44.0, 43.0, 40.0, 28.0, 29.0, 46.0, 34.0, 28.0, 24.0, 24.0, 24.0, 21.0, 18.0, 20.0, 8.0, 9.0, 3.0, 9.0, 9.0, 6.0, 6.0, 2.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-4.51171875, -4.3729248046875, -4.234130859375, -4.0953369140625, -3.95654296875, -3.8177490234375, -3.678955078125, -3.5401611328125, -3.4013671875, -3.2625732421875, -3.123779296875, -2.9849853515625, -2.84619140625, -2.7073974609375, -2.568603515625, -2.4298095703125, -2.291015625, -2.1522216796875, -2.013427734375, -1.8746337890625, -1.73583984375, -1.5970458984375, -1.458251953125, -1.3194580078125, -1.1806640625, -1.0418701171875, -0.903076171875, -0.7642822265625, -0.62548828125, -0.4866943359375, -0.347900390625, -0.2091064453125, -0.0703125, 0.0684814453125, 0.207275390625, 0.3460693359375, 0.48486328125, 0.6236572265625, 0.762451171875, 0.9012451171875, 1.0400390625, 1.1788330078125, 1.317626953125, 1.4564208984375, 1.59521484375, 1.7340087890625, 1.872802734375, 2.0115966796875, 2.150390625, 2.2891845703125, 2.427978515625, 2.5667724609375, 2.70556640625, 2.8443603515625, 2.983154296875, 3.1219482421875, 3.2607421875, 3.3995361328125, 3.538330078125, 3.6771240234375, 3.81591796875, 3.9547119140625, 4.093505859375, 4.2322998046875, 4.37109375]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 7.0, 3.0, 7.0, 4.0, 8.0, 6.0, 11.0, 11.0, 16.0, 16.0, 21.0, 21.0, 26.0, 30.0, 29.0, 53.0, 46.0, 57.0, 62.0, 93.0, 183.0, 333.0, 824.0, 2447.0, 9948.0, 78072.0, 875148.0, 2438360.0, 712968.0, 62982.0, 8556.0, 2280.0, 710.0, 300.0, 145.0, 82.0, 75.0, 47.0, 48.0, 42.0, 35.0, 27.0, 28.0, 27.0, 20.0, 13.0, 15.0, 8.0, 16.0, 6.0, 7.0, 6.0, 1.0, 3.0, 4.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.6796875, -8.3946533203125, -8.109619140625, -7.8245849609375, -7.53955078125, -7.2545166015625, -6.969482421875, -6.6844482421875, -6.3994140625, -6.1143798828125, -5.829345703125, -5.5443115234375, -5.25927734375, -4.9742431640625, -4.689208984375, -4.4041748046875, -4.119140625, -3.8341064453125, -3.549072265625, -3.2640380859375, -2.97900390625, -2.6939697265625, -2.408935546875, -2.1239013671875, -1.8388671875, -1.5538330078125, -1.268798828125, -0.9837646484375, -0.69873046875, -0.4136962890625, -0.128662109375, 0.1563720703125, 0.44140625, 0.7264404296875, 1.011474609375, 1.2965087890625, 1.58154296875, 1.8665771484375, 2.151611328125, 2.4366455078125, 2.7216796875, 3.0067138671875, 3.291748046875, 3.5767822265625, 3.86181640625, 4.1468505859375, 4.431884765625, 4.7169189453125, 5.001953125, 5.2869873046875, 5.572021484375, 5.8570556640625, 6.14208984375, 6.4271240234375, 6.712158203125, 6.9971923828125, 7.2822265625, 7.5672607421875, 7.852294921875, 8.1373291015625, 8.42236328125, 8.7073974609375, 8.992431640625, 9.2774658203125, 9.5625]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 6.0, 5.0, 6.0, 10.0, 11.0, 17.0, 24.0, 25.0, 27.0, 30.0, 62.0, 53.0, 68.0, 104.0, 127.0, 173.0, 204.0, 272.0, 385.0, 388.0, 399.0, 354.0, 296.0, 238.0, 191.0, 148.0, 104.0, 76.0, 55.0, 53.0, 44.0, 21.0, 25.0, 19.0, 11.0, 9.0, 9.0, 3.0, 8.0, 3.0, 7.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.2421875, -6.0198974609375, -5.797607421875, -5.5753173828125, -5.35302734375, -5.1307373046875, -4.908447265625, -4.6861572265625, -4.4638671875, -4.2415771484375, -4.019287109375, -3.7969970703125, -3.57470703125, -3.3524169921875, -3.130126953125, -2.9078369140625, -2.685546875, -2.4632568359375, -2.240966796875, -2.0186767578125, -1.79638671875, -1.5740966796875, -1.351806640625, -1.1295166015625, -0.9072265625, -0.6849365234375, -0.462646484375, -0.2403564453125, -0.01806640625, 0.2042236328125, 0.426513671875, 0.6488037109375, 0.87109375, 1.0933837890625, 1.315673828125, 1.5379638671875, 1.76025390625, 1.9825439453125, 2.204833984375, 2.4271240234375, 2.6494140625, 2.8717041015625, 3.093994140625, 3.3162841796875, 3.53857421875, 3.7608642578125, 3.983154296875, 4.2054443359375, 4.427734375, 4.6500244140625, 4.872314453125, 5.0946044921875, 5.31689453125, 5.5391845703125, 5.761474609375, 5.9837646484375, 6.2060546875, 6.4283447265625, 6.650634765625, 6.8729248046875, 7.09521484375, 7.3175048828125, 7.539794921875, 7.7620849609375, 7.984375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 4.0, 1.0, 5.0, 6.0, 5.0, 7.0, 9.0, 13.0, 18.0, 21.0, 30.0, 26.0, 63.0, 61.0, 61.0, 103.0, 136.0, 224.0, 286.0, 407.0, 1374.0, 54905.0, 3983251.0, 149564.0, 2093.0, 449.0, 290.0, 242.0, 141.0, 119.0, 78.0, 62.0, 62.0, 32.0, 24.0, 23.0, 27.0, 17.0, 8.0, 12.0, 10.0, 6.0, 4.0, 4.0, 0.0, 2.0, 1.0, 3.0, 1.0, 2.0], "bins": [-37.4375, -36.414306640625, -35.39111328125, -34.367919921875, -33.3447265625, -32.321533203125, -31.29833984375, -30.275146484375, -29.251953125, -28.228759765625, -27.20556640625, -26.182373046875, -25.1591796875, -24.135986328125, -23.11279296875, -22.089599609375, -21.06640625, -20.043212890625, -19.02001953125, -17.996826171875, -16.9736328125, -15.950439453125, -14.92724609375, -13.904052734375, -12.880859375, -11.857666015625, -10.83447265625, -9.811279296875, -8.7880859375, -7.764892578125, -6.74169921875, -5.718505859375, -4.6953125, -3.672119140625, -2.64892578125, -1.625732421875, -0.6025390625, 0.420654296875, 1.44384765625, 2.467041015625, 3.490234375, 4.513427734375, 5.53662109375, 6.559814453125, 7.5830078125, 8.606201171875, 9.62939453125, 10.652587890625, 11.67578125, 12.698974609375, 13.72216796875, 14.745361328125, 15.7685546875, 16.791748046875, 17.81494140625, 18.838134765625, 19.861328125, 20.884521484375, 21.90771484375, 22.930908203125, 23.9541015625, 24.977294921875, 26.00048828125, 27.023681640625, 28.046875]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 9.0, 65.0, 304.0, 407.0, 196.0, 24.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-173.0847930908203, -169.08375549316406, -165.08270263671875, -161.0816650390625, -157.08062744140625, -153.07957458496094, -149.0785369873047, -145.07748413085938, -141.07644653320312, -137.07540893554688, -133.07435607910156, -129.0733184814453, -125.07227325439453, -121.07122802734375, -117.0701904296875, -113.06914520263672, -109.06809997558594, -105.06705474853516, -101.06600952148438, -97.06497192382812, -93.06392669677734, -89.06288146972656, -85.06184387207031, -81.06079864501953, -77.05975341796875, -73.05870819091797, -69.05766296386719, -65.05662536621094, -61.055580139160156, -57.054534912109375, -53.05349349975586, -49.052452087402344, -45.05140686035156, -41.05036163330078, -37.049320220947266, -33.04827880859375, -29.04723358154297, -25.04619026184082, -21.045146942138672, -17.044103622436523, -13.043060302734375, -9.042016983032227, -5.040973663330078, -1.0399303436279297, 2.9611129760742188, 6.962156295776367, 10.963199615478516, 14.964242935180664, 18.965286254882812, 22.96632957458496, 26.96737289428711, 30.968416213989258, 34.969459533691406, 38.97050476074219, 42.9715461730957, 46.97258758544922, 50.9736328125, 54.97467803955078, 58.9757194519043, 62.97676086425781, 66.9778060913086, 70.97885131835938, 74.97988891601562, 78.9809341430664, 82.98197937011719]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 5.0, 3.0, 5.0, 8.0, 4.0, 16.0, 14.0, 12.0, 20.0, 30.0, 28.0, 39.0, 44.0, 56.0, 42.0, 58.0, 55.0, 44.0, 60.0, 52.0, 51.0, 39.0, 47.0, 33.0, 33.0, 36.0, 31.0, 19.0, 29.0, 24.0, 17.0, 20.0, 10.0, 11.0, 6.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-40.40298080444336, -39.3249397277832, -38.24689483642578, -37.168853759765625, -36.09081268310547, -35.01276779174805, -33.93472671508789, -32.85668182373047, -31.778640747070312, -30.700597763061523, -29.622554779052734, -28.544513702392578, -27.46647071838379, -26.388427734375, -25.310386657714844, -24.232343673706055, -23.154300689697266, -22.076257705688477, -20.998214721679688, -19.92017364501953, -18.842130661010742, -17.764087677001953, -16.686046600341797, -15.608003616333008, -14.529960632324219, -13.45191764831543, -12.373875617980957, -11.295833587646484, -10.217790603637695, -9.139747619628906, -8.061705589294434, -6.983663082122803, -5.905620574951172, -4.827578067779541, -3.74953556060791, -2.6714930534362793, -1.5934505462646484, -0.5154080390930176, 0.5626344680786133, 1.6406769752502441, 2.718719482421875, 3.796761989593506, 4.874804496765137, 5.952847003936768, 7.030889511108398, 8.108932495117188, 9.18697452545166, 10.265016555786133, 11.343059539794922, 12.421102523803711, 13.499144554138184, 14.577186584472656, 15.655229568481445, 16.733272552490234, 17.81131362915039, 18.88935661315918, 19.96739959716797, 21.045442581176758, 22.123485565185547, 23.201526641845703, 24.279569625854492, 25.35761260986328, 26.435653686523438, 27.513696670532227, 28.591739654541016]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 4.0, 8.0, 10.0, 6.0, 12.0, 12.0, 24.0, 20.0, 22.0, 21.0, 30.0, 17.0, 26.0, 24.0, 30.0, 25.0, 35.0, 38.0, 37.0, 44.0, 34.0, 31.0, 30.0, 38.0, 40.0, 43.0, 34.0, 29.0, 29.0, 28.0, 19.0, 22.0, 20.0, 20.0, 22.0, 23.0, 17.0, 7.0, 9.0, 6.0, 8.0, 5.0, 2.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.5859375, -3.47100830078125, -3.3560791015625, -3.24114990234375, -3.126220703125, -3.01129150390625, -2.8963623046875, -2.78143310546875, -2.66650390625, -2.55157470703125, -2.4366455078125, -2.32171630859375, -2.206787109375, -2.09185791015625, -1.9769287109375, -1.86199951171875, -1.7470703125, -1.63214111328125, -1.5172119140625, -1.40228271484375, -1.287353515625, -1.17242431640625, -1.0574951171875, -0.94256591796875, -0.82763671875, -0.71270751953125, -0.5977783203125, -0.48284912109375, -0.367919921875, -0.25299072265625, -0.1380615234375, -0.02313232421875, 0.091796875, 0.20672607421875, 0.3216552734375, 0.43658447265625, 0.551513671875, 0.66644287109375, 0.7813720703125, 0.89630126953125, 1.01123046875, 1.12615966796875, 1.2410888671875, 1.35601806640625, 1.470947265625, 1.58587646484375, 1.7008056640625, 1.81573486328125, 1.9306640625, 2.04559326171875, 2.1605224609375, 2.27545166015625, 2.390380859375, 2.50531005859375, 2.6202392578125, 2.73516845703125, 2.85009765625, 2.96502685546875, 3.0799560546875, 3.19488525390625, 3.309814453125, 3.42474365234375, 3.5396728515625, 3.65460205078125, 3.76953125]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 5.0, 12.0, 21.0, 17.0, 27.0, 30.0, 47.0, 95.0, 123.0, 202.0, 275.0, 447.0, 690.0, 997.0, 1535.0, 2453.0, 3811.0, 6117.0, 9775.0, 16213.0, 27438.0, 47796.0, 86984.0, 166113.0, 262389.0, 187150.0, 97559.0, 52965.0, 30142.0, 17876.0, 10927.0, 6655.0, 4187.0, 2595.0, 1646.0, 1088.0, 709.0, 485.0, 324.0, 158.0, 156.0, 119.0, 70.0, 44.0, 32.0, 25.0, 14.0, 11.0, 4.0, 5.0, 0.0, 2.0, 2.0, 1.0], "bins": [-0.609375, -0.5917587280273438, -0.5741424560546875, -0.5565261840820312, -0.538909912109375, -0.5212936401367188, -0.5036773681640625, -0.48606109619140625, -0.46844482421875, -0.45082855224609375, -0.4332122802734375, -0.41559600830078125, -0.397979736328125, -0.38036346435546875, -0.3627471923828125, -0.34513092041015625, -0.3275146484375, -0.30989837646484375, -0.2922821044921875, -0.27466583251953125, -0.257049560546875, -0.23943328857421875, -0.2218170166015625, -0.20420074462890625, -0.18658447265625, -0.16896820068359375, -0.1513519287109375, -0.13373565673828125, -0.116119384765625, -0.09850311279296875, -0.0808868408203125, -0.06327056884765625, -0.045654296875, -0.02803802490234375, -0.0104217529296875, 0.00719451904296875, 0.024810791015625, 0.04242706298828125, 0.0600433349609375, 0.07765960693359375, 0.09527587890625, 0.11289215087890625, 0.1305084228515625, 0.14812469482421875, 0.165740966796875, 0.18335723876953125, 0.2009735107421875, 0.21858978271484375, 0.2362060546875, 0.25382232666015625, 0.2714385986328125, 0.28905487060546875, 0.306671142578125, 0.32428741455078125, 0.3419036865234375, 0.35951995849609375, 0.37713623046875, 0.39475250244140625, 0.4123687744140625, 0.42998504638671875, 0.447601318359375, 0.46521759033203125, 0.4828338623046875, 0.5004501342773438, 0.51806640625]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 0.0, 3.0, 2.0, 0.0, 4.0, 3.0, 5.0, 6.0, 8.0, 11.0, 7.0, 12.0, 14.0, 18.0, 25.0, 22.0, 26.0, 42.0, 32.0, 38.0, 43.0, 31.0, 27.0, 42.0, 53.0, 38.0, 1060.0, 35.0, 34.0, 26.0, 35.0, 38.0, 27.0, 30.0, 36.0, 21.0, 28.0, 24.0, 21.0, 15.0, 14.0, 13.0, 10.0, 7.0, 13.0, 5.0, 8.0, 8.0, 4.0, 2.0, 4.0, 5.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.595703125, -2.5174560546875, -2.439208984375, -2.3609619140625, -2.28271484375, -2.2044677734375, -2.126220703125, -2.0479736328125, -1.9697265625, -1.8914794921875, -1.813232421875, -1.7349853515625, -1.65673828125, -1.5784912109375, -1.500244140625, -1.4219970703125, -1.34375, -1.2655029296875, -1.187255859375, -1.1090087890625, -1.03076171875, -0.9525146484375, -0.874267578125, -0.7960205078125, -0.7177734375, -0.6395263671875, -0.561279296875, -0.4830322265625, -0.40478515625, -0.3265380859375, -0.248291015625, -0.1700439453125, -0.091796875, -0.0135498046875, 0.064697265625, 0.1429443359375, 0.22119140625, 0.2994384765625, 0.377685546875, 0.4559326171875, 0.5341796875, 0.6124267578125, 0.690673828125, 0.7689208984375, 0.84716796875, 0.9254150390625, 1.003662109375, 1.0819091796875, 1.16015625, 1.2384033203125, 1.316650390625, 1.3948974609375, 1.47314453125, 1.5513916015625, 1.629638671875, 1.7078857421875, 1.7861328125, 1.8643798828125, 1.942626953125, 2.0208740234375, 2.09912109375, 2.1773681640625, 2.255615234375, 2.3338623046875, 2.412109375]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 6.0, 3.0, 13.0, 10.0, 17.0, 31.0, 34.0, 60.0, 81.0, 109.0, 169.0, 248.0, 330.0, 507.0, 800.0, 1064.0, 1577.0, 2277.0, 3298.0, 4776.0, 6792.0, 10074.0, 14736.0, 21789.0, 33470.0, 53674.0, 88501.0, 145527.0, 1247440.0, 170923.0, 106631.0, 64120.0, 39520.0, 25353.0, 16836.0, 11237.0, 7690.0, 5279.0, 3637.0, 2625.0, 1848.0, 1220.0, 846.0, 603.0, 424.0, 308.0, 185.0, 142.0, 102.0, 63.0, 38.0, 38.0, 22.0, 12.0, 12.0, 10.0, 1.0, 2.0, 3.0, 4.0], "bins": [-0.361083984375, -0.35003662109375, -0.3389892578125, -0.32794189453125, -0.31689453125, -0.30584716796875, -0.2947998046875, -0.28375244140625, -0.272705078125, -0.26165771484375, -0.2506103515625, -0.23956298828125, -0.228515625, -0.21746826171875, -0.2064208984375, -0.19537353515625, -0.184326171875, -0.17327880859375, -0.1622314453125, -0.15118408203125, -0.14013671875, -0.12908935546875, -0.1180419921875, -0.10699462890625, -0.095947265625, -0.08489990234375, -0.0738525390625, -0.06280517578125, -0.0517578125, -0.04071044921875, -0.0296630859375, -0.01861572265625, -0.007568359375, 0.00347900390625, 0.0145263671875, 0.02557373046875, 0.03662109375, 0.04766845703125, 0.0587158203125, 0.06976318359375, 0.080810546875, 0.09185791015625, 0.1029052734375, 0.11395263671875, 0.125, 0.13604736328125, 0.1470947265625, 0.15814208984375, 0.169189453125, 0.18023681640625, 0.1912841796875, 0.20233154296875, 0.21337890625, 0.22442626953125, 0.2354736328125, 0.24652099609375, 0.257568359375, 0.26861572265625, 0.2796630859375, 0.29071044921875, 0.3017578125, 0.31280517578125, 0.3238525390625, 0.33489990234375, 0.345947265625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 3.0, 2.0, 4.0, 5.0, 9.0, 8.0, 8.0, 7.0, 10.0, 12.0, 21.0, 23.0, 33.0, 37.0, 46.0, 56.0, 81.0, 72.0, 104.0, 83.0, 71.0, 58.0, 52.0, 43.0, 23.0, 37.0, 16.0, 12.0, 14.0, 11.0, 9.0, 3.0, 15.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031642913818359375, -0.003070622682571411, -0.0029769539833068848, -0.0028832852840423584, -0.002789616584777832, -0.0026959478855133057, -0.0026022791862487793, -0.002508610486984253, -0.0024149417877197266, -0.0023212730884552, -0.002227604389190674, -0.0021339356899261475, -0.002040266990661621, -0.0019465982913970947, -0.0018529295921325684, -0.001759260892868042, -0.0016655921936035156, -0.0015719234943389893, -0.0014782547950744629, -0.0013845860958099365, -0.0012909173965454102, -0.0011972486972808838, -0.0011035799980163574, -0.001009911298751831, -0.0009162425994873047, -0.0008225739002227783, -0.000728905200958252, -0.0006352365016937256, -0.0005415678024291992, -0.00044789910316467285, -0.0003542304039001465, -0.0002605617046356201, -0.00016689300537109375, -7.322430610656738e-05, 2.0444393157958984e-05, 0.00011411309242248535, 0.00020778179168701172, 0.0003014504909515381, 0.00039511919021606445, 0.0004887878894805908, 0.0005824565887451172, 0.0006761252880096436, 0.0007697939872741699, 0.0008634626865386963, 0.0009571313858032227, 0.001050800085067749, 0.0011444687843322754, 0.0012381374835968018, 0.0013318061828613281, 0.0014254748821258545, 0.0015191435813903809, 0.0016128122806549072, 0.0017064809799194336, 0.00180014967918396, 0.0018938183784484863, 0.0019874870777130127, 0.002081155776977539, 0.0021748244762420654, 0.002268493175506592, 0.002362161874771118, 0.0024558305740356445, 0.002549499273300171, 0.0026431679725646973, 0.0027368366718292236, 0.00283050537109375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 6.0, 8.0, 12.0, 8.0, 9.0, 20.0, 18.0, 22.0, 30.0, 59.0, 82.0, 100.0, 190.0, 428.0, 4552.0, 1027018.0, 14764.0, 546.0, 239.0, 128.0, 84.0, 53.0, 47.0, 34.0, 21.0, 10.0, 17.0, 9.0, 4.0, 14.0, 8.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05767822265625, -0.05550956726074219, -0.053340911865234375, -0.05117225646972656, -0.04900360107421875, -0.04683494567871094, -0.044666290283203125, -0.04249763488769531, -0.0403289794921875, -0.03816032409667969, -0.035991668701171875, -0.03382301330566406, -0.03165435791015625, -0.029485702514648438, -0.027317047119140625, -0.025148391723632812, -0.022979736328125, -0.020811080932617188, -0.018642425537109375, -0.016473770141601562, -0.01430511474609375, -0.012136459350585938, -0.009967803955078125, -0.0077991485595703125, -0.0056304931640625, -0.0034618377685546875, -0.001293182373046875, 0.0008754730224609375, 0.00304412841796875, 0.0052127838134765625, 0.007381439208984375, 0.009550094604492188, 0.01171875, 0.013887405395507812, 0.016056060791015625, 0.018224716186523438, 0.02039337158203125, 0.022562026977539062, 0.024730682373046875, 0.026899337768554688, 0.0290679931640625, 0.031236648559570312, 0.033405303955078125, 0.03557395935058594, 0.03774261474609375, 0.03991127014160156, 0.042079925537109375, 0.04424858093261719, 0.046417236328125, 0.04858589172363281, 0.050754547119140625, 0.05292320251464844, 0.05509185791015625, 0.05726051330566406, 0.059429168701171875, 0.06159782409667969, 0.0637664794921875, 0.06593513488769531, 0.06810379028320312, 0.07027244567871094, 0.07244110107421875, 0.07460975646972656, 0.07677841186523438, 0.07894706726074219, 0.08111572265625]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 121.0, 464.0, 355.0, 59.0, 8.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0025161760859191418, -0.002234133193269372, -0.0019520905334502459, -0.001670047640800476, -0.0013880048645660281, -0.0011059620883315802, -0.0008239191956818104, -0.0005418765358626842, -0.00025983364321291447, 2.2209162125363946e-05, 0.00030425196746364236, 0.0005862948019057512, 0.0008683375781401992, 0.0011503803543746471, 0.001432423247024417, 0.001714465906843543, 0.001996508799493313, 0.0022785516921430826, 0.0025605943519622087, 0.0028426372446119785, 0.0031246799044311047, 0.0034067227970808744, 0.0036887656897306442, 0.00397080834954977, 0.0042528510093688965, 0.004534893669188023, 0.004816936794668436, 0.005098979454487562, 0.005381022114306688, 0.005663065239787102, 0.005945107899606228, 0.006227150559425354, 0.00650919321924448, 0.006791235879063606, 0.00707327900454402, 0.007355321664363146, 0.007637364324182272, 0.007919407449662685, 0.008201450109481812, 0.008483492769300938, 0.008765535429120064, 0.00904757808893919, 0.009329620748758316, 0.009611664339900017, 0.009893706999719143, 0.010175749659538269, 0.010457792319357395, 0.010739834979176521, 0.011021878570318222, 0.011303921230137348, 0.011585963889956474, 0.011868007481098175, 0.012150050140917301, 0.012432092800736427, 0.012714135460555553, 0.01299617812037468, 0.013278220780193806, 0.013560263440012932, 0.013842306099832058, 0.014124348759651184, 0.014406392350792885, 0.014688435010612011, 0.014970477670431137, 0.015252520330250263, 0.01553456299006939]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 5.0, 10.0, 5.0, 7.0, 9.0, 8.0, 12.0, 13.0, 14.0, 20.0, 23.0, 27.0, 26.0, 29.0, 17.0, 29.0, 37.0, 40.0, 42.0, 37.0, 21.0, 43.0, 47.0, 34.0, 37.0, 36.0, 38.0, 41.0, 35.0, 37.0, 39.0, 23.0, 27.0, 17.0, 18.0, 21.0, 11.0, 10.0, 17.0, 10.0, 8.0, 7.0, 3.0, 2.0, 4.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0012183189392089844, -0.001177830621600151, -0.0011373423039913177, -0.0010968539863824844, -0.0010563656687736511, -0.0010158773511648178, -0.0009753890335559845, -0.0009349007159471512, -0.0008944123983383179, -0.0008539240807294846, -0.0008134357631206512, -0.0007729474455118179, -0.0007324591279029846, -0.0006919708102941513, -0.000651482492685318, -0.0006109941750764847, -0.0005705058574676514, -0.000530017539858818, -0.0004895292222499847, -0.00044904090464115143, -0.0004085525870323181, -0.0003680642694234848, -0.0003275759518146515, -0.0002870876342058182, -0.00024659931659698486, -0.00020611099898815155, -0.00016562268137931824, -0.00012513436377048492, -8.464604616165161e-05, -4.41577285528183e-05, -3.6694109439849854e-06, 3.681890666484833e-05, 7.730722427368164e-05, 0.00011779554188251495, 0.00015828385949134827, 0.00019877217710018158, 0.0002392604947090149, 0.0002797488123178482, 0.0003202371299266815, 0.00036072544753551483, 0.00040121376514434814, 0.00044170208275318146, 0.00048219040036201477, 0.0005226787179708481, 0.0005631670355796814, 0.0006036553531885147, 0.000644143670797348, 0.0006846319884061813, 0.0007251203060150146, 0.000765608623623848, 0.0008060969412326813, 0.0008465852588415146, 0.0008870735764503479, 0.0009275618940591812, 0.0009680502116680145, 0.0010085385292768478, 0.0010490268468856812, 0.0010895151644945145, 0.0011300034821033478, 0.001170491799712181, 0.0012109801173210144, 0.0012514684349298477, 0.001291956752538681, 0.0013324450701475143, 0.0013729333877563477]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 3.0, 3.0, 3.0, 3.0, 3.0, 9.0, 4.0, 8.0, 10.0, 6.0, 12.0, 12.0, 24.0, 20.0, 22.0, 21.0, 30.0, 17.0, 26.0, 24.0, 30.0, 25.0, 35.0, 38.0, 37.0, 44.0, 34.0, 31.0, 30.0, 38.0, 40.0, 43.0, 34.0, 29.0, 29.0, 28.0, 19.0, 22.0, 20.0, 20.0, 22.0, 23.0, 17.0, 7.0, 9.0, 6.0, 8.0, 5.0, 2.0, 7.0, 6.0, 3.0, 3.0, 2.0, 2.0, 6.0, 1.0, 0.0, 0.0, 3.0], "bins": [-3.5859375, -3.47100830078125, -3.3560791015625, -3.24114990234375, -3.126220703125, -3.01129150390625, -2.8963623046875, -2.78143310546875, -2.66650390625, -2.55157470703125, -2.4366455078125, -2.32171630859375, -2.206787109375, -2.09185791015625, -1.9769287109375, -1.86199951171875, -1.7470703125, -1.63214111328125, -1.5172119140625, -1.40228271484375, -1.287353515625, -1.17242431640625, -1.0574951171875, -0.94256591796875, -0.82763671875, -0.71270751953125, -0.5977783203125, -0.48284912109375, -0.367919921875, -0.25299072265625, -0.1380615234375, -0.02313232421875, 0.091796875, 0.20672607421875, 0.3216552734375, 0.43658447265625, 0.551513671875, 0.66644287109375, 0.7813720703125, 0.89630126953125, 1.01123046875, 1.12615966796875, 1.2410888671875, 1.35601806640625, 1.470947265625, 1.58587646484375, 1.7008056640625, 1.81573486328125, 1.9306640625, 2.04559326171875, 2.1605224609375, 2.27545166015625, 2.390380859375, 2.50531005859375, 2.6202392578125, 2.73516845703125, 2.85009765625, 2.96502685546875, 3.0799560546875, 3.19488525390625, 3.309814453125, 3.42474365234375, 3.5396728515625, 3.65460205078125, 3.76953125]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 1.0, 7.0, 2.0, 5.0, 5.0, 11.0, 10.0, 8.0, 19.0, 13.0, 24.0, 32.0, 57.0, 79.0, 137.0, 274.0, 527.0, 1069.0, 2215.0, 4457.0, 9153.0, 18654.0, 40412.0, 101259.0, 277613.0, 356813.0, 136970.0, 53041.0, 23496.0, 11221.0, 5566.0, 2714.0, 1284.0, 637.0, 295.0, 182.0, 107.0, 53.0, 26.0, 29.0, 19.0, 9.0, 7.0, 15.0, 4.0, 5.0, 8.0, 3.0, 6.0, 3.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0], "bins": [-3.912109375, -3.790435791015625, -3.66876220703125, -3.547088623046875, -3.4254150390625, -3.303741455078125, -3.18206787109375, -3.060394287109375, -2.938720703125, -2.817047119140625, -2.69537353515625, -2.573699951171875, -2.4520263671875, -2.330352783203125, -2.20867919921875, -2.087005615234375, -1.96533203125, -1.843658447265625, -1.72198486328125, -1.600311279296875, -1.4786376953125, -1.356964111328125, -1.23529052734375, -1.113616943359375, -0.991943359375, -0.870269775390625, -0.74859619140625, -0.626922607421875, -0.5052490234375, -0.383575439453125, -0.26190185546875, -0.140228271484375, -0.0185546875, 0.103118896484375, 0.22479248046875, 0.346466064453125, 0.4681396484375, 0.589813232421875, 0.71148681640625, 0.833160400390625, 0.954833984375, 1.076507568359375, 1.19818115234375, 1.319854736328125, 1.4415283203125, 1.563201904296875, 1.68487548828125, 1.806549072265625, 1.92822265625, 2.049896240234375, 2.17156982421875, 2.293243408203125, 2.4149169921875, 2.536590576171875, 2.65826416015625, 2.779937744140625, 2.901611328125, 3.023284912109375, 3.14495849609375, 3.266632080078125, 3.3883056640625, 3.509979248046875, 3.63165283203125, 3.753326416015625, 3.875]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 1.0, 3.0, 4.0, 9.0, 15.0, 14.0, 11.0, 9.0, 20.0, 22.0, 25.0, 23.0, 19.0, 35.0, 40.0, 39.0, 44.0, 52.0, 88.0, 173.0, 1530.0, 320.0, 128.0, 62.0, 37.0, 52.0, 39.0, 39.0, 38.0, 25.0, 26.0, 21.0, 19.0, 12.0, 10.0, 12.0, 7.0, 7.0, 5.0, 3.0, 6.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.5078125, -12.0726318359375, -11.637451171875, -11.2022705078125, -10.76708984375, -10.3319091796875, -9.896728515625, -9.4615478515625, -9.0263671875, -8.5911865234375, -8.156005859375, -7.7208251953125, -7.28564453125, -6.8504638671875, -6.415283203125, -5.9801025390625, -5.544921875, -5.1097412109375, -4.674560546875, -4.2393798828125, -3.80419921875, -3.3690185546875, -2.933837890625, -2.4986572265625, -2.0634765625, -1.6282958984375, -1.193115234375, -0.7579345703125, -0.32275390625, 0.1124267578125, 0.547607421875, 0.9827880859375, 1.41796875, 1.8531494140625, 2.288330078125, 2.7235107421875, 3.15869140625, 3.5938720703125, 4.029052734375, 4.4642333984375, 4.8994140625, 5.3345947265625, 5.769775390625, 6.2049560546875, 6.64013671875, 7.0753173828125, 7.510498046875, 7.9456787109375, 8.380859375, 8.8160400390625, 9.251220703125, 9.6864013671875, 10.12158203125, 10.5567626953125, 10.991943359375, 11.4271240234375, 11.8623046875, 12.2974853515625, 12.732666015625, 13.1678466796875, 13.60302734375, 14.0382080078125, 14.473388671875, 14.9085693359375, 15.34375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 7.0, 5.0, 8.0, 10.0, 7.0, 16.0, 14.0, 28.0, 32.0, 41.0, 76.0, 75.0, 145.0, 168.0, 260.0, 438.0, 1272.0, 268941.0, 2870344.0, 2305.0, 511.0, 319.0, 199.0, 155.0, 80.0, 66.0, 44.0, 33.0, 25.0, 26.0, 19.0, 15.0, 6.0, 5.0, 6.0, 4.0, 2.0, 1.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.75, -41.37646484375, -40.0029296875, -38.62939453125, -37.255859375, -35.88232421875, -34.5087890625, -33.13525390625, -31.76171875, -30.38818359375, -29.0146484375, -27.64111328125, -26.267578125, -24.89404296875, -23.5205078125, -22.14697265625, -20.7734375, -19.39990234375, -18.0263671875, -16.65283203125, -15.279296875, -13.90576171875, -12.5322265625, -11.15869140625, -9.78515625, -8.41162109375, -7.0380859375, -5.66455078125, -4.291015625, -2.91748046875, -1.5439453125, -0.17041015625, 1.203125, 2.57666015625, 3.9501953125, 5.32373046875, 6.697265625, 8.07080078125, 9.4443359375, 10.81787109375, 12.19140625, 13.56494140625, 14.9384765625, 16.31201171875, 17.685546875, 19.05908203125, 20.4326171875, 21.80615234375, 23.1796875, 24.55322265625, 25.9267578125, 27.30029296875, 28.673828125, 30.04736328125, 31.4208984375, 32.79443359375, 34.16796875, 35.54150390625, 36.9150390625, 38.28857421875, 39.662109375, 41.03564453125, 42.4091796875, 43.78271484375, 45.15625]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 8.0, 83.0, 386.0, 378.0, 143.0, 17.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-36.579986572265625, -34.845088958740234, -33.110191345214844, -31.375293731689453, -29.640398025512695, -27.905500411987305, -26.170602798461914, -24.435707092285156, -22.700809478759766, -20.965911865234375, -19.231014251708984, -17.496116638183594, -15.761220932006836, -14.026323318481445, -12.291425704956055, -10.55652904510498, -8.821630477905273, -7.086733341217041, -5.351836204528809, -3.616938591003418, -1.8820414543151855, -0.14714431762695312, 1.5877532958984375, 3.3226499557495117, 5.057547569274902, 6.792444705963135, 8.527341842651367, 10.262239456176758, 11.997137069702148, 13.732033729553223, 15.466931343078613, 17.201828002929688, 18.936725616455078, 20.67162322998047, 22.40652084350586, 24.14141845703125, 25.876314163208008, 27.6112117767334, 29.34610939025879, 31.081005096435547, 32.81590270996094, 34.55080032348633, 36.28569793701172, 38.02059555053711, 39.7554931640625, 41.490386962890625, 43.22528839111328, 44.960182189941406, 46.69508361816406, 48.42998123168945, 50.164878845214844, 51.899776458740234, 53.634674072265625, 55.36956787109375, 57.104469299316406, 58.83936309814453, 60.57426071166992, 62.30915832519531, 64.04405212402344, 65.7789535522461, 67.51384735107422, 69.24874877929688, 70.983642578125, 72.71854400634766, 74.45343780517578]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 3.0, 4.0, 7.0, 3.0, 9.0, 14.0, 5.0, 10.0, 17.0, 13.0, 15.0, 23.0, 16.0, 33.0, 34.0, 25.0, 39.0, 40.0, 41.0, 45.0, 57.0, 42.0, 41.0, 45.0, 51.0, 36.0, 28.0, 39.0, 36.0, 33.0, 32.0, 25.0, 31.0, 22.0, 23.0, 11.0, 11.0, 10.0, 4.0, 10.0, 4.0, 5.0, 6.0, 6.0, 3.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.46971893310547, -29.383363723754883, -28.297008514404297, -27.21065330505371, -26.124298095703125, -25.037940979003906, -23.95158576965332, -22.865230560302734, -21.77887535095215, -20.692520141601562, -19.606164932250977, -18.51980972290039, -17.433452606201172, -16.34709930419922, -15.2607421875, -14.174386978149414, -13.088031768798828, -12.001676559448242, -10.915321350097656, -9.828965187072754, -8.742609977722168, -7.656254768371582, -6.569899082183838, -5.483543395996094, -4.397188186645508, -3.3108327388763428, -2.2244772911071777, -1.1381218433380127, -0.051766395568847656, 1.0345888137817383, 2.1209444999694824, 3.2073001861572266, 4.293651580810547, 5.380006790161133, 6.466362476348877, 7.552718162536621, 8.639073371887207, 9.725428581237793, 10.811784744262695, 11.898139953613281, 12.984495162963867, 14.070850372314453, 15.157205581665039, 16.243560791015625, 17.329917907714844, 18.416271209716797, 19.502628326416016, 20.5889835357666, 21.675338745117188, 22.761693954467773, 23.84804916381836, 24.934404373168945, 26.02075958251953, 27.10711669921875, 28.193471908569336, 29.279827117919922, 30.366182327270508, 31.452537536621094, 32.53889465332031, 33.625247955322266, 34.711605072021484, 35.79795837402344, 36.884315490722656, 37.970672607421875, 39.05702590942383]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 3.0, 7.0, 4.0, 9.0, 9.0, 13.0, 14.0, 10.0, 18.0, 19.0, 25.0, 34.0, 32.0, 30.0, 28.0, 35.0, 35.0, 30.0, 46.0, 34.0, 42.0, 42.0, 35.0, 43.0, 38.0, 39.0, 36.0, 40.0, 31.0, 25.0, 22.0, 28.0, 25.0, 12.0, 23.0, 20.0, 9.0, 6.0, 11.0, 13.0, 5.0, 3.0, 4.0, 6.0, 8.0, 5.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.896484375, -3.760589599609375, -3.62469482421875, -3.488800048828125, -3.3529052734375, -3.217010498046875, -3.08111572265625, -2.945220947265625, -2.809326171875, -2.673431396484375, -2.53753662109375, -2.401641845703125, -2.2657470703125, -2.129852294921875, -1.99395751953125, -1.858062744140625, -1.72216796875, -1.586273193359375, -1.45037841796875, -1.314483642578125, -1.1785888671875, -1.042694091796875, -0.90679931640625, -0.770904541015625, -0.635009765625, -0.499114990234375, -0.36322021484375, -0.227325439453125, -0.0914306640625, 0.044464111328125, 0.18035888671875, 0.316253662109375, 0.4521484375, 0.588043212890625, 0.72393798828125, 0.859832763671875, 0.9957275390625, 1.131622314453125, 1.26751708984375, 1.403411865234375, 1.539306640625, 1.675201416015625, 1.81109619140625, 1.946990966796875, 2.0828857421875, 2.218780517578125, 2.35467529296875, 2.490570068359375, 2.62646484375, 2.762359619140625, 2.89825439453125, 3.034149169921875, 3.1700439453125, 3.305938720703125, 3.44183349609375, 3.577728271484375, 3.713623046875, 3.849517822265625, 3.98541259765625, 4.121307373046875, 4.2572021484375, 4.393096923828125, 4.52899169921875, 4.664886474609375, 4.80078125]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 3.0, 4.0, 7.0, 11.0, 11.0, 18.0, 14.0, 21.0, 25.0, 22.0, 36.0, 45.0, 68.0, 57.0, 76.0, 127.0, 206.0, 406.0, 969.0, 3379.0, 24242.0, 513843.0, 2919059.0, 692404.0, 32704.0, 4171.0, 1119.0, 427.0, 235.0, 121.0, 92.0, 67.0, 60.0, 42.0, 33.0, 30.0, 21.0, 21.0, 14.0, 14.0, 12.0, 15.0, 8.0, 6.0, 4.0, 6.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.125, -10.7608642578125, -10.396728515625, -10.0325927734375, -9.66845703125, -9.3043212890625, -8.940185546875, -8.5760498046875, -8.2119140625, -7.8477783203125, -7.483642578125, -7.1195068359375, -6.75537109375, -6.3912353515625, -6.027099609375, -5.6629638671875, -5.298828125, -4.9346923828125, -4.570556640625, -4.2064208984375, -3.84228515625, -3.4781494140625, -3.114013671875, -2.7498779296875, -2.3857421875, -2.0216064453125, -1.657470703125, -1.2933349609375, -0.92919921875, -0.5650634765625, -0.200927734375, 0.1632080078125, 0.52734375, 0.8914794921875, 1.255615234375, 1.6197509765625, 1.98388671875, 2.3480224609375, 2.712158203125, 3.0762939453125, 3.4404296875, 3.8045654296875, 4.168701171875, 4.5328369140625, 4.89697265625, 5.2611083984375, 5.625244140625, 5.9893798828125, 6.353515625, 6.7176513671875, 7.081787109375, 7.4459228515625, 7.81005859375, 8.1741943359375, 8.538330078125, 8.9024658203125, 9.2666015625, 9.6307373046875, 9.994873046875, 10.3590087890625, 10.72314453125, 11.0872802734375, 11.451416015625, 11.8155517578125, 12.1796875]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 6.0, 3.0, 3.0, 7.0, 6.0, 9.0, 10.0, 15.0, 26.0, 12.0, 27.0, 41.0, 51.0, 67.0, 87.0, 103.0, 111.0, 174.0, 239.0, 256.0, 336.0, 351.0, 387.0, 334.0, 292.0, 259.0, 178.0, 167.0, 108.0, 75.0, 80.0, 56.0, 43.0, 30.0, 25.0, 26.0, 18.0, 9.0, 4.0, 11.0, 10.0, 5.0, 3.0, 1.0, 2.0, 3.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 2.0], "bins": [-6.390625, -6.19268798828125, -5.9947509765625, -5.79681396484375, -5.598876953125, -5.40093994140625, -5.2030029296875, -5.00506591796875, -4.80712890625, -4.60919189453125, -4.4112548828125, -4.21331787109375, -4.015380859375, -3.81744384765625, -3.6195068359375, -3.42156982421875, -3.2236328125, -3.02569580078125, -2.8277587890625, -2.62982177734375, -2.431884765625, -2.23394775390625, -2.0360107421875, -1.83807373046875, -1.64013671875, -1.44219970703125, -1.2442626953125, -1.04632568359375, -0.848388671875, -0.65045166015625, -0.4525146484375, -0.25457763671875, -0.056640625, 0.14129638671875, 0.3392333984375, 0.53717041015625, 0.735107421875, 0.93304443359375, 1.1309814453125, 1.32891845703125, 1.52685546875, 1.72479248046875, 1.9227294921875, 2.12066650390625, 2.318603515625, 2.51654052734375, 2.7144775390625, 2.91241455078125, 3.1103515625, 3.30828857421875, 3.5062255859375, 3.70416259765625, 3.902099609375, 4.10003662109375, 4.2979736328125, 4.49591064453125, 4.69384765625, 4.89178466796875, 5.0897216796875, 5.28765869140625, 5.485595703125, 5.68353271484375, 5.8814697265625, 6.07940673828125, 6.27734375]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 2.0, 0.0, 3.0, 3.0, 2.0, 5.0, 2.0, 0.0, 3.0, 4.0, 9.0, 7.0, 10.0, 6.0, 15.0, 20.0, 30.0, 30.0, 56.0, 53.0, 86.0, 96.0, 132.0, 192.0, 242.0, 339.0, 624.0, 5590.0, 891609.0, 3274412.0, 18234.0, 926.0, 428.0, 263.0, 206.0, 146.0, 139.0, 95.0, 69.0, 49.0, 27.0, 31.0, 22.0, 22.0, 8.0, 11.0, 6.0, 8.0, 7.0, 3.0, 3.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-29.5625, -28.642822265625, -27.72314453125, -26.803466796875, -25.8837890625, -24.964111328125, -24.04443359375, -23.124755859375, -22.205078125, -21.285400390625, -20.36572265625, -19.446044921875, -18.5263671875, -17.606689453125, -16.68701171875, -15.767333984375, -14.84765625, -13.927978515625, -13.00830078125, -12.088623046875, -11.1689453125, -10.249267578125, -9.32958984375, -8.409912109375, -7.490234375, -6.570556640625, -5.65087890625, -4.731201171875, -3.8115234375, -2.891845703125, -1.97216796875, -1.052490234375, -0.1328125, 0.786865234375, 1.70654296875, 2.626220703125, 3.5458984375, 4.465576171875, 5.38525390625, 6.304931640625, 7.224609375, 8.144287109375, 9.06396484375, 9.983642578125, 10.9033203125, 11.822998046875, 12.74267578125, 13.662353515625, 14.58203125, 15.501708984375, 16.42138671875, 17.341064453125, 18.2607421875, 19.180419921875, 20.10009765625, 21.019775390625, 21.939453125, 22.859130859375, 23.77880859375, 24.698486328125, 25.6181640625, 26.537841796875, 27.45751953125, 28.377197265625, 29.296875]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 5.0, 23.0, 34.0, 64.0, 105.0, 137.0, 187.0, 125.0, 146.0, 81.0, 56.0, 25.0, 14.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.84977340698242, -58.54204559326172, -57.234317779541016, -55.92658996582031, -54.61886215209961, -53.311134338378906, -52.0034065246582, -50.6956787109375, -49.38795471191406, -48.08022689819336, -46.772499084472656, -45.46477127075195, -44.15704345703125, -42.84931564331055, -41.541587829589844, -40.233863830566406, -38.92613220214844, -37.618404388427734, -36.31067657470703, -35.00294876098633, -33.695220947265625, -32.38749313354492, -31.07976722717285, -29.77203941345215, -28.464311599731445, -27.156583786010742, -25.84885597229004, -24.541128158569336, -23.233402252197266, -21.925674438476562, -20.61794662475586, -19.310218811035156, -18.002492904663086, -16.694765090942383, -15.38703727722168, -14.079310417175293, -12.77158260345459, -11.463854789733887, -10.1561279296875, -8.848400115966797, -7.540672302246094, -6.232944488525391, -4.925217151641846, -3.6174895763397217, -2.3097620010375977, -1.0020341873168945, 0.3056931495666504, 1.6134204864501953, 2.9211483001708984, 4.228876113891602, 5.5366034507751465, 6.844330787658691, 8.152058601379395, 9.459786415100098, 10.767513275146484, 12.075241088867188, 13.38296890258789, 14.690696716308594, 15.998424530029297, 17.30615234375, 18.613880157470703, 19.921607971191406, 21.229333877563477, 22.53706169128418, 23.844789505004883]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 3.0, 7.0, 3.0, 4.0, 10.0, 11.0, 7.0, 14.0, 23.0, 8.0, 17.0, 26.0, 24.0, 24.0, 32.0, 35.0, 32.0, 38.0, 32.0, 26.0, 37.0, 38.0, 51.0, 44.0, 36.0, 34.0, 49.0, 42.0, 29.0, 28.0, 44.0, 38.0, 19.0, 23.0, 17.0, 23.0, 9.0, 14.0, 7.0, 10.0, 9.0, 6.0, 9.0, 5.0, 3.0, 5.0, 0.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-23.256542205810547, -22.4775447845459, -21.698545455932617, -20.91954803466797, -20.140548706054688, -19.36155128479004, -18.58255386352539, -17.80355453491211, -17.024555206298828, -16.24555778503418, -15.466558456420898, -14.68756103515625, -13.908561706542969, -13.12956428527832, -12.350565910339355, -11.57156753540039, -10.792570114135742, -10.013571739196777, -9.234573364257812, -8.455575942993164, -7.676577091217041, -6.897578716278076, -6.1185808181762695, -5.339582443237305, -4.56058406829834, -3.781585693359375, -3.0025875568389893, -2.2235894203186035, -1.4445910453796387, -0.6655926704406738, 0.11340522766113281, 0.8924036026000977, 1.6714019775390625, 2.4504003524780273, 3.229398488998413, 4.008396625518799, 4.787395000457764, 5.5663933753967285, 6.345391273498535, 7.1243896484375, 7.903388023376465, 8.68238639831543, 9.461384773254395, 10.24038314819336, 11.019380569458008, 11.798379898071289, 12.577377319335938, 13.356375694274902, 14.135374069213867, 14.914372444152832, 15.693370819091797, 16.472368240356445, 17.251367568969727, 18.030364990234375, 18.809364318847656, 19.588361740112305, 20.367359161376953, 21.1463565826416, 21.925355911254883, 22.70435333251953, 23.483352661132812, 24.26235008239746, 25.04134750366211, 25.82034683227539, 26.599346160888672]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 4.0, 6.0, 8.0, 6.0, 16.0, 11.0, 17.0, 15.0, 17.0, 28.0, 34.0, 26.0, 33.0, 28.0, 22.0, 35.0, 23.0, 29.0, 36.0, 42.0, 40.0, 35.0, 45.0, 36.0, 44.0, 37.0, 37.0, 31.0, 30.0, 27.0, 30.0, 19.0, 19.0, 16.0, 15.0, 15.0, 17.0, 10.0, 13.0, 14.0, 4.0, 6.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5546875, -3.43316650390625, -3.3116455078125, -3.19012451171875, -3.068603515625, -2.94708251953125, -2.8255615234375, -2.70404052734375, -2.58251953125, -2.46099853515625, -2.3394775390625, -2.21795654296875, -2.096435546875, -1.97491455078125, -1.8533935546875, -1.73187255859375, -1.6103515625, -1.48883056640625, -1.3673095703125, -1.24578857421875, -1.124267578125, -1.00274658203125, -0.8812255859375, -0.75970458984375, -0.63818359375, -0.51666259765625, -0.3951416015625, -0.27362060546875, -0.152099609375, -0.03057861328125, 0.0909423828125, 0.21246337890625, 0.333984375, 0.45550537109375, 0.5770263671875, 0.69854736328125, 0.820068359375, 0.94158935546875, 1.0631103515625, 1.18463134765625, 1.30615234375, 1.42767333984375, 1.5491943359375, 1.67071533203125, 1.792236328125, 1.91375732421875, 2.0352783203125, 2.15679931640625, 2.2783203125, 2.39984130859375, 2.5213623046875, 2.64288330078125, 2.764404296875, 2.88592529296875, 3.0074462890625, 3.12896728515625, 3.25048828125, 3.37200927734375, 3.4935302734375, 3.61505126953125, 3.736572265625, 3.85809326171875, 3.9796142578125, 4.10113525390625, 4.22265625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 10.0, 12.0, 17.0, 22.0, 27.0, 41.0, 72.0, 97.0, 140.0, 212.0, 360.0, 513.0, 847.0, 1299.0, 2067.0, 3384.0, 5338.0, 9032.0, 15262.0, 25867.0, 45082.0, 82762.0, 151152.0, 250405.0, 200452.0, 110447.0, 60331.0, 33751.0, 19574.0, 11688.0, 7063.0, 4206.0, 2572.0, 1545.0, 1048.0, 617.0, 444.0, 277.0, 158.0, 133.0, 89.0, 42.0, 24.0, 25.0, 18.0, 16.0, 6.0, 5.0, 6.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.53759765625, -0.520660400390625, -0.50372314453125, -0.486785888671875, -0.4698486328125, -0.452911376953125, -0.43597412109375, -0.419036865234375, -0.402099609375, -0.385162353515625, -0.36822509765625, -0.351287841796875, -0.3343505859375, -0.317413330078125, -0.30047607421875, -0.283538818359375, -0.2666015625, -0.249664306640625, -0.23272705078125, -0.215789794921875, -0.1988525390625, -0.181915283203125, -0.16497802734375, -0.148040771484375, -0.131103515625, -0.114166259765625, -0.09722900390625, -0.080291748046875, -0.0633544921875, -0.046417236328125, -0.02947998046875, -0.012542724609375, 0.00439453125, 0.021331787109375, 0.03826904296875, 0.055206298828125, 0.0721435546875, 0.089080810546875, 0.10601806640625, 0.122955322265625, 0.139892578125, 0.156829833984375, 0.17376708984375, 0.190704345703125, 0.2076416015625, 0.224578857421875, 0.24151611328125, 0.258453369140625, 0.275390625, 0.292327880859375, 0.30926513671875, 0.326202392578125, 0.3431396484375, 0.360076904296875, 0.37701416015625, 0.393951416015625, 0.410888671875, 0.427825927734375, 0.44476318359375, 0.461700439453125, 0.4786376953125, 0.495574951171875, 0.51251220703125, 0.529449462890625, 0.54638671875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 0.0, 5.0, 3.0, 3.0, 10.0, 11.0, 11.0, 14.0, 25.0, 31.0, 20.0, 16.0, 34.0, 32.0, 43.0, 38.0, 26.0, 43.0, 35.0, 45.0, 45.0, 1067.0, 50.0, 54.0, 41.0, 28.0, 32.0, 34.0, 31.0, 32.0, 24.0, 13.0, 24.0, 21.0, 12.0, 13.0, 19.0, 14.0, 6.0, 5.0, 6.0, 4.0, 5.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.806640625, -2.717193603515625, -2.62774658203125, -2.538299560546875, -2.4488525390625, -2.359405517578125, -2.26995849609375, -2.180511474609375, -2.091064453125, -2.001617431640625, -1.91217041015625, -1.822723388671875, -1.7332763671875, -1.643829345703125, -1.55438232421875, -1.464935302734375, -1.37548828125, -1.286041259765625, -1.19659423828125, -1.107147216796875, -1.0177001953125, -0.928253173828125, -0.83880615234375, -0.749359130859375, -0.659912109375, -0.570465087890625, -0.48101806640625, -0.391571044921875, -0.3021240234375, -0.212677001953125, -0.12322998046875, -0.033782958984375, 0.0556640625, 0.145111083984375, 0.23455810546875, 0.324005126953125, 0.4134521484375, 0.502899169921875, 0.59234619140625, 0.681793212890625, 0.771240234375, 0.860687255859375, 0.95013427734375, 1.039581298828125, 1.1290283203125, 1.218475341796875, 1.30792236328125, 1.397369384765625, 1.48681640625, 1.576263427734375, 1.66571044921875, 1.755157470703125, 1.8446044921875, 1.934051513671875, 2.02349853515625, 2.112945556640625, 2.202392578125, 2.291839599609375, 2.38128662109375, 2.470733642578125, 2.5601806640625, 2.649627685546875, 2.73907470703125, 2.828521728515625, 2.91796875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 5.0, 7.0, 10.0, 17.0, 28.0, 52.0, 47.0, 114.0, 132.0, 217.0, 268.0, 407.0, 603.0, 901.0, 1209.0, 1814.0, 2595.0, 3609.0, 5234.0, 7617.0, 11098.0, 16081.0, 23391.0, 35129.0, 53639.0, 85041.0, 133336.0, 1222098.0, 173636.0, 111089.0, 69857.0, 44837.0, 29248.0, 19957.0, 13449.0, 9346.0, 6523.0, 4541.0, 3109.0, 2197.0, 1446.0, 1028.0, 672.0, 482.0, 328.0, 234.0, 162.0, 99.0, 67.0, 42.0, 29.0, 21.0, 13.0, 13.0, 6.0, 8.0, 4.0, 4.0, 0.0, 0.0, 1.0], "bins": [-0.32373046875, -0.3132171630859375, -0.302703857421875, -0.2921905517578125, -0.28167724609375, -0.2711639404296875, -0.260650634765625, -0.2501373291015625, -0.2396240234375, -0.2291107177734375, -0.218597412109375, -0.2080841064453125, -0.19757080078125, -0.1870574951171875, -0.176544189453125, -0.1660308837890625, -0.155517578125, -0.1450042724609375, -0.134490966796875, -0.1239776611328125, -0.11346435546875, -0.1029510498046875, -0.092437744140625, -0.0819244384765625, -0.0714111328125, -0.0608978271484375, -0.050384521484375, -0.0398712158203125, -0.02935791015625, -0.0188446044921875, -0.008331298828125, 0.0021820068359375, 0.0126953125, 0.0232086181640625, 0.033721923828125, 0.0442352294921875, 0.05474853515625, 0.0652618408203125, 0.075775146484375, 0.0862884521484375, 0.0968017578125, 0.1073150634765625, 0.117828369140625, 0.1283416748046875, 0.13885498046875, 0.1493682861328125, 0.159881591796875, 0.1703948974609375, 0.180908203125, 0.1914215087890625, 0.201934814453125, 0.2124481201171875, 0.22296142578125, 0.2334747314453125, 0.243988037109375, 0.2545013427734375, 0.2650146484375, 0.2755279541015625, 0.286041259765625, 0.2965545654296875, 0.30706787109375, 0.3175811767578125, 0.328094482421875, 0.3386077880859375, 0.34912109375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 4.0, 6.0, 13.0, 5.0, 10.0, 13.0, 13.0, 10.0, 29.0, 42.0, 38.0, 63.0, 71.0, 79.0, 95.0, 96.0, 83.0, 69.0, 47.0, 34.0, 45.0, 27.0, 25.0, 16.0, 16.0, 13.0, 6.0, 7.0, 8.0, 3.0, 9.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.00440216064453125, -0.004280120134353638, -0.004158079624176025, -0.004036039113998413, -0.003913998603820801, -0.0037919580936431885, -0.003669917583465576, -0.003547877073287964, -0.0034258365631103516, -0.0033037960529327393, -0.003181755542755127, -0.0030597150325775146, -0.0029376745223999023, -0.00281563401222229, -0.0026935935020446777, -0.0025715529918670654, -0.002449512481689453, -0.002327471971511841, -0.0022054314613342285, -0.002083390951156616, -0.001961350440979004, -0.0018393099308013916, -0.0017172694206237793, -0.001595228910446167, -0.0014731884002685547, -0.0013511478900909424, -0.00122910737991333, -0.0011070668697357178, -0.0009850263595581055, -0.0008629858493804932, -0.0007409453392028809, -0.0006189048290252686, -0.0004968643188476562, -0.00037482380867004395, -0.00025278329849243164, -0.00013074278831481934, -8.702278137207031e-06, 0.00011333823204040527, 0.00023537874221801758, 0.0003574192523956299, 0.0004794597625732422, 0.0006015002727508545, 0.0007235407829284668, 0.0008455812931060791, 0.0009676218032836914, 0.0010896623134613037, 0.001211702823638916, 0.0013337433338165283, 0.0014557838439941406, 0.001577824354171753, 0.0016998648643493652, 0.0018219053745269775, 0.0019439458847045898, 0.002065986394882202, 0.0021880269050598145, 0.0023100674152374268, 0.002432107925415039, 0.0025541484355926514, 0.0026761889457702637, 0.002798229455947876, 0.0029202699661254883, 0.0030423104763031006, 0.003164350986480713, 0.003286391496658325, 0.0034084320068359375]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 5.0, 3.0, 8.0, 7.0, 9.0, 13.0, 14.0, 23.0, 31.0, 32.0, 50.0, 67.0, 107.0, 178.0, 347.0, 1229.0, 760091.0, 284517.0, 977.0, 325.0, 183.0, 101.0, 71.0, 46.0, 29.0, 17.0, 19.0, 15.0, 9.0, 13.0, 6.0, 4.0, 3.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.0748291015625, -0.07215213775634766, -0.06947517395019531, -0.06679821014404297, -0.06412124633789062, -0.06144428253173828, -0.05876731872558594, -0.056090354919433594, -0.05341339111328125, -0.050736427307128906, -0.04805946350097656, -0.04538249969482422, -0.042705535888671875, -0.04002857208251953, -0.03735160827636719, -0.034674644470214844, -0.0319976806640625, -0.029320716857910156, -0.026643753051757812, -0.02396678924560547, -0.021289825439453125, -0.01861286163330078, -0.015935897827148438, -0.013258934020996094, -0.01058197021484375, -0.007905006408691406, -0.0052280426025390625, -0.0025510787963867188, 0.000125885009765625, 0.0028028488159179688, 0.0054798126220703125, 0.008156776428222656, 0.010833740234375, 0.013510704040527344, 0.016187667846679688, 0.01886463165283203, 0.021541595458984375, 0.02421855926513672, 0.026895523071289062, 0.029572486877441406, 0.03224945068359375, 0.034926414489746094, 0.03760337829589844, 0.04028034210205078, 0.042957305908203125, 0.04563426971435547, 0.04831123352050781, 0.050988197326660156, 0.0536651611328125, 0.056342124938964844, 0.05901908874511719, 0.06169605255126953, 0.06437301635742188, 0.06704998016357422, 0.06972694396972656, 0.0724039077758789, 0.07508087158203125, 0.0777578353881836, 0.08043479919433594, 0.08311176300048828, 0.08578872680664062, 0.08846569061279297, 0.09114265441894531, 0.09381961822509766, 0.09649658203125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 14.0, 158.0, 558.0, 260.0, 24.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014825855614617467, -0.0011612620437517762, -0.0008399384678341448, -0.0005186148919165134, -0.00019729137420654297, 0.0001240321435034275, 0.0004453557776287198, 0.0007666792953386903, 0.0010880028130486608, 0.0014093263307586312, 0.0017306499648839235, 0.002051973482593894, 0.0023732970003038645, 0.002694620518013835, 0.003015944268554449, 0.0033372677862644196, 0.00365859130397439, 0.0039799148216843605, 0.004301238339394331, 0.0046225618571043015, 0.004943885374814272, 0.005265208892524242, 0.0055865328758955, 0.005907855927944183, 0.006229179445654154, 0.006550502963364124, 0.006871826481074095, 0.007193149998784065, 0.007514473516494036, 0.007835797034204006, 0.008157121017575264, 0.008478444069623947, 0.008799768052995205, 0.009121092036366463, 0.009442415088415146, 0.009763739071786404, 0.010085062123835087, 0.010406386107206345, 0.010727709159255028, 0.011049033142626286, 0.011370356194674969, 0.011691680178046227, 0.01201300323009491, 0.012334327213466167, 0.01265565026551485, 0.012976974248886108, 0.013298297300934792, 0.01361962128430605, 0.013940945267677307, 0.014262269251048565, 0.014583592303097248, 0.014904916286468506, 0.015226239338517189, 0.015547563321888447, 0.015868887305259705, 0.016190210357308388, 0.01651153340935707, 0.016832856461405754, 0.017154181376099586, 0.01747550442814827, 0.017796827480196953, 0.018118150532245636, 0.01843947544693947, 0.01876079849898815, 0.019082121551036835]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 2.0, 1.0, 2.0, 4.0, 8.0, 8.0, 4.0, 19.0, 11.0, 10.0, 8.0, 14.0, 30.0, 24.0, 33.0, 24.0, 30.0, 29.0, 36.0, 41.0, 35.0, 44.0, 36.0, 42.0, 46.0, 23.0, 35.0, 31.0, 48.0, 40.0, 40.0, 29.0, 32.0, 24.0, 26.0, 26.0, 22.0, 13.0, 12.0, 9.0, 13.0, 5.0, 8.0, 5.0, 6.0, 5.0, 3.0, 0.0, 4.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00167924165725708, -0.0016269292682409286, -0.0015746168792247772, -0.0015223044902086258, -0.0014699921011924744, -0.001417679712176323, -0.0013653673231601715, -0.00131305493414402, -0.0012607425451278687, -0.0012084301561117172, -0.0011561177670955658, -0.0011038053780794144, -0.001051492989063263, -0.0009991806000471115, -0.0009468682110309601, -0.0008945558220148087, -0.0008422434329986572, -0.0007899310439825058, -0.0007376186549663544, -0.0006853062659502029, -0.0006329938769340515, -0.0005806814879179001, -0.0005283690989017487, -0.00047605670988559723, -0.0004237443208694458, -0.00037143193185329437, -0.00031911954283714294, -0.0002668071538209915, -0.0002144947648048401, -0.00016218237578868866, -0.00010986998677253723, -5.75575977563858e-05, -5.245208740234375e-06, 4.706718027591705e-05, 9.937956929206848e-05, 0.0001516919583082199, 0.00020400434732437134, 0.00025631673634052277, 0.0003086291253566742, 0.0003609415143728256, 0.00041325390338897705, 0.0004655662924051285, 0.0005178786814212799, 0.0005701910704374313, 0.0006225034594535828, 0.0006748158484697342, 0.0007271282374858856, 0.000779440626502037, 0.0008317530155181885, 0.0008840654045343399, 0.0009363777935504913, 0.0009886901825666428, 0.0010410025715827942, 0.0010933149605989456, 0.001145627349615097, 0.0011979397386312485, 0.0012502521276474, 0.0013025645166635513, 0.0013548769056797028, 0.0014071892946958542, 0.0014595016837120056, 0.001511814072728157, 0.0015641264617443085, 0.00161643885076046, 0.0016687512397766113]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 4.0, 2.0, 4.0, 4.0, 4.0, 6.0, 8.0, 7.0, 15.0, 11.0, 17.0, 15.0, 17.0, 28.0, 34.0, 26.0, 33.0, 28.0, 22.0, 35.0, 23.0, 30.0, 35.0, 42.0, 40.0, 35.0, 45.0, 36.0, 44.0, 37.0, 37.0, 31.0, 30.0, 27.0, 30.0, 19.0, 19.0, 16.0, 15.0, 15.0, 17.0, 10.0, 13.0, 14.0, 4.0, 6.0, 5.0, 6.0, 5.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.5546875, -3.43316650390625, -3.3116455078125, -3.19012451171875, -3.068603515625, -2.94708251953125, -2.8255615234375, -2.70404052734375, -2.58251953125, -2.46099853515625, -2.3394775390625, -2.21795654296875, -2.096435546875, -1.97491455078125, -1.8533935546875, -1.73187255859375, -1.6103515625, -1.48883056640625, -1.3673095703125, -1.24578857421875, -1.124267578125, -1.00274658203125, -0.8812255859375, -0.75970458984375, -0.63818359375, -0.51666259765625, -0.3951416015625, -0.27362060546875, -0.152099609375, -0.03057861328125, 0.0909423828125, 0.21246337890625, 0.333984375, 0.45550537109375, 0.5770263671875, 0.69854736328125, 0.820068359375, 0.94158935546875, 1.0631103515625, 1.18463134765625, 1.30615234375, 1.42767333984375, 1.5491943359375, 1.67071533203125, 1.792236328125, 1.91375732421875, 2.0352783203125, 2.15679931640625, 2.2783203125, 2.39984130859375, 2.5213623046875, 2.64288330078125, 2.764404296875, 2.88592529296875, 3.0074462890625, 3.12896728515625, 3.25048828125, 3.37200927734375, 3.4935302734375, 3.61505126953125, 3.736572265625, 3.85809326171875, 3.9796142578125, 4.10113525390625, 4.22265625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 4.0, 8.0, 6.0, 17.0, 19.0, 21.0, 28.0, 27.0, 35.0, 56.0, 75.0, 94.0, 109.0, 184.0, 271.0, 546.0, 1362.0, 3608.0, 10356.0, 29582.0, 80608.0, 207073.0, 406299.0, 191728.0, 74177.0, 26666.0, 9522.0, 3418.0, 1239.0, 512.0, 250.0, 170.0, 96.0, 80.0, 68.0, 50.0, 38.0, 38.0, 30.0, 15.0, 16.0, 16.0, 7.0, 12.0, 8.0, 5.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0, -3.85943603515625, -3.7188720703125, -3.57830810546875, -3.437744140625, -3.29718017578125, -3.1566162109375, -3.01605224609375, -2.87548828125, -2.73492431640625, -2.5943603515625, -2.45379638671875, -2.313232421875, -2.17266845703125, -2.0321044921875, -1.89154052734375, -1.7509765625, -1.61041259765625, -1.4698486328125, -1.32928466796875, -1.188720703125, -1.04815673828125, -0.9075927734375, -0.76702880859375, -0.62646484375, -0.48590087890625, -0.3453369140625, -0.20477294921875, -0.064208984375, 0.07635498046875, 0.2169189453125, 0.35748291015625, 0.498046875, 0.63861083984375, 0.7791748046875, 0.91973876953125, 1.060302734375, 1.20086669921875, 1.3414306640625, 1.48199462890625, 1.62255859375, 1.76312255859375, 1.9036865234375, 2.04425048828125, 2.184814453125, 2.32537841796875, 2.4659423828125, 2.60650634765625, 2.7470703125, 2.88763427734375, 3.0281982421875, 3.16876220703125, 3.309326171875, 3.44989013671875, 3.5904541015625, 3.73101806640625, 3.87158203125, 4.01214599609375, 4.1527099609375, 4.29327392578125, 4.433837890625, 4.57440185546875, 4.7149658203125, 4.85552978515625, 4.99609375]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 2.0, 2.0, 6.0, 6.0, 9.0, 5.0, 8.0, 9.0, 20.0, 21.0, 15.0, 28.0, 33.0, 30.0, 36.0, 39.0, 37.0, 45.0, 66.0, 123.0, 286.0, 1505.0, 182.0, 100.0, 71.0, 57.0, 44.0, 32.0, 32.0, 27.0, 29.0, 29.0, 30.0, 18.0, 12.0, 13.0, 9.0, 4.0, 4.0, 6.0, 5.0, 4.0, 3.0, 3.0, 6.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-11.828125, -11.4501953125, -11.072265625, -10.6943359375, -10.31640625, -9.9384765625, -9.560546875, -9.1826171875, -8.8046875, -8.4267578125, -8.048828125, -7.6708984375, -7.29296875, -6.9150390625, -6.537109375, -6.1591796875, -5.78125, -5.4033203125, -5.025390625, -4.6474609375, -4.26953125, -3.8916015625, -3.513671875, -3.1357421875, -2.7578125, -2.3798828125, -2.001953125, -1.6240234375, -1.24609375, -0.8681640625, -0.490234375, -0.1123046875, 0.265625, 0.6435546875, 1.021484375, 1.3994140625, 1.77734375, 2.1552734375, 2.533203125, 2.9111328125, 3.2890625, 3.6669921875, 4.044921875, 4.4228515625, 4.80078125, 5.1787109375, 5.556640625, 5.9345703125, 6.3125, 6.6904296875, 7.068359375, 7.4462890625, 7.82421875, 8.2021484375, 8.580078125, 8.9580078125, 9.3359375, 9.7138671875, 10.091796875, 10.4697265625, 10.84765625, 11.2255859375, 11.603515625, 11.9814453125, 12.359375]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 5.0, 3.0, 3.0, 10.0, 7.0, 10.0, 12.0, 8.0, 26.0, 36.0, 29.0, 40.0, 66.0, 88.0, 149.0, 194.0, 340.0, 750.0, 2514.0, 1647611.0, 1489624.0, 2424.0, 768.0, 352.0, 194.0, 124.0, 82.0, 54.0, 46.0, 40.0, 21.0, 21.0, 17.0, 11.0, 8.0, 4.0, 6.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-44.4375, -43.00390625, -41.5703125, -40.13671875, -38.703125, -37.26953125, -35.8359375, -34.40234375, -32.96875, -31.53515625, -30.1015625, -28.66796875, -27.234375, -25.80078125, -24.3671875, -22.93359375, -21.5, -20.06640625, -18.6328125, -17.19921875, -15.765625, -14.33203125, -12.8984375, -11.46484375, -10.03125, -8.59765625, -7.1640625, -5.73046875, -4.296875, -2.86328125, -1.4296875, 0.00390625, 1.4375, 2.87109375, 4.3046875, 5.73828125, 7.171875, 8.60546875, 10.0390625, 11.47265625, 12.90625, 14.33984375, 15.7734375, 17.20703125, 18.640625, 20.07421875, 21.5078125, 22.94140625, 24.375, 25.80859375, 27.2421875, 28.67578125, 30.109375, 31.54296875, 32.9765625, 34.41015625, 35.84375, 37.27734375, 38.7109375, 40.14453125, 41.578125, 43.01171875, 44.4453125, 45.87890625, 47.3125]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 8.0, 100.0, 340.0, 406.0, 132.0, 28.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-85.64314270019531, -83.96802520751953, -82.29290771484375, -80.61778259277344, -78.94266510009766, -77.26754760742188, -75.5924301147461, -73.91731262207031, -72.2421875, -70.56707000732422, -68.89195251464844, -67.21682739257812, -65.54170989990234, -63.86659240722656, -62.19147491455078, -60.516353607177734, -58.84123992919922, -57.16612243652344, -55.49100112915039, -53.81588363647461, -52.14076232910156, -50.46564483642578, -48.79052734375, -47.11540603637695, -45.440284729003906, -43.765167236328125, -42.09004592895508, -40.4149284362793, -38.73980712890625, -37.06468963623047, -35.38957214355469, -33.71445083618164, -32.039337158203125, -30.36421775817871, -28.689098358154297, -27.013980865478516, -25.3388614654541, -23.663742065429688, -21.988622665405273, -20.31350326538086, -18.638381958007812, -16.9632625579834, -15.2881441116333, -13.613024711608887, -11.937906265258789, -10.262786865234375, -8.587667465209961, -6.912549018859863, -5.237430572509766, -3.5623116493225098, -1.8871924877166748, -0.21207332611083984, 1.463045597076416, 3.138164520263672, 4.813283920288086, 6.488402366638184, 8.163521766662598, 9.838641166687012, 11.51375961303711, 13.188879013061523, 14.863998413085938, 16.53911590576172, 18.214237213134766, 19.889354705810547, 21.56447410583496]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 1.0, 2.0, 2.0, 6.0, 9.0, 9.0, 9.0, 13.0, 21.0, 22.0, 17.0, 12.0, 26.0, 23.0, 32.0, 30.0, 27.0, 39.0, 40.0, 39.0, 41.0, 50.0, 49.0, 36.0, 45.0, 37.0, 43.0, 28.0, 31.0, 40.0, 31.0, 21.0, 38.0, 22.0, 16.0, 13.0, 20.0, 13.0, 10.0, 11.0, 9.0, 7.0, 9.0, 3.0, 2.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.350603103637695, -28.41427230834961, -27.47793960571289, -26.541608810424805, -25.60527801513672, -24.6689453125, -23.732614517211914, -22.796283721923828, -21.85995101928711, -20.923620223999023, -19.987287521362305, -19.05095672607422, -18.1146240234375, -17.178293228149414, -16.241962432861328, -15.305630683898926, -14.369298934936523, -13.432967185974121, -12.496635437011719, -11.560304641723633, -10.62397289276123, -9.687641143798828, -8.751310348510742, -7.81497859954834, -6.8786468505859375, -5.942315101623535, -5.005983829498291, -4.069652557373047, -3.1333208084106445, -2.196989059448242, -1.260657787322998, -0.3243265151977539, 0.6120071411132812, 1.5483386516571045, 2.4846701622009277, 3.421001672744751, 4.357333183288574, 5.293664932250977, 6.229996204376221, 7.166327476501465, 8.102659225463867, 9.03899097442627, 9.975322723388672, 10.911653518676758, 11.84798526763916, 12.784317016601562, 13.720647811889648, 14.65697956085205, 15.593311309814453, 16.52964210510254, 17.465974807739258, 18.402305603027344, 19.338638305664062, 20.27496910095215, 21.211299896240234, 22.147632598876953, 23.08396339416504, 24.020294189453125, 24.956626892089844, 25.89295768737793, 26.829288482666016, 27.765621185302734, 28.70195198059082, 29.638282775878906, 30.574615478515625]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 5.0, 1.0, 3.0, 1.0, 5.0, 2.0, 3.0, 2.0, 8.0, 5.0, 10.0, 14.0, 7.0, 18.0, 13.0, 19.0, 26.0, 36.0, 26.0, 37.0, 23.0, 31.0, 16.0, 27.0, 30.0, 41.0, 50.0, 34.0, 38.0, 42.0, 35.0, 43.0, 41.0, 34.0, 26.0, 35.0, 20.0, 34.0, 17.0, 23.0, 21.0, 11.0, 13.0, 16.0, 11.0, 12.0, 7.0, 17.0, 8.0, 4.0, 6.0, 6.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.0625, -3.9332275390625, -3.803955078125, -3.6746826171875, -3.54541015625, -3.4161376953125, -3.286865234375, -3.1575927734375, -3.0283203125, -2.8990478515625, -2.769775390625, -2.6405029296875, -2.51123046875, -2.3819580078125, -2.252685546875, -2.1234130859375, -1.994140625, -1.8648681640625, -1.735595703125, -1.6063232421875, -1.47705078125, -1.3477783203125, -1.218505859375, -1.0892333984375, -0.9599609375, -0.8306884765625, -0.701416015625, -0.5721435546875, -0.44287109375, -0.3135986328125, -0.184326171875, -0.0550537109375, 0.07421875, 0.2034912109375, 0.332763671875, 0.4620361328125, 0.59130859375, 0.7205810546875, 0.849853515625, 0.9791259765625, 1.1083984375, 1.2376708984375, 1.366943359375, 1.4962158203125, 1.62548828125, 1.7547607421875, 1.884033203125, 2.0133056640625, 2.142578125, 2.2718505859375, 2.401123046875, 2.5303955078125, 2.65966796875, 2.7889404296875, 2.918212890625, 3.0474853515625, 3.1767578125, 3.3060302734375, 3.435302734375, 3.5645751953125, 3.69384765625, 3.8231201171875, 3.952392578125, 4.0816650390625, 4.2109375]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 1.0, 2.0, 0.0, 5.0, 3.0, 3.0, 1.0, 3.0, 2.0, 10.0, 10.0, 11.0, 16.0, 15.0, 21.0, 21.0, 32.0, 39.0, 47.0, 47.0, 51.0, 70.0, 83.0, 109.0, 173.0, 330.0, 864.0, 3968.0, 44362.0, 1160146.0, 2750056.0, 219843.0, 10866.0, 1743.0, 475.0, 214.0, 119.0, 102.0, 75.0, 54.0, 42.0, 42.0, 32.0, 36.0, 26.0, 21.0, 20.0, 16.0, 15.0, 13.0, 14.0, 6.0, 2.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-12.2421875, -11.8624267578125, -11.482666015625, -11.1029052734375, -10.72314453125, -10.3433837890625, -9.963623046875, -9.5838623046875, -9.2041015625, -8.8243408203125, -8.444580078125, -8.0648193359375, -7.68505859375, -7.3052978515625, -6.925537109375, -6.5457763671875, -6.166015625, -5.7862548828125, -5.406494140625, -5.0267333984375, -4.64697265625, -4.2672119140625, -3.887451171875, -3.5076904296875, -3.1279296875, -2.7481689453125, -2.368408203125, -1.9886474609375, -1.60888671875, -1.2291259765625, -0.849365234375, -0.4696044921875, -0.08984375, 0.2899169921875, 0.669677734375, 1.0494384765625, 1.42919921875, 1.8089599609375, 2.188720703125, 2.5684814453125, 2.9482421875, 3.3280029296875, 3.707763671875, 4.0875244140625, 4.46728515625, 4.8470458984375, 5.226806640625, 5.6065673828125, 5.986328125, 6.3660888671875, 6.745849609375, 7.1256103515625, 7.50537109375, 7.8851318359375, 8.264892578125, 8.6446533203125, 9.0244140625, 9.4041748046875, 9.783935546875, 10.1636962890625, 10.54345703125, 10.9232177734375, 11.302978515625, 11.6827392578125, 12.0625]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 7.0, 1.0, 5.0, 5.0, 4.0, 6.0, 18.0, 14.0, 27.0, 32.0, 50.0, 60.0, 87.0, 113.0, 190.0, 243.0, 335.0, 383.0, 466.0, 482.0, 415.0, 302.0, 243.0, 167.0, 118.0, 93.0, 60.0, 32.0, 35.0, 25.0, 22.0, 15.0, 7.0, 6.0, 3.0, 4.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.51171875, -7.2767333984375, -7.041748046875, -6.8067626953125, -6.57177734375, -6.3367919921875, -6.101806640625, -5.8668212890625, -5.6318359375, -5.3968505859375, -5.161865234375, -4.9268798828125, -4.69189453125, -4.4569091796875, -4.221923828125, -3.9869384765625, -3.751953125, -3.5169677734375, -3.281982421875, -3.0469970703125, -2.81201171875, -2.5770263671875, -2.342041015625, -2.1070556640625, -1.8720703125, -1.6370849609375, -1.402099609375, -1.1671142578125, -0.93212890625, -0.6971435546875, -0.462158203125, -0.2271728515625, 0.0078125, 0.2427978515625, 0.477783203125, 0.7127685546875, 0.94775390625, 1.1827392578125, 1.417724609375, 1.6527099609375, 1.8876953125, 2.1226806640625, 2.357666015625, 2.5926513671875, 2.82763671875, 3.0626220703125, 3.297607421875, 3.5325927734375, 3.767578125, 4.0025634765625, 4.237548828125, 4.4725341796875, 4.70751953125, 4.9425048828125, 5.177490234375, 5.4124755859375, 5.6474609375, 5.8824462890625, 6.117431640625, 6.3524169921875, 6.58740234375, 6.8223876953125, 7.057373046875, 7.2923583984375, 7.52734375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 4.0, 1.0, 3.0, 2.0, 2.0, 2.0, 6.0, 9.0, 17.0, 15.0, 25.0, 35.0, 26.0, 66.0, 105.0, 105.0, 185.0, 267.0, 362.0, 685.0, 11241.0, 3953354.0, 224703.0, 1516.0, 477.0, 314.0, 221.0, 172.0, 110.0, 69.0, 60.0, 38.0, 25.0, 24.0, 9.0, 9.0, 8.0, 4.0, 2.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.34375, -38.1416015625, -36.939453125, -35.7373046875, -34.53515625, -33.3330078125, -32.130859375, -30.9287109375, -29.7265625, -28.5244140625, -27.322265625, -26.1201171875, -24.91796875, -23.7158203125, -22.513671875, -21.3115234375, -20.109375, -18.9072265625, -17.705078125, -16.5029296875, -15.30078125, -14.0986328125, -12.896484375, -11.6943359375, -10.4921875, -9.2900390625, -8.087890625, -6.8857421875, -5.68359375, -4.4814453125, -3.279296875, -2.0771484375, -0.875, 0.3271484375, 1.529296875, 2.7314453125, 3.93359375, 5.1357421875, 6.337890625, 7.5400390625, 8.7421875, 9.9443359375, 11.146484375, 12.3486328125, 13.55078125, 14.7529296875, 15.955078125, 17.1572265625, 18.359375, 19.5615234375, 20.763671875, 21.9658203125, 23.16796875, 24.3701171875, 25.572265625, 26.7744140625, 27.9765625, 29.1787109375, 30.380859375, 31.5830078125, 32.78515625, 33.9873046875, 35.189453125, 36.3916015625, 37.59375]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 8.0, 19.0, 54.0, 83.0, 124.0, 190.0, 195.0, 136.0, 114.0, 52.0, 19.0, 13.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.29283905029297, -33.89237594604492, -32.491912841796875, -31.091447830200195, -29.690982818603516, -28.29051971435547, -26.890056610107422, -25.489593505859375, -24.089128494262695, -22.68866539001465, -21.28820037841797, -19.887737274169922, -18.487274169921875, -17.086809158325195, -15.686346054077148, -14.285881996154785, -12.885417938232422, -11.484953880310059, -10.084489822387695, -8.684026718139648, -7.283562660217285, -5.883098602294922, -4.482635498046875, -3.0821714401245117, -1.6817073822021484, -0.28124356269836426, 1.11922025680542, 2.519683837890625, 3.9201478958129883, 5.320611953735352, 6.721075057983398, 8.121539115905762, 9.52199935913086, 10.922463417053223, 12.322927474975586, 13.723390579223633, 15.123854637145996, 16.52431869506836, 17.924781799316406, 19.325244903564453, 20.725709915161133, 22.12617301940918, 23.52663803100586, 24.927101135253906, 26.327564239501953, 27.728029251098633, 29.12849235534668, 30.52895736694336, 31.929420471191406, 33.32988357543945, 34.7303466796875, 36.13081359863281, 37.53127670288086, 38.931739807128906, 40.33220291137695, 41.732666015625, 43.13313293457031, 44.53359603881836, 45.934059143066406, 47.33452606201172, 48.734989166259766, 50.13545227050781, 51.53591537475586, 52.936378479003906, 54.33684158325195]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 7.0, 5.0, 8.0, 13.0, 13.0, 21.0, 13.0, 21.0, 27.0, 23.0, 27.0, 31.0, 30.0, 32.0, 32.0, 43.0, 50.0, 38.0, 32.0, 54.0, 44.0, 51.0, 33.0, 38.0, 39.0, 33.0, 22.0, 34.0, 30.0, 15.0, 30.0, 18.0, 18.0, 19.0, 8.0, 13.0, 7.0, 3.0, 7.0, 2.0, 4.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.53048324584961, -23.79647445678711, -23.062463760375977, -22.328454971313477, -21.594444274902344, -20.860435485839844, -20.126426696777344, -19.392417907714844, -18.65840721130371, -17.92439842224121, -17.190387725830078, -16.456378936767578, -15.722369194030762, -14.988359451293945, -14.254350662231445, -13.520340919494629, -12.786331176757812, -12.052321434020996, -11.31831169128418, -10.58430290222168, -9.850293159484863, -9.116283416748047, -8.382274627685547, -7.6482648849487305, -6.914255142211914, -6.180245399475098, -5.4462361335754395, -4.712226867675781, -3.978217124938965, -3.2442076206207275, -2.5101981163024902, -1.776188850402832, -1.0421810150146484, -0.30817151069641113, 0.42583799362182617, 1.1598474979400635, 1.8938570022583008, 2.627866506576538, 3.3618760108947754, 4.095885276794434, 4.82989501953125, 5.563904762268066, 6.297914028167725, 7.031923294067383, 7.765933036804199, 8.499942779541016, 9.233951568603516, 9.967961311340332, 10.701971054077148, 11.435980796813965, 12.169990539550781, 12.903999328613281, 13.638009071350098, 14.372018814086914, 15.106027603149414, 15.84003734588623, 16.574047088623047, 17.308055877685547, 18.04206657409668, 18.77607536315918, 19.510086059570312, 20.244094848632812, 20.978103637695312, 21.712112426757812, 22.446123123168945]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 2.0, 5.0, 8.0, 10.0, 7.0, 5.0, 18.0, 19.0, 23.0, 17.0, 35.0, 24.0, 28.0, 28.0, 36.0, 25.0, 28.0, 37.0, 38.0, 37.0, 35.0, 36.0, 40.0, 34.0, 35.0, 23.0, 32.0, 26.0, 45.0, 26.0, 32.0, 28.0, 16.0, 29.0, 23.0, 14.0, 18.0, 8.0, 7.0, 13.0, 14.0, 4.0, 5.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.75390625, -3.6324462890625, -3.510986328125, -3.3895263671875, -3.26806640625, -3.1466064453125, -3.025146484375, -2.9036865234375, -2.7822265625, -2.6607666015625, -2.539306640625, -2.4178466796875, -2.29638671875, -2.1749267578125, -2.053466796875, -1.9320068359375, -1.810546875, -1.6890869140625, -1.567626953125, -1.4461669921875, -1.32470703125, -1.2032470703125, -1.081787109375, -0.9603271484375, -0.8388671875, -0.7174072265625, -0.595947265625, -0.4744873046875, -0.35302734375, -0.2315673828125, -0.110107421875, 0.0113525390625, 0.1328125, 0.2542724609375, 0.375732421875, 0.4971923828125, 0.61865234375, 0.7401123046875, 0.861572265625, 0.9830322265625, 1.1044921875, 1.2259521484375, 1.347412109375, 1.4688720703125, 1.59033203125, 1.7117919921875, 1.833251953125, 1.9547119140625, 2.076171875, 2.1976318359375, 2.319091796875, 2.4405517578125, 2.56201171875, 2.6834716796875, 2.804931640625, 2.9263916015625, 3.0478515625, 3.1693115234375, 3.290771484375, 3.4122314453125, 3.53369140625, 3.6551513671875, 3.776611328125, 3.8980712890625, 4.01953125]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [5.0, 4.0, 3.0, 7.0, 10.0, 12.0, 30.0, 39.0, 46.0, 65.0, 115.0, 136.0, 211.0, 329.0, 482.0, 688.0, 1059.0, 1535.0, 2267.0, 3379.0, 4906.0, 7365.0, 11218.0, 17336.0, 27082.0, 44360.0, 74508.0, 127787.0, 201434.0, 200828.0, 126158.0, 73574.0, 44103.0, 27044.0, 16863.0, 11017.0, 7294.0, 4919.0, 3379.0, 2250.0, 1525.0, 1077.0, 686.0, 451.0, 334.0, 235.0, 130.0, 97.0, 59.0, 48.0, 24.0, 23.0, 10.0, 7.0, 7.0, 4.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.43017578125, -0.41533660888671875, -0.4004974365234375, -0.38565826416015625, -0.370819091796875, -0.35597991943359375, -0.3411407470703125, -0.32630157470703125, -0.31146240234375, -0.29662322998046875, -0.2817840576171875, -0.26694488525390625, -0.252105712890625, -0.23726654052734375, -0.2224273681640625, -0.20758819580078125, -0.1927490234375, -0.17790985107421875, -0.1630706787109375, -0.14823150634765625, -0.133392333984375, -0.11855316162109375, -0.1037139892578125, -0.08887481689453125, -0.07403564453125, -0.05919647216796875, -0.0443572998046875, -0.02951812744140625, -0.014678955078125, 0.00016021728515625, 0.0149993896484375, 0.02983856201171875, 0.044677734375, 0.05951690673828125, 0.0743560791015625, 0.08919525146484375, 0.104034423828125, 0.11887359619140625, 0.1337127685546875, 0.14855194091796875, 0.16339111328125, 0.17823028564453125, 0.1930694580078125, 0.20790863037109375, 0.222747802734375, 0.23758697509765625, 0.2524261474609375, 0.26726531982421875, 0.2821044921875, 0.29694366455078125, 0.3117828369140625, 0.32662200927734375, 0.341461181640625, 0.35630035400390625, 0.3711395263671875, 0.38597869873046875, 0.40081787109375, 0.41565704345703125, 0.4304962158203125, 0.44533538818359375, 0.460174560546875, 0.47501373291015625, 0.4898529052734375, 0.5046920776367188, 0.51953125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 10.0, 6.0, 9.0, 13.0, 9.0, 13.0, 19.0, 15.0, 17.0, 30.0, 23.0, 26.0, 31.0, 43.0, 44.0, 52.0, 36.0, 44.0, 42.0, 1073.0, 57.0, 37.0, 45.0, 35.0, 34.0, 32.0, 40.0, 34.0, 25.0, 25.0, 22.0, 24.0, 7.0, 16.0, 15.0, 4.0, 5.0, 4.0, 4.0, 2.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.5, -2.407470703125, -2.31494140625, -2.222412109375, -2.1298828125, -2.037353515625, -1.94482421875, -1.852294921875, -1.759765625, -1.667236328125, -1.57470703125, -1.482177734375, -1.3896484375, -1.297119140625, -1.20458984375, -1.112060546875, -1.01953125, -0.927001953125, -0.83447265625, -0.741943359375, -0.6494140625, -0.556884765625, -0.46435546875, -0.371826171875, -0.279296875, -0.186767578125, -0.09423828125, -0.001708984375, 0.0908203125, 0.183349609375, 0.27587890625, 0.368408203125, 0.4609375, 0.553466796875, 0.64599609375, 0.738525390625, 0.8310546875, 0.923583984375, 1.01611328125, 1.108642578125, 1.201171875, 1.293701171875, 1.38623046875, 1.478759765625, 1.5712890625, 1.663818359375, 1.75634765625, 1.848876953125, 1.94140625, 2.033935546875, 2.12646484375, 2.218994140625, 2.3115234375, 2.404052734375, 2.49658203125, 2.589111328125, 2.681640625, 2.774169921875, 2.86669921875, 2.959228515625, 3.0517578125, 3.144287109375, 3.23681640625, 3.329345703125, 3.421875]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 3.0, 5.0, 6.0, 18.0, 8.0, 19.0, 32.0, 48.0, 69.0, 109.0, 154.0, 258.0, 351.0, 499.0, 816.0, 1130.0, 1776.0, 2754.0, 4068.0, 6143.0, 9262.0, 14487.0, 22057.0, 34403.0, 55794.0, 95796.0, 163578.0, 1267707.0, 164672.0, 95673.0, 56492.0, 34855.0, 21911.0, 14395.0, 9419.0, 6136.0, 4096.0, 2715.0, 1879.0, 1151.0, 795.0, 513.0, 349.0, 241.0, 155.0, 122.0, 78.0, 44.0, 33.0, 22.0, 16.0, 15.0, 6.0, 8.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.385498046875, -0.3728599548339844, -0.36022186279296875, -0.3475837707519531, -0.3349456787109375, -0.3223075866699219, -0.30966949462890625, -0.2970314025878906, -0.284393310546875, -0.2717552185058594, -0.25911712646484375, -0.24647903442382812, -0.2338409423828125, -0.22120285034179688, -0.20856475830078125, -0.19592666625976562, -0.18328857421875, -0.17065048217773438, -0.15801239013671875, -0.14537429809570312, -0.1327362060546875, -0.12009811401367188, -0.10746002197265625, -0.09482192993164062, -0.082183837890625, -0.06954574584960938, -0.05690765380859375, -0.044269561767578125, -0.0316314697265625, -0.018993377685546875, -0.00635528564453125, 0.006282806396484375, 0.0189208984375, 0.031558990478515625, 0.04419708251953125, 0.056835174560546875, 0.0694732666015625, 0.08211135864257812, 0.09474945068359375, 0.10738754272460938, 0.120025634765625, 0.13266372680664062, 0.14530181884765625, 0.15793991088867188, 0.1705780029296875, 0.18321609497070312, 0.19585418701171875, 0.20849227905273438, 0.22113037109375, 0.23376846313476562, 0.24640655517578125, 0.2590446472167969, 0.2716827392578125, 0.2843208312988281, 0.29695892333984375, 0.3095970153808594, 0.322235107421875, 0.3348731994628906, 0.34751129150390625, 0.3601493835449219, 0.3727874755859375, 0.3854255676269531, 0.39806365966796875, 0.4107017517089844, 0.42333984375]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 5.0, 7.0, 4.0, 8.0, 8.0, 8.0, 10.0, 15.0, 26.0, 33.0, 28.0, 30.0, 38.0, 51.0, 69.0, 50.0, 79.0, 81.0, 77.0, 70.0, 58.0, 41.0, 31.0, 31.0, 30.0, 21.0, 19.0, 16.0, 14.0, 8.0, 9.0, 7.0, 7.0, 3.0, 0.0, 4.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.00469207763671875, -0.004544198513031006, -0.004396319389343262, -0.004248440265655518, -0.0041005611419677734, -0.003952682018280029, -0.003804802894592285, -0.003656923770904541, -0.003509044647216797, -0.0033611655235290527, -0.0032132863998413086, -0.0030654072761535645, -0.0029175281524658203, -0.002769649028778076, -0.002621769905090332, -0.002473890781402588, -0.0023260116577148438, -0.0021781325340270996, -0.0020302534103393555, -0.0018823742866516113, -0.0017344951629638672, -0.001586616039276123, -0.001438736915588379, -0.0012908577919006348, -0.0011429786682128906, -0.0009950995445251465, -0.0008472204208374023, -0.0006993412971496582, -0.0005514621734619141, -0.0004035830497741699, -0.0002557039260864258, -0.00010782480239868164, 4.00543212890625e-05, 0.00018793344497680664, 0.0003358125686645508, 0.0004836916923522949, 0.0006315708160400391, 0.0007794499397277832, 0.0009273290634155273, 0.0010752081871032715, 0.0012230873107910156, 0.0013709664344787598, 0.001518845558166504, 0.001666724681854248, 0.0018146038055419922, 0.0019624829292297363, 0.0021103620529174805, 0.0022582411766052246, 0.0024061203002929688, 0.002553999423980713, 0.002701878547668457, 0.002849757671356201, 0.0029976367950439453, 0.0031455159187316895, 0.0032933950424194336, 0.0034412741661071777, 0.003589153289794922, 0.003737032413482666, 0.00388491153717041, 0.004032790660858154, 0.0041806697845458984, 0.004328548908233643, 0.004476428031921387, 0.004624307155609131, 0.004772186279296875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 3.0, 4.0, 6.0, 8.0, 17.0, 13.0, 20.0, 29.0, 25.0, 43.0, 68.0, 72.0, 117.0, 232.0, 556.0, 5695.0, 1036060.0, 4285.0, 541.0, 240.0, 134.0, 109.0, 60.0, 50.0, 42.0, 36.0, 19.0, 13.0, 12.0, 10.0, 7.0, 6.0, 8.0, 4.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.110595703125, -0.10719013214111328, -0.10378456115722656, -0.10037899017333984, -0.09697341918945312, -0.0935678482055664, -0.09016227722167969, -0.08675670623779297, -0.08335113525390625, -0.07994556427001953, -0.07653999328613281, -0.0731344223022461, -0.06972885131835938, -0.06632328033447266, -0.06291770935058594, -0.05951213836669922, -0.0561065673828125, -0.05270099639892578, -0.04929542541503906, -0.045889854431152344, -0.042484283447265625, -0.039078712463378906, -0.03567314147949219, -0.03226757049560547, -0.02886199951171875, -0.02545642852783203, -0.022050857543945312, -0.018645286560058594, -0.015239715576171875, -0.011834144592285156, -0.008428573608398438, -0.005023002624511719, -0.001617431640625, 0.0017881393432617188, 0.0051937103271484375, 0.008599281311035156, 0.012004852294921875, 0.015410423278808594, 0.018815994262695312, 0.02222156524658203, 0.02562713623046875, 0.02903270721435547, 0.03243827819824219, 0.035843849182128906, 0.039249420166015625, 0.042654991149902344, 0.04606056213378906, 0.04946613311767578, 0.0528717041015625, 0.05627727508544922, 0.05968284606933594, 0.06308841705322266, 0.06649398803710938, 0.0698995590209961, 0.07330513000488281, 0.07671070098876953, 0.08011627197265625, 0.08352184295654297, 0.08692741394042969, 0.0903329849243164, 0.09373855590820312, 0.09714412689208984, 0.10054969787597656, 0.10395526885986328, 0.10736083984375]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 8.0, 21.0, 391.0, 545.0, 45.0, 5.0, 0.0, 2.0], "bins": [-0.027752337977290154, -0.027282677590847015, -0.026813015341758728, -0.02634335495531559, -0.025873692706227303, -0.025404032319784164, -0.024934371933341026, -0.02446470968425274, -0.0239950492978096, -0.023525388911366463, -0.023055726662278175, -0.022586066275835037, -0.02211640402674675, -0.021646743640303612, -0.021177083253860474, -0.020707421004772186, -0.020237760618329048, -0.01976810023188591, -0.019298437982797623, -0.018828777596354485, -0.018359115347266197, -0.01788945496082306, -0.01741979457437992, -0.016950132325291634, -0.016480471938848495, -0.016010811552405357, -0.01554114930331707, -0.015071488916873932, -0.01460182759910822, -0.014132166281342506, -0.013662504963576794, -0.013192843645811081, -0.012723181396722794, -0.01225352007895708, -0.011783858761191368, -0.01131419837474823, -0.010844537056982517, -0.010374875739216805, -0.009905214421451092, -0.009435553103685379, -0.008965892717242241, -0.008496231399476528, -0.008026570081710815, -0.00755690922960639, -0.007087248377501965, -0.006617587059736252, -0.006147925741970539, -0.005678264889866114, -0.005208604037761688, -0.0047389427199959755, -0.00426928186789155, -0.0037996205501258373, -0.003329959698021412, -0.002860298380255699, -0.00239063729532063, -0.001920976210385561, -0.001451315125450492, -0.0009816540405154228, -0.0005119928973726928, -4.2331754229962826e-05, 0.00042732933070510626, 0.0008969905320554972, 0.0013666516169905663, 0.0018363127019256353, 0.0023059737868607044]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 5.0, 1.0, 2.0, 1.0, 3.0, 5.0, 4.0, 13.0, 9.0, 25.0, 10.0, 26.0, 19.0, 26.0, 36.0, 23.0, 27.0, 33.0, 41.0, 46.0, 38.0, 49.0, 46.0, 41.0, 45.0, 40.0, 40.0, 27.0, 38.0, 42.0, 38.0, 43.0, 31.0, 20.0, 23.0, 23.0, 17.0, 12.0, 12.0, 9.0, 5.0, 6.0, 5.0, 3.0, 5.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0021973252296447754, -0.0021203868091106415, -0.0020434483885765076, -0.0019665099680423737, -0.0018895715475082397, -0.0018126331269741058, -0.001735694706439972, -0.001658756285905838, -0.001581817865371704, -0.0015048794448375702, -0.0014279410243034363, -0.0013510026037693024, -0.0012740641832351685, -0.0011971257627010345, -0.0011201873421669006, -0.0010432489216327667, -0.0009663105010986328, -0.0008893720805644989, -0.000812433660030365, -0.0007354952394962311, -0.0006585568189620972, -0.0005816183984279633, -0.0005046799778938293, -0.00042774155735969543, -0.0003508031368255615, -0.0002738647162914276, -0.0001969262957572937, -0.00011998787522315979, -4.304945468902588e-05, 3.388896584510803e-05, 0.00011082738637924194, 0.00018776580691337585, 0.00026470422744750977, 0.0003416426479816437, 0.0004185810685157776, 0.0004955194890499115, 0.0005724579095840454, 0.0006493963301181793, 0.0007263347506523132, 0.0008032731711864471, 0.0008802115917205811, 0.000957150012254715, 0.0010340884327888489, 0.0011110268533229828, 0.0011879652738571167, 0.0012649036943912506, 0.0013418421149253845, 0.0014187805354595184, 0.0014957189559936523, 0.0015726573765277863, 0.0016495957970619202, 0.001726534217596054, 0.001803472638130188, 0.001880411058664322, 0.001957349479198456, 0.0020342878997325897, 0.0021112263202667236, 0.0021881647408008575, 0.0022651031613349915, 0.0023420415818691254, 0.0024189800024032593, 0.002495918422937393, 0.002572856843471527, 0.002649795264005661, 0.002726733684539795]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 2.0, 2.0, 5.0, 8.0, 10.0, 7.0, 5.0, 18.0, 20.0, 22.0, 17.0, 35.0, 24.0, 28.0, 28.0, 36.0, 25.0, 28.0, 37.0, 38.0, 37.0, 35.0, 36.0, 40.0, 34.0, 35.0, 23.0, 32.0, 26.0, 45.0, 26.0, 32.0, 28.0, 16.0, 29.0, 23.0, 14.0, 18.0, 8.0, 7.0, 13.0, 14.0, 4.0, 5.0, 8.0, 6.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-3.75390625, -3.6324462890625, -3.510986328125, -3.3895263671875, -3.26806640625, -3.1466064453125, -3.025146484375, -2.9036865234375, -2.7822265625, -2.6607666015625, -2.539306640625, -2.4178466796875, -2.29638671875, -2.1749267578125, -2.053466796875, -1.9320068359375, -1.810546875, -1.6890869140625, -1.567626953125, -1.4461669921875, -1.32470703125, -1.2032470703125, -1.081787109375, -0.9603271484375, -0.8388671875, -0.7174072265625, -0.595947265625, -0.4744873046875, -0.35302734375, -0.2315673828125, -0.110107421875, 0.0113525390625, 0.1328125, 0.2542724609375, 0.375732421875, 0.4971923828125, 0.61865234375, 0.7401123046875, 0.861572265625, 0.9830322265625, 1.1044921875, 1.2259521484375, 1.347412109375, 1.4688720703125, 1.59033203125, 1.7117919921875, 1.833251953125, 1.9547119140625, 2.076171875, 2.1976318359375, 2.319091796875, 2.4405517578125, 2.56201171875, 2.6834716796875, 2.804931640625, 2.9263916015625, 3.0478515625, 3.1693115234375, 3.290771484375, 3.4122314453125, 3.53369140625, 3.6551513671875, 3.776611328125, 3.8980712890625, 4.01953125]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 1.0, 3.0, 5.0, 4.0, 7.0, 8.0, 10.0, 14.0, 28.0, 29.0, 19.0, 29.0, 52.0, 69.0, 81.0, 118.0, 173.0, 241.0, 385.0, 708.0, 1533.0, 5422.0, 29159.0, 187664.0, 669056.0, 126491.0, 20148.0, 4000.0, 1289.0, 659.0, 339.0, 230.0, 133.0, 113.0, 71.0, 56.0, 37.0, 38.0, 23.0, 21.0, 17.0, 11.0, 10.0, 11.0, 13.0, 5.0, 4.0, 2.0, 6.0, 3.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-7.7421875, -7.49560546875, -7.2490234375, -7.00244140625, -6.755859375, -6.50927734375, -6.2626953125, -6.01611328125, -5.76953125, -5.52294921875, -5.2763671875, -5.02978515625, -4.783203125, -4.53662109375, -4.2900390625, -4.04345703125, -3.796875, -3.55029296875, -3.3037109375, -3.05712890625, -2.810546875, -2.56396484375, -2.3173828125, -2.07080078125, -1.82421875, -1.57763671875, -1.3310546875, -1.08447265625, -0.837890625, -0.59130859375, -0.3447265625, -0.09814453125, 0.1484375, 0.39501953125, 0.6416015625, 0.88818359375, 1.134765625, 1.38134765625, 1.6279296875, 1.87451171875, 2.12109375, 2.36767578125, 2.6142578125, 2.86083984375, 3.107421875, 3.35400390625, 3.6005859375, 3.84716796875, 4.09375, 4.34033203125, 4.5869140625, 4.83349609375, 5.080078125, 5.32666015625, 5.5732421875, 5.81982421875, 6.06640625, 6.31298828125, 6.5595703125, 6.80615234375, 7.052734375, 7.29931640625, 7.5458984375, 7.79248046875, 8.0390625]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 4.0, 7.0, 12.0, 11.0, 22.0, 22.0, 20.0, 22.0, 34.0, 28.0, 43.0, 52.0, 47.0, 77.0, 152.0, 421.0, 1473.0, 140.0, 76.0, 69.0, 56.0, 44.0, 50.0, 38.0, 27.0, 16.0, 22.0, 12.0, 15.0, 5.0, 7.0, 7.0, 6.0, 3.0, 6.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-18.28125, -17.77392578125, -17.2666015625, -16.75927734375, -16.251953125, -15.74462890625, -15.2373046875, -14.72998046875, -14.22265625, -13.71533203125, -13.2080078125, -12.70068359375, -12.193359375, -11.68603515625, -11.1787109375, -10.67138671875, -10.1640625, -9.65673828125, -9.1494140625, -8.64208984375, -8.134765625, -7.62744140625, -7.1201171875, -6.61279296875, -6.10546875, -5.59814453125, -5.0908203125, -4.58349609375, -4.076171875, -3.56884765625, -3.0615234375, -2.55419921875, -2.046875, -1.53955078125, -1.0322265625, -0.52490234375, -0.017578125, 0.48974609375, 0.9970703125, 1.50439453125, 2.01171875, 2.51904296875, 3.0263671875, 3.53369140625, 4.041015625, 4.54833984375, 5.0556640625, 5.56298828125, 6.0703125, 6.57763671875, 7.0849609375, 7.59228515625, 8.099609375, 8.60693359375, 9.1142578125, 9.62158203125, 10.12890625, 10.63623046875, 11.1435546875, 11.65087890625, 12.158203125, 12.66552734375, 13.1728515625, 13.68017578125, 14.1875]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 7.0, 3.0, 11.0, 16.0, 10.0, 17.0, 24.0, 37.0, 56.0, 68.0, 112.0, 196.0, 347.0, 1111.0, 136896.0, 3004105.0, 1688.0, 440.0, 192.0, 102.0, 73.0, 63.0, 54.0, 30.0, 22.0, 11.0, 11.0, 5.0, 4.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.375, -65.3408203125, -63.306640625, -61.2724609375, -59.23828125, -57.2041015625, -55.169921875, -53.1357421875, -51.1015625, -49.0673828125, -47.033203125, -44.9990234375, -42.96484375, -40.9306640625, -38.896484375, -36.8623046875, -34.828125, -32.7939453125, -30.759765625, -28.7255859375, -26.69140625, -24.6572265625, -22.623046875, -20.5888671875, -18.5546875, -16.5205078125, -14.486328125, -12.4521484375, -10.41796875, -8.3837890625, -6.349609375, -4.3154296875, -2.28125, -0.2470703125, 1.787109375, 3.8212890625, 5.85546875, 7.8896484375, 9.923828125, 11.9580078125, 13.9921875, 16.0263671875, 18.060546875, 20.0947265625, 22.12890625, 24.1630859375, 26.197265625, 28.2314453125, 30.265625, 32.2998046875, 34.333984375, 36.3681640625, 38.40234375, 40.4365234375, 42.470703125, 44.5048828125, 46.5390625, 48.5732421875, 50.607421875, 52.6416015625, 54.67578125, 56.7099609375, 58.744140625, 60.7783203125, 62.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 2.0, 13.0, 67.0, 201.0, 328.0, 271.0, 114.0, 19.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.601672172546387, -5.445283889770508, -4.288895606994629, -3.13250732421875, -1.976119041442871, -0.8197307586669922, 0.3366575241088867, 1.4930458068847656, 2.6494340896606445, 3.8058223724365234, 4.962210655212402, 6.118598937988281, 7.27498722076416, 8.431375503540039, 9.587763786315918, 10.744152069091797, 11.900540351867676, 13.056928634643555, 14.213316917419434, 15.369705200195312, 16.526092529296875, 17.68248176574707, 18.838871002197266, 19.995258331298828, 21.15164566040039, 22.308032989501953, 23.46442222595215, 24.620811462402344, 25.777198791503906, 26.93358612060547, 28.089975357055664, 29.24636459350586, 30.402755737304688, 31.55914306640625, 32.71553039550781, 33.87192153930664, 35.0283088684082, 36.184696197509766, 37.341087341308594, 38.497474670410156, 39.65386199951172, 40.81024932861328, 41.966636657714844, 43.12302780151367, 44.279415130615234, 45.4358024597168, 46.592193603515625, 47.74858093261719, 48.90496826171875, 50.06135559082031, 51.217742919921875, 52.3741340637207, 53.530521392822266, 54.68690872192383, 55.843299865722656, 56.99968719482422, 58.15607452392578, 59.312461853027344, 60.468849182128906, 61.625240325927734, 62.7816276550293, 63.93801498413086, 65.09440612792969, 66.25079345703125, 67.40718078613281]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 3.0, 1.0, 3.0, 2.0, 4.0, 9.0, 11.0, 11.0, 26.0, 21.0, 11.0, 23.0, 28.0, 29.0, 30.0, 26.0, 41.0, 44.0, 34.0, 40.0, 42.0, 40.0, 52.0, 55.0, 37.0, 38.0, 45.0, 39.0, 30.0, 31.0, 30.0, 30.0, 21.0, 20.0, 14.0, 13.0, 14.0, 15.0, 7.0, 7.0, 9.0, 2.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-39.07048416137695, -37.82530212402344, -36.580116271972656, -35.33493423461914, -34.089752197265625, -32.84457015991211, -31.59938621520996, -30.354202270507812, -29.109020233154297, -27.86383819580078, -26.618654251098633, -25.373470306396484, -24.12828826904297, -22.883106231689453, -21.637922286987305, -20.392738342285156, -19.14755630493164, -17.902374267578125, -16.657190322875977, -15.412007331848145, -14.166824340820312, -12.92164134979248, -11.676458358764648, -10.431275367736816, -9.186092376708984, -7.940909385681152, -6.69572639465332, -5.450543403625488, -4.205360412597656, -2.960177421569824, -1.7149944305419922, -0.46981143951416016, 0.7753753662109375, 2.0205583572387695, 3.2657413482666016, 4.510924339294434, 5.756107330322266, 7.001290321350098, 8.24647331237793, 9.491656303405762, 10.736839294433594, 11.982022285461426, 13.227205276489258, 14.47238826751709, 15.717571258544922, 16.962753295898438, 18.207937240600586, 19.453121185302734, 20.69830322265625, 21.943485260009766, 23.188669204711914, 24.433853149414062, 25.679035186767578, 26.924217224121094, 28.169401168823242, 29.41458511352539, 30.659767150878906, 31.904949188232422, 33.15013122558594, 34.39531707763672, 35.640499114990234, 36.88568115234375, 38.13086700439453, 39.37604904174805, 40.62123107910156]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0, 3.0, 3.0, 3.0, 3.0, 10.0, 12.0, 12.0, 13.0, 17.0, 20.0, 22.0, 35.0, 38.0, 33.0, 32.0, 32.0, 31.0, 34.0, 36.0, 37.0, 49.0, 51.0, 39.0, 35.0, 36.0, 34.0, 29.0, 33.0, 33.0, 36.0, 33.0, 34.0, 25.0, 25.0, 15.0, 13.0, 10.0, 13.0, 7.0, 9.0, 5.0, 7.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.7109375, -4.56219482421875, -4.4134521484375, -4.26470947265625, -4.115966796875, -3.96722412109375, -3.8184814453125, -3.66973876953125, -3.52099609375, -3.37225341796875, -3.2235107421875, -3.07476806640625, -2.926025390625, -2.77728271484375, -2.6285400390625, -2.47979736328125, -2.3310546875, -2.18231201171875, -2.0335693359375, -1.88482666015625, -1.736083984375, -1.58734130859375, -1.4385986328125, -1.28985595703125, -1.14111328125, -0.99237060546875, -0.8436279296875, -0.69488525390625, -0.546142578125, -0.39739990234375, -0.2486572265625, -0.09991455078125, 0.048828125, 0.19757080078125, 0.3463134765625, 0.49505615234375, 0.643798828125, 0.79254150390625, 0.9412841796875, 1.09002685546875, 1.23876953125, 1.38751220703125, 1.5362548828125, 1.68499755859375, 1.833740234375, 1.98248291015625, 2.1312255859375, 2.27996826171875, 2.4287109375, 2.57745361328125, 2.7261962890625, 2.87493896484375, 3.023681640625, 3.17242431640625, 3.3211669921875, 3.46990966796875, 3.61865234375, 3.76739501953125, 3.9161376953125, 4.06488037109375, 4.213623046875, 4.36236572265625, 4.5111083984375, 4.65985107421875, 4.80859375]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 5.0, 2.0, 4.0, 8.0, 6.0, 14.0, 16.0, 12.0, 22.0, 39.0, 55.0, 59.0, 92.0, 114.0, 166.0, 283.0, 452.0, 858.0, 1660.0, 4553.0, 15704.0, 67398.0, 296618.0, 951906.0, 1519574.0, 947200.0, 294888.0, 67388.0, 16155.0, 4865.0, 1931.0, 873.0, 505.0, 256.0, 168.0, 119.0, 90.0, 49.0, 47.0, 41.0, 24.0, 15.0, 16.0, 11.0, 7.0, 6.0, 11.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.28125, -5.11358642578125, -4.9459228515625, -4.77825927734375, -4.610595703125, -4.44293212890625, -4.2752685546875, -4.10760498046875, -3.93994140625, -3.77227783203125, -3.6046142578125, -3.43695068359375, -3.269287109375, -3.10162353515625, -2.9339599609375, -2.76629638671875, -2.5986328125, -2.43096923828125, -2.2633056640625, -2.09564208984375, -1.927978515625, -1.76031494140625, -1.5926513671875, -1.42498779296875, -1.25732421875, -1.08966064453125, -0.9219970703125, -0.75433349609375, -0.586669921875, -0.41900634765625, -0.2513427734375, -0.08367919921875, 0.083984375, 0.25164794921875, 0.4193115234375, 0.58697509765625, 0.754638671875, 0.92230224609375, 1.0899658203125, 1.25762939453125, 1.42529296875, 1.59295654296875, 1.7606201171875, 1.92828369140625, 2.095947265625, 2.26361083984375, 2.4312744140625, 2.59893798828125, 2.7666015625, 2.93426513671875, 3.1019287109375, 3.26959228515625, 3.437255859375, 3.60491943359375, 3.7725830078125, 3.94024658203125, 4.10791015625, 4.27557373046875, 4.4432373046875, 4.61090087890625, 4.778564453125, 4.94622802734375, 5.1138916015625, 5.28155517578125, 5.44921875]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 14.0, 14.0, 29.0, 35.0, 44.0, 75.0, 125.0, 122.0, 158.0, 269.0, 385.0, 476.0, 522.0, 478.0, 372.0, 297.0, 174.0, 132.0, 72.0, 78.0, 51.0, 41.0, 34.0, 20.0, 11.0, 10.0, 8.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.3046875, -7.0177001953125, -6.730712890625, -6.4437255859375, -6.15673828125, -5.8697509765625, -5.582763671875, -5.2957763671875, -5.0087890625, -4.7218017578125, -4.434814453125, -4.1478271484375, -3.86083984375, -3.5738525390625, -3.286865234375, -2.9998779296875, -2.712890625, -2.4259033203125, -2.138916015625, -1.8519287109375, -1.56494140625, -1.2779541015625, -0.990966796875, -0.7039794921875, -0.4169921875, -0.1300048828125, 0.156982421875, 0.4439697265625, 0.73095703125, 1.0179443359375, 1.304931640625, 1.5919189453125, 1.87890625, 2.1658935546875, 2.452880859375, 2.7398681640625, 3.02685546875, 3.3138427734375, 3.600830078125, 3.8878173828125, 4.1748046875, 4.4617919921875, 4.748779296875, 5.0357666015625, 5.32275390625, 5.6097412109375, 5.896728515625, 6.1837158203125, 6.470703125, 6.7576904296875, 7.044677734375, 7.3316650390625, 7.61865234375, 7.9056396484375, 8.192626953125, 8.4796142578125, 8.7666015625, 9.0535888671875, 9.340576171875, 9.6275634765625, 9.91455078125, 10.2015380859375, 10.488525390625, 10.7755126953125, 11.0625]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 6.0, 10.0, 6.0, 20.0, 32.0, 47.0, 43.0, 76.0, 124.0, 171.0, 255.0, 431.0, 834.0, 2288.0, 45528.0, 4024143.0, 115118.0, 2846.0, 952.0, 448.0, 297.0, 209.0, 129.0, 89.0, 54.0, 46.0, 21.0, 17.0, 10.0, 11.0, 8.0, 7.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-37.84375, -36.836669921875, -35.82958984375, -34.822509765625, -33.8154296875, -32.808349609375, -31.80126953125, -30.794189453125, -29.787109375, -28.780029296875, -27.77294921875, -26.765869140625, -25.7587890625, -24.751708984375, -23.74462890625, -22.737548828125, -21.73046875, -20.723388671875, -19.71630859375, -18.709228515625, -17.7021484375, -16.695068359375, -15.68798828125, -14.680908203125, -13.673828125, -12.666748046875, -11.65966796875, -10.652587890625, -9.6455078125, -8.638427734375, -7.63134765625, -6.624267578125, -5.6171875, -4.610107421875, -3.60302734375, -2.595947265625, -1.5888671875, -0.581787109375, 0.42529296875, 1.432373046875, 2.439453125, 3.446533203125, 4.45361328125, 5.460693359375, 6.4677734375, 7.474853515625, 8.48193359375, 9.489013671875, 10.49609375, 11.503173828125, 12.51025390625, 13.517333984375, 14.5244140625, 15.531494140625, 16.53857421875, 17.545654296875, 18.552734375, 19.559814453125, 20.56689453125, 21.573974609375, 22.5810546875, 23.588134765625, 24.59521484375, 25.602294921875, 26.609375]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 124.0, 799.0, 91.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-111.4483642578125, -103.73912811279297, -96.0298843383789, -88.32064819335938, -80.61141204833984, -72.90217590332031, -65.19293212890625, -57.48369598388672, -49.77445602416992, -42.065216064453125, -34.355979919433594, -26.646739959716797, -18.937501907348633, -11.228263854980469, -3.519023895263672, 4.190212249755859, 11.899452209472656, 19.60869026184082, 27.317928314208984, 35.02716827392578, 42.73640441894531, 50.44564437866211, 58.154884338378906, 65.86412048339844, 73.5733642578125, 81.28260040283203, 88.9918441772461, 96.70108032226562, 104.41031646728516, 112.11955261230469, 119.82879638671875, 127.53803253173828, 135.2472686767578, 142.95651245117188, 150.66574096679688, 158.37498474121094, 166.084228515625, 173.79345703125, 181.50270080566406, 189.21194458007812, 196.92117309570312, 204.6304168701172, 212.3396453857422, 220.04888916015625, 227.7581329345703, 235.4673614501953, 243.17660522460938, 250.88583374023438, 258.5950927734375, 266.3043212890625, 274.0135803222656, 281.7228088378906, 289.4320373535156, 297.14129638671875, 304.85052490234375, 312.55975341796875, 320.26898193359375, 327.97821044921875, 335.6874694824219, 343.3966979980469, 351.1059265136719, 358.815185546875, 366.5244140625, 374.233642578125, 381.9429016113281]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 7.0, 1.0, 1.0, 7.0, 9.0, 10.0, 9.0, 12.0, 20.0, 18.0, 24.0, 30.0, 35.0, 29.0, 40.0, 40.0, 45.0, 47.0, 45.0, 37.0, 40.0, 45.0, 46.0, 44.0, 51.0, 29.0, 45.0, 28.0, 28.0, 45.0, 24.0, 16.0, 12.0, 23.0, 15.0, 11.0, 12.0, 5.0, 6.0, 5.0, 4.0, 5.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.786460876464844, -25.88762664794922, -24.988794326782227, -24.0899600982666, -23.191125869750977, -22.292293548583984, -21.39345932006836, -20.494625091552734, -19.595792770385742, -18.696958541870117, -17.798126220703125, -16.8992919921875, -16.000457763671875, -15.101625442504883, -14.202791213989258, -13.30395793914795, -12.405123710632324, -11.506290435791016, -10.60745620727539, -9.708622932434082, -8.809789657592773, -7.910955905914307, -7.01212215423584, -6.113288879394531, -5.2144551277160645, -4.315621376037598, -3.416788101196289, -2.5179543495178223, -1.6191208362579346, -0.7202873229980469, 0.17854642868041992, 1.0773797035217285, 1.9762134552001953, 2.875046968460083, 3.7738804817199707, 4.6727142333984375, 5.571547508239746, 6.470381259918213, 7.36921501159668, 8.268048286437988, 9.166881561279297, 10.065714836120605, 10.96454906463623, 11.863382339477539, 12.762215614318848, 13.661048889160156, 14.559883117675781, 15.45871639251709, 16.35755157470703, 17.256385803222656, 18.15521812438965, 19.054052352905273, 19.9528865814209, 20.85171890258789, 21.750553131103516, 22.64938735961914, 23.548219680786133, 24.447053909301758, 25.34588623046875, 26.244720458984375, 27.1435546875, 28.042387008666992, 28.941221237182617, 29.84005355834961, 30.738887786865234]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 7.0, 9.0, 4.0, 8.0, 15.0, 11.0, 18.0, 23.0, 22.0, 27.0, 27.0, 23.0, 25.0, 42.0, 41.0, 46.0, 38.0, 33.0, 31.0, 42.0, 37.0, 32.0, 42.0, 29.0, 32.0, 39.0, 34.0, 25.0, 30.0, 33.0, 25.0, 24.0, 7.0, 27.0, 17.0, 7.0, 13.0, 10.0, 11.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.29296875, -4.1630859375, -4.033203125, -3.9033203125, -3.7734375, -3.6435546875, -3.513671875, -3.3837890625, -3.25390625, -3.1240234375, -2.994140625, -2.8642578125, -2.734375, -2.6044921875, -2.474609375, -2.3447265625, -2.21484375, -2.0849609375, -1.955078125, -1.8251953125, -1.6953125, -1.5654296875, -1.435546875, -1.3056640625, -1.17578125, -1.0458984375, -0.916015625, -0.7861328125, -0.65625, -0.5263671875, -0.396484375, -0.2666015625, -0.13671875, -0.0068359375, 0.123046875, 0.2529296875, 0.3828125, 0.5126953125, 0.642578125, 0.7724609375, 0.90234375, 1.0322265625, 1.162109375, 1.2919921875, 1.421875, 1.5517578125, 1.681640625, 1.8115234375, 1.94140625, 2.0712890625, 2.201171875, 2.3310546875, 2.4609375, 2.5908203125, 2.720703125, 2.8505859375, 2.98046875, 3.1103515625, 3.240234375, 3.3701171875, 3.5, 3.6298828125, 3.759765625, 3.8896484375, 4.01953125]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 3.0, 12.0, 10.0, 10.0, 21.0, 37.0, 43.0, 59.0, 75.0, 108.0, 148.0, 213.0, 366.0, 482.0, 733.0, 1145.0, 1601.0, 2397.0, 3786.0, 5838.0, 8864.0, 13525.0, 21244.0, 34010.0, 55703.0, 93236.0, 157404.0, 226958.0, 166008.0, 97423.0, 58093.0, 35140.0, 22432.0, 14355.0, 9405.0, 5911.0, 3953.0, 2568.0, 1725.0, 1131.0, 747.0, 560.0, 324.0, 217.0, 153.0, 102.0, 81.0, 62.0, 36.0, 35.0, 28.0, 17.0, 14.0, 6.0, 4.0, 6.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.509765625, -0.4936065673828125, -0.477447509765625, -0.4612884521484375, -0.44512939453125, -0.4289703369140625, -0.412811279296875, -0.3966522216796875, -0.3804931640625, -0.3643341064453125, -0.348175048828125, -0.3320159912109375, -0.31585693359375, -0.2996978759765625, -0.283538818359375, -0.2673797607421875, -0.251220703125, -0.2350616455078125, -0.218902587890625, -0.2027435302734375, -0.18658447265625, -0.1704254150390625, -0.154266357421875, -0.1381072998046875, -0.1219482421875, -0.1057891845703125, -0.089630126953125, -0.0734710693359375, -0.05731201171875, -0.0411529541015625, -0.024993896484375, -0.0088348388671875, 0.00732421875, 0.0234832763671875, 0.039642333984375, 0.0558013916015625, 0.07196044921875, 0.0881195068359375, 0.104278564453125, 0.1204376220703125, 0.1365966796875, 0.1527557373046875, 0.168914794921875, 0.1850738525390625, 0.20123291015625, 0.2173919677734375, 0.233551025390625, 0.2497100830078125, 0.265869140625, 0.2820281982421875, 0.298187255859375, 0.3143463134765625, 0.33050537109375, 0.3466644287109375, 0.362823486328125, 0.3789825439453125, 0.3951416015625, 0.4113006591796875, 0.427459716796875, 0.4436187744140625, 0.45977783203125, 0.4759368896484375, 0.492095947265625, 0.5082550048828125, 0.5244140625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 7.0, 3.0, 4.0, 4.0, 12.0, 6.0, 14.0, 17.0, 13.0, 22.0, 22.0, 22.0, 25.0, 35.0, 40.0, 39.0, 31.0, 35.0, 43.0, 51.0, 39.0, 1068.0, 49.0, 39.0, 42.0, 39.0, 28.0, 33.0, 23.0, 30.0, 31.0, 22.0, 20.0, 24.0, 31.0, 12.0, 10.0, 7.0, 9.0, 5.0, 8.0, 5.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.8359375, -2.7486572265625, -2.661376953125, -2.5740966796875, -2.48681640625, -2.3995361328125, -2.312255859375, -2.2249755859375, -2.1376953125, -2.0504150390625, -1.963134765625, -1.8758544921875, -1.78857421875, -1.7012939453125, -1.614013671875, -1.5267333984375, -1.439453125, -1.3521728515625, -1.264892578125, -1.1776123046875, -1.09033203125, -1.0030517578125, -0.915771484375, -0.8284912109375, -0.7412109375, -0.6539306640625, -0.566650390625, -0.4793701171875, -0.39208984375, -0.3048095703125, -0.217529296875, -0.1302490234375, -0.04296875, 0.0443115234375, 0.131591796875, 0.2188720703125, 0.30615234375, 0.3934326171875, 0.480712890625, 0.5679931640625, 0.6552734375, 0.7425537109375, 0.829833984375, 0.9171142578125, 1.00439453125, 1.0916748046875, 1.178955078125, 1.2662353515625, 1.353515625, 1.4407958984375, 1.528076171875, 1.6153564453125, 1.70263671875, 1.7899169921875, 1.877197265625, 1.9644775390625, 2.0517578125, 2.1390380859375, 2.226318359375, 2.3135986328125, 2.40087890625, 2.4881591796875, 2.575439453125, 2.6627197265625, 2.75]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 7.0, 7.0, 8.0, 24.0, 29.0, 36.0, 50.0, 90.0, 106.0, 184.0, 302.0, 455.0, 657.0, 1036.0, 1625.0, 2454.0, 3866.0, 5937.0, 9371.0, 14442.0, 23008.0, 37371.0, 63270.0, 110351.0, 186852.0, 1265579.0, 151515.0, 86616.0, 50055.0, 30083.0, 18643.0, 11748.0, 7465.0, 4837.0, 3113.0, 2057.0, 1319.0, 855.0, 553.0, 391.0, 270.0, 161.0, 102.0, 82.0, 48.0, 36.0, 25.0, 14.0, 16.0, 7.0, 6.0, 2.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.4423828125, -0.4290924072265625, -0.415802001953125, -0.4025115966796875, -0.38922119140625, -0.3759307861328125, -0.362640380859375, -0.3493499755859375, -0.3360595703125, -0.3227691650390625, -0.309478759765625, -0.2961883544921875, -0.28289794921875, -0.2696075439453125, -0.256317138671875, -0.2430267333984375, -0.229736328125, -0.2164459228515625, -0.203155517578125, -0.1898651123046875, -0.17657470703125, -0.1632843017578125, -0.149993896484375, -0.1367034912109375, -0.1234130859375, -0.1101226806640625, -0.096832275390625, -0.0835418701171875, -0.07025146484375, -0.0569610595703125, -0.043670654296875, -0.0303802490234375, -0.01708984375, -0.0037994384765625, 0.009490966796875, 0.0227813720703125, 0.03607177734375, 0.0493621826171875, 0.062652587890625, 0.0759429931640625, 0.0892333984375, 0.1025238037109375, 0.115814208984375, 0.1291046142578125, 0.14239501953125, 0.1556854248046875, 0.168975830078125, 0.1822662353515625, 0.195556640625, 0.2088470458984375, 0.222137451171875, 0.2354278564453125, 0.24871826171875, 0.2620086669921875, 0.275299072265625, 0.2885894775390625, 0.3018798828125, 0.3151702880859375, 0.328460693359375, 0.3417510986328125, 0.35504150390625, 0.3683319091796875, 0.381622314453125, 0.3949127197265625, 0.408203125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 8.0, 5.0, 2.0, 12.0, 16.0, 14.0, 20.0, 24.0, 28.0, 47.0, 48.0, 65.0, 74.0, 100.0, 105.0, 95.0, 71.0, 52.0, 49.0, 28.0, 34.0, 21.0, 16.0, 10.0, 16.0, 12.0, 8.0, 4.0, 6.0, 0.0, 3.0, 7.0, 3.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00399017333984375, -0.0038677752017974854, -0.0037453770637512207, -0.003622978925704956, -0.0035005807876586914, -0.0033781826496124268, -0.003255784511566162, -0.0031333863735198975, -0.003010988235473633, -0.002888590097427368, -0.0027661919593811035, -0.002643793821334839, -0.0025213956832885742, -0.0023989975452423096, -0.002276599407196045, -0.0021542012691497803, -0.0020318031311035156, -0.001909404993057251, -0.0017870068550109863, -0.0016646087169647217, -0.001542210578918457, -0.0014198124408721924, -0.0012974143028259277, -0.001175016164779663, -0.0010526180267333984, -0.0009302198886871338, -0.0008078217506408691, -0.0006854236125946045, -0.0005630254745483398, -0.0004406273365020752, -0.00031822919845581055, -0.0001958310604095459, -7.343292236328125e-05, 4.89652156829834e-05, 0.00017136335372924805, 0.0002937614917755127, 0.00041615962982177734, 0.000538557767868042, 0.0006609559059143066, 0.0007833540439605713, 0.0009057521820068359, 0.0010281503200531006, 0.0011505484580993652, 0.0012729465961456299, 0.0013953447341918945, 0.0015177428722381592, 0.0016401410102844238, 0.0017625391483306885, 0.0018849372863769531, 0.0020073354244232178, 0.0021297335624694824, 0.002252131700515747, 0.0023745298385620117, 0.0024969279766082764, 0.002619326114654541, 0.0027417242527008057, 0.0028641223907470703, 0.002986520528793335, 0.0031089186668395996, 0.0032313168048858643, 0.003353714942932129, 0.0034761130809783936, 0.003598511219024658, 0.003720909357070923, 0.0038433074951171875]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 8.0, 5.0, 8.0, 4.0, 8.0, 16.0, 10.0, 20.0, 22.0, 32.0, 38.0, 57.0, 75.0, 142.0, 212.0, 511.0, 7494.0, 1034907.0, 3839.0, 482.0, 214.0, 113.0, 107.0, 55.0, 52.0, 24.0, 29.0, 27.0, 5.0, 9.0, 4.0, 7.0, 5.0, 2.0, 5.0, 2.0, 2.0, 0.0, 0.0, 4.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0775146484375, -0.07496833801269531, -0.07242202758789062, -0.06987571716308594, -0.06732940673828125, -0.06478309631347656, -0.062236785888671875, -0.05969047546386719, -0.0571441650390625, -0.05459785461425781, -0.052051544189453125, -0.04950523376464844, -0.04695892333984375, -0.04441261291503906, -0.041866302490234375, -0.03931999206542969, -0.036773681640625, -0.03422737121582031, -0.031681060791015625, -0.029134750366210938, -0.02658843994140625, -0.024042129516601562, -0.021495819091796875, -0.018949508666992188, -0.0164031982421875, -0.013856887817382812, -0.011310577392578125, -0.008764266967773438, -0.00621795654296875, -0.0036716461181640625, -0.001125335693359375, 0.0014209747314453125, 0.00396728515625, 0.0065135955810546875, 0.009059906005859375, 0.011606216430664062, 0.01415252685546875, 0.016698837280273438, 0.019245147705078125, 0.021791458129882812, 0.0243377685546875, 0.026884078979492188, 0.029430389404296875, 0.03197669982910156, 0.03452301025390625, 0.03706932067871094, 0.039615631103515625, 0.04216194152832031, 0.044708251953125, 0.04725456237792969, 0.049800872802734375, 0.05234718322753906, 0.05489349365234375, 0.05743980407714844, 0.059986114501953125, 0.06253242492675781, 0.0650787353515625, 0.06762504577636719, 0.07017135620117188, 0.07271766662597656, 0.07526397705078125, 0.07781028747558594, 0.08035659790039062, 0.08290290832519531, 0.08544921875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 669.0, 345.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0037546472158282995, -0.002798384288325906, -0.001842121477238834, -0.000885858666151762, 7.040426135063171e-05, 0.0010266669560223818, 0.0019829298835247755, 0.0029391928110271692, 0.003895455738529563, 0.004851718433201313, 0.005807981360703707, 0.0067642442882061005, 0.007720507215708494, 0.008676770143210888, 0.009633032605051994, 0.010589295998215675, 0.011545558460056782, 0.012501820921897888, 0.01345808431506157, 0.014414346776902676, 0.015370610170066357, 0.016326872631907463, 0.017283136025071144, 0.018239397555589676, 0.019195660948753357, 0.020151924341917038, 0.02110818587243557, 0.02206444926559925, 0.023020712658762932, 0.023976974189281464, 0.024933237582445145, 0.025889500975608826, 0.026845766231417656, 0.027802029624581337, 0.02875829115509987, 0.02971455454826355, 0.03067081794142723, 0.03162708133459091, 0.03258334472775459, 0.033539608120918274, 0.034495867788791656, 0.03545213118195534, 0.03640839457511902, 0.0373646579682827, 0.03832091763615608, 0.03927718102931976, 0.040233444422483444, 0.041189707815647125, 0.042145971208810806, 0.04310223460197449, 0.04405849799513817, 0.04501476138830185, 0.04597102105617523, 0.04692728444933891, 0.047883547842502594, 0.048839811235666275, 0.049796074628829956, 0.05075233802199364, 0.05170860141515732, 0.052664864808321, 0.05362112447619438, 0.05457738786935806, 0.055533651262521744, 0.056489914655685425, 0.057446178048849106]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 2.0, 7.0, 12.0, 16.0, 21.0, 20.0, 16.0, 36.0, 35.0, 32.0, 39.0, 35.0, 44.0, 45.0, 51.0, 44.0, 64.0, 41.0, 56.0, 59.0, 44.0, 45.0, 34.0, 35.0, 37.0, 28.0, 22.0, 23.0, 10.0, 12.0, 20.0, 7.0, 6.0, 5.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.00282210111618042, -0.002753114327788353, -0.002684127539396286, -0.002615140751004219, -0.002546153962612152, -0.002477167174220085, -0.002408180385828018, -0.0023391935974359512, -0.0022702068090438843, -0.0022012200206518173, -0.0021322332322597504, -0.0020632464438676834, -0.0019942596554756165, -0.0019252728670835495, -0.0018562860786914825, -0.0017872992902994156, -0.0017183125019073486, -0.0016493257135152817, -0.0015803389251232147, -0.0015113521367311478, -0.0014423653483390808, -0.0013733785599470139, -0.001304391771554947, -0.00123540498316288, -0.001166418194770813, -0.001097431406378746, -0.001028444617986679, -0.0009594578295946121, -0.0008904710412025452, -0.0008214842528104782, -0.0007524974644184113, -0.0006835106760263443, -0.0006145238876342773, -0.0005455370992422104, -0.00047655031085014343, -0.0004075635224580765, -0.0003385767340660095, -0.00026958994567394257, -0.0002006031572818756, -0.00013161636888980865, -6.26295804977417e-05, 6.357207894325256e-06, 7.534399628639221e-05, 0.00014433078467845917, 0.00021331757307052612, 0.0002823043614625931, 0.00035129114985466003, 0.000420277938246727, 0.0004892647266387939, 0.0005582515150308609, 0.0006272383034229279, 0.0006962250918149948, 0.0007652118802070618, 0.0008341986685991287, 0.0009031854569911957, 0.0009721722453832626, 0.0010411590337753296, 0.0011101458221673965, 0.0011791326105594635, 0.0012481193989515305, 0.0013171061873435974, 0.0013860929757356644, 0.0014550797641277313, 0.0015240665525197983, 0.0015930533409118652]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 3.0, 6.0, 7.0, 9.0, 4.0, 9.0, 14.0, 11.0, 18.0, 23.0, 22.0, 27.0, 27.0, 23.0, 25.0, 42.0, 41.0, 46.0, 38.0, 33.0, 31.0, 42.0, 37.0, 32.0, 42.0, 29.0, 32.0, 39.0, 34.0, 25.0, 30.0, 33.0, 25.0, 24.0, 7.0, 27.0, 17.0, 7.0, 13.0, 10.0, 11.0, 6.0, 8.0, 5.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-4.29296875, -4.1630859375, -4.033203125, -3.9033203125, -3.7734375, -3.6435546875, -3.513671875, -3.3837890625, -3.25390625, -3.1240234375, -2.994140625, -2.8642578125, -2.734375, -2.6044921875, -2.474609375, -2.3447265625, -2.21484375, -2.0849609375, -1.955078125, -1.8251953125, -1.6953125, -1.5654296875, -1.435546875, -1.3056640625, -1.17578125, -1.0458984375, -0.916015625, -0.7861328125, -0.65625, -0.5263671875, -0.396484375, -0.2666015625, -0.13671875, -0.0068359375, 0.123046875, 0.2529296875, 0.3828125, 0.5126953125, 0.642578125, 0.7724609375, 0.90234375, 1.0322265625, 1.162109375, 1.2919921875, 1.421875, 1.5517578125, 1.681640625, 1.8115234375, 1.94140625, 2.0712890625, 2.201171875, 2.3310546875, 2.4609375, 2.5908203125, 2.720703125, 2.8505859375, 2.98046875, 3.1103515625, 3.240234375, 3.3701171875, 3.5, 3.6298828125, 3.759765625, 3.8896484375, 4.01953125]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 5.0, 2.0, 5.0, 4.0, 4.0, 6.0, 12.0, 11.0, 11.0, 14.0, 26.0, 29.0, 46.0, 69.0, 115.0, 199.0, 422.0, 1002.0, 2430.0, 6150.0, 15252.0, 37585.0, 94860.0, 266806.0, 369250.0, 155831.0, 58669.0, 23673.0, 9449.0, 3767.0, 1487.0, 660.0, 268.0, 130.0, 104.0, 48.0, 40.0, 27.0, 16.0, 18.0, 5.0, 15.0, 11.0, 9.0, 6.0, 2.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0], "bins": [-5.10546875, -4.95635986328125, -4.8072509765625, -4.65814208984375, -4.509033203125, -4.35992431640625, -4.2108154296875, -4.06170654296875, -3.91259765625, -3.76348876953125, -3.6143798828125, -3.46527099609375, -3.316162109375, -3.16705322265625, -3.0179443359375, -2.86883544921875, -2.7197265625, -2.57061767578125, -2.4215087890625, -2.27239990234375, -2.123291015625, -1.97418212890625, -1.8250732421875, -1.67596435546875, -1.52685546875, -1.37774658203125, -1.2286376953125, -1.07952880859375, -0.930419921875, -0.78131103515625, -0.6322021484375, -0.48309326171875, -0.333984375, -0.18487548828125, -0.0357666015625, 0.11334228515625, 0.262451171875, 0.41156005859375, 0.5606689453125, 0.70977783203125, 0.85888671875, 1.00799560546875, 1.1571044921875, 1.30621337890625, 1.455322265625, 1.60443115234375, 1.7535400390625, 1.90264892578125, 2.0517578125, 2.20086669921875, 2.3499755859375, 2.49908447265625, 2.648193359375, 2.79730224609375, 2.9464111328125, 3.09552001953125, 3.24462890625, 3.39373779296875, 3.5428466796875, 3.69195556640625, 3.841064453125, 3.99017333984375, 4.1392822265625, 4.28839111328125, 4.4375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 0.0, 4.0, 3.0, 2.0, 3.0, 4.0, 3.0, 7.0, 6.0, 7.0, 13.0, 12.0, 18.0, 12.0, 19.0, 24.0, 24.0, 33.0, 26.0, 34.0, 33.0, 38.0, 48.0, 68.0, 152.0, 271.0, 1471.0, 215.0, 80.0, 56.0, 52.0, 37.0, 32.0, 34.0, 32.0, 28.0, 28.0, 21.0, 21.0, 19.0, 14.0, 11.0, 9.0, 10.0, 4.0, 7.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0], "bins": [-13.3046875, -12.8924560546875, -12.480224609375, -12.0679931640625, -11.65576171875, -11.2435302734375, -10.831298828125, -10.4190673828125, -10.0068359375, -9.5946044921875, -9.182373046875, -8.7701416015625, -8.35791015625, -7.9456787109375, -7.533447265625, -7.1212158203125, -6.708984375, -6.2967529296875, -5.884521484375, -5.4722900390625, -5.06005859375, -4.6478271484375, -4.235595703125, -3.8233642578125, -3.4111328125, -2.9989013671875, -2.586669921875, -2.1744384765625, -1.76220703125, -1.3499755859375, -0.937744140625, -0.5255126953125, -0.11328125, 0.2989501953125, 0.711181640625, 1.1234130859375, 1.53564453125, 1.9478759765625, 2.360107421875, 2.7723388671875, 3.1845703125, 3.5968017578125, 4.009033203125, 4.4212646484375, 4.83349609375, 5.2457275390625, 5.657958984375, 6.0701904296875, 6.482421875, 6.8946533203125, 7.306884765625, 7.7191162109375, 8.13134765625, 8.5435791015625, 8.955810546875, 9.3680419921875, 9.7802734375, 10.1925048828125, 10.604736328125, 11.0169677734375, 11.42919921875, 11.8414306640625, 12.253662109375, 12.6658935546875, 13.078125]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 6.0, 3.0, 6.0, 8.0, 3.0, 10.0, 11.0, 20.0, 30.0, 36.0, 39.0, 59.0, 90.0, 101.0, 187.0, 262.0, 439.0, 1027.0, 6865.0, 2740716.0, 390817.0, 3013.0, 773.0, 407.0, 244.0, 155.0, 81.0, 82.0, 55.0, 37.0, 33.0, 29.0, 10.0, 8.0, 13.0, 4.0, 8.0, 4.0, 5.0, 4.0, 0.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-31.875, -30.905029296875, -29.93505859375, -28.965087890625, -27.9951171875, -27.025146484375, -26.05517578125, -25.085205078125, -24.115234375, -23.145263671875, -22.17529296875, -21.205322265625, -20.2353515625, -19.265380859375, -18.29541015625, -17.325439453125, -16.35546875, -15.385498046875, -14.41552734375, -13.445556640625, -12.4755859375, -11.505615234375, -10.53564453125, -9.565673828125, -8.595703125, -7.625732421875, -6.65576171875, -5.685791015625, -4.7158203125, -3.745849609375, -2.77587890625, -1.805908203125, -0.8359375, 0.134033203125, 1.10400390625, 2.073974609375, 3.0439453125, 4.013916015625, 4.98388671875, 5.953857421875, 6.923828125, 7.893798828125, 8.86376953125, 9.833740234375, 10.8037109375, 11.773681640625, 12.74365234375, 13.713623046875, 14.68359375, 15.653564453125, 16.62353515625, 17.593505859375, 18.5634765625, 19.533447265625, 20.50341796875, 21.473388671875, 22.443359375, 23.413330078125, 24.38330078125, 25.353271484375, 26.3232421875, 27.293212890625, 28.26318359375, 29.233154296875, 30.203125]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 38.0, 299.0, 510.0, 152.0, 13.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.032657623291016, -59.75957107543945, -57.48648452758789, -55.21339797973633, -52.940311431884766, -50.6672248840332, -48.394134521484375, -46.12104797363281, -43.84796142578125, -41.57487487792969, -39.301788330078125, -37.02870178222656, -34.755615234375, -32.48252868652344, -30.209440231323242, -27.93635368347168, -25.66326904296875, -23.390182495117188, -21.117095947265625, -18.844009399414062, -16.5709228515625, -14.297835350036621, -12.024747848510742, -9.75166130065918, -7.478574752807617, -5.205488204956055, -2.932401180267334, -0.6593141555786133, 1.6137723922729492, 3.8868589401245117, 6.159946441650391, 8.433032989501953, 10.706123352050781, 12.979209899902344, 15.252296447753906, 17.52538299560547, 19.79846954345703, 22.071556091308594, 24.34464454650879, 26.61773109436035, 28.890817642211914, 31.163904190063477, 33.43699264526367, 35.710079193115234, 37.9831657409668, 40.25625228881836, 42.52933883666992, 44.802425384521484, 47.07551193237305, 49.34859848022461, 51.62168502807617, 53.894771575927734, 56.1678581237793, 58.44094467163086, 60.71403503417969, 62.98712158203125, 65.26020812988281, 67.53329467773438, 69.80638122558594, 72.0794677734375, 74.35255432128906, 76.62564086914062, 78.89872741699219, 81.17181396484375, 83.44490051269531]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 1.0, 3.0, 2.0, 4.0, 9.0, 8.0, 8.0, 19.0, 11.0, 12.0, 20.0, 16.0, 16.0, 25.0, 29.0, 37.0, 46.0, 26.0, 33.0, 33.0, 28.0, 47.0, 42.0, 40.0, 38.0, 40.0, 43.0, 36.0, 53.0, 28.0, 48.0, 29.0, 30.0, 18.0, 27.0, 25.0, 12.0, 7.0, 8.0, 14.0, 10.0, 9.0, 3.0, 4.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-36.25355529785156, -35.137939453125, -34.02232360839844, -32.90671157836914, -31.791095733642578, -30.675479888916016, -29.559864044189453, -28.44424819946289, -27.32863426208496, -26.2130184173584, -25.09740447998047, -23.981788635253906, -22.866172790527344, -21.750558853149414, -20.63494300842285, -19.519329071044922, -18.40371322631836, -17.288097381591797, -16.172483444213867, -15.056867599487305, -13.941252708435059, -12.825637817382812, -11.71002197265625, -10.594407081604004, -9.478792190551758, -8.363177299499512, -7.247561931610107, -6.131946563720703, -5.016331672668457, -3.900716781616211, -2.7851014137268066, -1.6694860458374023, -0.5538711547851562, 0.561743974685669, 1.6773591041564941, 2.7929742336273193, 3.9085893630981445, 5.024204254150391, 6.139819622039795, 7.255434989929199, 8.371049880981445, 9.486664772033691, 10.602279663085938, 11.7178955078125, 12.833510398864746, 13.949125289916992, 15.064741134643555, 16.180355072021484, 17.295970916748047, 18.41158676147461, 19.52720069885254, 20.6428165435791, 21.75843048095703, 22.874046325683594, 23.989662170410156, 25.10527801513672, 26.22089195251465, 27.33650779724121, 28.45212173461914, 29.567737579345703, 30.683353424072266, 31.798967361450195, 32.914581298828125, 34.03019714355469, 35.14581298828125]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 0.0, 5.0, 8.0, 1.0, 9.0, 5.0, 12.0, 15.0, 8.0, 23.0, 27.0, 22.0, 25.0, 26.0, 29.0, 31.0, 36.0, 30.0, 44.0, 45.0, 43.0, 44.0, 45.0, 45.0, 39.0, 40.0, 26.0, 37.0, 31.0, 32.0, 22.0, 29.0, 23.0, 26.0, 28.0, 10.0, 22.0, 11.0, 12.0, 9.0, 5.0, 10.0, 2.0, 4.0, 5.0, 2.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.625, -4.48272705078125, -4.3404541015625, -4.19818115234375, -4.055908203125, -3.91363525390625, -3.7713623046875, -3.62908935546875, -3.48681640625, -3.34454345703125, -3.2022705078125, -3.05999755859375, -2.917724609375, -2.77545166015625, -2.6331787109375, -2.49090576171875, -2.3486328125, -2.20635986328125, -2.0640869140625, -1.92181396484375, -1.779541015625, -1.63726806640625, -1.4949951171875, -1.35272216796875, -1.21044921875, -1.06817626953125, -0.9259033203125, -0.78363037109375, -0.641357421875, -0.49908447265625, -0.3568115234375, -0.21453857421875, -0.072265625, 0.07000732421875, 0.2122802734375, 0.35455322265625, 0.496826171875, 0.63909912109375, 0.7813720703125, 0.92364501953125, 1.06591796875, 1.20819091796875, 1.3504638671875, 1.49273681640625, 1.635009765625, 1.77728271484375, 1.9195556640625, 2.06182861328125, 2.2041015625, 2.34637451171875, 2.4886474609375, 2.63092041015625, 2.773193359375, 2.91546630859375, 3.0577392578125, 3.20001220703125, 3.34228515625, 3.48455810546875, 3.6268310546875, 3.76910400390625, 3.911376953125, 4.05364990234375, 4.1959228515625, 4.33819580078125, 4.48046875]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 4.0, 1.0, 3.0, 1.0, 7.0, 5.0, 10.0, 7.0, 15.0, 15.0, 19.0, 32.0, 29.0, 36.0, 47.0, 40.0, 62.0, 88.0, 138.0, 313.0, 1106.0, 10209.0, 411836.0, 3369962.0, 388336.0, 9959.0, 1128.0, 323.0, 129.0, 84.0, 84.0, 42.0, 39.0, 33.0, 16.0, 24.0, 20.0, 14.0, 10.0, 13.0, 8.0, 8.0, 4.0, 6.0, 8.0, 5.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.59375, -13.162109375, -12.73046875, -12.298828125, -11.8671875, -11.435546875, -11.00390625, -10.572265625, -10.140625, -9.708984375, -9.27734375, -8.845703125, -8.4140625, -7.982421875, -7.55078125, -7.119140625, -6.6875, -6.255859375, -5.82421875, -5.392578125, -4.9609375, -4.529296875, -4.09765625, -3.666015625, -3.234375, -2.802734375, -2.37109375, -1.939453125, -1.5078125, -1.076171875, -0.64453125, -0.212890625, 0.21875, 0.650390625, 1.08203125, 1.513671875, 1.9453125, 2.376953125, 2.80859375, 3.240234375, 3.671875, 4.103515625, 4.53515625, 4.966796875, 5.3984375, 5.830078125, 6.26171875, 6.693359375, 7.125, 7.556640625, 7.98828125, 8.419921875, 8.8515625, 9.283203125, 9.71484375, 10.146484375, 10.578125, 11.009765625, 11.44140625, 11.873046875, 12.3046875, 12.736328125, 13.16796875, 13.599609375, 14.03125]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 6.0, 7.0, 7.0, 14.0, 22.0, 44.0, 41.0, 65.0, 82.0, 136.0, 221.0, 356.0, 400.0, 584.0, 540.0, 455.0, 365.0, 238.0, 174.0, 93.0, 67.0, 40.0, 34.0, 23.0, 17.0, 17.0, 5.0, 6.0, 5.0, 5.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0390625, -6.7701416015625, -6.501220703125, -6.2322998046875, -5.96337890625, -5.6944580078125, -5.425537109375, -5.1566162109375, -4.8876953125, -4.6187744140625, -4.349853515625, -4.0809326171875, -3.81201171875, -3.5430908203125, -3.274169921875, -3.0052490234375, -2.736328125, -2.4674072265625, -2.198486328125, -1.9295654296875, -1.66064453125, -1.3917236328125, -1.122802734375, -0.8538818359375, -0.5849609375, -0.3160400390625, -0.047119140625, 0.2218017578125, 0.49072265625, 0.7596435546875, 1.028564453125, 1.2974853515625, 1.56640625, 1.8353271484375, 2.104248046875, 2.3731689453125, 2.64208984375, 2.9110107421875, 3.179931640625, 3.4488525390625, 3.7177734375, 3.9866943359375, 4.255615234375, 4.5245361328125, 4.79345703125, 5.0623779296875, 5.331298828125, 5.6002197265625, 5.869140625, 6.1380615234375, 6.406982421875, 6.6759033203125, 6.94482421875, 7.2137451171875, 7.482666015625, 7.7515869140625, 8.0205078125, 8.2894287109375, 8.558349609375, 8.8272705078125, 9.09619140625, 9.3651123046875, 9.634033203125, 9.9029541015625, 10.171875]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 6.0, 5.0, 12.0, 7.0, 12.0, 18.0, 26.0, 38.0, 50.0, 60.0, 109.0, 148.0, 232.0, 387.0, 757.0, 2906.0, 205071.0, 3944590.0, 36625.0, 1571.0, 579.0, 370.0, 207.0, 155.0, 99.0, 79.0, 61.0, 36.0, 27.0, 18.0, 13.0, 6.0, 3.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-35.3125, -34.366943359375, -33.42138671875, -32.475830078125, -31.5302734375, -30.584716796875, -29.63916015625, -28.693603515625, -27.748046875, -26.802490234375, -25.85693359375, -24.911376953125, -23.9658203125, -23.020263671875, -22.07470703125, -21.129150390625, -20.18359375, -19.238037109375, -18.29248046875, -17.346923828125, -16.4013671875, -15.455810546875, -14.51025390625, -13.564697265625, -12.619140625, -11.673583984375, -10.72802734375, -9.782470703125, -8.8369140625, -7.891357421875, -6.94580078125, -6.000244140625, -5.0546875, -4.109130859375, -3.16357421875, -2.218017578125, -1.2724609375, -0.326904296875, 0.61865234375, 1.564208984375, 2.509765625, 3.455322265625, 4.40087890625, 5.346435546875, 6.2919921875, 7.237548828125, 8.18310546875, 9.128662109375, 10.07421875, 11.019775390625, 11.96533203125, 12.910888671875, 13.8564453125, 14.802001953125, 15.74755859375, 16.693115234375, 17.638671875, 18.584228515625, 19.52978515625, 20.475341796875, 21.4208984375, 22.366455078125, 23.31201171875, 24.257568359375, 25.203125]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 21.0, 89.0, 248.0, 357.0, 217.0, 66.0, 14.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.732115745544434, -13.276546478271484, -10.820978164672852, -8.365409851074219, -5.9098405838012695, -3.4542722702026367, -0.9987030029296875, 1.4568662643432617, 3.9124345779418945, 6.3680033683776855, 8.823572158813477, 11.27914047241211, 13.734709739685059, 16.190277099609375, 18.64584732055664, 21.101417541503906, 23.556983947753906, 26.01255226135254, 28.468120574951172, 30.923690795898438, 33.37925720214844, 35.8348274230957, 38.29039764404297, 40.74596405029297, 43.201534271240234, 45.6571044921875, 48.1126708984375, 50.568241119384766, 53.02381134033203, 55.47937774658203, 57.9349479675293, 60.39051818847656, 62.84608459472656, 65.30165100097656, 67.7572250366211, 70.2127914428711, 72.6683578491211, 75.12393188476562, 77.57949829101562, 80.03506469726562, 82.49063110351562, 84.94619750976562, 87.40177154541016, 89.85733795166016, 92.31290435791016, 94.76847839355469, 97.22404479980469, 99.67961120605469, 102.13518524169922, 104.59075164794922, 107.04632568359375, 109.50189208984375, 111.95745849609375, 114.41302490234375, 116.86859893798828, 119.32416534423828, 121.77973937988281, 124.23530578613281, 126.69087982177734, 129.1464385986328, 131.60202026367188, 134.05758666992188, 136.51315307617188, 138.96871948242188, 141.42428588867188]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 6.0, 5.0, 4.0, 9.0, 5.0, 7.0, 8.0, 14.0, 25.0, 20.0, 13.0, 29.0, 21.0, 26.0, 31.0, 37.0, 32.0, 42.0, 26.0, 38.0, 41.0, 33.0, 43.0, 29.0, 33.0, 42.0, 42.0, 32.0, 38.0, 35.0, 30.0, 33.0, 29.0, 25.0, 14.0, 26.0, 18.0, 15.0, 16.0, 5.0, 7.0, 7.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0], "bins": [-22.40570640563965, -21.699596405029297, -20.993486404418945, -20.287376403808594, -19.581266403198242, -18.87515640258789, -18.16904640197754, -17.462936401367188, -16.756826400756836, -16.050716400146484, -15.344606399536133, -14.638496398925781, -13.93238639831543, -13.226276397705078, -12.520166397094727, -11.814056396484375, -11.107946395874023, -10.401836395263672, -9.69572639465332, -8.989616394042969, -8.283506393432617, -7.577396392822266, -6.871286392211914, -6.1651763916015625, -5.459066390991211, -4.752956390380859, -4.046846389770508, -3.3407363891601562, -2.6346263885498047, -1.9285163879394531, -1.2224063873291016, -0.51629638671875, 0.18981361389160156, 0.8959236145019531, 1.6020336151123047, 2.3081436157226562, 3.014253616333008, 3.7203636169433594, 4.426473617553711, 5.1325836181640625, 5.838693618774414, 6.544803619384766, 7.250913619995117, 7.957023620605469, 8.66313362121582, 9.369243621826172, 10.075353622436523, 10.781463623046875, 11.487573623657227, 12.193683624267578, 12.89979362487793, 13.605903625488281, 14.312013626098633, 15.018123626708984, 15.724233627319336, 16.430343627929688, 17.13645362854004, 17.84256362915039, 18.548673629760742, 19.254783630371094, 19.960893630981445, 20.667003631591797, 21.37311363220215, 22.0792236328125, 22.78533363342285]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 4.0, 10.0, 13.0, 13.0, 16.0, 22.0, 21.0, 20.0, 22.0, 27.0, 31.0, 32.0, 51.0, 38.0, 37.0, 37.0, 49.0, 50.0, 48.0, 41.0, 37.0, 39.0, 37.0, 34.0, 42.0, 23.0, 25.0, 23.0, 21.0, 18.0, 28.0, 21.0, 19.0, 8.0, 9.0, 5.0, 7.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.3056640625, -4.162109375, -4.0185546875, -3.875, -3.7314453125, -3.587890625, -3.4443359375, -3.30078125, -3.1572265625, -3.013671875, -2.8701171875, -2.7265625, -2.5830078125, -2.439453125, -2.2958984375, -2.15234375, -2.0087890625, -1.865234375, -1.7216796875, -1.578125, -1.4345703125, -1.291015625, -1.1474609375, -1.00390625, -0.8603515625, -0.716796875, -0.5732421875, -0.4296875, -0.2861328125, -0.142578125, 0.0009765625, 0.14453125, 0.2880859375, 0.431640625, 0.5751953125, 0.71875, 0.8623046875, 1.005859375, 1.1494140625, 1.29296875, 1.4365234375, 1.580078125, 1.7236328125, 1.8671875, 2.0107421875, 2.154296875, 2.2978515625, 2.44140625, 2.5849609375, 2.728515625, 2.8720703125, 3.015625, 3.1591796875, 3.302734375, 3.4462890625, 3.58984375, 3.7333984375, 3.876953125, 4.0205078125, 4.1640625, 4.3076171875, 4.451171875, 4.5947265625, 4.73828125]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 4.0, 6.0, 5.0, 10.0, 18.0, 19.0, 34.0, 46.0, 52.0, 85.0, 128.0, 193.0, 260.0, 393.0, 520.0, 878.0, 1197.0, 1760.0, 2661.0, 3790.0, 5617.0, 8284.0, 12605.0, 18817.0, 29432.0, 46442.0, 76641.0, 127421.0, 198974.0, 192283.0, 120385.0, 72708.0, 44076.0, 27956.0, 17863.0, 11887.0, 8238.0, 5277.0, 3668.0, 2512.0, 1698.0, 1198.0, 776.0, 571.0, 382.0, 242.0, 159.0, 129.0, 83.0, 64.0, 34.0, 32.0, 16.0, 13.0, 10.0, 9.0, 4.0, 2.0, 1.0, 3.0], "bins": [-0.480712890625, -0.4661216735839844, -0.45153045654296875, -0.4369392395019531, -0.4223480224609375, -0.4077568054199219, -0.39316558837890625, -0.3785743713378906, -0.363983154296875, -0.3493919372558594, -0.33480072021484375, -0.3202095031738281, -0.3056182861328125, -0.2910270690917969, -0.27643585205078125, -0.2618446350097656, -0.24725341796875, -0.23266220092773438, -0.21807098388671875, -0.20347976684570312, -0.1888885498046875, -0.17429733276367188, -0.15970611572265625, -0.14511489868164062, -0.130523681640625, -0.11593246459960938, -0.10134124755859375, -0.08675003051757812, -0.0721588134765625, -0.057567596435546875, -0.04297637939453125, -0.028385162353515625, -0.0137939453125, 0.000797271728515625, 0.01538848876953125, 0.029979705810546875, 0.0445709228515625, 0.059162139892578125, 0.07375335693359375, 0.08834457397460938, 0.102935791015625, 0.11752700805664062, 0.13211822509765625, 0.14670944213867188, 0.1613006591796875, 0.17589187622070312, 0.19048309326171875, 0.20507431030273438, 0.21966552734375, 0.23425674438476562, 0.24884796142578125, 0.2634391784667969, 0.2780303955078125, 0.2926216125488281, 0.30721282958984375, 0.3218040466308594, 0.336395263671875, 0.3509864807128906, 0.36557769775390625, 0.3801689147949219, 0.3947601318359375, 0.4093513488769531, 0.42394256591796875, 0.4385337829589844, 0.453125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 5.0, 4.0, 9.0, 13.0, 5.0, 11.0, 8.0, 13.0, 22.0, 21.0, 18.0, 31.0, 40.0, 29.0, 31.0, 27.0, 44.0, 44.0, 39.0, 43.0, 1072.0, 36.0, 56.0, 43.0, 46.0, 42.0, 31.0, 28.0, 32.0, 22.0, 15.0, 24.0, 19.0, 27.0, 15.0, 12.0, 10.0, 9.0, 13.0, 13.0, 5.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.232421875, -3.139739990234375, -3.04705810546875, -2.954376220703125, -2.8616943359375, -2.769012451171875, -2.67633056640625, -2.583648681640625, -2.490966796875, -2.398284912109375, -2.30560302734375, -2.212921142578125, -2.1202392578125, -2.027557373046875, -1.93487548828125, -1.842193603515625, -1.74951171875, -1.656829833984375, -1.56414794921875, -1.471466064453125, -1.3787841796875, -1.286102294921875, -1.19342041015625, -1.100738525390625, -1.008056640625, -0.915374755859375, -0.82269287109375, -0.730010986328125, -0.6373291015625, -0.544647216796875, -0.45196533203125, -0.359283447265625, -0.2666015625, -0.173919677734375, -0.08123779296875, 0.011444091796875, 0.1041259765625, 0.196807861328125, 0.28948974609375, 0.382171630859375, 0.474853515625, 0.567535400390625, 0.66021728515625, 0.752899169921875, 0.8455810546875, 0.938262939453125, 1.03094482421875, 1.123626708984375, 1.21630859375, 1.308990478515625, 1.40167236328125, 1.494354248046875, 1.5870361328125, 1.679718017578125, 1.77239990234375, 1.865081787109375, 1.957763671875, 2.050445556640625, 2.14312744140625, 2.235809326171875, 2.3284912109375, 2.421173095703125, 2.51385498046875, 2.606536865234375, 2.69921875]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 9.0, 22.0, 32.0, 47.0, 48.0, 92.0, 127.0, 209.0, 337.0, 534.0, 767.0, 1247.0, 1916.0, 3020.0, 4743.0, 7321.0, 11735.0, 18881.0, 31308.0, 54390.0, 96368.0, 173292.0, 1281794.0, 173350.0, 97751.0, 54498.0, 31785.0, 18941.0, 11845.0, 7483.0, 4653.0, 3097.0, 1979.0, 1229.0, 802.0, 554.0, 320.0, 201.0, 141.0, 86.0, 55.0, 50.0, 25.0, 15.0, 11.0, 8.0, 3.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.458251953125, -0.4437065124511719, -0.42916107177734375, -0.4146156311035156, -0.4000701904296875, -0.3855247497558594, -0.37097930908203125, -0.3564338684082031, -0.341888427734375, -0.3273429870605469, -0.31279754638671875, -0.2982521057128906, -0.2837066650390625, -0.2691612243652344, -0.25461578369140625, -0.24007034301757812, -0.22552490234375, -0.21097946166992188, -0.19643402099609375, -0.18188858032226562, -0.1673431396484375, -0.15279769897460938, -0.13825225830078125, -0.12370681762695312, -0.109161376953125, -0.09461593627929688, -0.08007049560546875, -0.06552505493164062, -0.0509796142578125, -0.036434173583984375, -0.02188873291015625, -0.007343292236328125, 0.0072021484375, 0.021747589111328125, 0.03629302978515625, 0.050838470458984375, 0.0653839111328125, 0.07992935180664062, 0.09447479248046875, 0.10902023315429688, 0.123565673828125, 0.13811111450195312, 0.15265655517578125, 0.16720199584960938, 0.1817474365234375, 0.19629287719726562, 0.21083831787109375, 0.22538375854492188, 0.23992919921875, 0.2544746398925781, 0.26902008056640625, 0.2835655212402344, 0.2981109619140625, 0.3126564025878906, 0.32720184326171875, 0.3417472839355469, 0.356292724609375, 0.3708381652832031, 0.38538360595703125, 0.3999290466308594, 0.4144744873046875, 0.4290199279785156, 0.44356536865234375, 0.4581108093261719, 0.47265625]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 5.0, 6.0, 7.0, 2.0, 5.0, 8.0, 11.0, 12.0, 20.0, 19.0, 38.0, 31.0, 49.0, 75.0, 78.0, 135.0, 123.0, 104.0, 63.0, 45.0, 38.0, 33.0, 17.0, 18.0, 9.0, 11.0, 12.0, 7.0, 4.0, 4.0, 9.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.006961822509765625, -0.006778717041015625, -0.006595611572265625, -0.006412506103515625, -0.006229400634765625, -0.006046295166015625, -0.005863189697265625, -0.005680084228515625, -0.005496978759765625, -0.005313873291015625, -0.005130767822265625, -0.004947662353515625, -0.004764556884765625, -0.004581451416015625, -0.004398345947265625, -0.004215240478515625, -0.004032135009765625, -0.003849029541015625, -0.003665924072265625, -0.003482818603515625, -0.003299713134765625, -0.003116607666015625, -0.002933502197265625, -0.002750396728515625, -0.002567291259765625, -0.002384185791015625, -0.002201080322265625, -0.002017974853515625, -0.001834869384765625, -0.001651763916015625, -0.001468658447265625, -0.001285552978515625, -0.001102447509765625, -0.000919342041015625, -0.000736236572265625, -0.000553131103515625, -0.000370025634765625, -0.000186920166015625, -3.814697265625e-06, 0.000179290771484375, 0.000362396240234375, 0.000545501708984375, 0.000728607177734375, 0.000911712646484375, 0.001094818115234375, 0.001277923583984375, 0.001461029052734375, 0.001644134521484375, 0.001827239990234375, 0.002010345458984375, 0.002193450927734375, 0.002376556396484375, 0.002559661865234375, 0.002742767333984375, 0.002925872802734375, 0.003108978271484375, 0.003292083740234375, 0.003475189208984375, 0.003658294677734375, 0.003841400146484375, 0.004024505615234375, 0.004207611083984375, 0.004390716552734375, 0.004573822021484375, 0.004756927490234375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 6.0, 9.0, 9.0, 10.0, 20.0, 26.0, 23.0, 43.0, 61.0, 102.0, 177.0, 384.0, 1498.0, 1041113.0, 3991.0, 477.0, 228.0, 103.0, 70.0, 61.0, 23.0, 34.0, 17.0, 16.0, 7.0, 2.0, 8.0, 5.0, 9.0, 5.0, 3.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10528564453125, -0.10117626190185547, -0.09706687927246094, -0.0929574966430664, -0.08884811401367188, -0.08473873138427734, -0.08062934875488281, -0.07651996612548828, -0.07241058349609375, -0.06830120086669922, -0.06419181823730469, -0.060082435607910156, -0.055973052978515625, -0.051863670349121094, -0.04775428771972656, -0.04364490509033203, -0.0395355224609375, -0.03542613983154297, -0.03131675720214844, -0.027207374572753906, -0.023097991943359375, -0.018988609313964844, -0.014879226684570312, -0.010769844055175781, -0.00666046142578125, -0.0025510787963867188, 0.0015583038330078125, 0.005667686462402344, 0.009777069091796875, 0.013886451721191406, 0.017995834350585938, 0.02210521697998047, 0.026214599609375, 0.03032398223876953, 0.03443336486816406, 0.038542747497558594, 0.042652130126953125, 0.046761512756347656, 0.05087089538574219, 0.05498027801513672, 0.05908966064453125, 0.06319904327392578, 0.06730842590332031, 0.07141780853271484, 0.07552719116210938, 0.0796365737915039, 0.08374595642089844, 0.08785533905029297, 0.0919647216796875, 0.09607410430908203, 0.10018348693847656, 0.1042928695678711, 0.10840225219726562, 0.11251163482666016, 0.11662101745605469, 0.12073040008544922, 0.12483978271484375, 0.12894916534423828, 0.1330585479736328, 0.13716793060302734, 0.14127731323242188, 0.1453866958618164, 0.14949607849121094, 0.15360546112060547, 0.15771484375]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 525.0, 488.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0072646173648536205, -0.006225452292710543, -0.0051862867549061775, -0.0041471216827631, -0.003107956610620022, -0.002068791538476944, -0.0010296260006725788, 9.539071470499039e-06, 0.0010487041436135769, 0.0020878692157566547, 0.0031270345207303762, 0.004166199825704098, 0.005205364897847176, 0.0062445299699902534, 0.007283695507794619, 0.008322861045598984, 0.009362025186419487, 0.010401190258562565, 0.011440355330705643, 0.012479521334171295, 0.013518685474991798, 0.01455785147845745, 0.015597016550600529, 0.016636181622743607, 0.01767534762620926, 0.01871451362967491, 0.019753677770495415, 0.020792843773961067, 0.02183200791478157, 0.022871173918247223, 0.023910339921712875, 0.02494950406253338, 0.025988668203353882, 0.027027834206819534, 0.028066998347640038, 0.02910616435110569, 0.030145328491926193, 0.031184494495391846, 0.0322236604988575, 0.03326282650232315, 0.034301988780498505, 0.03534115478396416, 0.03638032078742981, 0.037419483065605164, 0.038458649069070816, 0.03949781507253647, 0.04053698107600212, 0.04157614707946777, 0.04261530935764313, 0.04365447536110878, 0.04469364136457443, 0.045732803642749786, 0.04677196964621544, 0.04781113564968109, 0.048850301653146744, 0.049889467656612396, 0.05092863366007805, 0.0519677996635437, 0.053006965667009354, 0.05404612794518471, 0.05508529394865036, 0.05612445995211601, 0.057163625955581665, 0.05820278823375702, 0.05924195423722267]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 10.0, 11.0, 2.0, 13.0, 18.0, 15.0, 27.0, 23.0, 29.0, 25.0, 27.0, 23.0, 42.0, 36.0, 39.0, 34.0, 45.0, 44.0, 47.0, 48.0, 41.0, 36.0, 31.0, 43.0, 45.0, 36.0, 26.0, 25.0, 27.0, 14.0, 19.0, 13.0, 14.0, 14.0, 9.0, 6.0, 12.0, 9.0, 6.0, 6.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.002496957778930664, -0.002421971410512924, -0.0023469850420951843, -0.0022719986736774445, -0.0021970123052597046, -0.0021220259368419647, -0.002047039568424225, -0.001972053200006485, -0.0018970668315887451, -0.0018220804631710052, -0.0017470940947532654, -0.0016721077263355255, -0.0015971213579177856, -0.0015221349895000458, -0.001447148621082306, -0.001372162252664566, -0.0012971758842468262, -0.0012221895158290863, -0.0011472031474113464, -0.0010722167789936066, -0.0009972304105758667, -0.0009222440421581268, -0.000847257673740387, -0.0007722713053226471, -0.0006972849369049072, -0.0006222985684871674, -0.0005473122000694275, -0.0004723258316516876, -0.00039733946323394775, -0.0003223530948162079, -0.000247366726398468, -0.00017238035798072815, -9.739398956298828e-05, -2.2407621145248413e-05, 5.2578747272491455e-05, 0.00012756511569023132, 0.0002025514841079712, 0.00027753785252571106, 0.00035252422094345093, 0.0004275105893611908, 0.0005024969577789307, 0.0005774833261966705, 0.0006524696946144104, 0.0007274560630321503, 0.0008024424314498901, 0.00087742879986763, 0.0009524151682853699, 0.0010274015367031097, 0.0011023879051208496, 0.0011773742735385895, 0.0012523606419563293, 0.0013273470103740692, 0.001402333378791809, 0.001477319747209549, 0.0015523061156272888, 0.0016272924840450287, 0.0017022788524627686, 0.0017772652208805084, 0.0018522515892982483, 0.0019272379577159882, 0.002002224326133728, 0.002077210694551468, 0.0021521970629692078, 0.0022271834313869476, 0.0023021697998046875]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 7.0, 5.0, 4.0, 9.0, 14.0, 13.0, 16.0, 22.0, 21.0, 20.0, 22.0, 27.0, 31.0, 32.0, 51.0, 38.0, 37.0, 37.0, 49.0, 50.0, 48.0, 41.0, 37.0, 39.0, 37.0, 34.0, 42.0, 23.0, 25.0, 23.0, 21.0, 18.0, 28.0, 21.0, 19.0, 8.0, 9.0, 5.0, 7.0, 6.0, 2.0, 4.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.44921875, -4.3056640625, -4.162109375, -4.0185546875, -3.875, -3.7314453125, -3.587890625, -3.4443359375, -3.30078125, -3.1572265625, -3.013671875, -2.8701171875, -2.7265625, -2.5830078125, -2.439453125, -2.2958984375, -2.15234375, -2.0087890625, -1.865234375, -1.7216796875, -1.578125, -1.4345703125, -1.291015625, -1.1474609375, -1.00390625, -0.8603515625, -0.716796875, -0.5732421875, -0.4296875, -0.2861328125, -0.142578125, 0.0009765625, 0.14453125, 0.2880859375, 0.431640625, 0.5751953125, 0.71875, 0.8623046875, 1.005859375, 1.1494140625, 1.29296875, 1.4365234375, 1.580078125, 1.7236328125, 1.8671875, 2.0107421875, 2.154296875, 2.2978515625, 2.44140625, 2.5849609375, 2.728515625, 2.8720703125, 3.015625, 3.1591796875, 3.302734375, 3.4462890625, 3.58984375, 3.7333984375, 3.876953125, 4.0205078125, 4.1640625, 4.3076171875, 4.451171875, 4.5947265625, 4.73828125]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 5.0, 9.0, 15.0, 19.0, 26.0, 39.0, 41.0, 72.0, 82.0, 131.0, 203.0, 277.0, 480.0, 981.0, 3056.0, 13716.0, 68853.0, 583884.0, 323394.0, 40415.0, 8820.0, 2058.0, 738.0, 421.0, 238.0, 148.0, 118.0, 80.0, 50.0, 49.0, 35.0, 24.0, 19.0, 16.0, 10.0, 7.0, 8.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.5703125, -8.29248046875, -8.0146484375, -7.73681640625, -7.458984375, -7.18115234375, -6.9033203125, -6.62548828125, -6.34765625, -6.06982421875, -5.7919921875, -5.51416015625, -5.236328125, -4.95849609375, -4.6806640625, -4.40283203125, -4.125, -3.84716796875, -3.5693359375, -3.29150390625, -3.013671875, -2.73583984375, -2.4580078125, -2.18017578125, -1.90234375, -1.62451171875, -1.3466796875, -1.06884765625, -0.791015625, -0.51318359375, -0.2353515625, 0.04248046875, 0.3203125, 0.59814453125, 0.8759765625, 1.15380859375, 1.431640625, 1.70947265625, 1.9873046875, 2.26513671875, 2.54296875, 2.82080078125, 3.0986328125, 3.37646484375, 3.654296875, 3.93212890625, 4.2099609375, 4.48779296875, 4.765625, 5.04345703125, 5.3212890625, 5.59912109375, 5.876953125, 6.15478515625, 6.4326171875, 6.71044921875, 6.98828125, 7.26611328125, 7.5439453125, 7.82177734375, 8.099609375, 8.37744140625, 8.6552734375, 8.93310546875, 9.2109375]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 8.0, 6.0, 5.0, 8.0, 9.0, 14.0, 14.0, 21.0, 21.0, 33.0, 28.0, 39.0, 51.0, 59.0, 62.0, 96.0, 210.0, 1604.0, 283.0, 101.0, 68.0, 57.0, 48.0, 36.0, 40.0, 21.0, 26.0, 21.0, 13.0, 13.0, 7.0, 11.0, 6.0, 8.0, 5.0, 1.0, 3.0, 0.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.625, -14.095458984375, -13.56591796875, -13.036376953125, -12.5068359375, -11.977294921875, -11.44775390625, -10.918212890625, -10.388671875, -9.859130859375, -9.32958984375, -8.800048828125, -8.2705078125, -7.740966796875, -7.21142578125, -6.681884765625, -6.15234375, -5.622802734375, -5.09326171875, -4.563720703125, -4.0341796875, -3.504638671875, -2.97509765625, -2.445556640625, -1.916015625, -1.386474609375, -0.85693359375, -0.327392578125, 0.2021484375, 0.731689453125, 1.26123046875, 1.790771484375, 2.3203125, 2.849853515625, 3.37939453125, 3.908935546875, 4.4384765625, 4.968017578125, 5.49755859375, 6.027099609375, 6.556640625, 7.086181640625, 7.61572265625, 8.145263671875, 8.6748046875, 9.204345703125, 9.73388671875, 10.263427734375, 10.79296875, 11.322509765625, 11.85205078125, 12.381591796875, 12.9111328125, 13.440673828125, 13.97021484375, 14.499755859375, 15.029296875, 15.558837890625, 16.08837890625, 16.617919921875, 17.1474609375, 17.677001953125, 18.20654296875, 18.736083984375, 19.265625]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 9.0, 6.0, 13.0, 10.0, 18.0, 21.0, 22.0, 21.0, 43.0, 38.0, 72.0, 113.0, 168.0, 272.0, 605.0, 2233.0, 190258.0, 2944859.0, 5146.0, 802.0, 330.0, 195.0, 123.0, 78.0, 55.0, 52.0, 31.0, 25.0, 23.0, 15.0, 9.0, 6.0, 17.0, 3.0, 8.0, 0.0, 3.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-42.03125, -40.869140625, -39.70703125, -38.544921875, -37.3828125, -36.220703125, -35.05859375, -33.896484375, -32.734375, -31.572265625, -30.41015625, -29.248046875, -28.0859375, -26.923828125, -25.76171875, -24.599609375, -23.4375, -22.275390625, -21.11328125, -19.951171875, -18.7890625, -17.626953125, -16.46484375, -15.302734375, -14.140625, -12.978515625, -11.81640625, -10.654296875, -9.4921875, -8.330078125, -7.16796875, -6.005859375, -4.84375, -3.681640625, -2.51953125, -1.357421875, -0.1953125, 0.966796875, 2.12890625, 3.291015625, 4.453125, 5.615234375, 6.77734375, 7.939453125, 9.1015625, 10.263671875, 11.42578125, 12.587890625, 13.75, 14.912109375, 16.07421875, 17.236328125, 18.3984375, 19.560546875, 20.72265625, 21.884765625, 23.046875, 24.208984375, 25.37109375, 26.533203125, 27.6953125, 28.857421875, 30.01953125, 31.181640625, 32.34375]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 62.0, 418.0, 488.0, 43.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.65626525878906, -89.3628158569336, -87.06936645507812, -84.77591705322266, -82.48246765136719, -80.18902587890625, -77.89557647705078, -75.60212707519531, -73.30867767333984, -71.01522827148438, -68.7217788696289, -66.42832946777344, -64.1348876953125, -61.841434478759766, -59.54798889160156, -57.254539489746094, -54.961090087890625, -52.667640686035156, -50.37419128417969, -48.080745697021484, -45.787296295166016, -43.49384689331055, -41.200401306152344, -38.906951904296875, -36.613502502441406, -34.32005310058594, -32.02660369873047, -29.733158111572266, -27.439708709716797, -25.146259307861328, -22.852811813354492, -20.559364318847656, -18.265911102294922, -15.97246265411377, -13.679014205932617, -11.385565757751465, -9.092117309570312, -6.79866886138916, -4.505220413208008, -2.211772918701172, 0.08167648315429688, 2.375124931335449, 4.668573379516602, 6.962021827697754, 9.255470275878906, 11.548918724060059, 13.842367172241211, 16.135814666748047, 18.429264068603516, 20.722713470458984, 23.01616096496582, 25.309608459472656, 27.603057861328125, 29.896507263183594, 32.18995666503906, 34.483402252197266, 36.776851654052734, 39.0703010559082, 41.363746643066406, 43.657196044921875, 45.950645446777344, 48.24409484863281, 50.53754425048828, 52.830989837646484, 55.12443923950195]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 2.0, 5.0, 6.0, 10.0, 10.0, 8.0, 10.0, 10.0, 9.0, 10.0, 18.0, 25.0, 27.0, 24.0, 35.0, 40.0, 32.0, 36.0, 34.0, 35.0, 39.0, 42.0, 48.0, 42.0, 38.0, 44.0, 35.0, 30.0, 32.0, 27.0, 37.0, 35.0, 29.0, 23.0, 22.0, 17.0, 12.0, 16.0, 7.0, 7.0, 11.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 6.0, 2.0, 2.0, 0.0, 2.0, 0.0, 2.0], "bins": [-32.701820373535156, -31.70050621032715, -30.69919204711914, -29.697877883911133, -28.696563720703125, -27.695249557495117, -26.69393539428711, -25.692623138427734, -24.691307067871094, -23.689992904663086, -22.688678741455078, -21.68736457824707, -20.686050415039062, -19.684736251831055, -18.683422088623047, -17.682109832763672, -16.680795669555664, -15.679481506347656, -14.678167343139648, -13.67685317993164, -12.675539016723633, -11.674224853515625, -10.672911643981934, -9.671597480773926, -8.670283317565918, -7.66896915435791, -6.667654991149902, -5.666341304779053, -4.665027141571045, -3.663712978363037, -2.6623992919921875, -1.6610851287841797, -0.6597709655761719, 0.3415430784225464, 1.3428571224212646, 2.3441710472106934, 3.345485210418701, 4.346799373626709, 5.348113059997559, 6.349427223205566, 7.350741386413574, 8.352055549621582, 9.35336971282959, 10.354682922363281, 11.355997085571289, 12.357311248779297, 13.358625411987305, 14.359939575195312, 15.36125373840332, 16.362567901611328, 17.363882064819336, 18.365196228027344, 19.36651039123535, 20.36782455444336, 21.369136810302734, 22.370452880859375, 23.37176513671875, 24.373079299926758, 25.374393463134766, 26.375707626342773, 27.37702178955078, 28.37833595275879, 29.379650115966797, 30.380962371826172, 31.382278442382812]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 5.0, 7.0, 3.0, 4.0, 8.0, 9.0, 19.0, 15.0, 24.0, 20.0, 26.0, 19.0, 32.0, 30.0, 38.0, 28.0, 44.0, 36.0, 44.0, 40.0, 56.0, 41.0, 48.0, 49.0, 33.0, 37.0, 30.0, 39.0, 26.0, 27.0, 27.0, 27.0, 20.0, 19.0, 16.0, 12.0, 8.0, 6.0, 9.0, 11.0, 2.0, 1.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.75390625, -4.604736328125, -4.45556640625, -4.306396484375, -4.1572265625, -4.008056640625, -3.85888671875, -3.709716796875, -3.560546875, -3.411376953125, -3.26220703125, -3.113037109375, -2.9638671875, -2.814697265625, -2.66552734375, -2.516357421875, -2.3671875, -2.218017578125, -2.06884765625, -1.919677734375, -1.7705078125, -1.621337890625, -1.47216796875, -1.322998046875, -1.173828125, -1.024658203125, -0.87548828125, -0.726318359375, -0.5771484375, -0.427978515625, -0.27880859375, -0.129638671875, 0.01953125, 0.168701171875, 0.31787109375, 0.467041015625, 0.6162109375, 0.765380859375, 0.91455078125, 1.063720703125, 1.212890625, 1.362060546875, 1.51123046875, 1.660400390625, 1.8095703125, 1.958740234375, 2.10791015625, 2.257080078125, 2.40625, 2.555419921875, 2.70458984375, 2.853759765625, 3.0029296875, 3.152099609375, 3.30126953125, 3.450439453125, 3.599609375, 3.748779296875, 3.89794921875, 4.047119140625, 4.1962890625, 4.345458984375, 4.49462890625, 4.643798828125, 4.79296875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 1.0, 0.0, 5.0, 8.0, 4.0, 6.0, 12.0, 17.0, 19.0, 20.0, 30.0, 44.0, 49.0, 63.0, 78.0, 118.0, 220.0, 534.0, 1594.0, 10345.0, 230803.0, 2724111.0, 1171843.0, 48803.0, 3809.0, 884.0, 324.0, 152.0, 86.0, 55.0, 50.0, 45.0, 28.0, 28.0, 23.0, 11.0, 14.0, 13.0, 5.0, 11.0, 4.0, 6.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.59375, -11.228759765625, -10.86376953125, -10.498779296875, -10.1337890625, -9.768798828125, -9.40380859375, -9.038818359375, -8.673828125, -8.308837890625, -7.94384765625, -7.578857421875, -7.2138671875, -6.848876953125, -6.48388671875, -6.118896484375, -5.75390625, -5.388916015625, -5.02392578125, -4.658935546875, -4.2939453125, -3.928955078125, -3.56396484375, -3.198974609375, -2.833984375, -2.468994140625, -2.10400390625, -1.739013671875, -1.3740234375, -1.009033203125, -0.64404296875, -0.279052734375, 0.0859375, 0.450927734375, 0.81591796875, 1.180908203125, 1.5458984375, 1.910888671875, 2.27587890625, 2.640869140625, 3.005859375, 3.370849609375, 3.73583984375, 4.100830078125, 4.4658203125, 4.830810546875, 5.19580078125, 5.560791015625, 5.92578125, 6.290771484375, 6.65576171875, 7.020751953125, 7.3857421875, 7.750732421875, 8.11572265625, 8.480712890625, 8.845703125, 9.210693359375, 9.57568359375, 9.940673828125, 10.3056640625, 10.670654296875, 11.03564453125, 11.400634765625, 11.765625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 3.0, 6.0, 5.0, 10.0, 10.0, 10.0, 24.0, 19.0, 35.0, 37.0, 38.0, 71.0, 82.0, 105.0, 166.0, 191.0, 242.0, 330.0, 397.0, 387.0, 381.0, 340.0, 287.0, 211.0, 180.0, 147.0, 87.0, 69.0, 49.0, 36.0, 31.0, 23.0, 16.0, 15.0, 9.0, 2.0, 10.0, 6.0, 0.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.23046875, -5.04833984375, -4.8662109375, -4.68408203125, -4.501953125, -4.31982421875, -4.1376953125, -3.95556640625, -3.7734375, -3.59130859375, -3.4091796875, -3.22705078125, -3.044921875, -2.86279296875, -2.6806640625, -2.49853515625, -2.31640625, -2.13427734375, -1.9521484375, -1.77001953125, -1.587890625, -1.40576171875, -1.2236328125, -1.04150390625, -0.859375, -0.67724609375, -0.4951171875, -0.31298828125, -0.130859375, 0.05126953125, 0.2333984375, 0.41552734375, 0.59765625, 0.77978515625, 0.9619140625, 1.14404296875, 1.326171875, 1.50830078125, 1.6904296875, 1.87255859375, 2.0546875, 2.23681640625, 2.4189453125, 2.60107421875, 2.783203125, 2.96533203125, 3.1474609375, 3.32958984375, 3.51171875, 3.69384765625, 3.8759765625, 4.05810546875, 4.240234375, 4.42236328125, 4.6044921875, 4.78662109375, 4.96875, 5.15087890625, 5.3330078125, 5.51513671875, 5.697265625, 5.87939453125, 6.0615234375, 6.24365234375, 6.42578125]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 11.0, 10.0, 13.0, 16.0, 28.0, 32.0, 48.0, 81.0, 106.0, 160.0, 189.0, 284.0, 563.0, 1087.0, 5314.0, 101321.0, 3512517.0, 554683.0, 14063.0, 1894.0, 630.0, 351.0, 231.0, 153.0, 131.0, 88.0, 68.0, 55.0, 56.0, 28.0, 19.0, 16.0, 7.0, 9.0, 8.0, 4.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.375, -16.7900390625, -16.205078125, -15.6201171875, -15.03515625, -14.4501953125, -13.865234375, -13.2802734375, -12.6953125, -12.1103515625, -11.525390625, -10.9404296875, -10.35546875, -9.7705078125, -9.185546875, -8.6005859375, -8.015625, -7.4306640625, -6.845703125, -6.2607421875, -5.67578125, -5.0908203125, -4.505859375, -3.9208984375, -3.3359375, -2.7509765625, -2.166015625, -1.5810546875, -0.99609375, -0.4111328125, 0.173828125, 0.7587890625, 1.34375, 1.9287109375, 2.513671875, 3.0986328125, 3.68359375, 4.2685546875, 4.853515625, 5.4384765625, 6.0234375, 6.6083984375, 7.193359375, 7.7783203125, 8.36328125, 8.9482421875, 9.533203125, 10.1181640625, 10.703125, 11.2880859375, 11.873046875, 12.4580078125, 13.04296875, 13.6279296875, 14.212890625, 14.7978515625, 15.3828125, 15.9677734375, 16.552734375, 17.1376953125, 17.72265625, 18.3076171875, 18.892578125, 19.4775390625, 20.0625]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 9.0, 40.0, 160.0, 348.0, 318.0, 111.0, 25.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.79484558105469, -89.43700408935547, -87.07916259765625, -84.72132110595703, -82.36347961425781, -80.0056381225586, -77.64779663085938, -75.28994750976562, -72.93211364746094, -70.57427215576172, -68.2164306640625, -65.85858917236328, -63.50074768066406, -61.142906188964844, -58.78506088256836, -56.42721939086914, -54.069374084472656, -51.71153259277344, -49.35369110107422, -46.995849609375, -44.63800811767578, -42.28016662597656, -39.92232131958008, -37.56447982788086, -35.20663833618164, -32.84879684448242, -30.490955352783203, -28.13311195373535, -25.775270462036133, -23.417428970336914, -21.059585571289062, -18.701744079589844, -16.34389877319336, -13.98605728149414, -11.628214836120605, -9.27037239074707, -6.912530899047852, -4.554689407348633, -2.1968469619750977, 0.1609954833984375, 2.5188369750976562, 4.876678943634033, 7.23452091217041, 9.592363357543945, 11.950204849243164, 14.308046340942383, 16.665889739990234, 19.023731231689453, 21.381572723388672, 23.73941421508789, 26.09725570678711, 28.45509910583496, 30.81294059753418, 33.17078399658203, 35.52862548828125, 37.88646697998047, 40.24430847167969, 42.602149963378906, 44.959991455078125, 47.317832946777344, 49.67567443847656, 52.03351593017578, 54.391361236572266, 56.749202728271484, 59.1070442199707]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 4.0, 5.0, 8.0, 8.0, 13.0, 10.0, 13.0, 18.0, 22.0, 22.0, 23.0, 21.0, 33.0, 36.0, 34.0, 42.0, 40.0, 36.0, 52.0, 35.0, 34.0, 36.0, 46.0, 35.0, 42.0, 40.0, 44.0, 31.0, 25.0, 37.0, 24.0, 20.0, 23.0, 19.0, 12.0, 18.0, 16.0, 7.0, 6.0, 2.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.652366638183594, -17.94457244873047, -17.236778259277344, -16.52898406982422, -15.821189880371094, -15.113395690917969, -14.405601501464844, -13.697807312011719, -12.990013122558594, -12.282218933105469, -11.574424743652344, -10.866630554199219, -10.158836364746094, -9.451042175292969, -8.743247985839844, -8.035453796386719, -7.327659606933594, -6.619865417480469, -5.912071228027344, -5.204277038574219, -4.496482849121094, -3.7886886596679688, -3.0808944702148438, -2.3731002807617188, -1.6653060913085938, -0.9575119018554688, -0.24971771240234375, 0.45807647705078125, 1.1658706665039062, 1.8736648559570312, 2.5814590454101562, 3.2892532348632812, 3.9970455169677734, 4.704839706420898, 5.412633895874023, 6.120428085327148, 6.828222274780273, 7.536016464233398, 8.243810653686523, 8.951604843139648, 9.659399032592773, 10.367193222045898, 11.074987411499023, 11.782781600952148, 12.490575790405273, 13.198369979858398, 13.906164169311523, 14.613958358764648, 15.321752548217773, 16.0295467376709, 16.737340927124023, 17.44513511657715, 18.152929306030273, 18.8607234954834, 19.568517684936523, 20.27631187438965, 20.984106063842773, 21.6919002532959, 22.399694442749023, 23.10748863220215, 23.815282821655273, 24.5230770111084, 25.230871200561523, 25.93866539001465, 26.646459579467773]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 8.0, 3.0, 6.0, 4.0, 4.0, 10.0, 7.0, 13.0, 12.0, 17.0, 16.0, 25.0, 23.0, 23.0, 35.0, 28.0, 27.0, 32.0, 36.0, 39.0, 32.0, 46.0, 43.0, 40.0, 43.0, 41.0, 37.0, 23.0, 31.0, 38.0, 29.0, 38.0, 23.0, 17.0, 22.0, 29.0, 17.0, 17.0, 16.0, 13.0, 16.0, 5.0, 6.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.787109375, -3.650115966796875, -3.51312255859375, -3.376129150390625, -3.2391357421875, -3.102142333984375, -2.96514892578125, -2.828155517578125, -2.691162109375, -2.554168701171875, -2.41717529296875, -2.280181884765625, -2.1431884765625, -2.006195068359375, -1.86920166015625, -1.732208251953125, -1.59521484375, -1.458221435546875, -1.32122802734375, -1.184234619140625, -1.0472412109375, -0.910247802734375, -0.77325439453125, -0.636260986328125, -0.499267578125, -0.362274169921875, -0.22528076171875, -0.088287353515625, 0.0487060546875, 0.185699462890625, 0.32269287109375, 0.459686279296875, 0.5966796875, 0.733673095703125, 0.87066650390625, 1.007659912109375, 1.1446533203125, 1.281646728515625, 1.41864013671875, 1.555633544921875, 1.692626953125, 1.829620361328125, 1.96661376953125, 2.103607177734375, 2.2406005859375, 2.377593994140625, 2.51458740234375, 2.651580810546875, 2.78857421875, 2.925567626953125, 3.06256103515625, 3.199554443359375, 3.3365478515625, 3.473541259765625, 3.61053466796875, 3.747528076171875, 3.884521484375, 4.021514892578125, 4.15850830078125, 4.295501708984375, 4.4324951171875, 4.569488525390625, 4.70648193359375, 4.843475341796875, 4.98046875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 6.0, 17.0, 26.0, 42.0, 48.0, 81.0, 88.0, 148.0, 231.0, 313.0, 416.0, 611.0, 871.0, 1258.0, 1749.0, 2550.0, 3635.0, 5400.0, 7855.0, 11481.0, 17111.0, 26460.0, 40887.0, 64535.0, 103669.0, 162302.0, 200444.0, 143115.0, 90157.0, 55920.0, 35791.0, 23174.0, 15211.0, 10412.0, 6986.0, 4730.0, 3159.0, 2412.0, 1549.0, 1116.0, 783.0, 559.0, 396.0, 266.0, 179.0, 127.0, 96.0, 57.0, 42.0, 36.0, 14.0, 15.0, 8.0, 8.0, 1.0, 5.0, 2.0, 2.0], "bins": [-0.462158203125, -0.4478721618652344, -0.43358612060546875, -0.4193000793457031, -0.4050140380859375, -0.3907279968261719, -0.37644195556640625, -0.3621559143066406, -0.347869873046875, -0.3335838317871094, -0.31929779052734375, -0.3050117492675781, -0.2907257080078125, -0.2764396667480469, -0.26215362548828125, -0.24786758422851562, -0.23358154296875, -0.21929550170898438, -0.20500946044921875, -0.19072341918945312, -0.1764373779296875, -0.16215133666992188, -0.14786529541015625, -0.13357925415039062, -0.119293212890625, -0.10500717163085938, -0.09072113037109375, -0.07643508911132812, -0.0621490478515625, -0.047863006591796875, -0.03357696533203125, -0.019290924072265625, -0.0050048828125, 0.009281158447265625, 0.02356719970703125, 0.037853240966796875, 0.0521392822265625, 0.06642532348632812, 0.08071136474609375, 0.09499740600585938, 0.109283447265625, 0.12356948852539062, 0.13785552978515625, 0.15214157104492188, 0.1664276123046875, 0.18071365356445312, 0.19499969482421875, 0.20928573608398438, 0.22357177734375, 0.23785781860351562, 0.25214385986328125, 0.2664299011230469, 0.2807159423828125, 0.2950019836425781, 0.30928802490234375, 0.3235740661621094, 0.337860107421875, 0.3521461486816406, 0.36643218994140625, 0.3807182312011719, 0.3950042724609375, 0.4092903137207031, 0.42357635498046875, 0.4378623962402344, 0.4521484375]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 8.0, 2.0, 2.0, 7.0, 8.0, 6.0, 9.0, 8.0, 11.0, 10.0, 11.0, 19.0, 19.0, 14.0, 22.0, 17.0, 23.0, 32.0, 35.0, 33.0, 34.0, 33.0, 32.0, 20.0, 34.0, 1069.0, 45.0, 43.0, 39.0, 41.0, 25.0, 36.0, 30.0, 21.0, 30.0, 32.0, 26.0, 28.0, 17.0, 22.0, 13.0, 11.0, 8.0, 13.0, 12.0, 5.0, 3.0, 2.0, 2.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-2.755859375, -2.674896240234375, -2.59393310546875, -2.512969970703125, -2.4320068359375, -2.351043701171875, -2.27008056640625, -2.189117431640625, -2.108154296875, -2.027191162109375, -1.94622802734375, -1.865264892578125, -1.7843017578125, -1.703338623046875, -1.62237548828125, -1.541412353515625, -1.46044921875, -1.379486083984375, -1.29852294921875, -1.217559814453125, -1.1365966796875, -1.055633544921875, -0.97467041015625, -0.893707275390625, -0.812744140625, -0.731781005859375, -0.65081787109375, -0.569854736328125, -0.4888916015625, -0.407928466796875, -0.32696533203125, -0.246002197265625, -0.1650390625, -0.084075927734375, -0.00311279296875, 0.077850341796875, 0.1588134765625, 0.239776611328125, 0.32073974609375, 0.401702880859375, 0.482666015625, 0.563629150390625, 0.64459228515625, 0.725555419921875, 0.8065185546875, 0.887481689453125, 0.96844482421875, 1.049407958984375, 1.13037109375, 1.211334228515625, 1.29229736328125, 1.373260498046875, 1.4542236328125, 1.535186767578125, 1.61614990234375, 1.697113037109375, 1.778076171875, 1.859039306640625, 1.94000244140625, 2.020965576171875, 2.1019287109375, 2.182891845703125, 2.26385498046875, 2.344818115234375, 2.42578125]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 1.0, 2.0, 8.0, 10.0, 16.0, 23.0, 30.0, 46.0, 56.0, 107.0, 152.0, 194.0, 323.0, 504.0, 755.0, 1104.0, 1753.0, 2623.0, 4003.0, 6377.0, 9976.0, 15784.0, 24430.0, 40115.0, 68573.0, 121816.0, 269323.0, 1203939.0, 133630.0, 74650.0, 43767.0, 26574.0, 16784.0, 10533.0, 6674.0, 4264.0, 2850.0, 1781.0, 1216.0, 750.0, 506.0, 349.0, 239.0, 181.0, 111.0, 75.0, 49.0, 30.0, 36.0, 14.0, 4.0, 12.0, 9.0, 5.0, 1.0, 3.0, 0.0, 2.0], "bins": [-0.470947265625, -0.4567108154296875, -0.442474365234375, -0.4282379150390625, -0.41400146484375, -0.3997650146484375, -0.385528564453125, -0.3712921142578125, -0.3570556640625, -0.3428192138671875, -0.328582763671875, -0.3143463134765625, -0.30010986328125, -0.2858734130859375, -0.271636962890625, -0.2574005126953125, -0.2431640625, -0.2289276123046875, -0.214691162109375, -0.2004547119140625, -0.18621826171875, -0.1719818115234375, -0.157745361328125, -0.1435089111328125, -0.1292724609375, -0.1150360107421875, -0.100799560546875, -0.0865631103515625, -0.07232666015625, -0.0580902099609375, -0.043853759765625, -0.0296173095703125, -0.015380859375, -0.0011444091796875, 0.013092041015625, 0.0273284912109375, 0.04156494140625, 0.0558013916015625, 0.070037841796875, 0.0842742919921875, 0.0985107421875, 0.1127471923828125, 0.126983642578125, 0.1412200927734375, 0.15545654296875, 0.1696929931640625, 0.183929443359375, 0.1981658935546875, 0.21240234375, 0.2266387939453125, 0.240875244140625, 0.2551116943359375, 0.26934814453125, 0.2835845947265625, 0.297821044921875, 0.3120574951171875, 0.3262939453125, 0.3405303955078125, 0.354766845703125, 0.3690032958984375, 0.38323974609375, 0.3974761962890625, 0.411712646484375, 0.4259490966796875, 0.440185546875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 7.0, 5.0, 2.0, 3.0, 7.0, 7.0, 7.0, 12.0, 11.0, 13.0, 13.0, 11.0, 15.0, 23.0, 26.0, 32.0, 37.0, 61.0, 66.0, 93.0, 85.0, 97.0, 70.0, 47.0, 36.0, 41.0, 29.0, 24.0, 16.0, 18.0, 19.0, 23.0, 15.0, 14.0, 2.0, 8.0, 3.0, 3.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004329681396484375, -0.004183948040008545, -0.004038214683532715, -0.0038924813270568848, -0.0037467479705810547, -0.0036010146141052246, -0.0034552812576293945, -0.0033095479011535645, -0.0031638145446777344, -0.0030180811882019043, -0.0028723478317260742, -0.002726614475250244, -0.002580881118774414, -0.002435147762298584, -0.002289414405822754, -0.002143681049346924, -0.0019979476928710938, -0.0018522143363952637, -0.0017064809799194336, -0.0015607476234436035, -0.0014150142669677734, -0.0012692809104919434, -0.0011235475540161133, -0.0009778141975402832, -0.0008320808410644531, -0.000686347484588623, -0.000540614128112793, -0.0003948807716369629, -0.0002491474151611328, -0.00010341405868530273, 4.2319297790527344e-05, 0.00018805265426635742, 0.0003337860107421875, 0.0004795193672180176, 0.0006252527236938477, 0.0007709860801696777, 0.0009167194366455078, 0.0010624527931213379, 0.001208186149597168, 0.001353919506072998, 0.0014996528625488281, 0.0016453862190246582, 0.0017911195755004883, 0.0019368529319763184, 0.0020825862884521484, 0.0022283196449279785, 0.0023740530014038086, 0.0025197863578796387, 0.0026655197143554688, 0.002811253070831299, 0.002956986427307129, 0.003102719783782959, 0.003248453140258789, 0.003394186496734619, 0.0035399198532104492, 0.0036856532096862793, 0.0038313865661621094, 0.0039771199226379395, 0.0041228532791137695, 0.0042685866355896, 0.00441431999206543, 0.00456005334854126, 0.00470578670501709, 0.00485152006149292, 0.00499725341796875]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 9.0, 5.0, 13.0, 16.0, 27.0, 27.0, 27.0, 45.0, 55.0, 68.0, 93.0, 105.0, 214.0, 423.0, 1445.0, 910039.0, 133873.0, 989.0, 375.0, 222.0, 116.0, 73.0, 57.0, 38.0, 34.0, 30.0, 22.0, 21.0, 17.0, 15.0, 13.0, 11.0, 5.0, 5.0, 4.0, 7.0, 4.0, 3.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.1065673828125, -0.10351371765136719, -0.10046005249023438, -0.09740638732910156, -0.09435272216796875, -0.09129905700683594, -0.08824539184570312, -0.08519172668457031, -0.0821380615234375, -0.07908439636230469, -0.07603073120117188, -0.07297706604003906, -0.06992340087890625, -0.06686973571777344, -0.06381607055664062, -0.06076240539550781, -0.057708740234375, -0.05465507507324219, -0.051601409912109375, -0.04854774475097656, -0.04549407958984375, -0.04244041442871094, -0.039386749267578125, -0.03633308410644531, -0.0332794189453125, -0.030225753784179688, -0.027172088623046875, -0.024118423461914062, -0.02106475830078125, -0.018011093139648438, -0.014957427978515625, -0.011903762817382812, -0.00885009765625, -0.0057964324951171875, -0.002742767333984375, 0.0003108978271484375, 0.00336456298828125, 0.0064182281494140625, 0.009471893310546875, 0.012525558471679688, 0.0155792236328125, 0.018632888793945312, 0.021686553955078125, 0.024740219116210938, 0.02779388427734375, 0.030847549438476562, 0.033901214599609375, 0.03695487976074219, 0.040008544921875, 0.04306221008300781, 0.046115875244140625, 0.04916954040527344, 0.05222320556640625, 0.05527687072753906, 0.058330535888671875, 0.06138420104980469, 0.0644378662109375, 0.06749153137207031, 0.07054519653320312, 0.07359886169433594, 0.07665252685546875, 0.07970619201660156, 0.08275985717773438, 0.08581352233886719, 0.0888671875]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 184.0, 750.0, 71.0, 3.0], "bins": [-0.034013669937849045, -0.03345935791730881, -0.03290504217147827, -0.032350730150938034, -0.0317964144051075, -0.03124210238456726, -0.030687788501381874, -0.030133474618196487, -0.0295791607350111, -0.029024846851825714, -0.028470532968640327, -0.02791621908545494, -0.027361907064914703, -0.026807593181729317, -0.02625327929854393, -0.025698965415358543, -0.025144651532173157, -0.02459033764898777, -0.024036023765802383, -0.023481709882616997, -0.02292739599943161, -0.022373083978891373, -0.021818770095705986, -0.0212644562125206, -0.020710142329335213, -0.020155828446149826, -0.01960151456296444, -0.019047200679779053, -0.018492888659238815, -0.01793857477605343, -0.017384260892868042, -0.016829947009682655, -0.01627563126385212, -0.015721317380666733, -0.015167003497481346, -0.014612690545618534, -0.014058376662433147, -0.01350406277924776, -0.012949749827384949, -0.012395435944199562, -0.011841122061014175, -0.011286808177828789, -0.010732494294643402, -0.01017818134278059, -0.009623867459595203, -0.009069553576409817, -0.008515240624547005, -0.007960926741361618, -0.007406613323837519, -0.006852299906313419, -0.006297986023128033, -0.005743672139942646, -0.005189358722418547, -0.004635045304894447, -0.004080731421709061, -0.0035264177713543177, -0.0029721041209995747, -0.0024177904706448317, -0.0018634768202900887, -0.0013091631699353456, -0.0007548495195806026, -0.00020053586922585964, 0.00035377778112888336, 0.0009080914314836264, 0.0014624050818383694]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 1.0, 2.0, 7.0, 6.0, 11.0, 8.0, 19.0, 12.0, 21.0, 30.0, 28.0, 30.0, 30.0, 40.0, 39.0, 55.0, 42.0, 45.0, 54.0, 47.0, 50.0, 43.0, 50.0, 48.0, 40.0, 39.0, 39.0, 22.0, 35.0, 24.0, 18.0, 20.0, 12.0, 9.0, 7.0, 8.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.003399789333343506, -0.0033113937824964523, -0.003222998231649399, -0.0031346026808023453, -0.0030462071299552917, -0.0029578115791082382, -0.0028694160282611847, -0.002781020477414131, -0.0026926249265670776, -0.002604229375720024, -0.0025158338248729706, -0.002427438274025917, -0.0023390427231788635, -0.00225064717233181, -0.0021622516214847565, -0.002073856070637703, -0.0019854605197906494, -0.0018970649689435959, -0.0018086694180965424, -0.0017202738672494888, -0.0016318783164024353, -0.0015434827655553818, -0.0014550872147083282, -0.0013666916638612747, -0.0012782961130142212, -0.0011899005621671677, -0.0011015050113201141, -0.0010131094604730606, -0.0009247139096260071, -0.0008363183587789536, -0.0007479228079319, -0.0006595272570848465, -0.000571131706237793, -0.00048273615539073944, -0.0003943406045436859, -0.0003059450536966324, -0.00021754950284957886, -0.00012915395200252533, -4.07584011554718e-05, 4.7637149691581726e-05, 0.00013603270053863525, 0.00022442825138568878, 0.0003128238022327423, 0.00040121935307979584, 0.0004896149039268494, 0.0005780104547739029, 0.0006664060056209564, 0.00075480155646801, 0.0008431971073150635, 0.000931592658162117, 0.0010199882090091705, 0.001108383759856224, 0.0011967793107032776, 0.0012851748615503311, 0.0013735704123973846, 0.0014619659632444382, 0.0015503615140914917, 0.0016387570649385452, 0.0017271526157855988, 0.0018155481666326523, 0.0019039437174797058, 0.0019923392683267593, 0.002080734819173813, 0.0021691303700208664, 0.00225752592086792]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 8.0, 3.0, 6.0, 4.0, 4.0, 10.0, 7.0, 13.0, 12.0, 17.0, 16.0, 25.0, 23.0, 23.0, 35.0, 28.0, 27.0, 32.0, 36.0, 39.0, 32.0, 46.0, 43.0, 40.0, 43.0, 41.0, 37.0, 23.0, 31.0, 38.0, 29.0, 38.0, 23.0, 17.0, 22.0, 29.0, 17.0, 17.0, 16.0, 13.0, 16.0, 5.0, 6.0, 5.0, 4.0, 6.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.787109375, -3.650115966796875, -3.51312255859375, -3.376129150390625, -3.2391357421875, -3.102142333984375, -2.96514892578125, -2.828155517578125, -2.691162109375, -2.554168701171875, -2.41717529296875, -2.280181884765625, -2.1431884765625, -2.006195068359375, -1.86920166015625, -1.732208251953125, -1.59521484375, -1.458221435546875, -1.32122802734375, -1.184234619140625, -1.0472412109375, -0.910247802734375, -0.77325439453125, -0.636260986328125, -0.499267578125, -0.362274169921875, -0.22528076171875, -0.088287353515625, 0.0487060546875, 0.185699462890625, 0.32269287109375, 0.459686279296875, 0.5966796875, 0.733673095703125, 0.87066650390625, 1.007659912109375, 1.1446533203125, 1.281646728515625, 1.41864013671875, 1.555633544921875, 1.692626953125, 1.829620361328125, 1.96661376953125, 2.103607177734375, 2.2406005859375, 2.377593994140625, 2.51458740234375, 2.651580810546875, 2.78857421875, 2.925567626953125, 3.06256103515625, 3.199554443359375, 3.3365478515625, 3.473541259765625, 3.61053466796875, 3.747528076171875, 3.884521484375, 4.021514892578125, 4.15850830078125, 4.295501708984375, 4.4324951171875, 4.569488525390625, 4.70648193359375, 4.843475341796875, 4.98046875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 5.0, 6.0, 6.0, 7.0, 6.0, 20.0, 11.0, 29.0, 34.0, 41.0, 51.0, 83.0, 112.0, 134.0, 176.0, 281.0, 339.0, 512.0, 684.0, 1274.0, 3906.0, 15743.0, 88408.0, 756704.0, 148176.0, 22226.0, 5238.0, 1643.0, 784.0, 506.0, 338.0, 270.0, 208.0, 130.0, 120.0, 107.0, 57.0, 44.0, 43.0, 20.0, 19.0, 19.0, 7.0, 9.0, 6.0, 10.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4921875, -9.1484375, -8.8046875, -8.4609375, -8.1171875, -7.7734375, -7.4296875, -7.0859375, -6.7421875, -6.3984375, -6.0546875, -5.7109375, -5.3671875, -5.0234375, -4.6796875, -4.3359375, -3.9921875, -3.6484375, -3.3046875, -2.9609375, -2.6171875, -2.2734375, -1.9296875, -1.5859375, -1.2421875, -0.8984375, -0.5546875, -0.2109375, 0.1328125, 0.4765625, 0.8203125, 1.1640625, 1.5078125, 1.8515625, 2.1953125, 2.5390625, 2.8828125, 3.2265625, 3.5703125, 3.9140625, 4.2578125, 4.6015625, 4.9453125, 5.2890625, 5.6328125, 5.9765625, 6.3203125, 6.6640625, 7.0078125, 7.3515625, 7.6953125, 8.0390625, 8.3828125, 8.7265625, 9.0703125, 9.4140625, 9.7578125, 10.1015625, 10.4453125, 10.7890625, 11.1328125, 11.4765625, 11.8203125, 12.1640625, 12.5078125]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 6.0, 4.0, 6.0, 5.0, 16.0, 8.0, 13.0, 15.0, 23.0, 15.0, 19.0, 36.0, 37.0, 45.0, 67.0, 62.0, 78.0, 163.0, 1674.0, 289.0, 59.0, 63.0, 58.0, 34.0, 46.0, 35.0, 33.0, 31.0, 18.0, 21.0, 18.0, 12.0, 16.0, 6.0, 9.0, 5.0, 3.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 5.0, 0.0, 0.0, 1.0], "bins": [-17.59375, -17.0867919921875, -16.579833984375, -16.0728759765625, -15.56591796875, -15.0589599609375, -14.552001953125, -14.0450439453125, -13.5380859375, -13.0311279296875, -12.524169921875, -12.0172119140625, -11.51025390625, -11.0032958984375, -10.496337890625, -9.9893798828125, -9.482421875, -8.9754638671875, -8.468505859375, -7.9615478515625, -7.45458984375, -6.9476318359375, -6.440673828125, -5.9337158203125, -5.4267578125, -4.9197998046875, -4.412841796875, -3.9058837890625, -3.39892578125, -2.8919677734375, -2.385009765625, -1.8780517578125, -1.37109375, -0.8641357421875, -0.357177734375, 0.1497802734375, 0.65673828125, 1.1636962890625, 1.670654296875, 2.1776123046875, 2.6845703125, 3.1915283203125, 3.698486328125, 4.2054443359375, 4.71240234375, 5.2193603515625, 5.726318359375, 6.2332763671875, 6.740234375, 7.2471923828125, 7.754150390625, 8.2611083984375, 8.76806640625, 9.2750244140625, 9.781982421875, 10.2889404296875, 10.7958984375, 11.3028564453125, 11.809814453125, 12.3167724609375, 12.82373046875, 13.3306884765625, 13.837646484375, 14.3446044921875, 14.8515625]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 1.0, 5.0, 7.0, 4.0, 12.0, 18.0, 40.0, 46.0, 64.0, 111.0, 222.0, 462.0, 4180.0, 3122944.0, 16163.0, 850.0, 229.0, 117.0, 89.0, 54.0, 34.0, 21.0, 16.0, 8.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.6875, -79.8037109375, -76.919921875, -74.0361328125, -71.15234375, -68.2685546875, -65.384765625, -62.5009765625, -59.6171875, -56.7333984375, -53.849609375, -50.9658203125, -48.08203125, -45.1982421875, -42.314453125, -39.4306640625, -36.546875, -33.6630859375, -30.779296875, -27.8955078125, -25.01171875, -22.1279296875, -19.244140625, -16.3603515625, -13.4765625, -10.5927734375, -7.708984375, -4.8251953125, -1.94140625, 0.9423828125, 3.826171875, 6.7099609375, 9.59375, 12.4775390625, 15.361328125, 18.2451171875, 21.12890625, 24.0126953125, 26.896484375, 29.7802734375, 32.6640625, 35.5478515625, 38.431640625, 41.3154296875, 44.19921875, 47.0830078125, 49.966796875, 52.8505859375, 55.734375, 58.6181640625, 61.501953125, 64.3857421875, 67.26953125, 70.1533203125, 73.037109375, 75.9208984375, 78.8046875, 81.6884765625, 84.572265625, 87.4560546875, 90.33984375, 93.2236328125, 96.107421875, 98.9912109375, 101.875]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 309.0, 691.0, 14.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.21897888183594, -62.62183380126953, -57.024688720703125, -51.427547454833984, -45.83040237426758, -40.23325729370117, -34.63611602783203, -29.038970947265625, -23.44182586669922, -17.844680786132812, -12.247537612915039, -6.650394439697266, -1.0532493591308594, 4.543895721435547, 10.141036987304688, 15.738182067871094, 21.3353271484375, 26.932472229003906, 32.52961730957031, 38.12675857543945, 43.72390365600586, 49.321048736572266, 54.918190002441406, 60.51533508300781, 66.11248016357422, 71.70962524414062, 77.30677032470703, 82.90391540527344, 88.50105285644531, 94.09820556640625, 99.69534301757812, 105.29248809814453, 110.8896484375, 116.4867935180664, 122.08393859863281, 127.68107604980469, 133.27822875976562, 138.8753662109375, 144.47250366210938, 150.0696563720703, 155.66680908203125, 161.26394653320312, 166.86109924316406, 172.45823669433594, 178.05538940429688, 183.65252685546875, 189.24966430664062, 194.84681701660156, 200.44395446777344, 206.0410919189453, 211.63824462890625, 217.23538208007812, 222.83253479003906, 228.42967224121094, 234.02682495117188, 239.62396240234375, 245.22109985351562, 250.8182373046875, 256.4153747558594, 262.0125427246094, 267.60968017578125, 273.2068176269531, 278.803955078125, 284.401123046875, 289.9982604980469]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 9.0, 5.0, 11.0, 11.0, 13.0, 13.0, 17.0, 17.0, 21.0, 21.0, 20.0, 32.0, 34.0, 42.0, 34.0, 34.0, 44.0, 37.0, 35.0, 36.0, 39.0, 39.0, 39.0, 41.0, 36.0, 31.0, 36.0, 42.0, 33.0, 25.0, 29.0, 15.0, 15.0, 16.0, 18.0, 11.0, 8.0, 8.0, 8.0, 8.0, 3.0, 1.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-33.516639709472656, -32.56614685058594, -31.615650177001953, -30.665157318115234, -29.714662551879883, -28.76416778564453, -27.81367301940918, -26.863178253173828, -25.912683486938477, -24.962188720703125, -24.011693954467773, -23.061199188232422, -22.110706329345703, -21.16021156311035, -20.209716796875, -19.25922203063965, -18.308727264404297, -17.358232498168945, -16.407737731933594, -15.457243919372559, -14.506749153137207, -13.556255340576172, -12.60576057434082, -11.655265808105469, -10.70477294921875, -9.754278182983398, -8.803784370422363, -7.853289604187012, -6.90279483795166, -5.952300548553467, -5.001806259155273, -4.051311492919922, -3.1008167266845703, -2.150322198867798, -1.199827790260315, -0.24933338165283203, 0.7011611461639404, 1.651655673980713, 2.6021499633789062, 3.552644729614258, 4.503139019012451, 5.4536333084106445, 6.404128074645996, 7.3546223640441895, 8.305116653442383, 9.255611419677734, 10.206106185913086, 11.156600952148438, 12.107094764709473, 13.057589530944824, 14.00808334350586, 14.958578109741211, 15.909072875976562, 16.859567642211914, 17.810062408447266, 18.760555267333984, 19.711050033569336, 20.661544799804688, 21.61203956604004, 22.56253433227539, 23.51302719116211, 24.46352195739746, 25.414016723632812, 26.364511489868164, 27.315006256103516]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 9.0, 3.0, 6.0, 10.0, 10.0, 16.0, 22.0, 18.0, 19.0, 24.0, 23.0, 36.0, 32.0, 36.0, 43.0, 36.0, 34.0, 35.0, 50.0, 46.0, 29.0, 47.0, 35.0, 39.0, 39.0, 24.0, 38.0, 31.0, 29.0, 20.0, 27.0, 21.0, 19.0, 10.0, 13.0, 18.0, 11.0, 8.0, 9.0, 5.0, 8.0, 3.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.814453125, -3.667877197265625, -3.52130126953125, -3.374725341796875, -3.2281494140625, -3.081573486328125, -2.93499755859375, -2.788421630859375, -2.641845703125, -2.495269775390625, -2.34869384765625, -2.202117919921875, -2.0555419921875, -1.908966064453125, -1.76239013671875, -1.615814208984375, -1.46923828125, -1.322662353515625, -1.17608642578125, -1.029510498046875, -0.8829345703125, -0.736358642578125, -0.58978271484375, -0.443206787109375, -0.296630859375, -0.150054931640625, -0.00347900390625, 0.143096923828125, 0.2896728515625, 0.436248779296875, 0.58282470703125, 0.729400634765625, 0.8759765625, 1.022552490234375, 1.16912841796875, 1.315704345703125, 1.4622802734375, 1.608856201171875, 1.75543212890625, 1.902008056640625, 2.048583984375, 2.195159912109375, 2.34173583984375, 2.488311767578125, 2.6348876953125, 2.781463623046875, 2.92803955078125, 3.074615478515625, 3.22119140625, 3.367767333984375, 3.51434326171875, 3.660919189453125, 3.8074951171875, 3.954071044921875, 4.10064697265625, 4.247222900390625, 4.393798828125, 4.540374755859375, 4.68695068359375, 4.833526611328125, 4.9801025390625, 5.126678466796875, 5.27325439453125, 5.419830322265625, 5.56640625]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 7.0, 5.0, 7.0, 7.0, 9.0, 18.0, 19.0, 23.0, 32.0, 53.0, 49.0, 67.0, 82.0, 127.0, 136.0, 187.0, 306.0, 522.0, 1098.0, 3426.0, 17321.0, 145768.0, 1098626.0, 2225060.0, 621279.0, 66701.0, 8885.0, 2118.0, 876.0, 437.0, 285.0, 179.0, 121.0, 85.0, 74.0, 67.0, 39.0, 41.0, 38.0, 33.0, 12.0, 20.0, 13.0, 16.0, 2.0, 3.0, 5.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.16796875, -6.92364501953125, -6.6793212890625, -6.43499755859375, -6.190673828125, -5.94635009765625, -5.7020263671875, -5.45770263671875, -5.21337890625, -4.96905517578125, -4.7247314453125, -4.48040771484375, -4.236083984375, -3.99176025390625, -3.7474365234375, -3.50311279296875, -3.2587890625, -3.01446533203125, -2.7701416015625, -2.52581787109375, -2.281494140625, -2.03717041015625, -1.7928466796875, -1.54852294921875, -1.30419921875, -1.05987548828125, -0.8155517578125, -0.57122802734375, -0.326904296875, -0.08258056640625, 0.1617431640625, 0.40606689453125, 0.650390625, 0.89471435546875, 1.1390380859375, 1.38336181640625, 1.627685546875, 1.87200927734375, 2.1163330078125, 2.36065673828125, 2.60498046875, 2.84930419921875, 3.0936279296875, 3.33795166015625, 3.582275390625, 3.82659912109375, 4.0709228515625, 4.31524658203125, 4.5595703125, 4.80389404296875, 5.0482177734375, 5.29254150390625, 5.536865234375, 5.78118896484375, 6.0255126953125, 6.26983642578125, 6.51416015625, 6.75848388671875, 7.0028076171875, 7.24713134765625, 7.491455078125, 7.73577880859375, 7.9801025390625, 8.22442626953125, 8.46875]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 9.0, 14.0, 19.0, 37.0, 49.0, 71.0, 85.0, 151.0, 246.0, 354.0, 515.0, 592.0, 559.0, 401.0, 301.0, 226.0, 140.0, 101.0, 59.0, 38.0, 36.0, 20.0, 15.0, 8.0, 5.0, 3.0, 5.0, 3.0, 3.0, 0.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.30859375, -5.05242919921875, -4.7962646484375, -4.54010009765625, -4.283935546875, -4.02777099609375, -3.7716064453125, -3.51544189453125, -3.25927734375, -3.00311279296875, -2.7469482421875, -2.49078369140625, -2.234619140625, -1.97845458984375, -1.7222900390625, -1.46612548828125, -1.2099609375, -0.95379638671875, -0.6976318359375, -0.44146728515625, -0.185302734375, 0.07086181640625, 0.3270263671875, 0.58319091796875, 0.83935546875, 1.09552001953125, 1.3516845703125, 1.60784912109375, 1.864013671875, 2.12017822265625, 2.3763427734375, 2.63250732421875, 2.888671875, 3.14483642578125, 3.4010009765625, 3.65716552734375, 3.913330078125, 4.16949462890625, 4.4256591796875, 4.68182373046875, 4.93798828125, 5.19415283203125, 5.4503173828125, 5.70648193359375, 5.962646484375, 6.21881103515625, 6.4749755859375, 6.73114013671875, 6.9873046875, 7.24346923828125, 7.4996337890625, 7.75579833984375, 8.011962890625, 8.26812744140625, 8.5242919921875, 8.78045654296875, 9.03662109375, 9.29278564453125, 9.5489501953125, 9.80511474609375, 10.061279296875, 10.31744384765625, 10.5736083984375, 10.82977294921875, 11.0859375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 9.0, 4.0, 12.0, 17.0, 27.0, 54.0, 68.0, 107.0, 161.0, 295.0, 485.0, 1097.0, 4856.0, 161633.0, 3886289.0, 132291.0, 4640.0, 1050.0, 457.0, 237.0, 171.0, 112.0, 83.0, 35.0, 32.0, 17.0, 16.0, 12.0, 6.0, 6.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.375, -22.6552734375, -21.935546875, -21.2158203125, -20.49609375, -19.7763671875, -19.056640625, -18.3369140625, -17.6171875, -16.8974609375, -16.177734375, -15.4580078125, -14.73828125, -14.0185546875, -13.298828125, -12.5791015625, -11.859375, -11.1396484375, -10.419921875, -9.7001953125, -8.98046875, -8.2607421875, -7.541015625, -6.8212890625, -6.1015625, -5.3818359375, -4.662109375, -3.9423828125, -3.22265625, -2.5029296875, -1.783203125, -1.0634765625, -0.34375, 0.3759765625, 1.095703125, 1.8154296875, 2.53515625, 3.2548828125, 3.974609375, 4.6943359375, 5.4140625, 6.1337890625, 6.853515625, 7.5732421875, 8.29296875, 9.0126953125, 9.732421875, 10.4521484375, 11.171875, 11.8916015625, 12.611328125, 13.3310546875, 14.05078125, 14.7705078125, 15.490234375, 16.2099609375, 16.9296875, 17.6494140625, 18.369140625, 19.0888671875, 19.80859375, 20.5283203125, 21.248046875, 21.9677734375, 22.6875]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 8.0, 555.0, 452.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.07829284667969, -41.98406982421875, -34.88984680175781, -27.79561996459961, -20.701396942138672, -13.607173919677734, -6.512947082519531, 0.5812759399414062, 7.675498962402344, 14.769722938537598, 21.86394691467285, 28.958171844482422, 36.05239486694336, 43.1466178894043, 50.2408447265625, 57.33506774902344, 64.42929077148438, 71.52351379394531, 78.61773681640625, 85.71195983886719, 92.80618286132812, 99.90040588378906, 106.99463653564453, 114.08885955810547, 121.1830825805664, 128.27731323242188, 135.3715362548828, 142.46575927734375, 149.5599822998047, 156.65420532226562, 163.74842834472656, 170.8426513671875, 177.93685913085938, 185.0310821533203, 192.12530517578125, 199.2195281982422, 206.31375122070312, 213.40797424316406, 220.502197265625, 227.596435546875, 234.69064331054688, 241.7848663330078, 248.87908935546875, 255.9733123779297, 263.0675354003906, 270.1617736816406, 277.2559814453125, 284.3502197265625, 291.4444580078125, 298.5386962890625, 305.6329040527344, 312.7271423339844, 319.82135009765625, 326.91558837890625, 334.0097961425781, 341.1040344238281, 348.1982421875, 355.29248046875, 362.3866882324219, 369.4809265136719, 376.57513427734375, 383.66937255859375, 390.7635803222656, 397.8578186035156, 404.9520263671875]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 7.0, 2.0, 8.0, 10.0, 12.0, 9.0, 15.0, 17.0, 11.0, 22.0, 14.0, 29.0, 31.0, 27.0, 27.0, 36.0, 26.0, 23.0, 39.0, 30.0, 34.0, 45.0, 55.0, 44.0, 39.0, 30.0, 31.0, 35.0, 29.0, 29.0, 32.0, 24.0, 20.0, 24.0, 17.0, 21.0, 18.0, 9.0, 13.0, 7.0, 10.0, 12.0, 7.0, 6.0, 5.0, 4.0, 3.0, 2.0, 5.0], "bins": [-22.164546966552734, -21.55539321899414, -20.946239471435547, -20.337085723876953, -19.72793197631836, -19.118778228759766, -18.509624481201172, -17.900470733642578, -17.291316986083984, -16.68216323852539, -16.073009490966797, -15.463855743408203, -14.85470199584961, -14.245548248291016, -13.636393547058105, -13.027239799499512, -12.418085098266602, -11.808931350708008, -11.199777603149414, -10.59062385559082, -9.981470108032227, -9.372316360473633, -8.763161659240723, -8.154007911682129, -7.544854164123535, -6.935700416564941, -6.326546669006348, -5.717392444610596, -5.108238697052002, -4.499084949493408, -3.8899309635162354, -3.2807769775390625, -2.6716232299804688, -2.062469482421875, -1.4533154964447021, -0.8441616296768188, -0.23500776290893555, 0.3741459846496582, 0.983299970626831, 1.592453956604004, 2.2016077041625977, 2.8107614517211914, 3.4199154376983643, 4.029069423675537, 4.638223171234131, 5.247376918792725, 5.856531143188477, 6.46568489074707, 7.074838638305664, 7.683992385864258, 8.293146133422852, 8.902299880981445, 9.511453628540039, 10.120607376098633, 10.729762077331543, 11.338915824890137, 11.94806957244873, 12.557223320007324, 13.166377067565918, 13.775530815124512, 14.384685516357422, 14.993839263916016, 15.60299301147461, 16.212146759033203, 16.821300506591797]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 9.0, 13.0, 7.0, 15.0, 24.0, 16.0, 19.0, 16.0, 37.0, 24.0, 42.0, 35.0, 41.0, 30.0, 38.0, 35.0, 48.0, 50.0, 51.0, 51.0, 31.0, 52.0, 43.0, 39.0, 36.0, 26.0, 29.0, 24.0, 21.0, 18.0, 13.0, 11.0, 14.0, 8.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.88739013671875, -3.7357177734375, -3.58404541015625, -3.432373046875, -3.28070068359375, -3.1290283203125, -2.97735595703125, -2.82568359375, -2.67401123046875, -2.5223388671875, -2.37066650390625, -2.218994140625, -2.06732177734375, -1.9156494140625, -1.76397705078125, -1.6123046875, -1.46063232421875, -1.3089599609375, -1.15728759765625, -1.005615234375, -0.85394287109375, -0.7022705078125, -0.55059814453125, -0.39892578125, -0.24725341796875, -0.0955810546875, 0.05609130859375, 0.207763671875, 0.35943603515625, 0.5111083984375, 0.66278076171875, 0.814453125, 0.96612548828125, 1.1177978515625, 1.26947021484375, 1.421142578125, 1.57281494140625, 1.7244873046875, 1.87615966796875, 2.02783203125, 2.17950439453125, 2.3311767578125, 2.48284912109375, 2.634521484375, 2.78619384765625, 2.9378662109375, 3.08953857421875, 3.2412109375, 3.39288330078125, 3.5445556640625, 3.69622802734375, 3.847900390625, 3.99957275390625, 4.1512451171875, 4.30291748046875, 4.45458984375, 4.60626220703125, 4.7579345703125, 4.90960693359375, 5.061279296875, 5.21295166015625, 5.3646240234375, 5.51629638671875, 5.66796875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [4.0, 7.0, 7.0, 13.0, 9.0, 10.0, 18.0, 46.0, 51.0, 61.0, 91.0, 136.0, 195.0, 270.0, 375.0, 518.0, 737.0, 1061.0, 1542.0, 2013.0, 3007.0, 4234.0, 6105.0, 8795.0, 12972.0, 19313.0, 30099.0, 48016.0, 77739.0, 125786.0, 185842.0, 183640.0, 123241.0, 75747.0, 46609.0, 29405.0, 19296.0, 12654.0, 8720.0, 6098.0, 4145.0, 2913.0, 2052.0, 1481.0, 1014.0, 734.0, 513.0, 348.0, 271.0, 196.0, 121.0, 95.0, 65.0, 46.0, 33.0, 25.0, 16.0, 13.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.435791015625, -0.421722412109375, -0.40765380859375, -0.393585205078125, -0.3795166015625, -0.365447998046875, -0.35137939453125, -0.337310791015625, -0.3232421875, -0.309173583984375, -0.29510498046875, -0.281036376953125, -0.2669677734375, -0.252899169921875, -0.23883056640625, -0.224761962890625, -0.210693359375, -0.196624755859375, -0.18255615234375, -0.168487548828125, -0.1544189453125, -0.140350341796875, -0.12628173828125, -0.112213134765625, -0.09814453125, -0.084075927734375, -0.07000732421875, -0.055938720703125, -0.0418701171875, -0.027801513671875, -0.01373291015625, 0.000335693359375, 0.014404296875, 0.028472900390625, 0.04254150390625, 0.056610107421875, 0.0706787109375, 0.084747314453125, 0.09881591796875, 0.112884521484375, 0.126953125, 0.141021728515625, 0.15509033203125, 0.169158935546875, 0.1832275390625, 0.197296142578125, 0.21136474609375, 0.225433349609375, 0.239501953125, 0.253570556640625, 0.26763916015625, 0.281707763671875, 0.2957763671875, 0.309844970703125, 0.32391357421875, 0.337982177734375, 0.35205078125, 0.366119384765625, 0.38018798828125, 0.394256591796875, 0.4083251953125, 0.422393798828125, 0.43646240234375, 0.450531005859375, 0.464599609375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 4.0, 6.0, 8.0, 10.0, 17.0, 15.0, 22.0, 10.0, 25.0, 14.0, 25.0, 23.0, 30.0, 34.0, 30.0, 38.0, 37.0, 45.0, 40.0, 35.0, 36.0, 1051.0, 43.0, 38.0, 41.0, 32.0, 31.0, 34.0, 25.0, 20.0, 24.0, 22.0, 23.0, 24.0, 23.0, 16.0, 11.0, 14.0, 10.0, 9.0, 4.0, 6.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0], "bins": [-2.880859375, -2.79644775390625, -2.7120361328125, -2.62762451171875, -2.543212890625, -2.45880126953125, -2.3743896484375, -2.28997802734375, -2.20556640625, -2.12115478515625, -2.0367431640625, -1.95233154296875, -1.867919921875, -1.78350830078125, -1.6990966796875, -1.61468505859375, -1.5302734375, -1.44586181640625, -1.3614501953125, -1.27703857421875, -1.192626953125, -1.10821533203125, -1.0238037109375, -0.93939208984375, -0.85498046875, -0.77056884765625, -0.6861572265625, -0.60174560546875, -0.517333984375, -0.43292236328125, -0.3485107421875, -0.26409912109375, -0.1796875, -0.09527587890625, -0.0108642578125, 0.07354736328125, 0.157958984375, 0.24237060546875, 0.3267822265625, 0.41119384765625, 0.49560546875, 0.58001708984375, 0.6644287109375, 0.74884033203125, 0.833251953125, 0.91766357421875, 1.0020751953125, 1.08648681640625, 1.1708984375, 1.25531005859375, 1.3397216796875, 1.42413330078125, 1.508544921875, 1.59295654296875, 1.6773681640625, 1.76177978515625, 1.84619140625, 1.93060302734375, 2.0150146484375, 2.09942626953125, 2.183837890625, 2.26824951171875, 2.3526611328125, 2.43707275390625, 2.521484375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 17.0, 19.0, 25.0, 33.0, 57.0, 65.0, 125.0, 171.0, 286.0, 404.0, 573.0, 900.0, 1315.0, 2010.0, 3042.0, 4551.0, 7126.0, 10994.0, 16981.0, 27507.0, 44426.0, 73670.0, 124521.0, 321545.0, 1124100.0, 130610.0, 76942.0, 45859.0, 28334.0, 17759.0, 11504.0, 7358.0, 4804.0, 3163.0, 2222.0, 1393.0, 879.0, 625.0, 417.0, 272.0, 190.0, 105.0, 84.0, 53.0, 31.0, 27.0, 14.0, 9.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.412109375, -0.398834228515625, -0.38555908203125, -0.372283935546875, -0.3590087890625, -0.345733642578125, -0.33245849609375, -0.319183349609375, -0.305908203125, -0.292633056640625, -0.27935791015625, -0.266082763671875, -0.2528076171875, -0.239532470703125, -0.22625732421875, -0.212982177734375, -0.19970703125, -0.186431884765625, -0.17315673828125, -0.159881591796875, -0.1466064453125, -0.133331298828125, -0.12005615234375, -0.106781005859375, -0.093505859375, -0.080230712890625, -0.06695556640625, -0.053680419921875, -0.0404052734375, -0.027130126953125, -0.01385498046875, -0.000579833984375, 0.0126953125, 0.025970458984375, 0.03924560546875, 0.052520751953125, 0.0657958984375, 0.079071044921875, 0.09234619140625, 0.105621337890625, 0.118896484375, 0.132171630859375, 0.14544677734375, 0.158721923828125, 0.1719970703125, 0.185272216796875, 0.19854736328125, 0.211822509765625, 0.22509765625, 0.238372802734375, 0.25164794921875, 0.264923095703125, 0.2781982421875, 0.291473388671875, 0.30474853515625, 0.318023681640625, 0.331298828125, 0.344573974609375, 0.35784912109375, 0.371124267578125, 0.3843994140625, 0.397674560546875, 0.41094970703125, 0.424224853515625, 0.4375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 4.0, 0.0, 3.0, 7.0, 4.0, 9.0, 6.0, 14.0, 13.0, 15.0, 17.0, 30.0, 33.0, 35.0, 50.0, 48.0, 60.0, 94.0, 112.0, 80.0, 62.0, 53.0, 47.0, 28.0, 27.0, 30.0, 21.0, 11.0, 19.0, 11.0, 9.0, 11.0, 7.0, 4.0, 2.0, 2.0, 5.0, 5.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-0.003856658935546875, -0.0037377476692199707, -0.0036188364028930664, -0.003499925136566162, -0.003381013870239258, -0.0032621026039123535, -0.0031431913375854492, -0.003024280071258545, -0.0029053688049316406, -0.0027864575386047363, -0.002667546272277832, -0.0025486350059509277, -0.0024297237396240234, -0.002310812473297119, -0.002191901206970215, -0.0020729899406433105, -0.0019540786743164062, -0.001835167407989502, -0.0017162561416625977, -0.0015973448753356934, -0.001478433609008789, -0.0013595223426818848, -0.0012406110763549805, -0.0011216998100280762, -0.0010027885437011719, -0.0008838772773742676, -0.0007649660110473633, -0.000646054744720459, -0.0005271434783935547, -0.0004082322120666504, -0.0002893209457397461, -0.0001704096794128418, -5.14984130859375e-05, 6.74128532409668e-05, 0.0001863241195678711, 0.0003052353858947754, 0.0004241466522216797, 0.000543057918548584, 0.0006619691848754883, 0.0007808804512023926, 0.0008997917175292969, 0.0010187029838562012, 0.0011376142501831055, 0.0012565255165100098, 0.001375436782836914, 0.0014943480491638184, 0.0016132593154907227, 0.001732170581817627, 0.0018510818481445312, 0.0019699931144714355, 0.00208890438079834, 0.002207815647125244, 0.0023267269134521484, 0.0024456381797790527, 0.002564549446105957, 0.0026834607124328613, 0.0028023719787597656, 0.00292128324508667, 0.0030401945114135742, 0.0031591057777404785, 0.003278017044067383, 0.003396928310394287, 0.0035158395767211914, 0.0036347508430480957, 0.003753662109375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 2.0, 1.0, 3.0, 2.0, 8.0, 10.0, 10.0, 8.0, 13.0, 8.0, 17.0, 25.0, 26.0, 35.0, 50.0, 57.0, 66.0, 107.0, 177.0, 320.0, 719.0, 14640.0, 1026785.0, 4066.0, 568.0, 242.0, 172.0, 93.0, 89.0, 46.0, 36.0, 29.0, 21.0, 22.0, 13.0, 11.0, 6.0, 8.0, 10.0, 9.0, 5.0, 1.0, 7.0, 4.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.0760498046875, -0.07362651824951172, -0.07120323181152344, -0.06877994537353516, -0.06635665893554688, -0.0639333724975586, -0.06151008605957031, -0.05908679962158203, -0.05666351318359375, -0.05424022674560547, -0.05181694030761719, -0.049393653869628906, -0.046970367431640625, -0.044547080993652344, -0.04212379455566406, -0.03970050811767578, -0.0372772216796875, -0.03485393524169922, -0.03243064880371094, -0.030007362365722656, -0.027584075927734375, -0.025160789489746094, -0.022737503051757812, -0.02031421661376953, -0.01789093017578125, -0.015467643737792969, -0.013044357299804688, -0.010621070861816406, -0.008197784423828125, -0.005774497985839844, -0.0033512115478515625, -0.0009279251098632812, 0.001495361328125, 0.003918647766113281, 0.0063419342041015625, 0.008765220642089844, 0.011188507080078125, 0.013611793518066406, 0.016035079956054688, 0.01845836639404297, 0.02088165283203125, 0.02330493927001953, 0.025728225708007812, 0.028151512145996094, 0.030574798583984375, 0.032998085021972656, 0.03542137145996094, 0.03784465789794922, 0.0402679443359375, 0.04269123077392578, 0.04511451721191406, 0.047537803649902344, 0.049961090087890625, 0.052384376525878906, 0.05480766296386719, 0.05723094940185547, 0.05965423583984375, 0.06207752227783203, 0.06450080871582031, 0.0669240951538086, 0.06934738159179688, 0.07177066802978516, 0.07419395446777344, 0.07661724090576172, 0.07904052734375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 15.0, 100.0, 317.0, 354.0, 164.0, 55.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004567306954413652, -0.004370035603642464, -0.004172763787209988, -0.003975492436438799, -0.0037782208528369665, -0.003580949269235134, -0.0033836779184639454, -0.003186406334862113, -0.0029891347512602806, -0.0027918631676584482, -0.002594591584056616, -0.002397320233285427, -0.0022000486496835947, -0.0020027770660817623, -0.0018055055988952518, -0.0016082341317087412, -0.0014109625481069088, -0.0012136909645050764, -0.0010164194973185658, -0.0008191479719243944, -0.0006218764465302229, -0.0004246048629283905, -0.00022733339574187994, -3.0061928555369377e-05, 0.000167209655046463, 0.0003644811804406345, 0.000561752705834806, 0.0007590242312289774, 0.0009562957566231489, 0.0011535673402249813, 0.0013508388074114919, 0.0015481102745980024, 0.0017453813925385475, 0.00194265297614038, 0.0021399245597422123, 0.002337195910513401, 0.0025344674941152334, 0.002731739077717066, 0.0029290104284882545, 0.003126282012090087, 0.0033235535956919193, 0.0035208251792937517, 0.003718096762895584, 0.003915368113666773, 0.004112639464437962, 0.004309911280870438, 0.004507182631641626, 0.004704453982412815, 0.004901725798845291, 0.00509899714961648, 0.005296268966048956, 0.005493540316820145, 0.005690812133252621, 0.005888083484023809, 0.006085354834794998, 0.006282626651227474, 0.006479898001998663, 0.006677169352769852, 0.006874441169202328, 0.0070717125199735165, 0.007268983870744705, 0.007466255687177181, 0.00766352703794837, 0.007860798388719559, 0.008058070205152035]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 6.0, 5.0, 9.0, 9.0, 13.0, 14.0, 14.0, 22.0, 22.0, 23.0, 28.0, 24.0, 32.0, 38.0, 38.0, 38.0, 31.0, 48.0, 35.0, 52.0, 48.0, 44.0, 40.0, 52.0, 33.0, 30.0, 30.0, 26.0, 30.0, 24.0, 20.0, 20.0, 25.0, 23.0, 13.0, 7.0, 11.0, 6.0, 6.0, 4.0, 3.0, 3.0, 4.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019146203994750977, -0.0018517421558499336, -0.0017888639122247696, -0.0017259856685996056, -0.0016631074249744415, -0.0016002291813492775, -0.0015373509377241135, -0.0014744726940989494, -0.0014115944504737854, -0.0013487162068486214, -0.0012858379632234573, -0.0012229597195982933, -0.0011600814759731293, -0.0010972032323479652, -0.0010343249887228012, -0.0009714467450976372, -0.0009085685014724731, -0.0008456902578473091, -0.0007828120142221451, -0.000719933770596981, -0.000657055526971817, -0.000594177283346653, -0.000531299039721489, -0.0004684207960963249, -0.0004055425524711609, -0.00034266430884599686, -0.0002797860652208328, -0.0002169078215956688, -0.00015402957797050476, -9.115133434534073e-05, -2.8273090720176697e-05, 3.4605152904987335e-05, 9.748339653015137e-05, 0.0001603616401553154, 0.00022323988378047943, 0.00028611812740564346, 0.0003489963710308075, 0.0004118746146559715, 0.00047475285828113556, 0.0005376311019062996, 0.0006005093455314636, 0.0006633875891566277, 0.0007262658327817917, 0.0007891440764069557, 0.0008520223200321198, 0.0009149005636572838, 0.0009777788072824478, 0.0010406570509076118, 0.0011035352945327759, 0.00116641353815794, 0.001229291781783104, 0.001292170025408268, 0.001355048269033432, 0.001417926512658596, 0.00148080475628376, 0.001543682999908924, 0.0016065612435340881, 0.0016694394871592522, 0.0017323177307844162, 0.0017951959744095802, 0.0018580742180347443, 0.0019209524616599083, 0.0019838307052850723, 0.0020467089489102364, 0.0021095871925354004]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 2.0, 3.0, 7.0, 9.0, 13.0, 7.0, 15.0, 24.0, 16.0, 19.0, 16.0, 37.0, 24.0, 42.0, 35.0, 41.0, 30.0, 38.0, 35.0, 48.0, 50.0, 51.0, 51.0, 31.0, 52.0, 43.0, 39.0, 36.0, 26.0, 29.0, 24.0, 21.0, 19.0, 12.0, 11.0, 14.0, 8.0, 6.0, 7.0, 5.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0390625, -3.88739013671875, -3.7357177734375, -3.58404541015625, -3.432373046875, -3.28070068359375, -3.1290283203125, -2.97735595703125, -2.82568359375, -2.67401123046875, -2.5223388671875, -2.37066650390625, -2.218994140625, -2.06732177734375, -1.9156494140625, -1.76397705078125, -1.6123046875, -1.46063232421875, -1.3089599609375, -1.15728759765625, -1.005615234375, -0.85394287109375, -0.7022705078125, -0.55059814453125, -0.39892578125, -0.24725341796875, -0.0955810546875, 0.05609130859375, 0.207763671875, 0.35943603515625, 0.5111083984375, 0.66278076171875, 0.814453125, 0.96612548828125, 1.1177978515625, 1.26947021484375, 1.421142578125, 1.57281494140625, 1.7244873046875, 1.87615966796875, 2.02783203125, 2.17950439453125, 2.3311767578125, 2.48284912109375, 2.634521484375, 2.78619384765625, 2.9378662109375, 3.08953857421875, 3.2412109375, 3.39288330078125, 3.5445556640625, 3.69622802734375, 3.847900390625, 3.99957275390625, 4.1512451171875, 4.30291748046875, 4.45458984375, 4.60626220703125, 4.7579345703125, 4.90960693359375, 5.061279296875, 5.21295166015625, 5.3646240234375, 5.51629638671875, 5.66796875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 8.0, 7.0, 19.0, 21.0, 17.0, 42.0, 62.0, 69.0, 107.0, 146.0, 236.0, 374.0, 662.0, 1156.0, 2436.0, 5221.0, 12951.0, 34644.0, 97787.0, 301242.0, 384699.0, 131734.0, 45207.0, 16655.0, 6718.0, 2875.0, 1424.0, 764.0, 441.0, 273.0, 183.0, 101.0, 87.0, 50.0, 29.0, 28.0, 18.0, 15.0, 12.0, 11.0, 7.0, 5.0, 4.0, 4.0, 1.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.140625, -4.951171875, -4.76171875, -4.572265625, -4.3828125, -4.193359375, -4.00390625, -3.814453125, -3.625, -3.435546875, -3.24609375, -3.056640625, -2.8671875, -2.677734375, -2.48828125, -2.298828125, -2.109375, -1.919921875, -1.73046875, -1.541015625, -1.3515625, -1.162109375, -0.97265625, -0.783203125, -0.59375, -0.404296875, -0.21484375, -0.025390625, 0.1640625, 0.353515625, 0.54296875, 0.732421875, 0.921875, 1.111328125, 1.30078125, 1.490234375, 1.6796875, 1.869140625, 2.05859375, 2.248046875, 2.4375, 2.626953125, 2.81640625, 3.005859375, 3.1953125, 3.384765625, 3.57421875, 3.763671875, 3.953125, 4.142578125, 4.33203125, 4.521484375, 4.7109375, 4.900390625, 5.08984375, 5.279296875, 5.46875, 5.658203125, 5.84765625, 6.037109375, 6.2265625, 6.416015625, 6.60546875, 6.794921875, 6.984375]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [3.0, 2.0, 6.0, 2.0, 1.0, 5.0, 5.0, 5.0, 2.0, 6.0, 10.0, 15.0, 8.0, 12.0, 17.0, 19.0, 33.0, 33.0, 39.0, 35.0, 37.0, 45.0, 74.0, 63.0, 109.0, 146.0, 1363.0, 316.0, 159.0, 99.0, 66.0, 45.0, 32.0, 37.0, 29.0, 33.0, 22.0, 26.0, 16.0, 12.0, 12.0, 12.0, 13.0, 5.0, 5.0, 9.0, 5.0, 4.0, 2.0, 3.0, 6.0, 2.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4375, -9.0877685546875, -8.738037109375, -8.3883056640625, -8.03857421875, -7.6888427734375, -7.339111328125, -6.9893798828125, -6.6396484375, -6.2899169921875, -5.940185546875, -5.5904541015625, -5.24072265625, -4.8909912109375, -4.541259765625, -4.1915283203125, -3.841796875, -3.4920654296875, -3.142333984375, -2.7926025390625, -2.44287109375, -2.0931396484375, -1.743408203125, -1.3936767578125, -1.0439453125, -0.6942138671875, -0.344482421875, 0.0052490234375, 0.35498046875, 0.7047119140625, 1.054443359375, 1.4041748046875, 1.75390625, 2.1036376953125, 2.453369140625, 2.8031005859375, 3.15283203125, 3.5025634765625, 3.852294921875, 4.2020263671875, 4.5517578125, 4.9014892578125, 5.251220703125, 5.6009521484375, 5.95068359375, 6.3004150390625, 6.650146484375, 6.9998779296875, 7.349609375, 7.6993408203125, 8.049072265625, 8.3988037109375, 8.74853515625, 9.0982666015625, 9.447998046875, 9.7977294921875, 10.1474609375, 10.4971923828125, 10.846923828125, 11.1966552734375, 11.54638671875, 11.8961181640625, 12.245849609375, 12.5955810546875, 12.9453125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 5.0, 9.0, 13.0, 18.0, 20.0, 32.0, 38.0, 82.0, 94.0, 185.0, 307.0, 502.0, 1117.0, 10350.0, 2471397.0, 653942.0, 5369.0, 960.0, 477.0, 293.0, 176.0, 96.0, 74.0, 52.0, 21.0, 17.0, 14.0, 15.0, 12.0, 5.0, 4.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.53125, -29.680908203125, -28.83056640625, -27.980224609375, -27.1298828125, -26.279541015625, -25.42919921875, -24.578857421875, -23.728515625, -22.878173828125, -22.02783203125, -21.177490234375, -20.3271484375, -19.476806640625, -18.62646484375, -17.776123046875, -16.92578125, -16.075439453125, -15.22509765625, -14.374755859375, -13.5244140625, -12.674072265625, -11.82373046875, -10.973388671875, -10.123046875, -9.272705078125, -8.42236328125, -7.572021484375, -6.7216796875, -5.871337890625, -5.02099609375, -4.170654296875, -3.3203125, -2.469970703125, -1.61962890625, -0.769287109375, 0.0810546875, 0.931396484375, 1.78173828125, 2.632080078125, 3.482421875, 4.332763671875, 5.18310546875, 6.033447265625, 6.8837890625, 7.734130859375, 8.58447265625, 9.434814453125, 10.28515625, 11.135498046875, 11.98583984375, 12.836181640625, 13.6865234375, 14.536865234375, 15.38720703125, 16.237548828125, 17.087890625, 17.938232421875, 18.78857421875, 19.638916015625, 20.4892578125, 21.339599609375, 22.18994140625, 23.040283203125, 23.890625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 7.0, 47.0, 138.0, 298.0, 305.0, 159.0, 50.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.042195320129395, -11.737531661987305, -10.432867050170898, -9.128203392028809, -7.823539733886719, -6.518876075744629, -5.214211940765381, -3.909547805786133, -2.604884147644043, -1.300220251083374, 0.004443645477294922, 1.3091075420379639, 2.613771438598633, 3.9184350967407227, 5.223099231719971, 6.527763366699219, 7.832427024841309, 9.137090682983398, 10.441755294799805, 11.746418952941895, 13.051082611083984, 14.355746269226074, 15.660409927368164, 16.96507453918457, 18.269737243652344, 19.57440185546875, 20.879064559936523, 22.18372917175293, 23.488391876220703, 24.79305648803711, 26.097721099853516, 27.402385711669922, 28.707046508789062, 30.01171112060547, 31.316373825073242, 32.621036529541016, 33.92570114135742, 35.23036575317383, 36.535030364990234, 37.83969497680664, 39.14435577392578, 40.44902038574219, 41.753684997558594, 43.058345794677734, 44.36301040649414, 45.66767501831055, 46.97233963012695, 48.27700424194336, 49.581668853759766, 50.88633346557617, 52.19099807739258, 53.49565887451172, 54.800323486328125, 56.10498809814453, 57.40965270996094, 58.714317321777344, 60.01898193359375, 61.323646545410156, 62.62831115722656, 63.9329719543457, 65.23764038085938, 66.54229736328125, 67.84696197509766, 69.15162658691406, 70.45629119873047]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 4.0, 2.0, 5.0, 3.0, 5.0, 4.0, 0.0, 6.0, 7.0, 14.0, 21.0, 12.0, 16.0, 26.0, 24.0, 25.0, 38.0, 36.0, 34.0, 32.0, 28.0, 36.0, 36.0, 32.0, 44.0, 39.0, 38.0, 30.0, 36.0, 51.0, 44.0, 28.0, 25.0, 35.0, 27.0, 17.0, 27.0, 20.0, 17.0, 18.0, 8.0, 10.0, 12.0, 9.0, 5.0, 6.0, 7.0, 5.0, 4.0, 1.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-24.70195960998535, -23.914472579956055, -23.12698745727539, -22.339500427246094, -21.552013397216797, -20.7645263671875, -19.977039337158203, -19.18955421447754, -18.402067184448242, -17.614580154418945, -16.82709503173828, -16.039608001708984, -15.252120971679688, -14.46463394165039, -13.67714786529541, -12.88966178894043, -12.102174758911133, -11.314687728881836, -10.527201652526855, -9.739715576171875, -8.952228546142578, -8.164741516113281, -7.377255439758301, -6.589768886566162, -5.802282333374023, -5.014795780181885, -4.227309226989746, -3.4398226737976074, -2.6523361206054688, -1.86484956741333, -1.0773630142211914, -0.28987646102905273, 0.49761199951171875, 1.2850985527038574, 2.072585105895996, 2.8600716590881348, 3.6475582122802734, 4.435044765472412, 5.222531318664551, 6.0100178718566895, 6.797504425048828, 7.584990978240967, 8.372477531433105, 9.159963607788086, 9.947450637817383, 10.73493766784668, 11.52242374420166, 12.30990982055664, 13.097396850585938, 13.884883880615234, 14.672369956970215, 15.459856033325195, 16.247343063354492, 17.03483009338379, 17.822315216064453, 18.60980224609375, 19.397289276123047, 20.184776306152344, 20.97226333618164, 21.759748458862305, 22.5472354888916, 23.3347225189209, 24.122207641601562, 24.90969467163086, 25.697181701660156]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 1.0, 5.0, 8.0, 8.0, 6.0, 11.0, 14.0, 20.0, 12.0, 13.0, 15.0, 25.0, 25.0, 27.0, 26.0, 20.0, 30.0, 39.0, 42.0, 44.0, 41.0, 57.0, 43.0, 47.0, 39.0, 45.0, 38.0, 36.0, 32.0, 28.0, 25.0, 29.0, 32.0, 19.0, 16.0, 12.0, 17.0, 14.0, 8.0, 13.0, 9.0, 4.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.25390625, -4.11395263671875, -3.9739990234375, -3.83404541015625, -3.694091796875, -3.55413818359375, -3.4141845703125, -3.27423095703125, -3.13427734375, -2.99432373046875, -2.8543701171875, -2.71441650390625, -2.574462890625, -2.43450927734375, -2.2945556640625, -2.15460205078125, -2.0146484375, -1.87469482421875, -1.7347412109375, -1.59478759765625, -1.454833984375, -1.31488037109375, -1.1749267578125, -1.03497314453125, -0.89501953125, -0.75506591796875, -0.6151123046875, -0.47515869140625, -0.335205078125, -0.19525146484375, -0.0552978515625, 0.08465576171875, 0.224609375, 0.36456298828125, 0.5045166015625, 0.64447021484375, 0.784423828125, 0.92437744140625, 1.0643310546875, 1.20428466796875, 1.34423828125, 1.48419189453125, 1.6241455078125, 1.76409912109375, 1.904052734375, 2.04400634765625, 2.1839599609375, 2.32391357421875, 2.4638671875, 2.60382080078125, 2.7437744140625, 2.88372802734375, 3.023681640625, 3.16363525390625, 3.3035888671875, 3.44354248046875, 3.58349609375, 3.72344970703125, 3.8634033203125, 4.00335693359375, 4.143310546875, 4.28326416015625, 4.4232177734375, 4.56317138671875, 4.703125]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 7.0, 2.0, 6.0, 1.0, 7.0, 5.0, 8.0, 15.0, 8.0, 11.0, 7.0, 25.0, 23.0, 44.0, 37.0, 64.0, 110.0, 202.0, 401.0, 852.0, 2404.0, 9689.0, 60396.0, 493554.0, 2137555.0, 1276496.0, 181396.0, 23439.0, 4790.0, 1416.0, 553.0, 284.0, 165.0, 83.0, 63.0, 47.0, 29.0, 24.0, 17.0, 20.0, 12.0, 5.0, 5.0, 4.0, 6.0, 3.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.28125, -7.0445556640625, -6.807861328125, -6.5711669921875, -6.33447265625, -6.0977783203125, -5.861083984375, -5.6243896484375, -5.3876953125, -5.1510009765625, -4.914306640625, -4.6776123046875, -4.44091796875, -4.2042236328125, -3.967529296875, -3.7308349609375, -3.494140625, -3.2574462890625, -3.020751953125, -2.7840576171875, -2.54736328125, -2.3106689453125, -2.073974609375, -1.8372802734375, -1.6005859375, -1.3638916015625, -1.127197265625, -0.8905029296875, -0.65380859375, -0.4171142578125, -0.180419921875, 0.0562744140625, 0.29296875, 0.5296630859375, 0.766357421875, 1.0030517578125, 1.23974609375, 1.4764404296875, 1.713134765625, 1.9498291015625, 2.1865234375, 2.4232177734375, 2.659912109375, 2.8966064453125, 3.13330078125, 3.3699951171875, 3.606689453125, 3.8433837890625, 4.080078125, 4.3167724609375, 4.553466796875, 4.7901611328125, 5.02685546875, 5.2635498046875, 5.500244140625, 5.7369384765625, 5.9736328125, 6.2103271484375, 6.447021484375, 6.6837158203125, 6.92041015625, 7.1571044921875, 7.393798828125, 7.6304931640625, 7.8671875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 3.0, 2.0, 4.0, 9.0, 11.0, 10.0, 39.0, 48.0, 68.0, 91.0, 161.0, 250.0, 374.0, 597.0, 628.0, 577.0, 424.0, 287.0, 174.0, 125.0, 67.0, 49.0, 27.0, 17.0, 13.0, 11.0, 9.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.66015625, -7.40106201171875, -7.1419677734375, -6.88287353515625, -6.623779296875, -6.36468505859375, -6.1055908203125, -5.84649658203125, -5.58740234375, -5.32830810546875, -5.0692138671875, -4.81011962890625, -4.551025390625, -4.29193115234375, -4.0328369140625, -3.77374267578125, -3.5146484375, -3.25555419921875, -2.9964599609375, -2.73736572265625, -2.478271484375, -2.21917724609375, -1.9600830078125, -1.70098876953125, -1.44189453125, -1.18280029296875, -0.9237060546875, -0.66461181640625, -0.405517578125, -0.14642333984375, 0.1126708984375, 0.37176513671875, 0.630859375, 0.88995361328125, 1.1490478515625, 1.40814208984375, 1.667236328125, 1.92633056640625, 2.1854248046875, 2.44451904296875, 2.70361328125, 2.96270751953125, 3.2218017578125, 3.48089599609375, 3.739990234375, 3.99908447265625, 4.2581787109375, 4.51727294921875, 4.7763671875, 5.03546142578125, 5.2945556640625, 5.55364990234375, 5.812744140625, 6.07183837890625, 6.3309326171875, 6.59002685546875, 6.84912109375, 7.10821533203125, 7.3673095703125, 7.62640380859375, 7.885498046875, 8.14459228515625, 8.4036865234375, 8.66278076171875, 8.921875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 6.0, 1.0, 11.0, 4.0, 15.0, 15.0, 42.0, 41.0, 63.0, 77.0, 160.0, 304.0, 544.0, 1124.0, 3247.0, 12687.0, 75961.0, 814283.0, 2884927.0, 348488.0, 40411.0, 7792.0, 2134.0, 857.0, 441.0, 241.0, 145.0, 85.0, 53.0, 38.0, 29.0, 16.0, 11.0, 10.0, 4.0, 11.0, 4.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0], "bins": [-11.4140625, -11.091064453125, -10.76806640625, -10.445068359375, -10.1220703125, -9.799072265625, -9.47607421875, -9.153076171875, -8.830078125, -8.507080078125, -8.18408203125, -7.861083984375, -7.5380859375, -7.215087890625, -6.89208984375, -6.569091796875, -6.24609375, -5.923095703125, -5.60009765625, -5.277099609375, -4.9541015625, -4.631103515625, -4.30810546875, -3.985107421875, -3.662109375, -3.339111328125, -3.01611328125, -2.693115234375, -2.3701171875, -2.047119140625, -1.72412109375, -1.401123046875, -1.078125, -0.755126953125, -0.43212890625, -0.109130859375, 0.2138671875, 0.536865234375, 0.85986328125, 1.182861328125, 1.505859375, 1.828857421875, 2.15185546875, 2.474853515625, 2.7978515625, 3.120849609375, 3.44384765625, 3.766845703125, 4.08984375, 4.412841796875, 4.73583984375, 5.058837890625, 5.3818359375, 5.704833984375, 6.02783203125, 6.350830078125, 6.673828125, 6.996826171875, 7.31982421875, 7.642822265625, 7.9658203125, 8.288818359375, 8.61181640625, 8.934814453125, 9.2578125]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 6.0, 26.0, 61.0, 184.0, 282.0, 240.0, 144.0, 52.0, 18.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.89398956298828, -47.25218963623047, -45.610389709472656, -43.968589782714844, -42.32678985595703, -40.68498992919922, -39.04318618774414, -37.40138626098633, -35.759586334228516, -34.1177864074707, -32.47598648071289, -30.834184646606445, -29.192384719848633, -27.55058479309082, -25.908782958984375, -24.266983032226562, -22.62518310546875, -20.983383178710938, -19.341583251953125, -17.69978141784668, -16.057981491088867, -14.416181564331055, -12.774380683898926, -11.132579803466797, -9.490779876708984, -7.848979473114014, -6.207179069519043, -4.565378665924072, -2.9235782623291016, -1.281778335571289, 0.36002254486083984, 2.0018234252929688, 3.643627166748047, 5.285427570343018, 6.927227973937988, 8.569028854370117, 10.21082878112793, 11.852628707885742, 13.494429588317871, 15.13623046875, 16.778030395507812, 18.419830322265625, 20.061630249023438, 21.703432083129883, 23.345232009887695, 24.987031936645508, 26.628833770751953, 28.270633697509766, 29.912433624267578, 31.55423355102539, 33.1960334777832, 34.837833404541016, 36.479637145996094, 38.121437072753906, 39.76323699951172, 41.40503692626953, 43.046836853027344, 44.688636779785156, 46.33043670654297, 47.97223663330078, 49.614036560058594, 51.255836486816406, 52.897640228271484, 54.5394401550293, 56.18124008178711]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 5.0, 4.0, 5.0, 11.0, 6.0, 13.0, 12.0, 14.0, 21.0, 25.0, 23.0, 18.0, 20.0, 32.0, 28.0, 28.0, 34.0, 29.0, 42.0, 47.0, 35.0, 33.0, 51.0, 32.0, 47.0, 39.0, 34.0, 33.0, 36.0, 34.0, 31.0, 30.0, 22.0, 16.0, 15.0, 9.0, 16.0, 13.0, 12.0, 7.0, 8.0, 8.0, 6.0, 1.0, 4.0, 1.0, 7.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-18.254837036132812, -17.63751220703125, -17.020187377929688, -16.402860641479492, -15.78553581237793, -15.168210983276367, -14.550885200500488, -13.93355941772461, -13.316234588623047, -12.698909759521484, -12.081583976745605, -11.464258193969727, -10.846933364868164, -10.229608535766602, -9.612282752990723, -8.994956970214844, -8.377632141113281, -7.7603068351745605, -7.14298152923584, -6.525656223297119, -5.908330917358398, -5.291005611419678, -4.673680305480957, -4.056354999542236, -3.4390296936035156, -2.821704387664795, -2.204379081726074, -1.5870537757873535, -0.9697284698486328, -0.3524031639099121, 0.2649221420288086, 0.8822474479675293, 1.49957275390625, 2.1168980598449707, 2.7342233657836914, 3.351548671722412, 3.968873977661133, 4.5861992835998535, 5.203524589538574, 5.820849895477295, 6.438175201416016, 7.055500507354736, 7.672825813293457, 8.290151596069336, 8.907476425170898, 9.524801254272461, 10.14212703704834, 10.759452819824219, 11.376777648925781, 11.994102478027344, 12.611428260803223, 13.228754043579102, 13.846078872680664, 14.463403701782227, 15.080729484558105, 15.698055267333984, 16.315380096435547, 16.93270492553711, 17.550029754638672, 18.167356491088867, 18.78468132019043, 19.402006149291992, 20.019332885742188, 20.63665771484375, 21.253982543945312]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 11.0, 7.0, 11.0, 21.0, 19.0, 12.0, 21.0, 15.0, 22.0, 22.0, 28.0, 36.0, 40.0, 40.0, 37.0, 38.0, 34.0, 46.0, 44.0, 58.0, 33.0, 31.0, 35.0, 30.0, 31.0, 35.0, 44.0, 19.0, 31.0, 20.0, 19.0, 17.0, 14.0, 9.0, 8.0, 14.0, 11.0, 5.0, 6.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.94647216796875, -3.8031005859375, -3.65972900390625, -3.516357421875, -3.37298583984375, -3.2296142578125, -3.08624267578125, -2.94287109375, -2.79949951171875, -2.6561279296875, -2.51275634765625, -2.369384765625, -2.22601318359375, -2.0826416015625, -1.93927001953125, -1.7958984375, -1.65252685546875, -1.5091552734375, -1.36578369140625, -1.222412109375, -1.07904052734375, -0.9356689453125, -0.79229736328125, -0.64892578125, -0.50555419921875, -0.3621826171875, -0.21881103515625, -0.075439453125, 0.06793212890625, 0.2113037109375, 0.35467529296875, 0.498046875, 0.64141845703125, 0.7847900390625, 0.92816162109375, 1.071533203125, 1.21490478515625, 1.3582763671875, 1.50164794921875, 1.64501953125, 1.78839111328125, 1.9317626953125, 2.07513427734375, 2.218505859375, 2.36187744140625, 2.5052490234375, 2.64862060546875, 2.7919921875, 2.93536376953125, 3.0787353515625, 3.22210693359375, 3.365478515625, 3.50885009765625, 3.6522216796875, 3.79559326171875, 3.93896484375, 4.08233642578125, 4.2257080078125, 4.36907958984375, 4.512451171875, 4.65582275390625, 4.7991943359375, 4.94256591796875, 5.0859375]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 3.0, 5.0, 10.0, 12.0, 18.0, 20.0, 37.0, 41.0, 76.0, 110.0, 139.0, 235.0, 295.0, 386.0, 532.0, 778.0, 1099.0, 1521.0, 2146.0, 2890.0, 4088.0, 5814.0, 8163.0, 11489.0, 17176.0, 25073.0, 38476.0, 59573.0, 94212.0, 147067.0, 192237.0, 151806.0, 97244.0, 61707.0, 39265.0, 26285.0, 17255.0, 12212.0, 8350.0, 5928.0, 4210.0, 2974.0, 2170.0, 1535.0, 1105.0, 824.0, 570.0, 421.0, 294.0, 212.0, 163.0, 102.0, 70.0, 52.0, 35.0, 19.0, 16.0, 9.0, 7.0, 7.0, 4.0, 1.0, 1.0], "bins": [-0.42431640625, -0.4108619689941406, -0.39740753173828125, -0.3839530944824219, -0.3704986572265625, -0.3570442199707031, -0.34358978271484375, -0.3301353454589844, -0.316680908203125, -0.3032264709472656, -0.28977203369140625, -0.2763175964355469, -0.2628631591796875, -0.24940872192382812, -0.23595428466796875, -0.22249984741210938, -0.20904541015625, -0.19559097290039062, -0.18213653564453125, -0.16868209838867188, -0.1552276611328125, -0.14177322387695312, -0.12831878662109375, -0.11486434936523438, -0.101409912109375, -0.08795547485351562, -0.07450103759765625, -0.061046600341796875, -0.0475921630859375, -0.034137725830078125, -0.02068328857421875, -0.007228851318359375, 0.0062255859375, 0.019680023193359375, 0.03313446044921875, 0.046588897705078125, 0.0600433349609375, 0.07349777221679688, 0.08695220947265625, 0.10040664672851562, 0.113861083984375, 0.12731552124023438, 0.14076995849609375, 0.15422439575195312, 0.1676788330078125, 0.18113327026367188, 0.19458770751953125, 0.20804214477539062, 0.22149658203125, 0.23495101928710938, 0.24840545654296875, 0.2618598937988281, 0.2753143310546875, 0.2887687683105469, 0.30222320556640625, 0.3156776428222656, 0.329132080078125, 0.3425865173339844, 0.35604095458984375, 0.3694953918457031, 0.3829498291015625, 0.3964042663574219, 0.40985870361328125, 0.4233131408691406, 0.436767578125]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 3.0, 3.0, 6.0, 3.0, 7.0, 4.0, 12.0, 14.0, 16.0, 14.0, 13.0, 19.0, 14.0, 26.0, 31.0, 27.0, 23.0, 34.0, 29.0, 40.0, 31.0, 35.0, 32.0, 34.0, 1052.0, 44.0, 32.0, 39.0, 37.0, 21.0, 38.0, 45.0, 32.0, 25.0, 26.0, 28.0, 23.0, 17.0, 18.0, 19.0, 17.0, 12.0, 8.0, 5.0, 6.0, 5.0, 7.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.6875, -2.6002197265625, -2.512939453125, -2.4256591796875, -2.33837890625, -2.2510986328125, -2.163818359375, -2.0765380859375, -1.9892578125, -1.9019775390625, -1.814697265625, -1.7274169921875, -1.64013671875, -1.5528564453125, -1.465576171875, -1.3782958984375, -1.291015625, -1.2037353515625, -1.116455078125, -1.0291748046875, -0.94189453125, -0.8546142578125, -0.767333984375, -0.6800537109375, -0.5927734375, -0.5054931640625, -0.418212890625, -0.3309326171875, -0.24365234375, -0.1563720703125, -0.069091796875, 0.0181884765625, 0.10546875, 0.1927490234375, 0.280029296875, 0.3673095703125, 0.45458984375, 0.5418701171875, 0.629150390625, 0.7164306640625, 0.8037109375, 0.8909912109375, 0.978271484375, 1.0655517578125, 1.15283203125, 1.2401123046875, 1.327392578125, 1.4146728515625, 1.501953125, 1.5892333984375, 1.676513671875, 1.7637939453125, 1.85107421875, 1.9383544921875, 2.025634765625, 2.1129150390625, 2.2001953125, 2.2874755859375, 2.374755859375, 2.4620361328125, 2.54931640625, 2.6365966796875, 2.723876953125, 2.8111572265625, 2.8984375]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 2.0, 11.0, 8.0, 9.0, 9.0, 30.0, 42.0, 43.0, 82.0, 102.0, 186.0, 252.0, 374.0, 565.0, 770.0, 1205.0, 1760.0, 2673.0, 4024.0, 6009.0, 9181.0, 13987.0, 21119.0, 32897.0, 52231.0, 86670.0, 145085.0, 1244387.0, 182651.0, 109724.0, 65260.0, 40375.0, 25594.0, 17026.0, 10943.0, 7248.0, 4785.0, 3231.0, 2122.0, 1449.0, 983.0, 651.0, 433.0, 292.0, 202.0, 151.0, 104.0, 68.0, 46.0, 28.0, 25.0, 12.0, 8.0, 6.0, 5.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.400390625, -0.387359619140625, -0.37432861328125, -0.361297607421875, -0.3482666015625, -0.335235595703125, -0.32220458984375, -0.309173583984375, -0.296142578125, -0.283111572265625, -0.27008056640625, -0.257049560546875, -0.2440185546875, -0.230987548828125, -0.21795654296875, -0.204925537109375, -0.19189453125, -0.178863525390625, -0.16583251953125, -0.152801513671875, -0.1397705078125, -0.126739501953125, -0.11370849609375, -0.100677490234375, -0.087646484375, -0.074615478515625, -0.06158447265625, -0.048553466796875, -0.0355224609375, -0.022491455078125, -0.00946044921875, 0.003570556640625, 0.0166015625, 0.029632568359375, 0.04266357421875, 0.055694580078125, 0.0687255859375, 0.081756591796875, 0.09478759765625, 0.107818603515625, 0.120849609375, 0.133880615234375, 0.14691162109375, 0.159942626953125, 0.1729736328125, 0.186004638671875, 0.19903564453125, 0.212066650390625, 0.22509765625, 0.238128662109375, 0.25115966796875, 0.264190673828125, 0.2772216796875, 0.290252685546875, 0.30328369140625, 0.316314697265625, 0.329345703125, 0.342376708984375, 0.35540771484375, 0.368438720703125, 0.3814697265625, 0.394500732421875, 0.40753173828125, 0.420562744140625, 0.43359375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 5.0, 9.0, 9.0, 10.0, 14.0, 16.0, 24.0, 30.0, 57.0, 63.0, 126.0, 169.0, 130.0, 79.0, 54.0, 55.0, 34.0, 18.0, 13.0, 14.0, 18.0, 2.0, 9.0, 5.0, 3.0, 4.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.006191253662109375, -0.005989968776702881, -0.005788683891296387, -0.005587399005889893, -0.0053861141204833984, -0.005184829235076904, -0.00498354434967041, -0.004782259464263916, -0.004580974578857422, -0.004379689693450928, -0.004178404808044434, -0.0039771199226379395, -0.0037758350372314453, -0.003574550151824951, -0.003373265266418457, -0.003171980381011963, -0.0029706954956054688, -0.0027694106101989746, -0.0025681257247924805, -0.0023668408393859863, -0.002165555953979492, -0.001964271068572998, -0.001762986183166504, -0.0015617012977600098, -0.0013604164123535156, -0.0011591315269470215, -0.0009578466415405273, -0.0007565617561340332, -0.0005552768707275391, -0.0003539919853210449, -0.00015270709991455078, 4.857778549194336e-05, 0.0002498626708984375, 0.00045114755630493164, 0.0006524324417114258, 0.0008537173271179199, 0.001055002212524414, 0.0012562870979309082, 0.0014575719833374023, 0.0016588568687438965, 0.0018601417541503906, 0.0020614266395568848, 0.002262711524963379, 0.002463996410369873, 0.002665281295776367, 0.0028665661811828613, 0.0030678510665893555, 0.0032691359519958496, 0.0034704208374023438, 0.003671705722808838, 0.003872990608215332, 0.004074275493621826, 0.00427556037902832, 0.0044768452644348145, 0.004678130149841309, 0.004879415035247803, 0.005080699920654297, 0.005281984806060791, 0.005483269691467285, 0.005684554576873779, 0.0058858394622802734, 0.006087124347686768, 0.006288409233093262, 0.006489694118499756, 0.00669097900390625]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 1.0, 4.0, 5.0, 2.0, 2.0, 6.0, 10.0, 8.0, 17.0, 27.0, 30.0, 44.0, 53.0, 79.0, 130.0, 242.0, 482.0, 7215.0, 1037888.0, 1388.0, 353.0, 177.0, 112.0, 81.0, 40.0, 39.0, 26.0, 20.0, 8.0, 5.0, 7.0, 11.0, 4.0, 7.0, 6.0, 3.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.13623046875, -0.1321430206298828, -0.12805557250976562, -0.12396812438964844, -0.11988067626953125, -0.11579322814941406, -0.11170578002929688, -0.10761833190917969, -0.1035308837890625, -0.09944343566894531, -0.09535598754882812, -0.09126853942871094, -0.08718109130859375, -0.08309364318847656, -0.07900619506835938, -0.07491874694824219, -0.070831298828125, -0.06674385070800781, -0.06265640258789062, -0.05856895446777344, -0.05448150634765625, -0.05039405822753906, -0.046306610107421875, -0.04221916198730469, -0.0381317138671875, -0.03404426574707031, -0.029956817626953125, -0.025869369506835938, -0.02178192138671875, -0.017694473266601562, -0.013607025146484375, -0.009519577026367188, -0.00543212890625, -0.0013446807861328125, 0.002742767333984375, 0.0068302154541015625, 0.01091766357421875, 0.015005111694335938, 0.019092559814453125, 0.023180007934570312, 0.0272674560546875, 0.03135490417480469, 0.035442352294921875, 0.03952980041503906, 0.04361724853515625, 0.04770469665527344, 0.051792144775390625, 0.05587959289550781, 0.059967041015625, 0.06405448913574219, 0.06814193725585938, 0.07222938537597656, 0.07631683349609375, 0.08040428161621094, 0.08449172973632812, 0.08857917785644531, 0.0926666259765625, 0.09675407409667969, 0.10084152221679688, 0.10492897033691406, 0.10901641845703125, 0.11310386657714844, 0.11719131469726562, 0.12127876281738281, 0.1253662109375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 32.0, 504.0, 443.0, 34.0, 1.0], "bins": [-0.026273921132087708, -0.025842947885394096, -0.025411974638700485, -0.024981001392006874, -0.024550028145313263, -0.024119054898619652, -0.02368808165192604, -0.02325710840523243, -0.02282613515853882, -0.022395161911845207, -0.021964188665151596, -0.021533215418457985, -0.021102242171764374, -0.020671268925070763, -0.02024029567837715, -0.01980932243168354, -0.01937834732234478, -0.01894737407565117, -0.018516400828957558, -0.018085427582263947, -0.017654454335570335, -0.017223481088876724, -0.016792507842183113, -0.016361534595489502, -0.01593056134879589, -0.01549958810210228, -0.015068614855408669, -0.014637641608715057, -0.014206668362021446, -0.013775695115327835, -0.013344721868634224, -0.012913747690618038, -0.012482775375247002, -0.01205180212855339, -0.01162082888185978, -0.011189855635166168, -0.010758882388472557, -0.010327909141778946, -0.009896935895085335, -0.009465961717069149, -0.009034988470375538, -0.008604015223681927, -0.008173041976988316, -0.0077420687302947044, -0.007311095017939806, -0.006880121771246195, -0.006449148524552584, -0.006018174812197685, -0.005587201565504074, -0.005156228318810463, -0.004725255072116852, -0.004294281825423241, -0.003863308113068342, -0.003432334866374731, -0.00300136161968112, -0.002570388140156865, -0.0021394151262938976, -0.0017084417631849647, -0.0012774684000760317, -0.0008464951533824205, -0.00041552179027348757, 1.5451572835445404e-05, 0.00044642481952905655, 0.0008773982990533113, 0.0013083716621622443]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 9.0, 5.0, 5.0, 11.0, 11.0, 11.0, 8.0, 15.0, 21.0, 14.0, 24.0, 28.0, 36.0, 34.0, 35.0, 31.0, 47.0, 41.0, 52.0, 42.0, 57.0, 39.0, 49.0, 39.0, 38.0, 33.0, 43.0, 34.0, 29.0, 29.0, 29.0, 19.0, 22.0, 10.0, 15.0, 12.0, 7.0, 5.0, 1.0, 7.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002485930919647217, -0.0023978641256690025, -0.0023097973316907883, -0.002221730537712574, -0.0021336637437343597, -0.0020455969497561455, -0.001957530155777931, -0.001869463361799717, -0.0017813965678215027, -0.0016933297738432884, -0.0016052629798650742, -0.00151719618588686, -0.0014291293919086456, -0.0013410625979304314, -0.001252995803952217, -0.0011649290099740028, -0.0010768622159957886, -0.0009887954220175743, -0.00090072862803936, -0.0008126618340611458, -0.0007245950400829315, -0.0006365282461047173, -0.000548461452126503, -0.0004603946581482887, -0.00037232786417007446, -0.0002842610701918602, -0.00019619427621364594, -0.00010812748223543167, -2.0060688257217407e-05, 6.800610572099686e-05, 0.00015607289969921112, 0.00024413969367742538, 0.00033220648765563965, 0.0004202732816338539, 0.0005083400756120682, 0.0005964068695902824, 0.0006844736635684967, 0.000772540457546711, 0.0008606072515249252, 0.0009486740455031395, 0.0010367408394813538, 0.001124807633459568, 0.0012128744274377823, 0.0013009412214159966, 0.0013890080153942108, 0.001477074809372425, 0.0015651416033506393, 0.0016532083973288536, 0.0017412751913070679, 0.0018293419852852821, 0.0019174087792634964, 0.0020054755732417107, 0.002093542367219925, 0.002181609161198139, 0.0022696759551763535, 0.0023577427491545677, 0.002445809543132782, 0.0025338763371109962, 0.0026219431310892105, 0.0027100099250674248, 0.002798076719045639, 0.0028861435130238533, 0.0029742103070020676, 0.003062277100980282, 0.003150343894958496]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 7.0, 6.0, 11.0, 7.0, 11.0, 21.0, 19.0, 12.0, 21.0, 15.0, 22.0, 22.0, 28.0, 36.0, 40.0, 40.0, 37.0, 38.0, 34.0, 46.0, 44.0, 58.0, 33.0, 31.0, 35.0, 30.0, 31.0, 35.0, 44.0, 19.0, 31.0, 20.0, 19.0, 17.0, 14.0, 9.0, 8.0, 14.0, 11.0, 5.0, 6.0, 8.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.08984375, -3.94647216796875, -3.8031005859375, -3.65972900390625, -3.516357421875, -3.37298583984375, -3.2296142578125, -3.08624267578125, -2.94287109375, -2.79949951171875, -2.6561279296875, -2.51275634765625, -2.369384765625, -2.22601318359375, -2.0826416015625, -1.93927001953125, -1.7958984375, -1.65252685546875, -1.5091552734375, -1.36578369140625, -1.222412109375, -1.07904052734375, -0.9356689453125, -0.79229736328125, -0.64892578125, -0.50555419921875, -0.3621826171875, -0.21881103515625, -0.075439453125, 0.06793212890625, 0.2113037109375, 0.35467529296875, 0.498046875, 0.64141845703125, 0.7847900390625, 0.92816162109375, 1.071533203125, 1.21490478515625, 1.3582763671875, 1.50164794921875, 1.64501953125, 1.78839111328125, 1.9317626953125, 2.07513427734375, 2.218505859375, 2.36187744140625, 2.5052490234375, 2.64862060546875, 2.7919921875, 2.93536376953125, 3.0787353515625, 3.22210693359375, 3.365478515625, 3.50885009765625, 3.6522216796875, 3.79559326171875, 3.93896484375, 4.08233642578125, 4.2257080078125, 4.36907958984375, 4.512451171875, 4.65582275390625, 4.7991943359375, 4.94256591796875, 5.0859375]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 6.0, 8.0, 16.0, 17.0, 22.0, 26.0, 43.0, 40.0, 47.0, 89.0, 117.0, 186.0, 233.0, 297.0, 473.0, 701.0, 1161.0, 2267.0, 5139.0, 13790.0, 41392.0, 130940.0, 344971.0, 326684.0, 119013.0, 37912.0, 12592.0, 4909.0, 2157.0, 1158.0, 614.0, 436.0, 281.0, 199.0, 165.0, 106.0, 95.0, 66.0, 59.0, 45.0, 24.0, 16.0, 9.0, 7.0, 6.0, 6.0, 5.0, 4.0, 6.0, 2.0, 0.0, 2.0], "bins": [-6.66796875, -6.47723388671875, -6.2864990234375, -6.09576416015625, -5.905029296875, -5.71429443359375, -5.5235595703125, -5.33282470703125, -5.14208984375, -4.95135498046875, -4.7606201171875, -4.56988525390625, -4.379150390625, -4.18841552734375, -3.9976806640625, -3.80694580078125, -3.6162109375, -3.42547607421875, -3.2347412109375, -3.04400634765625, -2.853271484375, -2.66253662109375, -2.4718017578125, -2.28106689453125, -2.09033203125, -1.89959716796875, -1.7088623046875, -1.51812744140625, -1.327392578125, -1.13665771484375, -0.9459228515625, -0.75518798828125, -0.564453125, -0.37371826171875, -0.1829833984375, 0.00775146484375, 0.198486328125, 0.38922119140625, 0.5799560546875, 0.77069091796875, 0.96142578125, 1.15216064453125, 1.3428955078125, 1.53363037109375, 1.724365234375, 1.91510009765625, 2.1058349609375, 2.29656982421875, 2.4873046875, 2.67803955078125, 2.8687744140625, 3.05950927734375, 3.250244140625, 3.44097900390625, 3.6317138671875, 3.82244873046875, 4.01318359375, 4.20391845703125, 4.3946533203125, 4.58538818359375, 4.776123046875, 4.96685791015625, 5.1575927734375, 5.34832763671875, 5.5390625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 3.0, 7.0, 5.0, 9.0, 22.0, 8.0, 16.0, 16.0, 6.0, 11.0, 15.0, 12.0, 35.0, 24.0, 35.0, 33.0, 46.0, 42.0, 78.0, 101.0, 166.0, 280.0, 1362.0, 180.0, 113.0, 58.0, 53.0, 37.0, 33.0, 35.0, 19.0, 24.0, 29.0, 15.0, 19.0, 18.0, 13.0, 8.0, 9.0, 10.0, 6.0, 8.0, 5.0, 6.0, 4.0, 5.0, 5.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-11.0, -10.67724609375, -10.3544921875, -10.03173828125, -9.708984375, -9.38623046875, -9.0634765625, -8.74072265625, -8.41796875, -8.09521484375, -7.7724609375, -7.44970703125, -7.126953125, -6.80419921875, -6.4814453125, -6.15869140625, -5.8359375, -5.51318359375, -5.1904296875, -4.86767578125, -4.544921875, -4.22216796875, -3.8994140625, -3.57666015625, -3.25390625, -2.93115234375, -2.6083984375, -2.28564453125, -1.962890625, -1.64013671875, -1.3173828125, -0.99462890625, -0.671875, -0.34912109375, -0.0263671875, 0.29638671875, 0.619140625, 0.94189453125, 1.2646484375, 1.58740234375, 1.91015625, 2.23291015625, 2.5556640625, 2.87841796875, 3.201171875, 3.52392578125, 3.8466796875, 4.16943359375, 4.4921875, 4.81494140625, 5.1376953125, 5.46044921875, 5.783203125, 6.10595703125, 6.4287109375, 6.75146484375, 7.07421875, 7.39697265625, 7.7197265625, 8.04248046875, 8.365234375, 8.68798828125, 9.0107421875, 9.33349609375, 9.65625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 6.0, 5.0, 8.0, 8.0, 10.0, 7.0, 19.0, 30.0, 42.0, 49.0, 69.0, 101.0, 147.0, 183.0, 309.0, 512.0, 966.0, 3650.0, 231762.0, 2882535.0, 21741.0, 1689.0, 648.0, 363.0, 241.0, 178.0, 115.0, 102.0, 53.0, 41.0, 39.0, 20.0, 13.0, 17.0, 10.0, 6.0, 4.0, 4.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.703125, -23.912841796875, -23.12255859375, -22.332275390625, -21.5419921875, -20.751708984375, -19.96142578125, -19.171142578125, -18.380859375, -17.590576171875, -16.80029296875, -16.010009765625, -15.2197265625, -14.429443359375, -13.63916015625, -12.848876953125, -12.05859375, -11.268310546875, -10.47802734375, -9.687744140625, -8.8974609375, -8.107177734375, -7.31689453125, -6.526611328125, -5.736328125, -4.946044921875, -4.15576171875, -3.365478515625, -2.5751953125, -1.784912109375, -0.99462890625, -0.204345703125, 0.5859375, 1.376220703125, 2.16650390625, 2.956787109375, 3.7470703125, 4.537353515625, 5.32763671875, 6.117919921875, 6.908203125, 7.698486328125, 8.48876953125, 9.279052734375, 10.0693359375, 10.859619140625, 11.64990234375, 12.440185546875, 13.23046875, 14.020751953125, 14.81103515625, 15.601318359375, 16.3916015625, 17.181884765625, 17.97216796875, 18.762451171875, 19.552734375, 20.343017578125, 21.13330078125, 21.923583984375, 22.7138671875, 23.504150390625, 24.29443359375, 25.084716796875, 25.875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 125.0, 611.0, 257.0, 18.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-141.9075469970703, -138.8685760498047, -135.82958984375, -132.79061889648438, -129.75164794921875, -126.7126693725586, -123.67369079589844, -120.63471984863281, -117.59574127197266, -114.5567626953125, -111.51779174804688, -108.47881317138672, -105.43983459472656, -102.40086364746094, -99.36188507080078, -96.32290649414062, -93.283935546875, -90.24495697021484, -87.20598602294922, -84.16700744628906, -81.12803649902344, -78.08905792236328, -75.05007934570312, -72.0111083984375, -68.97212982177734, -65.93315124511719, -62.89418029785156, -59.855201721191406, -56.816226959228516, -53.777252197265625, -50.73827362060547, -47.69929885864258, -44.66033172607422, -41.62135696411133, -38.58238220214844, -35.54340362548828, -32.50442886352539, -29.4654541015625, -26.426477432250977, -23.387500762939453, -20.348526000976562, -17.309551239013672, -14.270574569702148, -11.231598854064941, -8.192623138427734, -5.153647422790527, -2.1146717071533203, 0.9243049621582031, 3.9632797241210938, 7.002255439758301, 10.041231155395508, 13.080206871032715, 16.119182586669922, 19.158157348632812, 22.197134017944336, 25.23611068725586, 28.27508544921875, 31.31406021118164, 34.35303497314453, 37.39201354980469, 40.43098831176758, 43.46996307373047, 46.508941650390625, 49.547916412353516, 52.586891174316406]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 5.0, 3.0, 6.0, 2.0, 4.0, 5.0, 9.0, 13.0, 11.0, 15.0, 18.0, 24.0, 15.0, 21.0, 24.0, 38.0, 28.0, 46.0, 34.0, 33.0, 35.0, 41.0, 39.0, 45.0, 32.0, 44.0, 42.0, 31.0, 33.0, 44.0, 33.0, 31.0, 28.0, 25.0, 26.0, 24.0, 19.0, 21.0, 13.0, 9.0, 14.0, 13.0, 7.0, 5.0, 7.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.42733383178711, -22.633399963378906, -21.839466094970703, -21.0455322265625, -20.251598358154297, -19.457664489746094, -18.66373062133789, -17.869796752929688, -17.075862884521484, -16.28192901611328, -15.487995147705078, -14.694061279296875, -13.900127410888672, -13.106193542480469, -12.312259674072266, -11.518325805664062, -10.724392890930176, -9.930459022521973, -9.13652515411377, -8.342591285705566, -7.548657417297363, -6.75472354888916, -5.960790157318115, -5.166856288909912, -4.372922420501709, -3.578988552093506, -2.7850546836853027, -1.9911210536956787, -1.1971871852874756, -0.40325331687927246, 0.39068031311035156, 1.1846141815185547, 1.9785480499267578, 2.772481918334961, 3.566415786743164, 4.360349655151367, 5.15428352355957, 5.948217391967773, 6.742150783538818, 7.5360846519470215, 8.330018997192383, 9.123952865600586, 9.917886734008789, 10.711820602416992, 11.505754470825195, 12.299688339233398, 13.093622207641602, 13.887556076049805, 14.681488990783691, 15.475422859191895, 16.26935577392578, 17.063289642333984, 17.857223510742188, 18.65115737915039, 19.445091247558594, 20.239025115966797, 21.032958984375, 21.826892852783203, 22.620826721191406, 23.41476058959961, 24.208694458007812, 25.002628326416016, 25.79656219482422, 26.590496063232422, 27.384429931640625]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 4.0, 4.0, 6.0, 10.0, 13.0, 12.0, 10.0, 15.0, 13.0, 24.0, 24.0, 16.0, 24.0, 26.0, 34.0, 29.0, 38.0, 38.0, 45.0, 43.0, 39.0, 58.0, 51.0, 40.0, 35.0, 37.0, 29.0, 33.0, 28.0, 29.0, 26.0, 31.0, 25.0, 12.0, 17.0, 13.0, 10.0, 9.0, 10.0, 11.0, 9.0, 4.0, 4.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-4.57421875, -4.42938232421875, -4.2845458984375, -4.13970947265625, -3.994873046875, -3.85003662109375, -3.7052001953125, -3.56036376953125, -3.41552734375, -3.27069091796875, -3.1258544921875, -2.98101806640625, -2.836181640625, -2.69134521484375, -2.5465087890625, -2.40167236328125, -2.2568359375, -2.11199951171875, -1.9671630859375, -1.82232666015625, -1.677490234375, -1.53265380859375, -1.3878173828125, -1.24298095703125, -1.09814453125, -0.95330810546875, -0.8084716796875, -0.66363525390625, -0.518798828125, -0.37396240234375, -0.2291259765625, -0.08428955078125, 0.060546875, 0.20538330078125, 0.3502197265625, 0.49505615234375, 0.639892578125, 0.78472900390625, 0.9295654296875, 1.07440185546875, 1.21923828125, 1.36407470703125, 1.5089111328125, 1.65374755859375, 1.798583984375, 1.94342041015625, 2.0882568359375, 2.23309326171875, 2.3779296875, 2.52276611328125, 2.6676025390625, 2.81243896484375, 2.957275390625, 3.10211181640625, 3.2469482421875, 3.39178466796875, 3.53662109375, 3.68145751953125, 3.8262939453125, 3.97113037109375, 4.115966796875, 4.26080322265625, 4.4056396484375, 4.55047607421875, 4.6953125]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 2.0, 6.0, 5.0, 4.0, 6.0, 5.0, 6.0, 13.0, 11.0, 7.0, 17.0, 19.0, 17.0, 36.0, 31.0, 33.0, 51.0, 82.0, 100.0, 136.0, 164.0, 231.0, 288.0, 462.0, 1648.0, 4062382.0, 126181.0, 734.0, 405.0, 304.0, 251.0, 172.0, 107.0, 92.0, 64.0, 53.0, 18.0, 40.0, 26.0, 21.0, 17.0, 16.0, 8.0, 1.0, 8.0, 4.0, 7.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.46875, -54.57373046875, -52.6787109375, -50.78369140625, -48.888671875, -46.99365234375, -45.0986328125, -43.20361328125, -41.30859375, -39.41357421875, -37.5185546875, -35.62353515625, -33.728515625, -31.83349609375, -29.9384765625, -28.04345703125, -26.1484375, -24.25341796875, -22.3583984375, -20.46337890625, -18.568359375, -16.67333984375, -14.7783203125, -12.88330078125, -10.98828125, -9.09326171875, -7.1982421875, -5.30322265625, -3.408203125, -1.51318359375, 0.3818359375, 2.27685546875, 4.171875, 6.06689453125, 7.9619140625, 9.85693359375, 11.751953125, 13.64697265625, 15.5419921875, 17.43701171875, 19.33203125, 21.22705078125, 23.1220703125, 25.01708984375, 26.912109375, 28.80712890625, 30.7021484375, 32.59716796875, 34.4921875, 36.38720703125, 38.2822265625, 40.17724609375, 42.072265625, 43.96728515625, 45.8623046875, 47.75732421875, 49.65234375, 51.54736328125, 53.4423828125, 55.33740234375, 57.232421875, 59.12744140625, 61.0224609375, 62.91748046875, 64.8125]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 3.0, 8.0, 4.0, 2.0, 6.0, 9.0, 8.0, 10.0, 17.0, 19.0, 20.0, 34.0, 39.0, 36.0, 79.0, 90.0, 128.0, 178.0, 227.0, 333.0, 415.0, 518.0, 467.0, 371.0, 273.0, 192.0, 151.0, 101.0, 75.0, 58.0, 43.0, 32.0, 39.0, 25.0, 12.0, 12.0, 11.0, 5.0, 5.0, 4.0, 6.0, 3.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-7.0546875, -6.85693359375, -6.6591796875, -6.46142578125, -6.263671875, -6.06591796875, -5.8681640625, -5.67041015625, -5.47265625, -5.27490234375, -5.0771484375, -4.87939453125, -4.681640625, -4.48388671875, -4.2861328125, -4.08837890625, -3.890625, -3.69287109375, -3.4951171875, -3.29736328125, -3.099609375, -2.90185546875, -2.7041015625, -2.50634765625, -2.30859375, -2.11083984375, -1.9130859375, -1.71533203125, -1.517578125, -1.31982421875, -1.1220703125, -0.92431640625, -0.7265625, -0.52880859375, -0.3310546875, -0.13330078125, 0.064453125, 0.26220703125, 0.4599609375, 0.65771484375, 0.85546875, 1.05322265625, 1.2509765625, 1.44873046875, 1.646484375, 1.84423828125, 2.0419921875, 2.23974609375, 2.4375, 2.63525390625, 2.8330078125, 3.03076171875, 3.228515625, 3.42626953125, 3.6240234375, 3.82177734375, 4.01953125, 4.21728515625, 4.4150390625, 4.61279296875, 4.810546875, 5.00830078125, 5.2060546875, 5.40380859375, 5.6015625]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 8.0, 8.0, 5.0, 5.0, 7.0, 7.0, 15.0, 25.0, 15.0, 25.0, 48.0, 47.0, 67.0, 123.0, 248.0, 1064.0, 33329.0, 4035742.0, 120849.0, 1848.0, 338.0, 139.0, 75.0, 53.0, 39.0, 36.0, 24.0, 24.0, 15.0, 10.0, 14.0, 12.0, 4.0, 6.0, 4.0, 5.0, 0.0, 2.0, 2.0, 4.0, 1.0], "bins": [-44.8125, -43.709228515625, -42.60595703125, -41.502685546875, -40.3994140625, -39.296142578125, -38.19287109375, -37.089599609375, -35.986328125, -34.883056640625, -33.77978515625, -32.676513671875, -31.5732421875, -30.469970703125, -29.36669921875, -28.263427734375, -27.16015625, -26.056884765625, -24.95361328125, -23.850341796875, -22.7470703125, -21.643798828125, -20.54052734375, -19.437255859375, -18.333984375, -17.230712890625, -16.12744140625, -15.024169921875, -13.9208984375, -12.817626953125, -11.71435546875, -10.611083984375, -9.5078125, -8.404541015625, -7.30126953125, -6.197998046875, -5.0947265625, -3.991455078125, -2.88818359375, -1.784912109375, -0.681640625, 0.421630859375, 1.52490234375, 2.628173828125, 3.7314453125, 4.834716796875, 5.93798828125, 7.041259765625, 8.14453125, 9.247802734375, 10.35107421875, 11.454345703125, 12.5576171875, 13.660888671875, 14.76416015625, 15.867431640625, 16.970703125, 18.073974609375, 19.17724609375, 20.280517578125, 21.3837890625, 22.487060546875, 23.59033203125, 24.693603515625, 25.796875]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 20.0, 29.0, 46.0, 65.0, 95.0, 110.0, 134.0, 134.0, 121.0, 102.0, 61.0, 34.0, 26.0, 11.0, 7.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.66743087768555, -33.81975173950195, -32.97207260131836, -32.124393463134766, -31.27671241760254, -30.429031372070312, -29.58135223388672, -28.733673095703125, -27.88599395751953, -27.038314819335938, -26.19063377380371, -25.342954635620117, -24.495275497436523, -23.647594451904297, -22.799915313720703, -21.95223617553711, -21.104557037353516, -20.256877899169922, -19.409196853637695, -18.5615177154541, -17.713838577270508, -16.86615753173828, -16.018478393554688, -15.170799255371094, -14.323118209838867, -13.475438117980957, -12.627758979797363, -11.780078887939453, -10.93239974975586, -10.08471965789795, -9.237039566040039, -8.389360427856445, -7.541681289672852, -6.6940016746521, -5.846322059631348, -4.9986419677734375, -4.150962829589844, -3.3032827377319336, -2.4556031227111816, -1.6079235076904297, -0.7602438926696777, 0.087435781955719, 0.9351154565811157, 1.7827951908111572, 2.630474805831909, 3.4781546592712402, 4.325834274291992, 5.173513889312744, 6.021193504333496, 6.868873119354248, 7.716552734375, 8.56423282623291, 9.411911964416504, 10.259592056274414, 11.107271194458008, 11.954951286315918, 12.802631378173828, 13.650311470031738, 14.497990608215332, 15.345670700073242, 16.193349838256836, 17.041030883789062, 17.888710021972656, 18.73638916015625, 19.584068298339844]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 8.0, 0.0, 5.0, 4.0, 7.0, 10.0, 9.0, 9.0, 8.0, 11.0, 17.0, 15.0, 11.0, 27.0, 27.0, 24.0, 29.0, 30.0, 35.0, 40.0, 41.0, 38.0, 28.0, 36.0, 47.0, 42.0, 38.0, 47.0, 24.0, 33.0, 37.0, 41.0, 28.0, 27.0, 26.0, 24.0, 18.0, 16.0, 14.0, 16.0, 12.0, 11.0, 8.0, 14.0, 8.0, 4.0, 2.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.676345825195312, -18.025131225585938, -17.373916625976562, -16.722702026367188, -16.071487426757812, -15.420272827148438, -14.769057273864746, -14.117842674255371, -13.466628074645996, -12.815413475036621, -12.164198875427246, -11.512984275817871, -10.86176872253418, -10.210554122924805, -9.55933952331543, -8.908124923706055, -8.25691032409668, -7.605695724487305, -6.95448112487793, -6.3032660484313965, -5.6520514488220215, -5.0008368492126465, -4.349621772766113, -3.6984071731567383, -3.0471925735473633, -2.3959779739379883, -1.7447631359100342, -1.0935484170913696, -0.4423336982727051, 0.20888090133666992, 0.860095739364624, 1.5113105773925781, 2.162525177001953, 2.813739776611328, 3.4649546146392822, 4.116169452667236, 4.767384052276611, 5.418598651885986, 6.0698137283325195, 6.7210283279418945, 7.3722429275512695, 8.023457527160645, 8.67467212677002, 9.325886726379395, 9.977102279663086, 10.628316879272461, 11.279531478881836, 11.930746078491211, 12.581960678100586, 13.233175277709961, 13.884389877319336, 14.535604476928711, 15.186819076538086, 15.838033676147461, 16.489248275756836, 17.140464782714844, 17.79167938232422, 18.442893981933594, 19.09410858154297, 19.745323181152344, 20.39653778076172, 21.047752380371094, 21.69896697998047, 22.350181579589844, 23.00139617919922]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 3.0, 6.0, 7.0, 11.0, 14.0, 23.0, 16.0, 16.0, 20.0, 24.0, 26.0, 40.0, 33.0, 46.0, 47.0, 33.0, 54.0, 38.0, 59.0, 43.0, 53.0, 41.0, 41.0, 41.0, 34.0, 33.0, 24.0, 29.0, 24.0, 20.0, 18.0, 16.0, 11.0, 10.0, 13.0, 11.0, 9.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.3828125, -5.22418212890625, -5.0655517578125, -4.90692138671875, -4.748291015625, -4.58966064453125, -4.4310302734375, -4.27239990234375, -4.11376953125, -3.95513916015625, -3.7965087890625, -3.63787841796875, -3.479248046875, -3.32061767578125, -3.1619873046875, -3.00335693359375, -2.8447265625, -2.68609619140625, -2.5274658203125, -2.36883544921875, -2.210205078125, -2.05157470703125, -1.8929443359375, -1.73431396484375, -1.57568359375, -1.41705322265625, -1.2584228515625, -1.09979248046875, -0.941162109375, -0.78253173828125, -0.6239013671875, -0.46527099609375, -0.306640625, -0.14801025390625, 0.0106201171875, 0.16925048828125, 0.327880859375, 0.48651123046875, 0.6451416015625, 0.80377197265625, 0.96240234375, 1.12103271484375, 1.2796630859375, 1.43829345703125, 1.596923828125, 1.75555419921875, 1.9141845703125, 2.07281494140625, 2.2314453125, 2.39007568359375, 2.5487060546875, 2.70733642578125, 2.865966796875, 3.02459716796875, 3.1832275390625, 3.34185791015625, 3.50048828125, 3.65911865234375, 3.8177490234375, 3.97637939453125, 4.135009765625, 4.29364013671875, 4.4522705078125, 4.61090087890625, 4.76953125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 13.0, 7.0, 14.0, 28.0, 39.0, 51.0, 68.0, 93.0, 152.0, 251.0, 337.0, 537.0, 739.0, 1186.0, 1764.0, 2736.0, 4255.0, 6630.0, 10273.0, 17034.0, 27752.0, 48423.0, 87994.0, 168047.0, 256930.0, 183981.0, 96908.0, 52713.0, 30347.0, 18013.0, 11174.0, 7002.0, 4531.0, 2863.0, 1911.0, 1234.0, 861.0, 540.0, 361.0, 239.0, 173.0, 123.0, 70.0, 47.0, 37.0, 26.0, 16.0, 13.0, 8.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0], "bins": [-0.58203125, -0.5641632080078125, -0.546295166015625, -0.5284271240234375, -0.51055908203125, -0.4926910400390625, -0.474822998046875, -0.4569549560546875, -0.4390869140625, -0.4212188720703125, -0.403350830078125, -0.3854827880859375, -0.36761474609375, -0.3497467041015625, -0.331878662109375, -0.3140106201171875, -0.296142578125, -0.2782745361328125, -0.260406494140625, -0.2425384521484375, -0.22467041015625, -0.2068023681640625, -0.188934326171875, -0.1710662841796875, -0.1531982421875, -0.1353302001953125, -0.117462158203125, -0.0995941162109375, -0.08172607421875, -0.0638580322265625, -0.045989990234375, -0.0281219482421875, -0.01025390625, 0.0076141357421875, 0.025482177734375, 0.0433502197265625, 0.06121826171875, 0.0790863037109375, 0.096954345703125, 0.1148223876953125, 0.1326904296875, 0.1505584716796875, 0.168426513671875, 0.1862945556640625, 0.20416259765625, 0.2220306396484375, 0.239898681640625, 0.2577667236328125, 0.275634765625, 0.2935028076171875, 0.311370849609375, 0.3292388916015625, 0.34710693359375, 0.3649749755859375, 0.382843017578125, 0.4007110595703125, 0.4185791015625, 0.4364471435546875, 0.454315185546875, 0.4721832275390625, 0.49005126953125, 0.5079193115234375, 0.525787353515625, 0.5436553955078125, 0.5615234375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 5.0, 4.0, 1.0, 2.0, 6.0, 6.0, 8.0, 14.0, 7.0, 17.0, 17.0, 19.0, 26.0, 16.0, 22.0, 30.0, 30.0, 31.0, 37.0, 31.0, 43.0, 37.0, 51.0, 45.0, 1064.0, 49.0, 38.0, 34.0, 41.0, 39.0, 23.0, 31.0, 34.0, 27.0, 23.0, 20.0, 19.0, 21.0, 13.0, 15.0, 5.0, 11.0, 9.0, 10.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.94921875, -2.854949951171875, -2.76068115234375, -2.666412353515625, -2.5721435546875, -2.477874755859375, -2.38360595703125, -2.289337158203125, -2.195068359375, -2.100799560546875, -2.00653076171875, -1.912261962890625, -1.8179931640625, -1.723724365234375, -1.62945556640625, -1.535186767578125, -1.44091796875, -1.346649169921875, -1.25238037109375, -1.158111572265625, -1.0638427734375, -0.969573974609375, -0.87530517578125, -0.781036376953125, -0.686767578125, -0.592498779296875, -0.49822998046875, -0.403961181640625, -0.3096923828125, -0.215423583984375, -0.12115478515625, -0.026885986328125, 0.0673828125, 0.161651611328125, 0.25592041015625, 0.350189208984375, 0.4444580078125, 0.538726806640625, 0.63299560546875, 0.727264404296875, 0.821533203125, 0.915802001953125, 1.01007080078125, 1.104339599609375, 1.1986083984375, 1.292877197265625, 1.38714599609375, 1.481414794921875, 1.57568359375, 1.669952392578125, 1.76422119140625, 1.858489990234375, 1.9527587890625, 2.047027587890625, 2.14129638671875, 2.235565185546875, 2.329833984375, 2.424102783203125, 2.51837158203125, 2.612640380859375, 2.7069091796875, 2.801177978515625, 2.89544677734375, 2.989715576171875, 3.083984375]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 2.0, 1.0, 10.0, 11.0, 14.0, 21.0, 31.0, 51.0, 77.0, 98.0, 148.0, 229.0, 358.0, 483.0, 686.0, 1055.0, 1641.0, 2334.0, 3644.0, 5458.0, 8392.0, 12645.0, 19546.0, 30559.0, 48061.0, 79099.0, 133509.0, 1201122.0, 240482.0, 117041.0, 69338.0, 42656.0, 26931.0, 17809.0, 11510.0, 7567.0, 4900.0, 3322.0, 2132.0, 1399.0, 913.0, 624.0, 400.0, 254.0, 178.0, 137.0, 82.0, 61.0, 39.0, 30.0, 14.0, 10.0, 7.0, 6.0, 7.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.404541015625, -0.3914375305175781, -0.37833404541015625, -0.3652305603027344, -0.3521270751953125, -0.3390235900878906, -0.32592010498046875, -0.3128166198730469, -0.299713134765625, -0.2866096496582031, -0.27350616455078125, -0.2604026794433594, -0.2472991943359375, -0.23419570922851562, -0.22109222412109375, -0.20798873901367188, -0.19488525390625, -0.18178176879882812, -0.16867828369140625, -0.15557479858398438, -0.1424713134765625, -0.12936782836914062, -0.11626434326171875, -0.10316085815429688, -0.090057373046875, -0.07695388793945312, -0.06385040283203125, -0.050746917724609375, -0.0376434326171875, -0.024539947509765625, -0.01143646240234375, 0.001667022705078125, 0.0147705078125, 0.027873992919921875, 0.04097747802734375, 0.054080963134765625, 0.0671844482421875, 0.08028793334960938, 0.09339141845703125, 0.10649490356445312, 0.119598388671875, 0.13270187377929688, 0.14580535888671875, 0.15890884399414062, 0.1720123291015625, 0.18511581420898438, 0.19821929931640625, 0.21132278442382812, 0.22442626953125, 0.23752975463867188, 0.25063323974609375, 0.2637367248535156, 0.2768402099609375, 0.2899436950683594, 0.30304718017578125, 0.3161506652832031, 0.329254150390625, 0.3423576354980469, 0.35546112060546875, 0.3685646057128906, 0.3816680908203125, 0.3947715759277344, 0.40787506103515625, 0.4209785461425781, 0.43408203125]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 3.0, 3.0, 8.0, 3.0, 4.0, 7.0, 15.0, 12.0, 20.0, 14.0, 21.0, 26.0, 39.0, 45.0, 84.0, 115.0, 139.0, 127.0, 88.0, 56.0, 25.0, 18.0, 23.0, 10.0, 19.0, 16.0, 9.0, 17.0, 9.0, 6.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.00799560546875, -0.007756650447845459, -0.007517695426940918, -0.007278740406036377, -0.007039785385131836, -0.006800830364227295, -0.006561875343322754, -0.006322920322418213, -0.006083965301513672, -0.005845010280609131, -0.00560605525970459, -0.005367100238800049, -0.005128145217895508, -0.004889190196990967, -0.004650235176086426, -0.004411280155181885, -0.004172325134277344, -0.003933370113372803, -0.0036944150924682617, -0.0034554600715637207, -0.0032165050506591797, -0.0029775500297546387, -0.0027385950088500977, -0.0024996399879455566, -0.0022606849670410156, -0.0020217299461364746, -0.0017827749252319336, -0.0015438199043273926, -0.0013048648834228516, -0.0010659098625183105, -0.0008269548416137695, -0.0005879998207092285, -0.0003490447998046875, -0.00011008977890014648, 0.00012886524200439453, 0.00036782026290893555, 0.0006067752838134766, 0.0008457303047180176, 0.0010846853256225586, 0.0013236403465270996, 0.0015625953674316406, 0.0018015503883361816, 0.0020405054092407227, 0.0022794604301452637, 0.0025184154510498047, 0.0027573704719543457, 0.0029963254928588867, 0.0032352805137634277, 0.0034742355346679688, 0.0037131905555725098, 0.003952145576477051, 0.004191100597381592, 0.004430055618286133, 0.004669010639190674, 0.004907965660095215, 0.005146920680999756, 0.005385875701904297, 0.005624830722808838, 0.005863785743713379, 0.00610274076461792, 0.006341695785522461, 0.006580650806427002, 0.006819605827331543, 0.007058560848236084, 0.007297515869140625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 3.0, 2.0, 2.0, 3.0, 2.0, 13.0, 21.0, 25.0, 36.0, 35.0, 49.0, 45.0, 67.0, 93.0, 163.0, 368.0, 713.0, 13084.0, 1031042.0, 1493.0, 491.0, 242.0, 158.0, 98.0, 59.0, 53.0, 42.0, 33.0, 21.0, 17.0, 11.0, 8.0, 7.0, 9.0, 7.0, 7.0, 5.0, 5.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0], "bins": [-0.1318359375, -0.12748146057128906, -0.12312698364257812, -0.11877250671386719, -0.11441802978515625, -0.11006355285644531, -0.10570907592773438, -0.10135459899902344, -0.0970001220703125, -0.09264564514160156, -0.08829116821289062, -0.08393669128417969, -0.07958221435546875, -0.07522773742675781, -0.07087326049804688, -0.06651878356933594, -0.062164306640625, -0.05780982971191406, -0.053455352783203125, -0.04910087585449219, -0.04474639892578125, -0.04039192199707031, -0.036037445068359375, -0.03168296813964844, -0.0273284912109375, -0.022974014282226562, -0.018619537353515625, -0.014265060424804688, -0.00991058349609375, -0.0055561065673828125, -0.001201629638671875, 0.0031528472900390625, 0.00750732421875, 0.011861801147460938, 0.016216278076171875, 0.020570755004882812, 0.02492523193359375, 0.029279708862304688, 0.033634185791015625, 0.03798866271972656, 0.0423431396484375, 0.04669761657714844, 0.051052093505859375, 0.05540657043457031, 0.05976104736328125, 0.06411552429199219, 0.06847000122070312, 0.07282447814941406, 0.077178955078125, 0.08153343200683594, 0.08588790893554688, 0.09024238586425781, 0.09459686279296875, 0.09895133972167969, 0.10330581665039062, 0.10766029357910156, 0.1120147705078125, 0.11636924743652344, 0.12072372436523438, 0.1250782012939453, 0.12943267822265625, 0.1337871551513672, 0.13814163208007812, 0.14249610900878906, 0.1468505859375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 11.0, 267.0, 706.0, 29.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.03649342060089111, -0.03584413602948189, -0.03519485145807266, -0.034545570611953735, -0.03389628604054451, -0.033247001469135284, -0.03259771689772606, -0.031948432326316833, -0.031299151480197906, -0.03064986690878868, -0.030000584200024605, -0.02935129962861538, -0.028702016919851303, -0.028052732348442078, -0.027403447777032852, -0.026754165068268776, -0.0261048786342144, -0.025455594062805176, -0.0248063113540411, -0.024157026782631874, -0.023507744073867798, -0.022858459502458572, -0.022209174931049347, -0.02155989222228527, -0.020910609513521194, -0.02026132494211197, -0.019612042233347893, -0.018962757661938667, -0.01831347495317459, -0.017664190381765366, -0.01701490581035614, -0.016365623101592064, -0.01571633853018284, -0.015067054890096188, -0.014417771250009537, -0.013768486678600311, -0.01311920303851366, -0.01246991939842701, -0.011820635758340359, -0.011171352118253708, -0.010522067546844482, -0.009872783906757832, -0.00922350026667118, -0.008574215695261955, -0.007924932055175304, -0.0072756484150886536, -0.006626364775002003, -0.0059770806692540646, -0.005327797029167414, -0.004678513389080763, -0.004029229283332825, -0.003379945643246174, -0.0027306617703288794, -0.002081377897411585, -0.001432094257324934, -0.0007828101515769958, -0.000133526511490345, 0.0005157573032192886, 0.0011650411179289222, 0.0018143248744308949, 0.0024636087473481894, 0.003112892620265484, 0.0037621762603521347, 0.004411460366100073, 0.005060744006186724]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 6.0, 3.0, 5.0, 5.0, 8.0, 9.0, 10.0, 12.0, 15.0, 24.0, 19.0, 29.0, 33.0, 32.0, 31.0, 40.0, 40.0, 38.0, 48.0, 38.0, 36.0, 41.0, 54.0, 35.0, 54.0, 45.0, 36.0, 31.0, 24.0, 38.0, 26.0, 34.0, 19.0, 22.0, 19.0, 14.0, 9.0, 4.0, 7.0, 7.0, 9.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.004114091396331787, -0.00399754848331213, -0.003881005570292473, -0.0037644626572728157, -0.0036479197442531586, -0.0035313768312335014, -0.0034148339182138443, -0.003298291005194187, -0.00318174809217453, -0.003065205179154873, -0.0029486622661352158, -0.0028321193531155586, -0.0027155764400959015, -0.0025990335270762444, -0.0024824906140565872, -0.00236594770103693, -0.002249404788017273, -0.002132861874997616, -0.0020163189619779587, -0.0018997760489583015, -0.0017832331359386444, -0.0016666902229189873, -0.0015501473098993301, -0.001433604396879673, -0.0013170614838600159, -0.0012005185708403587, -0.0010839756578207016, -0.0009674327448010445, -0.0008508898317813873, -0.0007343469187617302, -0.0006178040057420731, -0.0005012610927224159, -0.0003847181797027588, -0.00026817526668310165, -0.00015163235366344452, -3.5089440643787384e-05, 8.145347237586975e-05, 0.00019799638539552689, 0.000314539298415184, 0.00043108221143484116, 0.0005476251244544983, 0.0006641680374741554, 0.0007807109504938126, 0.0008972538635134697, 0.0010137967765331268, 0.001130339689552784, 0.001246882602572441, 0.0013634255155920982, 0.0014799684286117554, 0.0015965113416314125, 0.0017130542546510696, 0.0018295971676707268, 0.001946140080690384, 0.002062682993710041, 0.002179225906729698, 0.0022957688197493553, 0.0024123117327690125, 0.0025288546457886696, 0.0026453975588083267, 0.002761940471827984, 0.002878483384847641, 0.002995026297867298, 0.0031115692108869553, 0.0032281121239066124, 0.0033446550369262695]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 6.0, 3.0, 6.0, 7.0, 10.0, 15.0, 23.0, 16.0, 16.0, 20.0, 24.0, 26.0, 41.0, 32.0, 46.0, 47.0, 33.0, 54.0, 38.0, 59.0, 43.0, 53.0, 41.0, 41.0, 41.0, 34.0, 33.0, 24.0, 29.0, 24.0, 20.0, 18.0, 16.0, 11.0, 10.0, 13.0, 11.0, 9.0, 5.0, 5.0, 4.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-5.3828125, -5.22418212890625, -5.0655517578125, -4.90692138671875, -4.748291015625, -4.58966064453125, -4.4310302734375, -4.27239990234375, -4.11376953125, -3.95513916015625, -3.7965087890625, -3.63787841796875, -3.479248046875, -3.32061767578125, -3.1619873046875, -3.00335693359375, -2.8447265625, -2.68609619140625, -2.5274658203125, -2.36883544921875, -2.210205078125, -2.05157470703125, -1.8929443359375, -1.73431396484375, -1.57568359375, -1.41705322265625, -1.2584228515625, -1.09979248046875, -0.941162109375, -0.78253173828125, -0.6239013671875, -0.46527099609375, -0.306640625, -0.14801025390625, 0.0106201171875, 0.16925048828125, 0.327880859375, 0.48651123046875, 0.6451416015625, 0.80377197265625, 0.96240234375, 1.12103271484375, 1.2796630859375, 1.43829345703125, 1.596923828125, 1.75555419921875, 1.9141845703125, 2.07281494140625, 2.2314453125, 2.39007568359375, 2.5487060546875, 2.70733642578125, 2.865966796875, 3.02459716796875, 3.1832275390625, 3.34185791015625, 3.50048828125, 3.65911865234375, 3.8177490234375, 3.97637939453125, 4.135009765625, 4.29364013671875, 4.4522705078125, 4.61090087890625, 4.76953125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 14.0, 11.0, 16.0, 26.0, 36.0, 51.0, 86.0, 84.0, 125.0, 158.0, 221.0, 309.0, 416.0, 548.0, 761.0, 1171.0, 1776.0, 3814.0, 21678.0, 176603.0, 604534.0, 200831.0, 25144.0, 4187.0, 1746.0, 1183.0, 777.0, 623.0, 449.0, 340.0, 236.0, 154.0, 122.0, 87.0, 59.0, 57.0, 40.0, 20.0, 14.0, 14.0, 3.0, 9.0, 12.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.484375, -10.162109375, -9.83984375, -9.517578125, -9.1953125, -8.873046875, -8.55078125, -8.228515625, -7.90625, -7.583984375, -7.26171875, -6.939453125, -6.6171875, -6.294921875, -5.97265625, -5.650390625, -5.328125, -5.005859375, -4.68359375, -4.361328125, -4.0390625, -3.716796875, -3.39453125, -3.072265625, -2.75, -2.427734375, -2.10546875, -1.783203125, -1.4609375, -1.138671875, -0.81640625, -0.494140625, -0.171875, 0.150390625, 0.47265625, 0.794921875, 1.1171875, 1.439453125, 1.76171875, 2.083984375, 2.40625, 2.728515625, 3.05078125, 3.373046875, 3.6953125, 4.017578125, 4.33984375, 4.662109375, 4.984375, 5.306640625, 5.62890625, 5.951171875, 6.2734375, 6.595703125, 6.91796875, 7.240234375, 7.5625, 7.884765625, 8.20703125, 8.529296875, 8.8515625, 9.173828125, 9.49609375, 9.818359375, 10.140625]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 7.0, 6.0, 2.0, 15.0, 11.0, 12.0, 9.0, 17.0, 23.0, 25.0, 34.0, 27.0, 39.0, 47.0, 56.0, 51.0, 85.0, 231.0, 1449.0, 332.0, 154.0, 94.0, 64.0, 44.0, 45.0, 35.0, 27.0, 19.0, 21.0, 17.0, 18.0, 7.0, 10.0, 6.0, 8.0, 3.0, 3.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.7734375, -12.3846435546875, -11.995849609375, -11.6070556640625, -11.21826171875, -10.8294677734375, -10.440673828125, -10.0518798828125, -9.6630859375, -9.2742919921875, -8.885498046875, -8.4967041015625, -8.10791015625, -7.7191162109375, -7.330322265625, -6.9415283203125, -6.552734375, -6.1639404296875, -5.775146484375, -5.3863525390625, -4.99755859375, -4.6087646484375, -4.219970703125, -3.8311767578125, -3.4423828125, -3.0535888671875, -2.664794921875, -2.2760009765625, -1.88720703125, -1.4984130859375, -1.109619140625, -0.7208251953125, -0.33203125, 0.0567626953125, 0.445556640625, 0.8343505859375, 1.22314453125, 1.6119384765625, 2.000732421875, 2.3895263671875, 2.7783203125, 3.1671142578125, 3.555908203125, 3.9447021484375, 4.33349609375, 4.7222900390625, 5.111083984375, 5.4998779296875, 5.888671875, 6.2774658203125, 6.666259765625, 7.0550537109375, 7.44384765625, 7.8326416015625, 8.221435546875, 8.6102294921875, 8.9990234375, 9.3878173828125, 9.776611328125, 10.1654052734375, 10.55419921875, 10.9429931640625, 11.331787109375, 11.7205810546875, 12.109375]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 2.0, 1.0, 6.0, 4.0, 6.0, 3.0, 3.0, 20.0, 14.0, 11.0, 20.0, 33.0, 45.0, 69.0, 97.0, 144.0, 225.0, 329.0, 551.0, 1267.0, 8232.0, 3128729.0, 3365.0, 1065.0, 535.0, 284.0, 190.0, 128.0, 77.0, 64.0, 49.0, 36.0, 23.0, 15.0, 11.0, 18.0, 5.0, 7.0, 4.0, 3.0, 6.0, 6.0, 2.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.4375, -43.8369140625, -42.236328125, -40.6357421875, -39.03515625, -37.4345703125, -35.833984375, -34.2333984375, -32.6328125, -31.0322265625, -29.431640625, -27.8310546875, -26.23046875, -24.6298828125, -23.029296875, -21.4287109375, -19.828125, -18.2275390625, -16.626953125, -15.0263671875, -13.42578125, -11.8251953125, -10.224609375, -8.6240234375, -7.0234375, -5.4228515625, -3.822265625, -2.2216796875, -0.62109375, 0.9794921875, 2.580078125, 4.1806640625, 5.78125, 7.3818359375, 8.982421875, 10.5830078125, 12.18359375, 13.7841796875, 15.384765625, 16.9853515625, 18.5859375, 20.1865234375, 21.787109375, 23.3876953125, 24.98828125, 26.5888671875, 28.189453125, 29.7900390625, 31.390625, 32.9912109375, 34.591796875, 36.1923828125, 37.79296875, 39.3935546875, 40.994140625, 42.5947265625, 44.1953125, 45.7958984375, 47.396484375, 48.9970703125, 50.59765625, 52.1982421875, 53.798828125, 55.3994140625, 57.0]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 29.0, 85.0, 185.0, 246.0, 259.0, 133.0, 48.0, 14.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-56.310787200927734, -55.0550537109375, -53.799320220947266, -52.5435905456543, -51.28785705566406, -50.03212356567383, -48.776390075683594, -47.52065658569336, -46.264923095703125, -45.00918960571289, -43.753456115722656, -42.49772644042969, -41.24199295043945, -39.98625946044922, -38.730525970458984, -37.47479248046875, -36.21906280517578, -34.96332931518555, -33.70759582519531, -32.451866149902344, -31.19613265991211, -29.940399169921875, -28.68466567993164, -27.428932189941406, -26.173200607299805, -24.91746711730957, -23.66173553466797, -22.406002044677734, -21.1502685546875, -19.8945369720459, -18.638803482055664, -17.383071899414062, -16.127338409423828, -14.87160587310791, -13.615873336791992, -12.360139846801758, -11.10440731048584, -9.848674774169922, -8.592941284179688, -7.3372087478637695, -6.081476211547852, -4.825743675231934, -3.5700106620788574, -2.3142778873443604, -1.0585451126098633, 0.1971874237060547, 1.4529204368591309, 2.708653450012207, 3.964385986328125, 5.220118522644043, 6.475851535797119, 7.731584548950195, 8.987317085266113, 10.243049621582031, 11.498783111572266, 12.754515647888184, 14.010248184204102, 15.26598072052002, 16.521713256835938, 17.777446746826172, 19.033180236816406, 20.288911819458008, 21.544645309448242, 22.800376892089844, 24.056110382080078]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 4.0, 4.0, 7.0, 4.0, 2.0, 14.0, 8.0, 12.0, 12.0, 23.0, 23.0, 20.0, 26.0, 33.0, 31.0, 46.0, 49.0, 42.0, 37.0, 43.0, 33.0, 49.0, 47.0, 47.0, 42.0, 49.0, 29.0, 30.0, 23.0, 22.0, 33.0, 31.0, 29.0, 18.0, 15.0, 10.0, 16.0, 9.0, 11.0, 9.0, 8.0, 2.0, 5.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.812789916992188, -24.927526473999023, -24.04226303100586, -23.157001495361328, -22.271738052368164, -21.386474609375, -20.50121307373047, -19.615949630737305, -18.73068618774414, -17.845422744750977, -16.960159301757812, -16.07489776611328, -15.189634323120117, -14.304370880126953, -13.419108390808105, -12.533845901489258, -11.648582458496094, -10.76331901550293, -9.878056526184082, -8.992794036865234, -8.10753059387207, -7.2222676277160645, -6.337004661560059, -5.451741695404053, -4.566478729248047, -3.681215763092041, -2.795952796936035, -1.9106898307800293, -1.0254268646240234, -0.14016389846801758, 0.7450990676879883, 1.6303620338439941, 2.515625, 3.400887966156006, 4.286150932312012, 5.171413898468018, 6.056676864624023, 6.941939830780029, 7.827202796936035, 8.712465286254883, 9.597728729248047, 10.482992172241211, 11.368254661560059, 12.253517150878906, 13.13878059387207, 14.024044036865234, 14.909306526184082, 15.79456901550293, 16.679832458496094, 17.565095901489258, 18.450359344482422, 19.335620880126953, 20.220884323120117, 21.10614776611328, 21.991409301757812, 22.876672744750977, 23.76193618774414, 24.647199630737305, 25.53246307373047, 26.417724609375, 27.302988052368164, 28.188251495361328, 29.07351303100586, 29.958776473999023, 30.844039916992188]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 5.0, 4.0, 8.0, 14.0, 17.0, 15.0, 14.0, 16.0, 16.0, 20.0, 13.0, 37.0, 29.0, 44.0, 37.0, 44.0, 45.0, 40.0, 73.0, 45.0, 32.0, 45.0, 56.0, 44.0, 27.0, 33.0, 30.0, 23.0, 25.0, 25.0, 23.0, 20.0, 11.0, 14.0, 11.0, 11.0, 14.0, 7.0, 7.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-5.22265625, -5.06268310546875, -4.9027099609375, -4.74273681640625, -4.582763671875, -4.42279052734375, -4.2628173828125, -4.10284423828125, -3.94287109375, -3.78289794921875, -3.6229248046875, -3.46295166015625, -3.302978515625, -3.14300537109375, -2.9830322265625, -2.82305908203125, -2.6630859375, -2.50311279296875, -2.3431396484375, -2.18316650390625, -2.023193359375, -1.86322021484375, -1.7032470703125, -1.54327392578125, -1.38330078125, -1.22332763671875, -1.0633544921875, -0.90338134765625, -0.743408203125, -0.58343505859375, -0.4234619140625, -0.26348876953125, -0.103515625, 0.05645751953125, 0.2164306640625, 0.37640380859375, 0.536376953125, 0.69635009765625, 0.8563232421875, 1.01629638671875, 1.17626953125, 1.33624267578125, 1.4962158203125, 1.65618896484375, 1.816162109375, 1.97613525390625, 2.1361083984375, 2.29608154296875, 2.4560546875, 2.61602783203125, 2.7760009765625, 2.93597412109375, 3.095947265625, 3.25592041015625, 3.4158935546875, 3.57586669921875, 3.73583984375, 3.89581298828125, 4.0557861328125, 4.21575927734375, 4.375732421875, 4.53570556640625, 4.6956787109375, 4.85565185546875, 5.015625]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 4.0, 5.0, 10.0, 8.0, 17.0, 22.0, 35.0, 33.0, 47.0, 99.0, 103.0, 159.0, 223.0, 282.0, 462.0, 727.0, 1199.0, 2414.0, 5491.0, 15756.0, 62922.0, 320062.0, 1279867.0, 1789632.0, 563748.0, 110919.0, 24928.0, 7704.0, 3264.0, 1575.0, 854.0, 570.0, 346.0, 240.0, 155.0, 134.0, 81.0, 56.0, 43.0, 32.0, 25.0, 10.0, 6.0, 6.0, 9.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-6.5234375, -6.30731201171875, -6.0911865234375, -5.87506103515625, -5.658935546875, -5.44281005859375, -5.2266845703125, -5.01055908203125, -4.79443359375, -4.57830810546875, -4.3621826171875, -4.14605712890625, -3.929931640625, -3.71380615234375, -3.4976806640625, -3.28155517578125, -3.0654296875, -2.84930419921875, -2.6331787109375, -2.41705322265625, -2.200927734375, -1.98480224609375, -1.7686767578125, -1.55255126953125, -1.33642578125, -1.12030029296875, -0.9041748046875, -0.68804931640625, -0.471923828125, -0.25579833984375, -0.0396728515625, 0.17645263671875, 0.392578125, 0.60870361328125, 0.8248291015625, 1.04095458984375, 1.257080078125, 1.47320556640625, 1.6893310546875, 1.90545654296875, 2.12158203125, 2.33770751953125, 2.5538330078125, 2.76995849609375, 2.986083984375, 3.20220947265625, 3.4183349609375, 3.63446044921875, 3.8505859375, 4.06671142578125, 4.2828369140625, 4.49896240234375, 4.715087890625, 4.93121337890625, 5.1473388671875, 5.36346435546875, 5.57958984375, 5.79571533203125, 6.0118408203125, 6.22796630859375, 6.444091796875, 6.66021728515625, 6.8763427734375, 7.09246826171875, 7.30859375]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 2.0, 9.0, 10.0, 13.0, 13.0, 26.0, 29.0, 55.0, 56.0, 94.0, 121.0, 169.0, 256.0, 345.0, 555.0, 599.0, 567.0, 334.0, 262.0, 152.0, 107.0, 77.0, 59.0, 44.0, 39.0, 28.0, 20.0, 12.0, 13.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-11.90625, -11.596923828125, -11.28759765625, -10.978271484375, -10.6689453125, -10.359619140625, -10.05029296875, -9.740966796875, -9.431640625, -9.122314453125, -8.81298828125, -8.503662109375, -8.1943359375, -7.885009765625, -7.57568359375, -7.266357421875, -6.95703125, -6.647705078125, -6.33837890625, -6.029052734375, -5.7197265625, -5.410400390625, -5.10107421875, -4.791748046875, -4.482421875, -4.173095703125, -3.86376953125, -3.554443359375, -3.2451171875, -2.935791015625, -2.62646484375, -2.317138671875, -2.0078125, -1.698486328125, -1.38916015625, -1.079833984375, -0.7705078125, -0.461181640625, -0.15185546875, 0.157470703125, 0.466796875, 0.776123046875, 1.08544921875, 1.394775390625, 1.7041015625, 2.013427734375, 2.32275390625, 2.632080078125, 2.94140625, 3.250732421875, 3.56005859375, 3.869384765625, 4.1787109375, 4.488037109375, 4.79736328125, 5.106689453125, 5.416015625, 5.725341796875, 6.03466796875, 6.343994140625, 6.6533203125, 6.962646484375, 7.27197265625, 7.581298828125, 7.890625]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 5.0, 1.0, 1.0, 3.0, 4.0, 10.0, 12.0, 17.0, 26.0, 43.0, 68.0, 104.0, 188.0, 316.0, 619.0, 1238.0, 3673.0, 25552.0, 586579.0, 3390204.0, 170427.0, 10736.0, 2367.0, 936.0, 485.0, 274.0, 141.0, 94.0, 59.0, 29.0, 29.0, 20.0, 13.0, 5.0, 7.0, 1.0, 3.0, 2.0, 0.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.140625, -15.590087890625, -15.03955078125, -14.489013671875, -13.9384765625, -13.387939453125, -12.83740234375, -12.286865234375, -11.736328125, -11.185791015625, -10.63525390625, -10.084716796875, -9.5341796875, -8.983642578125, -8.43310546875, -7.882568359375, -7.33203125, -6.781494140625, -6.23095703125, -5.680419921875, -5.1298828125, -4.579345703125, -4.02880859375, -3.478271484375, -2.927734375, -2.377197265625, -1.82666015625, -1.276123046875, -0.7255859375, -0.175048828125, 0.37548828125, 0.926025390625, 1.4765625, 2.027099609375, 2.57763671875, 3.128173828125, 3.6787109375, 4.229248046875, 4.77978515625, 5.330322265625, 5.880859375, 6.431396484375, 6.98193359375, 7.532470703125, 8.0830078125, 8.633544921875, 9.18408203125, 9.734619140625, 10.28515625, 10.835693359375, 11.38623046875, 11.936767578125, 12.4873046875, 13.037841796875, 13.58837890625, 14.138916015625, 14.689453125, 15.239990234375, 15.79052734375, 16.341064453125, 16.8916015625, 17.442138671875, 17.99267578125, 18.543212890625, 19.09375]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 46.0, 938.0, 31.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.70046997070312, -69.92110443115234, -57.14173889160156, -44.36237335205078, -31.5830078125, -18.80364227294922, -6.0242767333984375, 6.755088806152344, 19.534454345703125, 32.313819885253906, 45.09318542480469, 57.87255096435547, 70.65191650390625, 83.43128204345703, 96.21064758300781, 108.9900131225586, 121.76937866210938, 134.54873657226562, 147.32810974121094, 160.10748291015625, 172.8868408203125, 185.66619873046875, 198.44557189941406, 211.22494506835938, 224.00430297851562, 236.78366088867188, 249.5630340576172, 262.3424072265625, 275.12176513671875, 287.901123046875, 300.68048095703125, 313.4598693847656, 326.23919677734375, 339.0185546875, 351.79791259765625, 364.5773010253906, 377.3566589355469, 390.1360168457031, 402.9154052734375, 415.69476318359375, 428.47412109375, 441.25347900390625, 454.0328369140625, 466.8122253417969, 479.5915832519531, 492.3709411621094, 505.15032958984375, 517.9296875, 530.7090454101562, 543.4884033203125, 556.2677612304688, 569.047119140625, 581.8265380859375, 594.6058959960938, 607.38525390625, 620.1646118164062, 632.9439697265625, 645.7233276367188, 658.502685546875, 671.2820434570312, 684.0614013671875, 696.8408203125, 709.6201782226562, 722.3995361328125, 735.1788940429688]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 6.0, 5.0, 10.0, 5.0, 12.0, 23.0, 10.0, 24.0, 27.0, 24.0, 31.0, 35.0, 51.0, 44.0, 39.0, 49.0, 57.0, 48.0, 46.0, 48.0, 64.0, 37.0, 40.0, 39.0, 39.0, 29.0, 26.0, 26.0, 16.0, 19.0, 17.0, 10.0, 9.0, 10.0, 8.0, 12.0, 3.0, 2.0, 3.0, 0.0, 4.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-39.01042938232422, -37.89729690551758, -36.7841682434082, -35.67103576660156, -34.55790328979492, -33.44477081298828, -32.331642150878906, -31.218509674072266, -30.105379104614258, -28.99224853515625, -27.87911605834961, -26.7659854888916, -25.652854919433594, -24.539722442626953, -23.426591873168945, -22.313461303710938, -21.200328826904297, -20.08719825744629, -18.97406578063965, -17.86093521118164, -16.747802734375, -15.634672164916992, -14.521541595458984, -13.40841007232666, -12.295278549194336, -11.182147026062012, -10.069015502929688, -8.95588493347168, -7.8427534103393555, -6.729621887207031, -5.616490840911865, -4.503359794616699, -3.390228271484375, -2.27709698677063, -1.1639657020568848, -0.05083441734313965, 1.0622968673706055, 2.1754283905029297, 3.2885594367980957, 4.401690483093262, 5.514822006225586, 6.62795352935791, 7.741084575653076, 8.854215621948242, 9.967347145080566, 11.08047866821289, 12.193609237670898, 13.306740760803223, 14.419872283935547, 15.533003807067871, 16.646135330200195, 17.759265899658203, 18.872398376464844, 19.98552894592285, 21.09865951538086, 22.2117919921875, 23.324922561645508, 24.438053131103516, 25.551185607910156, 26.664316177368164, 27.777446746826172, 28.890579223632812, 30.00370979309082, 31.116840362548828, 32.22997283935547]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 6.0, 13.0, 7.0, 16.0, 13.0, 14.0, 17.0, 16.0, 15.0, 12.0, 18.0, 30.0, 29.0, 29.0, 31.0, 28.0, 36.0, 46.0, 41.0, 41.0, 43.0, 41.0, 33.0, 42.0, 41.0, 34.0, 32.0, 26.0, 23.0, 31.0, 23.0, 27.0, 18.0, 18.0, 11.0, 11.0, 16.0, 18.0, 12.0, 14.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-3.556640625, -3.44537353515625, -3.3341064453125, -3.22283935546875, -3.111572265625, -3.00030517578125, -2.8890380859375, -2.77777099609375, -2.66650390625, -2.55523681640625, -2.4439697265625, -2.33270263671875, -2.221435546875, -2.11016845703125, -1.9989013671875, -1.88763427734375, -1.7763671875, -1.66510009765625, -1.5538330078125, -1.44256591796875, -1.331298828125, -1.22003173828125, -1.1087646484375, -0.99749755859375, -0.88623046875, -0.77496337890625, -0.6636962890625, -0.55242919921875, -0.441162109375, -0.32989501953125, -0.2186279296875, -0.10736083984375, 0.00390625, 0.11517333984375, 0.2264404296875, 0.33770751953125, 0.448974609375, 0.56024169921875, 0.6715087890625, 0.78277587890625, 0.89404296875, 1.00531005859375, 1.1165771484375, 1.22784423828125, 1.339111328125, 1.45037841796875, 1.5616455078125, 1.67291259765625, 1.7841796875, 1.89544677734375, 2.0067138671875, 2.11798095703125, 2.229248046875, 2.34051513671875, 2.4517822265625, 2.56304931640625, 2.67431640625, 2.78558349609375, 2.8968505859375, 3.00811767578125, 3.119384765625, 3.23065185546875, 3.3419189453125, 3.45318603515625, 3.564453125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 7.0, 5.0, 13.0, 18.0, 21.0, 43.0, 52.0, 83.0, 111.0, 161.0, 247.0, 357.0, 504.0, 705.0, 1170.0, 1839.0, 2831.0, 4580.0, 7524.0, 12384.0, 20747.0, 36328.0, 64299.0, 119523.0, 226165.0, 244745.0, 133865.0, 71219.0, 40183.0, 23206.0, 13750.0, 8045.0, 4972.0, 3134.0, 1975.0, 1238.0, 830.0, 508.0, 347.0, 236.0, 177.0, 136.0, 87.0, 47.0, 40.0, 27.0, 16.0, 13.0, 14.0, 3.0, 8.0, 6.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0], "bins": [-0.470458984375, -0.4553260803222656, -0.44019317626953125, -0.4250602722167969, -0.4099273681640625, -0.3947944641113281, -0.37966156005859375, -0.3645286560058594, -0.349395751953125, -0.3342628479003906, -0.31912994384765625, -0.3039970397949219, -0.2888641357421875, -0.2737312316894531, -0.25859832763671875, -0.24346542358398438, -0.22833251953125, -0.21319961547851562, -0.19806671142578125, -0.18293380737304688, -0.1678009033203125, -0.15266799926757812, -0.13753509521484375, -0.12240219116210938, -0.107269287109375, -0.09213638305664062, -0.07700347900390625, -0.061870574951171875, -0.0467376708984375, -0.031604766845703125, -0.01647186279296875, -0.001338958740234375, 0.0137939453125, 0.028926849365234375, 0.04405975341796875, 0.059192657470703125, 0.0743255615234375, 0.08945846557617188, 0.10459136962890625, 0.11972427368164062, 0.134857177734375, 0.14999008178710938, 0.16512298583984375, 0.18025588989257812, 0.1953887939453125, 0.21052169799804688, 0.22565460205078125, 0.24078750610351562, 0.25592041015625, 0.2710533142089844, 0.28618621826171875, 0.3013191223144531, 0.3164520263671875, 0.3315849304199219, 0.34671783447265625, 0.3618507385253906, 0.376983642578125, 0.3921165466308594, 0.40724945068359375, 0.4223823547363281, 0.4375152587890625, 0.4526481628417969, 0.46778106689453125, 0.4829139709472656, 0.498046875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 4.0, 6.0, 5.0, 6.0, 9.0, 9.0, 8.0, 9.0, 11.0, 17.0, 16.0, 20.0, 22.0, 33.0, 33.0, 37.0, 38.0, 32.0, 34.0, 50.0, 38.0, 47.0, 1064.0, 35.0, 43.0, 48.0, 33.0, 33.0, 27.0, 34.0, 38.0, 38.0, 22.0, 22.0, 22.0, 20.0, 14.0, 12.0, 9.0, 9.0, 7.0, 4.0, 1.0, 5.0, 1.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.619140625, -2.539276123046875, -2.45941162109375, -2.379547119140625, -2.2996826171875, -2.219818115234375, -2.13995361328125, -2.060089111328125, -1.980224609375, -1.900360107421875, -1.82049560546875, -1.740631103515625, -1.6607666015625, -1.580902099609375, -1.50103759765625, -1.421173095703125, -1.34130859375, -1.261444091796875, -1.18157958984375, -1.101715087890625, -1.0218505859375, -0.941986083984375, -0.86212158203125, -0.782257080078125, -0.702392578125, -0.622528076171875, -0.54266357421875, -0.462799072265625, -0.3829345703125, -0.303070068359375, -0.22320556640625, -0.143341064453125, -0.0634765625, 0.016387939453125, 0.09625244140625, 0.176116943359375, 0.2559814453125, 0.335845947265625, 0.41571044921875, 0.495574951171875, 0.575439453125, 0.655303955078125, 0.73516845703125, 0.815032958984375, 0.8948974609375, 0.974761962890625, 1.05462646484375, 1.134490966796875, 1.21435546875, 1.294219970703125, 1.37408447265625, 1.453948974609375, 1.5338134765625, 1.613677978515625, 1.69354248046875, 1.773406982421875, 1.853271484375, 1.933135986328125, 2.01300048828125, 2.092864990234375, 2.1727294921875, 2.252593994140625, 2.33245849609375, 2.412322998046875, 2.4921875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 10.0, 17.0, 26.0, 33.0, 42.0, 80.0, 108.0, 155.0, 257.0, 422.0, 658.0, 1012.0, 1464.0, 2240.0, 3499.0, 5339.0, 8177.0, 12678.0, 19617.0, 31480.0, 52415.0, 90900.0, 160951.0, 1275831.0, 176736.0, 101498.0, 58006.0, 33923.0, 20988.0, 13450.0, 8740.0, 5649.0, 3751.0, 2445.0, 1584.0, 1040.0, 649.0, 467.0, 305.0, 176.0, 104.0, 83.0, 42.0, 38.0, 22.0, 12.0, 7.0, 6.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.35791015625, -0.34658050537109375, -0.3352508544921875, -0.32392120361328125, -0.312591552734375, -0.30126190185546875, -0.2899322509765625, -0.27860260009765625, -0.26727294921875, -0.25594329833984375, -0.2446136474609375, -0.23328399658203125, -0.221954345703125, -0.21062469482421875, -0.1992950439453125, -0.18796539306640625, -0.1766357421875, -0.16530609130859375, -0.1539764404296875, -0.14264678955078125, -0.131317138671875, -0.11998748779296875, -0.1086578369140625, -0.09732818603515625, -0.08599853515625, -0.07466888427734375, -0.0633392333984375, -0.05200958251953125, -0.040679931640625, -0.02935028076171875, -0.0180206298828125, -0.00669097900390625, 0.004638671875, 0.01596832275390625, 0.0272979736328125, 0.03862762451171875, 0.049957275390625, 0.06128692626953125, 0.0726165771484375, 0.08394622802734375, 0.09527587890625, 0.10660552978515625, 0.1179351806640625, 0.12926483154296875, 0.140594482421875, 0.15192413330078125, 0.1632537841796875, 0.17458343505859375, 0.1859130859375, 0.19724273681640625, 0.2085723876953125, 0.21990203857421875, 0.231231689453125, 0.24256134033203125, 0.2538909912109375, 0.26522064208984375, 0.27655029296875, 0.28787994384765625, 0.2992095947265625, 0.31053924560546875, 0.321868896484375, 0.33319854736328125, 0.3445281982421875, 0.35585784912109375, 0.3671875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 10.0, 10.0, 20.0, 19.0, 32.0, 30.0, 53.0, 46.0, 83.0, 81.0, 81.0, 89.0, 90.0, 79.0, 69.0, 51.0, 43.0, 31.0, 19.0, 14.0, 9.0, 16.0, 6.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.005435943603515625, -0.005289316177368164, -0.005142688751220703, -0.004996061325073242, -0.004849433898925781, -0.00470280647277832, -0.004556179046630859, -0.0044095516204833984, -0.0042629241943359375, -0.0041162967681884766, -0.003969669342041016, -0.0038230419158935547, -0.0036764144897460938, -0.003529787063598633, -0.003383159637451172, -0.003236532211303711, -0.00308990478515625, -0.002943277359008789, -0.002796649932861328, -0.002650022506713867, -0.0025033950805664062, -0.0023567676544189453, -0.0022101402282714844, -0.0020635128021240234, -0.0019168853759765625, -0.0017702579498291016, -0.0016236305236816406, -0.0014770030975341797, -0.0013303756713867188, -0.0011837482452392578, -0.0010371208190917969, -0.0008904933929443359, -0.000743865966796875, -0.0005972385406494141, -0.0004506111145019531, -0.0003039836883544922, -0.00015735626220703125, -1.0728836059570312e-05, 0.00013589859008789062, 0.00028252601623535156, 0.0004291534423828125, 0.0005757808685302734, 0.0007224082946777344, 0.0008690357208251953, 0.0010156631469726562, 0.0011622905731201172, 0.0013089179992675781, 0.001455545425415039, 0.0016021728515625, 0.001748800277709961, 0.0018954277038574219, 0.002042055130004883, 0.0021886825561523438, 0.0023353099822998047, 0.0024819374084472656, 0.0026285648345947266, 0.0027751922607421875, 0.0029218196868896484, 0.0030684471130371094, 0.0032150745391845703, 0.0033617019653320312, 0.003508329391479492, 0.003654956817626953, 0.003801584243774414, 0.003948211669921875]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 1.0, 2.0, 1.0, 4.0, 7.0, 9.0, 4.0, 10.0, 11.0, 21.0, 26.0, 28.0, 45.0, 62.0, 103.0, 157.0, 255.0, 483.0, 1236.0, 733200.0, 310728.0, 1053.0, 478.0, 207.0, 132.0, 83.0, 67.0, 38.0, 36.0, 25.0, 15.0, 11.0, 9.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07122802734375, -0.06858634948730469, -0.06594467163085938, -0.06330299377441406, -0.06066131591796875, -0.05801963806152344, -0.055377960205078125, -0.05273628234863281, -0.0500946044921875, -0.04745292663574219, -0.044811248779296875, -0.04216957092285156, -0.03952789306640625, -0.03688621520996094, -0.034244537353515625, -0.03160285949707031, -0.028961181640625, -0.026319503784179688, -0.023677825927734375, -0.021036148071289062, -0.01839447021484375, -0.015752792358398438, -0.013111114501953125, -0.010469436645507812, -0.0078277587890625, -0.0051860809326171875, -0.002544403076171875, 9.72747802734375e-05, 0.00273895263671875, 0.0053806304931640625, 0.008022308349609375, 0.010663986206054688, 0.0133056640625, 0.015947341918945312, 0.018589019775390625, 0.021230697631835938, 0.02387237548828125, 0.026514053344726562, 0.029155731201171875, 0.03179740905761719, 0.0344390869140625, 0.03708076477050781, 0.039722442626953125, 0.04236412048339844, 0.04500579833984375, 0.04764747619628906, 0.050289154052734375, 0.05293083190917969, 0.055572509765625, 0.05821418762207031, 0.060855865478515625, 0.06349754333496094, 0.06613922119140625, 0.06878089904785156, 0.07142257690429688, 0.07406425476074219, 0.0767059326171875, 0.07934761047363281, 0.08198928833007812, 0.08463096618652344, 0.08727264404296875, 0.08991432189941406, 0.09255599975585938, 0.09519767761230469, 0.09783935546875]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 199.0, 805.0, 11.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0014879964292049408, -0.000816896150354296, -0.00014579587150365114, 0.0005253043491393328, 0.0011964046861976385, 0.0018675050232559443, 0.0025386051274836063, 0.003209705464541912, 0.003880805801600218, 0.0045519061386585236, 0.005223006475716829, 0.005894106812775135, 0.0065652066841721535, 0.0072363074868917465, 0.007907407358288765, 0.008578507229685783, 0.009249608032405376, 0.009920707903802395, 0.010591808706521988, 0.011262908577919006, 0.0119340093806386, 0.012605109252035618, 0.013276210054755211, 0.01394730992615223, 0.014618409797549248, 0.015289509668946266, 0.015960609540343285, 0.016631711274385452, 0.01730281114578247, 0.01797391101717949, 0.018645010888576508, 0.019316110759973526, 0.019987212494015694, 0.020658312365412712, 0.02132941223680973, 0.022000513970851898, 0.022671613842248917, 0.023342713713645935, 0.024013813585042953, 0.024684913456439972, 0.02535601519048214, 0.026027115061879158, 0.026698214933276176, 0.027369316667318344, 0.028040416538715363, 0.02871151641011238, 0.0293826162815094, 0.030053716152906418, 0.030724816024303436, 0.031395915895700455, 0.03206701576709747, 0.03273811563849449, 0.03340921550989151, 0.03408031910657883, 0.034751418977975845, 0.035422518849372864, 0.03609361872076988, 0.0367647185921669, 0.03743581846356392, 0.03810691833496094, 0.038778018206357956, 0.03944912180304527, 0.04012022167444229, 0.04079132154583931, 0.04146242141723633]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 6.0, 1.0, 6.0, 10.0, 7.0, 8.0, 14.0, 12.0, 21.0, 10.0, 26.0, 42.0, 42.0, 39.0, 51.0, 41.0, 54.0, 53.0, 65.0, 48.0, 46.0, 55.0, 55.0, 41.0, 60.0, 33.0, 31.0, 22.0, 24.0, 25.0, 14.0, 10.0, 11.0, 6.0, 7.0, 5.0, 6.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0028805136680603027, -0.002806234173476696, -0.0027319546788930893, -0.0026576751843094826, -0.002583395689725876, -0.002509116195142269, -0.0024348367005586624, -0.0023605572059750557, -0.002286277711391449, -0.0022119982168078423, -0.0021377187222242355, -0.002063439227640629, -0.001989159733057022, -0.0019148802384734154, -0.0018406007438898087, -0.001766321249306202, -0.0016920417547225952, -0.0016177622601389885, -0.0015434827655553818, -0.001469203270971775, -0.0013949237763881683, -0.0013206442818045616, -0.001246364787220955, -0.0011720852926373482, -0.0010978057980537415, -0.0010235263034701347, -0.000949246808886528, -0.0008749673143029213, -0.0008006878197193146, -0.0007264083251357079, -0.0006521288305521011, -0.0005778493359684944, -0.0005035698413848877, -0.000429290346801281, -0.00035501085221767426, -0.00028073135763406754, -0.00020645186305046082, -0.0001321723684668541, -5.7892873883247375e-05, 1.6386620700359344e-05, 9.066611528396606e-05, 0.00016494560986757278, 0.0002392251044511795, 0.0003135045990347862, 0.00038778409361839294, 0.00046206358820199966, 0.0005363430827856064, 0.0006106225773692131, 0.0006849020719528198, 0.0007591815665364265, 0.0008334610611200333, 0.00090774055570364, 0.0009820200502872467, 0.0010562995448708534, 0.0011305790394544601, 0.0012048585340380669, 0.0012791380286216736, 0.0013534175232052803, 0.001427697017788887, 0.0015019765123724937, 0.0015762560069561005, 0.0016505355015397072, 0.001724814996123314, 0.0017990944907069206, 0.0018733739852905273]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 2.0, 6.0, 13.0, 7.0, 16.0, 13.0, 14.0, 17.0, 16.0, 15.0, 12.0, 18.0, 30.0, 29.0, 29.0, 31.0, 27.0, 36.0, 47.0, 41.0, 41.0, 43.0, 41.0, 33.0, 42.0, 41.0, 34.0, 32.0, 26.0, 23.0, 31.0, 23.0, 27.0, 18.0, 18.0, 11.0, 12.0, 15.0, 18.0, 12.0, 14.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 4.0, 1.0, 1.0, 1.0], "bins": [-3.556640625, -3.44537353515625, -3.3341064453125, -3.22283935546875, -3.111572265625, -3.00030517578125, -2.8890380859375, -2.77777099609375, -2.66650390625, -2.55523681640625, -2.4439697265625, -2.33270263671875, -2.221435546875, -2.11016845703125, -1.9989013671875, -1.88763427734375, -1.7763671875, -1.66510009765625, -1.5538330078125, -1.44256591796875, -1.331298828125, -1.22003173828125, -1.1087646484375, -0.99749755859375, -0.88623046875, -0.77496337890625, -0.6636962890625, -0.55242919921875, -0.441162109375, -0.32989501953125, -0.2186279296875, -0.10736083984375, 0.00390625, 0.11517333984375, 0.2264404296875, 0.33770751953125, 0.448974609375, 0.56024169921875, 0.6715087890625, 0.78277587890625, 0.89404296875, 1.00531005859375, 1.1165771484375, 1.22784423828125, 1.339111328125, 1.45037841796875, 1.5616455078125, 1.67291259765625, 1.7841796875, 1.89544677734375, 2.0067138671875, 2.11798095703125, 2.229248046875, 2.34051513671875, 2.4517822265625, 2.56304931640625, 2.67431640625, 2.78558349609375, 2.8968505859375, 3.00811767578125, 3.119384765625, 3.23065185546875, 3.3419189453125, 3.45318603515625, 3.564453125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 5.0, 5.0, 6.0, 12.0, 13.0, 18.0, 25.0, 34.0, 41.0, 65.0, 96.0, 116.0, 146.0, 173.0, 237.0, 303.0, 421.0, 557.0, 709.0, 858.0, 1207.0, 1702.0, 2486.0, 3861.0, 9578.0, 58705.0, 502318.0, 399764.0, 44474.0, 8141.0, 3541.0, 2444.0, 1602.0, 1171.0, 877.0, 641.0, 528.0, 403.0, 280.0, 233.0, 182.0, 157.0, 105.0, 90.0, 51.0, 49.0, 39.0, 27.0, 17.0, 12.0, 13.0, 5.0, 8.0, 6.0, 1.0, 3.0, 1.0, 1.0], "bins": [-9.3359375, -9.052490234375, -8.76904296875, -8.485595703125, -8.2021484375, -7.918701171875, -7.63525390625, -7.351806640625, -7.068359375, -6.784912109375, -6.50146484375, -6.218017578125, -5.9345703125, -5.651123046875, -5.36767578125, -5.084228515625, -4.80078125, -4.517333984375, -4.23388671875, -3.950439453125, -3.6669921875, -3.383544921875, -3.10009765625, -2.816650390625, -2.533203125, -2.249755859375, -1.96630859375, -1.682861328125, -1.3994140625, -1.115966796875, -0.83251953125, -0.549072265625, -0.265625, 0.017822265625, 0.30126953125, 0.584716796875, 0.8681640625, 1.151611328125, 1.43505859375, 1.718505859375, 2.001953125, 2.285400390625, 2.56884765625, 2.852294921875, 3.1357421875, 3.419189453125, 3.70263671875, 3.986083984375, 4.26953125, 4.552978515625, 4.83642578125, 5.119873046875, 5.4033203125, 5.686767578125, 5.97021484375, 6.253662109375, 6.537109375, 6.820556640625, 7.10400390625, 7.387451171875, 7.6708984375, 7.954345703125, 8.23779296875, 8.521240234375, 8.8046875]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 6.0, 8.0, 7.0, 8.0, 11.0, 8.0, 15.0, 17.0, 19.0, 28.0, 29.0, 33.0, 36.0, 40.0, 40.0, 56.0, 62.0, 139.0, 310.0, 1524.0, 193.0, 84.0, 45.0, 48.0, 48.0, 35.0, 31.0, 39.0, 20.0, 20.0, 14.0, 12.0, 10.0, 11.0, 8.0, 9.0, 5.0, 5.0, 5.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 3.0], "bins": [-10.2265625, -9.9188232421875, -9.611083984375, -9.3033447265625, -8.99560546875, -8.6878662109375, -8.380126953125, -8.0723876953125, -7.7646484375, -7.4569091796875, -7.149169921875, -6.8414306640625, -6.53369140625, -6.2259521484375, -5.918212890625, -5.6104736328125, -5.302734375, -4.9949951171875, -4.687255859375, -4.3795166015625, -4.07177734375, -3.7640380859375, -3.456298828125, -3.1485595703125, -2.8408203125, -2.5330810546875, -2.225341796875, -1.9176025390625, -1.60986328125, -1.3021240234375, -0.994384765625, -0.6866455078125, -0.37890625, -0.0711669921875, 0.236572265625, 0.5443115234375, 0.85205078125, 1.1597900390625, 1.467529296875, 1.7752685546875, 2.0830078125, 2.3907470703125, 2.698486328125, 3.0062255859375, 3.31396484375, 3.6217041015625, 3.929443359375, 4.2371826171875, 4.544921875, 4.8526611328125, 5.160400390625, 5.4681396484375, 5.77587890625, 6.0836181640625, 6.391357421875, 6.6990966796875, 7.0068359375, 7.3145751953125, 7.622314453125, 7.9300537109375, 8.23779296875, 8.5455322265625, 8.853271484375, 9.1610107421875, 9.46875]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 4.0, 4.0, 1.0, 6.0, 9.0, 3.0, 8.0, 10.0, 16.0, 24.0, 19.0, 22.0, 43.0, 45.0, 55.0, 81.0, 128.0, 202.0, 229.0, 438.0, 768.0, 1798.0, 16647.0, 3116768.0, 5140.0, 1406.0, 622.0, 372.0, 240.0, 134.0, 119.0, 91.0, 61.0, 41.0, 36.0, 27.0, 25.0, 17.0, 15.0, 10.0, 3.0, 6.0, 5.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-33.8125, -32.734375, -31.65625, -30.578125, -29.5, -28.421875, -27.34375, -26.265625, -25.1875, -24.109375, -23.03125, -21.953125, -20.875, -19.796875, -18.71875, -17.640625, -16.5625, -15.484375, -14.40625, -13.328125, -12.25, -11.171875, -10.09375, -9.015625, -7.9375, -6.859375, -5.78125, -4.703125, -3.625, -2.546875, -1.46875, -0.390625, 0.6875, 1.765625, 2.84375, 3.921875, 5.0, 6.078125, 7.15625, 8.234375, 9.3125, 10.390625, 11.46875, 12.546875, 13.625, 14.703125, 15.78125, 16.859375, 17.9375, 19.015625, 20.09375, 21.171875, 22.25, 23.328125, 24.40625, 25.484375, 26.5625, 27.640625, 28.71875, 29.796875, 30.875, 31.953125, 33.03125, 34.109375, 35.1875]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 20.0, 74.0, 233.0, 341.0, 258.0, 63.0, 16.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.02975082397461, -56.35121154785156, -54.672672271728516, -52.99413299560547, -51.31559371948242, -49.637054443359375, -47.958518981933594, -46.27997589111328, -44.6014404296875, -42.92290115356445, -41.244361877441406, -39.56582260131836, -37.88728332519531, -36.208744049072266, -34.53020477294922, -32.85166931152344, -31.173126220703125, -29.494586944580078, -27.81604766845703, -26.137508392333984, -24.458969116210938, -22.78042984008789, -21.101892471313477, -19.42335319519043, -17.744813919067383, -16.066274642944336, -14.387735366821289, -12.709197044372559, -11.030657768249512, -9.352118492126465, -7.673580169677734, -5.9950408935546875, -4.316497802734375, -2.6379587650299072, -0.9594197273254395, 0.7191190719604492, 2.397658348083496, 4.076197624206543, 5.754735946655273, 7.43327522277832, 9.111814498901367, 10.790353775024414, 12.468893051147461, 14.147431373596191, 15.825970649719238, 17.50450897216797, 19.183048248291016, 20.861587524414062, 22.54012680053711, 24.218666076660156, 25.897205352783203, 27.57574462890625, 29.254283905029297, 30.932823181152344, 32.611358642578125, 34.28990173339844, 35.96843719482422, 37.646976470947266, 39.32551574707031, 41.00405502319336, 42.682594299316406, 44.36113357543945, 46.0396728515625, 47.71820831298828, 49.396751403808594]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 3.0, 6.0, 8.0, 7.0, 6.0, 11.0, 13.0, 24.0, 14.0, 9.0, 20.0, 17.0, 22.0, 20.0, 25.0, 32.0, 23.0, 20.0, 29.0, 30.0, 37.0, 36.0, 41.0, 40.0, 39.0, 33.0, 43.0, 44.0, 27.0, 32.0, 30.0, 28.0, 29.0, 25.0, 26.0, 21.0, 18.0, 16.0, 26.0, 16.0, 6.0, 9.0, 10.0, 5.0, 7.0, 3.0, 9.0, 0.0, 4.0, 2.0, 2.0, 1.0, 1.0, 2.0, 5.0], "bins": [-22.19858741760254, -21.534862518310547, -20.871137619018555, -20.207414627075195, -19.543689727783203, -18.87996482849121, -18.21623992919922, -17.55251693725586, -16.888792037963867, -16.225067138671875, -15.5613431930542, -14.897618293762207, -14.233894348144531, -13.570169448852539, -12.906444549560547, -12.242720603942871, -11.578995704650879, -10.915270805358887, -10.251546859741211, -9.587821960449219, -8.924098014831543, -8.26037311553955, -7.596648693084717, -6.932924270629883, -6.269199848175049, -5.605475425720215, -4.941751003265381, -4.278026580810547, -3.614301919937134, -2.9505774974823, -2.2868528366088867, -1.6231284141540527, -0.9594039916992188, -0.29567950963974, 0.36804497241973877, 1.0317695140838623, 1.6954939365386963, 2.3592183589935303, 3.0229430198669434, 3.6866674423217773, 4.350391864776611, 5.014116287231445, 5.677840709686279, 6.341565132141113, 7.0052900314331055, 7.669013977050781, 8.332738876342773, 8.996463775634766, 9.660187721252441, 10.323912620544434, 10.98763656616211, 11.651361465454102, 12.315085411071777, 12.97881031036377, 13.642534255981445, 14.306259155273438, 14.96998405456543, 15.633708953857422, 16.297433853149414, 16.961156845092773, 17.624881744384766, 18.288606643676758, 18.95233154296875, 19.61605453491211, 20.2797794342041]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 8.0, 3.0, 6.0, 4.0, 11.0, 9.0, 14.0, 10.0, 14.0, 15.0, 23.0, 16.0, 22.0, 18.0, 22.0, 28.0, 26.0, 29.0, 29.0, 45.0, 59.0, 44.0, 38.0, 50.0, 37.0, 51.0, 41.0, 31.0, 33.0, 35.0, 25.0, 23.0, 24.0, 30.0, 18.0, 20.0, 21.0, 11.0, 14.0, 9.0, 11.0, 9.0, 7.0, 5.0, 4.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-3.73828125, -3.61480712890625, -3.4913330078125, -3.36785888671875, -3.244384765625, -3.12091064453125, -2.9974365234375, -2.87396240234375, -2.75048828125, -2.62701416015625, -2.5035400390625, -2.38006591796875, -2.256591796875, -2.13311767578125, -2.0096435546875, -1.88616943359375, -1.7626953125, -1.63922119140625, -1.5157470703125, -1.39227294921875, -1.268798828125, -1.14532470703125, -1.0218505859375, -0.89837646484375, -0.77490234375, -0.65142822265625, -0.5279541015625, -0.40447998046875, -0.281005859375, -0.15753173828125, -0.0340576171875, 0.08941650390625, 0.212890625, 0.33636474609375, 0.4598388671875, 0.58331298828125, 0.706787109375, 0.83026123046875, 0.9537353515625, 1.07720947265625, 1.20068359375, 1.32415771484375, 1.4476318359375, 1.57110595703125, 1.694580078125, 1.81805419921875, 1.9415283203125, 2.06500244140625, 2.1884765625, 2.31195068359375, 2.4354248046875, 2.55889892578125, 2.682373046875, 2.80584716796875, 2.9293212890625, 3.05279541015625, 3.17626953125, 3.29974365234375, 3.4232177734375, 3.54669189453125, 3.670166015625, 3.79364013671875, 3.9171142578125, 4.04058837890625, 4.1640625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 11.0, 3.0, 10.0, 11.0, 23.0, 32.0, 29.0, 33.0, 49.0, 83.0, 134.0, 190.0, 349.0, 636.0, 1187.0, 2836.0, 7659.0, 42341.0, 584278.0, 2843338.0, 651883.0, 45312.0, 8310.0, 2752.0, 1225.0, 621.0, 334.0, 222.0, 103.0, 70.0, 47.0, 37.0, 33.0, 24.0, 14.0, 16.0, 7.0, 9.0, 7.0, 7.0, 3.0, 5.0, 8.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.296875, -8.98193359375, -8.6669921875, -8.35205078125, -8.037109375, -7.72216796875, -7.4072265625, -7.09228515625, -6.77734375, -6.46240234375, -6.1474609375, -5.83251953125, -5.517578125, -5.20263671875, -4.8876953125, -4.57275390625, -4.2578125, -3.94287109375, -3.6279296875, -3.31298828125, -2.998046875, -2.68310546875, -2.3681640625, -2.05322265625, -1.73828125, -1.42333984375, -1.1083984375, -0.79345703125, -0.478515625, -0.16357421875, 0.1513671875, 0.46630859375, 0.78125, 1.09619140625, 1.4111328125, 1.72607421875, 2.041015625, 2.35595703125, 2.6708984375, 2.98583984375, 3.30078125, 3.61572265625, 3.9306640625, 4.24560546875, 4.560546875, 4.87548828125, 5.1904296875, 5.50537109375, 5.8203125, 6.13525390625, 6.4501953125, 6.76513671875, 7.080078125, 7.39501953125, 7.7099609375, 8.02490234375, 8.33984375, 8.65478515625, 8.9697265625, 9.28466796875, 9.599609375, 9.91455078125, 10.2294921875, 10.54443359375, 10.859375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 4.0, 2.0, 5.0, 6.0, 20.0, 9.0, 30.0, 40.0, 41.0, 71.0, 87.0, 108.0, 146.0, 207.0, 266.0, 362.0, 416.0, 550.0, 419.0, 309.0, 244.0, 214.0, 149.0, 124.0, 64.0, 42.0, 49.0, 23.0, 21.0, 16.0, 9.0, 6.0, 7.0, 2.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3515625, -7.130859375, -6.91015625, -6.689453125, -6.46875, -6.248046875, -6.02734375, -5.806640625, -5.5859375, -5.365234375, -5.14453125, -4.923828125, -4.703125, -4.482421875, -4.26171875, -4.041015625, -3.8203125, -3.599609375, -3.37890625, -3.158203125, -2.9375, -2.716796875, -2.49609375, -2.275390625, -2.0546875, -1.833984375, -1.61328125, -1.392578125, -1.171875, -0.951171875, -0.73046875, -0.509765625, -0.2890625, -0.068359375, 0.15234375, 0.373046875, 0.59375, 0.814453125, 1.03515625, 1.255859375, 1.4765625, 1.697265625, 1.91796875, 2.138671875, 2.359375, 2.580078125, 2.80078125, 3.021484375, 3.2421875, 3.462890625, 3.68359375, 3.904296875, 4.125, 4.345703125, 4.56640625, 4.787109375, 5.0078125, 5.228515625, 5.44921875, 5.669921875, 5.890625, 6.111328125, 6.33203125, 6.552734375, 6.7734375]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 3.0, 2.0, 3.0, 6.0, 4.0, 0.0, 5.0, 6.0, 8.0, 11.0, 12.0, 20.0, 31.0, 66.0, 69.0, 92.0, 189.0, 298.0, 479.0, 950.0, 2086.0, 7310.0, 113168.0, 3535490.0, 512717.0, 15535.0, 2948.0, 1171.0, 617.0, 344.0, 212.0, 138.0, 97.0, 66.0, 37.0, 24.0, 19.0, 16.0, 12.0, 4.0, 10.0, 1.0, 3.0, 6.0, 4.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.921875, -12.455078125, -11.98828125, -11.521484375, -11.0546875, -10.587890625, -10.12109375, -9.654296875, -9.1875, -8.720703125, -8.25390625, -7.787109375, -7.3203125, -6.853515625, -6.38671875, -5.919921875, -5.453125, -4.986328125, -4.51953125, -4.052734375, -3.5859375, -3.119140625, -2.65234375, -2.185546875, -1.71875, -1.251953125, -0.78515625, -0.318359375, 0.1484375, 0.615234375, 1.08203125, 1.548828125, 2.015625, 2.482421875, 2.94921875, 3.416015625, 3.8828125, 4.349609375, 4.81640625, 5.283203125, 5.75, 6.216796875, 6.68359375, 7.150390625, 7.6171875, 8.083984375, 8.55078125, 9.017578125, 9.484375, 9.951171875, 10.41796875, 10.884765625, 11.3515625, 11.818359375, 12.28515625, 12.751953125, 13.21875, 13.685546875, 14.15234375, 14.619140625, 15.0859375, 15.552734375, 16.01953125, 16.486328125, 16.953125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 8.0, 184.0, 700.0, 120.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.82880401611328, -94.09553527832031, -88.36226654052734, -82.62899780273438, -76.8957290649414, -71.16246032714844, -65.42919158935547, -59.6959228515625, -53.96265411376953, -48.22938537597656, -42.496116638183594, -36.762847900390625, -31.029579162597656, -25.296310424804688, -19.56304168701172, -13.82977294921875, -8.096504211425781, -2.3632354736328125, 3.3700332641601562, 9.103302001953125, 14.836570739746094, 20.569839477539062, 26.30310821533203, 32.036376953125, 37.76964569091797, 43.50291442871094, 49.236183166503906, 54.969451904296875, 60.702720642089844, 66.43598937988281, 72.16925811767578, 77.90252685546875, 83.63580322265625, 89.36907196044922, 95.10234069824219, 100.83560943603516, 106.56887817382812, 112.3021469116211, 118.03541564941406, 123.76868438720703, 129.501953125, 135.2352294921875, 140.96849060058594, 146.70175170898438, 152.43502807617188, 158.16830444335938, 163.9015655517578, 169.63482666015625, 175.36810302734375, 181.10137939453125, 186.8346405029297, 192.56790161132812, 198.30117797851562, 204.03445434570312, 209.76771545410156, 215.5009765625, 221.2342529296875, 226.967529296875, 232.70079040527344, 238.43405151367188, 244.16732788085938, 249.90060424804688, 255.6338653564453, 261.36712646484375, 267.10040283203125]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 6.0, 1.0, 0.0, 3.0, 5.0, 5.0, 4.0, 9.0, 12.0, 7.0, 12.0, 22.0, 24.0, 24.0, 23.0, 19.0, 28.0, 25.0, 31.0, 43.0, 33.0, 44.0, 46.0, 39.0, 33.0, 38.0, 48.0, 32.0, 38.0, 50.0, 24.0, 41.0, 32.0, 37.0, 26.0, 21.0, 13.0, 21.0, 19.0, 16.0, 14.0, 5.0, 10.0, 9.0, 6.0, 2.0, 4.0, 6.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-23.582292556762695, -22.773160934448242, -21.96402931213379, -21.154897689819336, -20.34576416015625, -19.536632537841797, -18.727500915527344, -17.91836929321289, -17.109237670898438, -16.300106048583984, -15.490974426269531, -14.681841850280762, -13.872710227966309, -13.063578605651855, -12.254446029663086, -11.445314407348633, -10.63618278503418, -9.827051162719727, -9.017919540405273, -8.208786964416504, -7.399655342102051, -6.590523719787598, -5.781391620635986, -4.972259521484375, -4.163127899169922, -3.3539960384368896, -2.5448641777038574, -1.7357323169708252, -0.926600456237793, -0.11746883392333984, 0.6916632652282715, 1.5007953643798828, 2.3099288940429688, 3.119060754776001, 3.928192615509033, 4.7373247146606445, 5.546456336975098, 6.355587959289551, 7.164720058441162, 7.973852157592773, 8.782983779907227, 9.59211540222168, 10.401247024536133, 11.210379600524902, 12.019511222839355, 12.828642845153809, 13.637775421142578, 14.446907043457031, 15.256038665771484, 16.065170288085938, 16.87430191040039, 17.683433532714844, 18.492565155029297, 19.30169677734375, 20.110830307006836, 20.91996192932129, 21.729093551635742, 22.538225173950195, 23.34735679626465, 24.1564884185791, 24.965621948242188, 25.77475357055664, 26.583885192871094, 27.393016815185547, 28.2021484375]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 1.0, 8.0, 11.0, 12.0, 14.0, 15.0, 16.0, 14.0, 20.0, 21.0, 29.0, 23.0, 26.0, 29.0, 38.0, 35.0, 46.0, 38.0, 42.0, 38.0, 35.0, 41.0, 42.0, 32.0, 32.0, 34.0, 21.0, 36.0, 30.0, 33.0, 18.0, 23.0, 20.0, 16.0, 28.0, 13.0, 13.0, 11.0, 6.0, 7.0, 1.0, 7.0, 5.0, 4.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.939453125, -2.848785400390625, -2.75811767578125, -2.667449951171875, -2.5767822265625, -2.486114501953125, -2.39544677734375, -2.304779052734375, -2.214111328125, -2.123443603515625, -2.03277587890625, -1.942108154296875, -1.8514404296875, -1.760772705078125, -1.67010498046875, -1.579437255859375, -1.48876953125, -1.398101806640625, -1.30743408203125, -1.216766357421875, -1.1260986328125, -1.035430908203125, -0.94476318359375, -0.854095458984375, -0.763427734375, -0.672760009765625, -0.58209228515625, -0.491424560546875, -0.4007568359375, -0.310089111328125, -0.21942138671875, -0.128753662109375, -0.0380859375, 0.052581787109375, 0.14324951171875, 0.233917236328125, 0.3245849609375, 0.415252685546875, 0.50592041015625, 0.596588134765625, 0.687255859375, 0.777923583984375, 0.86859130859375, 0.959259033203125, 1.0499267578125, 1.140594482421875, 1.23126220703125, 1.321929931640625, 1.41259765625, 1.503265380859375, 1.59393310546875, 1.684600830078125, 1.7752685546875, 1.865936279296875, 1.95660400390625, 2.047271728515625, 2.137939453125, 2.228607177734375, 2.31927490234375, 2.409942626953125, 2.5006103515625, 2.591278076171875, 2.68194580078125, 2.772613525390625, 2.86328125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 7.0, 6.0, 11.0, 8.0, 18.0, 32.0, 51.0, 71.0, 130.0, 176.0, 236.0, 365.0, 573.0, 850.0, 1264.0, 1886.0, 2858.0, 4134.0, 6224.0, 9097.0, 13777.0, 21194.0, 33403.0, 55100.0, 94589.0, 165611.0, 236475.0, 160730.0, 92082.0, 53278.0, 32526.0, 20895.0, 13576.0, 9022.0, 6010.0, 4029.0, 2791.0, 1795.0, 1233.0, 757.0, 567.0, 390.0, 273.0, 173.0, 90.0, 58.0, 51.0, 43.0, 22.0, 14.0, 5.0, 4.0, 4.0, 1.0, 4.0, 2.0, 1.0], "bins": [-0.34130859375, -0.3311119079589844, -0.32091522216796875, -0.3107185363769531, -0.3005218505859375, -0.2903251647949219, -0.28012847900390625, -0.2699317932128906, -0.259735107421875, -0.24953842163085938, -0.23934173583984375, -0.22914505004882812, -0.2189483642578125, -0.20875167846679688, -0.19855499267578125, -0.18835830688476562, -0.17816162109375, -0.16796493530273438, -0.15776824951171875, -0.14757156372070312, -0.1373748779296875, -0.12717819213867188, -0.11698150634765625, -0.10678482055664062, -0.096588134765625, -0.08639144897460938, -0.07619476318359375, -0.06599807739257812, -0.0558013916015625, -0.045604705810546875, -0.03540802001953125, -0.025211334228515625, -0.0150146484375, -0.004817962646484375, 0.00537872314453125, 0.015575408935546875, 0.0257720947265625, 0.035968780517578125, 0.04616546630859375, 0.056362152099609375, 0.066558837890625, 0.07675552368164062, 0.08695220947265625, 0.09714889526367188, 0.1073455810546875, 0.11754226684570312, 0.12773895263671875, 0.13793563842773438, 0.14813232421875, 0.15832901000976562, 0.16852569580078125, 0.17872238159179688, 0.1889190673828125, 0.19911575317382812, 0.20931243896484375, 0.21950912475585938, 0.229705810546875, 0.23990249633789062, 0.25009918212890625, 0.2602958679199219, 0.2704925537109375, 0.2806892395019531, 0.29088592529296875, 0.3010826110839844, 0.311279296875]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 10.0, 10.0, 13.0, 15.0, 10.0, 18.0, 17.0, 26.0, 21.0, 23.0, 27.0, 31.0, 26.0, 40.0, 54.0, 36.0, 50.0, 45.0, 1060.0, 51.0, 36.0, 42.0, 42.0, 31.0, 30.0, 46.0, 32.0, 25.0, 27.0, 28.0, 12.0, 17.0, 16.0, 12.0, 6.0, 8.0, 8.0, 4.0, 5.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.95703125, -1.894927978515625, -1.83282470703125, -1.770721435546875, -1.7086181640625, -1.646514892578125, -1.58441162109375, -1.522308349609375, -1.460205078125, -1.398101806640625, -1.33599853515625, -1.273895263671875, -1.2117919921875, -1.149688720703125, -1.08758544921875, -1.025482177734375, -0.96337890625, -0.901275634765625, -0.83917236328125, -0.777069091796875, -0.7149658203125, -0.652862548828125, -0.59075927734375, -0.528656005859375, -0.466552734375, -0.404449462890625, -0.34234619140625, -0.280242919921875, -0.2181396484375, -0.156036376953125, -0.09393310546875, -0.031829833984375, 0.0302734375, 0.092376708984375, 0.15447998046875, 0.216583251953125, 0.2786865234375, 0.340789794921875, 0.40289306640625, 0.464996337890625, 0.527099609375, 0.589202880859375, 0.65130615234375, 0.713409423828125, 0.7755126953125, 0.837615966796875, 0.89971923828125, 0.961822509765625, 1.02392578125, 1.086029052734375, 1.14813232421875, 1.210235595703125, 1.2723388671875, 1.334442138671875, 1.39654541015625, 1.458648681640625, 1.520751953125, 1.582855224609375, 1.64495849609375, 1.707061767578125, 1.7691650390625, 1.831268310546875, 1.89337158203125, 1.955474853515625, 2.017578125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 5.0, 4.0, 7.0, 12.0, 21.0, 20.0, 46.0, 64.0, 89.0, 114.0, 172.0, 258.0, 372.0, 569.0, 806.0, 1159.0, 1647.0, 2381.0, 3410.0, 5001.0, 7170.0, 10757.0, 15756.0, 23922.0, 36662.0, 57351.0, 94025.0, 152590.0, 1246176.0, 161540.0, 99169.0, 61030.0, 38414.0, 24915.0, 16427.0, 10966.0, 7449.0, 5188.0, 3599.0, 2406.0, 1652.0, 1148.0, 808.0, 589.0, 419.0, 267.0, 176.0, 132.0, 82.0, 66.0, 53.0, 27.0, 19.0, 12.0, 7.0, 8.0, 4.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.2393798828125, -0.2317943572998047, -0.22420883178710938, -0.21662330627441406, -0.20903778076171875, -0.20145225524902344, -0.19386672973632812, -0.1862812042236328, -0.1786956787109375, -0.1711101531982422, -0.16352462768554688, -0.15593910217285156, -0.14835357666015625, -0.14076805114746094, -0.13318252563476562, -0.1255970001220703, -0.118011474609375, -0.11042594909667969, -0.10284042358398438, -0.09525489807128906, -0.08766937255859375, -0.08008384704589844, -0.07249832153320312, -0.06491279602050781, -0.0573272705078125, -0.04974174499511719, -0.042156219482421875, -0.03457069396972656, -0.02698516845703125, -0.019399642944335938, -0.011814117431640625, -0.0042285919189453125, 0.00335693359375, 0.010942459106445312, 0.018527984619140625, 0.026113510131835938, 0.03369903564453125, 0.04128456115722656, 0.048870086669921875, 0.05645561218261719, 0.0640411376953125, 0.07162666320800781, 0.07921218872070312, 0.08679771423339844, 0.09438323974609375, 0.10196876525878906, 0.10955429077148438, 0.11713981628417969, 0.124725341796875, 0.1323108673095703, 0.13989639282226562, 0.14748191833496094, 0.15506744384765625, 0.16265296936035156, 0.17023849487304688, 0.1778240203857422, 0.1854095458984375, 0.1929950714111328, 0.20058059692382812, 0.20816612243652344, 0.21575164794921875, 0.22333717346191406, 0.23092269897460938, 0.2385082244873047, 0.24609375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 2.0, 4.0, 3.0, 1.0, 5.0, 6.0, 5.0, 7.0, 5.0, 12.0, 10.0, 13.0, 29.0, 21.0, 28.0, 42.0, 54.0, 99.0, 139.0, 136.0, 118.0, 70.0, 44.0, 37.0, 23.0, 20.0, 12.0, 8.0, 10.0, 11.0, 6.0, 6.0, 4.0, 2.0, 2.0, 3.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0036907196044921875, -0.0035716593265533447, -0.003452599048614502, -0.003333538770675659, -0.0032144784927368164, -0.0030954182147979736, -0.002976357936859131, -0.002857297658920288, -0.0027382373809814453, -0.0026191771030426025, -0.0025001168251037598, -0.002381056547164917, -0.0022619962692260742, -0.0021429359912872314, -0.0020238757133483887, -0.001904815435409546, -0.0017857551574707031, -0.0016666948795318604, -0.0015476346015930176, -0.0014285743236541748, -0.001309514045715332, -0.0011904537677764893, -0.0010713934898376465, -0.0009523332118988037, -0.0008332729339599609, -0.0007142126560211182, -0.0005951523780822754, -0.0004760921001434326, -0.00035703182220458984, -0.00023797154426574707, -0.0001189112663269043, 1.4901161193847656e-07, 0.00011920928955078125, 0.00023826956748962402, 0.0003573298454284668, 0.00047639012336730957, 0.0005954504013061523, 0.0007145106792449951, 0.0008335709571838379, 0.0009526312351226807, 0.0010716915130615234, 0.0011907517910003662, 0.001309812068939209, 0.0014288723468780518, 0.0015479326248168945, 0.0016669929027557373, 0.00178605318069458, 0.0019051134586334229, 0.0020241737365722656, 0.0021432340145111084, 0.002262294292449951, 0.002381354570388794, 0.0025004148483276367, 0.0026194751262664795, 0.0027385354042053223, 0.002857595682144165, 0.002976655960083008, 0.0030957162380218506, 0.0032147765159606934, 0.003333836793899536, 0.003452897071838379, 0.0035719573497772217, 0.0036910176277160645, 0.0038100779056549072, 0.00392913818359375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 0.0, 2.0, 2.0, 5.0, 5.0, 3.0, 7.0, 8.0, 14.0, 12.0, 16.0, 22.0, 22.0, 33.0, 50.0, 67.0, 116.0, 153.0, 286.0, 642.0, 3409.0, 1035182.0, 6916.0, 689.0, 306.0, 176.0, 101.0, 69.0, 50.0, 42.0, 32.0, 25.0, 9.0, 19.0, 13.0, 13.0, 3.0, 8.0, 5.0, 2.0, 5.0, 7.0, 4.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0645751953125, -0.0625295639038086, -0.06048393249511719, -0.05843830108642578, -0.056392669677734375, -0.05434703826904297, -0.05230140686035156, -0.050255775451660156, -0.04821014404296875, -0.046164512634277344, -0.04411888122558594, -0.04207324981689453, -0.040027618408203125, -0.03798198699951172, -0.03593635559082031, -0.033890724182128906, -0.0318450927734375, -0.029799461364746094, -0.027753829956054688, -0.02570819854736328, -0.023662567138671875, -0.02161693572998047, -0.019571304321289062, -0.017525672912597656, -0.01548004150390625, -0.013434410095214844, -0.011388778686523438, -0.009343147277832031, -0.007297515869140625, -0.005251884460449219, -0.0032062530517578125, -0.0011606216430664062, 0.000885009765625, 0.0029306411743164062, 0.0049762725830078125, 0.007021903991699219, 0.009067535400390625, 0.011113166809082031, 0.013158798217773438, 0.015204429626464844, 0.01725006103515625, 0.019295692443847656, 0.021341323852539062, 0.02338695526123047, 0.025432586669921875, 0.02747821807861328, 0.029523849487304688, 0.031569480895996094, 0.0336151123046875, 0.035660743713378906, 0.03770637512207031, 0.03975200653076172, 0.041797637939453125, 0.04384326934814453, 0.04588890075683594, 0.047934532165527344, 0.04998016357421875, 0.052025794982910156, 0.05407142639160156, 0.05611705780029297, 0.058162689208984375, 0.06020832061767578, 0.06225395202636719, 0.0642995834350586, 0.06634521484375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 385.0, 625.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0017025572014972568, -0.0011482036206871271, -0.0005938500398769975, -3.949645906686783e-05, 0.0005148571217432618, 0.0010692105861380696, 0.001623564283363521, 0.0021779178641736507, 0.0027322713285684586, 0.0032866247929632664, 0.003840978490188718, 0.004395332187414169, 0.004949685651808977, 0.005504039116203785, 0.00605839304625988, 0.006612746510654688, 0.007167099975049496, 0.0077214534394443035, 0.008275806903839111, 0.008830160833895206, 0.009384514763951302, 0.009938867762684822, 0.010493221692740917, 0.011047575622797012, 0.011601928621530533, 0.012156282551586628, 0.012710635550320148, 0.013264989480376244, 0.013819342479109764, 0.01437369640916586, 0.014928050339221954, 0.015482403337955475, 0.016036756336688995, 0.016591109335422516, 0.017145464196801186, 0.017699817195534706, 0.018254170194268227, 0.018808525055646896, 0.019362878054380417, 0.019917231053113937, 0.020471584051847458, 0.02102593705058098, 0.021580291911959648, 0.02213464491069317, 0.02268899790942669, 0.02324335277080536, 0.02379770576953888, 0.0243520587682724, 0.02490641362965107, 0.02546076662838459, 0.02601512148976326, 0.02656947448849678, 0.0271238274872303, 0.02767818048596382, 0.02823253534734249, 0.02878688834607601, 0.02934124320745468, 0.029895596206188202, 0.03044995106756687, 0.031004304066300392, 0.03155865892767906, 0.03211301192641258, 0.0326673649251461, 0.03322171792387962, 0.033776070922613144]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 5.0, 2.0, 6.0, 3.0, 6.0, 7.0, 7.0, 12.0, 21.0, 16.0, 10.0, 18.0, 25.0, 24.0, 31.0, 41.0, 44.0, 48.0, 50.0, 34.0, 44.0, 42.0, 43.0, 56.0, 42.0, 40.0, 57.0, 43.0, 40.0, 34.0, 22.0, 20.0, 19.0, 26.0, 24.0, 5.0, 19.0, 5.0, 4.0, 6.0, 3.0, 1.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.002093017101287842, -0.0020349686965346336, -0.0019769202917814255, -0.0019188718870282173, -0.0018608234822750092, -0.001802775077521801, -0.0017447266727685928, -0.0016866782680153847, -0.0016286298632621765, -0.0015705814585089684, -0.0015125330537557602, -0.001454484649002552, -0.0013964362442493439, -0.0013383878394961357, -0.0012803394347429276, -0.0012222910299897194, -0.0011642426252365112, -0.001106194220483303, -0.001048145815730095, -0.0009900974109768867, -0.0009320490062236786, -0.0008740006014704704, -0.0008159521967172623, -0.0007579037919640541, -0.000699855387210846, -0.0006418069824576378, -0.0005837585777044296, -0.0005257101729512215, -0.0004676617681980133, -0.00040961336344480515, -0.000351564958691597, -0.0002935165539383888, -0.00023546814918518066, -0.0001774197444319725, -0.00011937133967876434, -6.132293492555618e-05, -3.2745301723480225e-06, 5.477387458086014e-05, 0.0001128222793340683, 0.00017087068408727646, 0.00022891908884048462, 0.0002869674935936928, 0.00034501589834690094, 0.0004030643031001091, 0.00046111270785331726, 0.0005191611126065254, 0.0005772095173597336, 0.0006352579221129417, 0.0006933063268661499, 0.0007513547316193581, 0.0008094031363725662, 0.0008674515411257744, 0.0009254999458789825, 0.0009835483506321907, 0.0010415967553853989, 0.001099645160138607, 0.0011576935648918152, 0.0012157419696450233, 0.0012737903743982315, 0.0013318387791514397, 0.0013898871839046478, 0.001447935588657856, 0.0015059839934110641, 0.0015640323981642723, 0.0016220808029174805]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 9.0, 1.0, 8.0, 11.0, 12.0, 14.0, 15.0, 16.0, 14.0, 20.0, 21.0, 29.0, 23.0, 26.0, 29.0, 38.0, 35.0, 46.0, 38.0, 42.0, 38.0, 35.0, 41.0, 42.0, 32.0, 32.0, 34.0, 21.0, 36.0, 30.0, 33.0, 18.0, 23.0, 20.0, 16.0, 28.0, 13.0, 13.0, 11.0, 6.0, 7.0, 1.0, 7.0, 5.0, 4.0, 0.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0], "bins": [-2.939453125, -2.848785400390625, -2.75811767578125, -2.667449951171875, -2.5767822265625, -2.486114501953125, -2.39544677734375, -2.304779052734375, -2.214111328125, -2.123443603515625, -2.03277587890625, -1.942108154296875, -1.8514404296875, -1.760772705078125, -1.67010498046875, -1.579437255859375, -1.48876953125, -1.398101806640625, -1.30743408203125, -1.216766357421875, -1.1260986328125, -1.035430908203125, -0.94476318359375, -0.854095458984375, -0.763427734375, -0.672760009765625, -0.58209228515625, -0.491424560546875, -0.4007568359375, -0.310089111328125, -0.21942138671875, -0.128753662109375, -0.0380859375, 0.052581787109375, 0.14324951171875, 0.233917236328125, 0.3245849609375, 0.415252685546875, 0.50592041015625, 0.596588134765625, 0.687255859375, 0.777923583984375, 0.86859130859375, 0.959259033203125, 1.0499267578125, 1.140594482421875, 1.23126220703125, 1.321929931640625, 1.41259765625, 1.503265380859375, 1.59393310546875, 1.684600830078125, 1.7752685546875, 1.865936279296875, 1.95660400390625, 2.047271728515625, 2.137939453125, 2.228607177734375, 2.31927490234375, 2.409942626953125, 2.5006103515625, 2.591278076171875, 2.68194580078125, 2.772613525390625, 2.86328125]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 6.0, 5.0, 4.0, 9.0, 10.0, 12.0, 24.0, 27.0, 44.0, 37.0, 71.0, 76.0, 110.0, 139.0, 158.0, 220.0, 282.0, 371.0, 524.0, 846.0, 1393.0, 2520.0, 5282.0, 13505.0, 47669.0, 233753.0, 540339.0, 147761.0, 32983.0, 10090.0, 4219.0, 2134.0, 1214.0, 723.0, 499.0, 337.0, 261.0, 233.0, 149.0, 120.0, 93.0, 66.0, 64.0, 52.0, 31.0, 29.0, 21.0, 16.0, 11.0, 8.0, 1.0, 5.0, 2.0, 1.0, 5.0, 1.0, 0.0, 2.0], "bins": [-5.21484375, -5.0537109375, -4.892578125, -4.7314453125, -4.5703125, -4.4091796875, -4.248046875, -4.0869140625, -3.92578125, -3.7646484375, -3.603515625, -3.4423828125, -3.28125, -3.1201171875, -2.958984375, -2.7978515625, -2.63671875, -2.4755859375, -2.314453125, -2.1533203125, -1.9921875, -1.8310546875, -1.669921875, -1.5087890625, -1.34765625, -1.1865234375, -1.025390625, -0.8642578125, -0.703125, -0.5419921875, -0.380859375, -0.2197265625, -0.05859375, 0.1025390625, 0.263671875, 0.4248046875, 0.5859375, 0.7470703125, 0.908203125, 1.0693359375, 1.23046875, 1.3916015625, 1.552734375, 1.7138671875, 1.875, 2.0361328125, 2.197265625, 2.3583984375, 2.51953125, 2.6806640625, 2.841796875, 3.0029296875, 3.1640625, 3.3251953125, 3.486328125, 3.6474609375, 3.80859375, 3.9697265625, 4.130859375, 4.2919921875, 4.453125, 4.6142578125, 4.775390625, 4.9365234375, 5.09765625]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 2.0, 4.0, 5.0, 3.0, 6.0, 8.0, 8.0, 14.0, 11.0, 22.0, 27.0, 27.0, 27.0, 43.0, 42.0, 49.0, 64.0, 144.0, 321.0, 1536.0, 222.0, 91.0, 80.0, 50.0, 52.0, 35.0, 29.0, 28.0, 21.0, 23.0, 14.0, 12.0, 7.0, 9.0, 6.0, 4.0, 3.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.7890625, -9.4957275390625, -9.202392578125, -8.9090576171875, -8.61572265625, -8.3223876953125, -8.029052734375, -7.7357177734375, -7.4423828125, -7.1490478515625, -6.855712890625, -6.5623779296875, -6.26904296875, -5.9757080078125, -5.682373046875, -5.3890380859375, -5.095703125, -4.8023681640625, -4.509033203125, -4.2156982421875, -3.92236328125, -3.6290283203125, -3.335693359375, -3.0423583984375, -2.7490234375, -2.4556884765625, -2.162353515625, -1.8690185546875, -1.57568359375, -1.2823486328125, -0.989013671875, -0.6956787109375, -0.40234375, -0.1090087890625, 0.184326171875, 0.4776611328125, 0.77099609375, 1.0643310546875, 1.357666015625, 1.6510009765625, 1.9443359375, 2.2376708984375, 2.531005859375, 2.8243408203125, 3.11767578125, 3.4110107421875, 3.704345703125, 3.9976806640625, 4.291015625, 4.5843505859375, 4.877685546875, 5.1710205078125, 5.46435546875, 5.7576904296875, 6.051025390625, 6.3443603515625, 6.6376953125, 6.9310302734375, 7.224365234375, 7.5177001953125, 7.81103515625, 8.1043701171875, 8.397705078125, 8.6910400390625, 8.984375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 4.0, 8.0, 10.0, 10.0, 21.0, 15.0, 31.0, 39.0, 50.0, 54.0, 99.0, 164.0, 253.0, 401.0, 784.0, 3283.0, 2860629.0, 276112.0, 2089.0, 634.0, 363.0, 179.0, 126.0, 97.0, 55.0, 52.0, 33.0, 20.0, 30.0, 23.0, 7.0, 9.0, 6.0, 5.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-16.953125, -16.322509765625, -15.69189453125, -15.061279296875, -14.4306640625, -13.800048828125, -13.16943359375, -12.538818359375, -11.908203125, -11.277587890625, -10.64697265625, -10.016357421875, -9.3857421875, -8.755126953125, -8.12451171875, -7.493896484375, -6.86328125, -6.232666015625, -5.60205078125, -4.971435546875, -4.3408203125, -3.710205078125, -3.07958984375, -2.448974609375, -1.818359375, -1.187744140625, -0.55712890625, 0.073486328125, 0.7041015625, 1.334716796875, 1.96533203125, 2.595947265625, 3.2265625, 3.857177734375, 4.48779296875, 5.118408203125, 5.7490234375, 6.379638671875, 7.01025390625, 7.640869140625, 8.271484375, 8.902099609375, 9.53271484375, 10.163330078125, 10.7939453125, 11.424560546875, 12.05517578125, 12.685791015625, 13.31640625, 13.947021484375, 14.57763671875, 15.208251953125, 15.8388671875, 16.469482421875, 17.10009765625, 17.730712890625, 18.361328125, 18.991943359375, 19.62255859375, 20.253173828125, 20.8837890625, 21.514404296875, 22.14501953125, 22.775634765625, 23.40625]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 5.0, 219.0, 731.0, 58.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.713550567626953, -16.55266761779785, -13.391783714294434, -10.230899810791016, -7.070016860961914, -3.9091339111328125, -0.7482490539550781, 2.4126338958740234, 5.573516845703125, 8.734399795532227, 11.895283699035645, 15.056167602539062, 18.217050552368164, 21.377933502197266, 24.538818359375, 27.6997013092041, 30.860584259033203, 34.02146911621094, 37.182350158691406, 40.34323501586914, 43.504119873046875, 46.665000915527344, 49.82588577270508, 52.98677062988281, 56.14765167236328, 59.308536529541016, 62.469417572021484, 65.63030242919922, 68.79118347167969, 71.95207214355469, 75.11295318603516, 78.27383422851562, 81.43472290039062, 84.5956039428711, 87.7564926147461, 90.91737365722656, 94.07825469970703, 97.2391357421875, 100.4000244140625, 103.56090545654297, 106.72178649902344, 109.8826675415039, 113.0435562133789, 116.20443725585938, 119.36531829833984, 122.52619934082031, 125.68708801269531, 128.8479766845703, 132.00885009765625, 135.16973876953125, 138.3306121826172, 141.4915008544922, 144.6523895263672, 147.81326293945312, 150.97415161132812, 154.13504028320312, 157.29592895507812, 160.45681762695312, 163.61769104003906, 166.77857971191406, 169.93946838378906, 173.100341796875, 176.26123046875, 179.422119140625, 182.58299255371094]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 4.0, 6.0, 6.0, 4.0, 8.0, 8.0, 5.0, 16.0, 7.0, 6.0, 16.0, 14.0, 19.0, 28.0, 18.0, 28.0, 18.0, 31.0, 32.0, 31.0, 37.0, 31.0, 26.0, 40.0, 30.0, 34.0, 51.0, 32.0, 37.0, 31.0, 35.0, 35.0, 36.0, 21.0, 24.0, 24.0, 28.0, 19.0, 21.0, 15.0, 12.0, 14.0, 14.0, 8.0, 5.0, 15.0, 10.0, 5.0, 4.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-13.828346252441406, -13.355687141418457, -12.883027076721191, -12.410367965698242, -11.937707901000977, -11.465048789978027, -10.992389678955078, -10.519729614257812, -10.047070503234863, -9.574411392211914, -9.101751327514648, -8.6290922164917, -8.15643310546875, -7.683773040771484, -7.211113929748535, -6.738454341888428, -6.26579475402832, -5.793135166168213, -5.3204755783081055, -4.847816467285156, -4.375156879425049, -3.9024972915649414, -3.429837942123413, -2.9571785926818848, -2.4845190048217773, -2.01185941696167, -1.5392000675201416, -1.0665405988693237, -0.5938811302185059, -0.12122154235839844, 0.3514378070831299, 0.8240971565246582, 1.2967567443847656, 1.7694162130355835, 2.2420756816864014, 2.7147350311279297, 3.187394618988037, 3.6600542068481445, 4.132713317871094, 4.605372905731201, 5.078032493591309, 5.550692081451416, 6.023351669311523, 6.496010780334473, 6.96867036819458, 7.4413299560546875, 7.913989067077637, 8.386648178100586, 8.859308242797852, 9.3319673538208, 9.804627418518066, 10.277286529541016, 10.749946594238281, 11.22260570526123, 11.69526481628418, 12.167924880981445, 12.640583992004395, 13.113243103027344, 13.58590316772461, 14.058562278747559, 14.531221389770508, 15.003881454467773, 15.476540565490723, 15.949199676513672, 16.421859741210938]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 2.0, 1.0, 3.0, 6.0, 7.0, 7.0, 5.0, 10.0, 12.0, 12.0, 14.0, 14.0, 18.0, 22.0, 32.0, 28.0, 36.0, 28.0, 34.0, 34.0, 36.0, 39.0, 45.0, 42.0, 39.0, 40.0, 35.0, 40.0, 34.0, 29.0, 34.0, 26.0, 38.0, 28.0, 20.0, 22.0, 22.0, 18.0, 18.0, 13.0, 14.0, 9.0, 15.0, 3.0, 3.0, 6.0, 4.0, 6.0, 2.0, 2.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.421875, -3.3170166015625, -3.212158203125, -3.1072998046875, -3.00244140625, -2.8975830078125, -2.792724609375, -2.6878662109375, -2.5830078125, -2.4781494140625, -2.373291015625, -2.2684326171875, -2.16357421875, -2.0587158203125, -1.953857421875, -1.8489990234375, -1.744140625, -1.6392822265625, -1.534423828125, -1.4295654296875, -1.32470703125, -1.2198486328125, -1.114990234375, -1.0101318359375, -0.9052734375, -0.8004150390625, -0.695556640625, -0.5906982421875, -0.48583984375, -0.3809814453125, -0.276123046875, -0.1712646484375, -0.06640625, 0.0384521484375, 0.143310546875, 0.2481689453125, 0.35302734375, 0.4578857421875, 0.562744140625, 0.6676025390625, 0.7724609375, 0.8773193359375, 0.982177734375, 1.0870361328125, 1.19189453125, 1.2967529296875, 1.401611328125, 1.5064697265625, 1.611328125, 1.7161865234375, 1.821044921875, 1.9259033203125, 2.03076171875, 2.1356201171875, 2.240478515625, 2.3453369140625, 2.4501953125, 2.5550537109375, 2.659912109375, 2.7647705078125, 2.86962890625, 2.9744873046875, 3.079345703125, 3.1842041015625, 3.2890625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 3.0, 6.0, 9.0, 10.0, 12.0, 19.0, 22.0, 27.0, 26.0, 42.0, 48.0, 83.0, 108.0, 141.0, 204.0, 282.0, 432.0, 708.0, 1316.0, 3583.0, 18743.0, 438419.0, 3517771.0, 193720.0, 12628.0, 2774.0, 1093.0, 635.0, 427.0, 272.0, 187.0, 132.0, 97.0, 74.0, 55.0, 50.0, 33.0, 23.0, 18.0, 14.0, 14.0, 9.0, 3.0, 6.0, 2.0, 5.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-19.5625, -18.993896484375, -18.42529296875, -17.856689453125, -17.2880859375, -16.719482421875, -16.15087890625, -15.582275390625, -15.013671875, -14.445068359375, -13.87646484375, -13.307861328125, -12.7392578125, -12.170654296875, -11.60205078125, -11.033447265625, -10.46484375, -9.896240234375, -9.32763671875, -8.759033203125, -8.1904296875, -7.621826171875, -7.05322265625, -6.484619140625, -5.916015625, -5.347412109375, -4.77880859375, -4.210205078125, -3.6416015625, -3.072998046875, -2.50439453125, -1.935791015625, -1.3671875, -0.798583984375, -0.22998046875, 0.338623046875, 0.9072265625, 1.475830078125, 2.04443359375, 2.613037109375, 3.181640625, 3.750244140625, 4.31884765625, 4.887451171875, 5.4560546875, 6.024658203125, 6.59326171875, 7.161865234375, 7.73046875, 8.299072265625, 8.86767578125, 9.436279296875, 10.0048828125, 10.573486328125, 11.14208984375, 11.710693359375, 12.279296875, 12.847900390625, 13.41650390625, 13.985107421875, 14.5537109375, 15.122314453125, 15.69091796875, 16.259521484375, 16.828125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 4.0, 5.0, 2.0, 6.0, 8.0, 12.0, 10.0, 23.0, 24.0, 37.0, 40.0, 75.0, 75.0, 140.0, 182.0, 294.0, 429.0, 534.0, 576.0, 503.0, 336.0, 244.0, 158.0, 115.0, 75.0, 38.0, 41.0, 27.0, 11.0, 20.0, 11.0, 8.0, 7.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.55859375, -7.30072021484375, -7.0428466796875, -6.78497314453125, -6.527099609375, -6.26922607421875, -6.0113525390625, -5.75347900390625, -5.49560546875, -5.23773193359375, -4.9798583984375, -4.72198486328125, -4.464111328125, -4.20623779296875, -3.9483642578125, -3.69049072265625, -3.4326171875, -3.17474365234375, -2.9168701171875, -2.65899658203125, -2.401123046875, -2.14324951171875, -1.8853759765625, -1.62750244140625, -1.36962890625, -1.11175537109375, -0.8538818359375, -0.59600830078125, -0.338134765625, -0.08026123046875, 0.1776123046875, 0.43548583984375, 0.693359375, 0.95123291015625, 1.2091064453125, 1.46697998046875, 1.724853515625, 1.98272705078125, 2.2406005859375, 2.49847412109375, 2.75634765625, 3.01422119140625, 3.2720947265625, 3.52996826171875, 3.787841796875, 4.04571533203125, 4.3035888671875, 4.56146240234375, 4.8193359375, 5.07720947265625, 5.3350830078125, 5.59295654296875, 5.850830078125, 6.10870361328125, 6.3665771484375, 6.62445068359375, 6.88232421875, 7.14019775390625, 7.3980712890625, 7.65594482421875, 7.913818359375, 8.17169189453125, 8.4295654296875, 8.68743896484375, 8.9453125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 3.0, 2.0, 8.0, 12.0, 11.0, 14.0, 18.0, 42.0, 74.0, 94.0, 166.0, 250.0, 431.0, 758.0, 1233.0, 2474.0, 4935.0, 10732.0, 26564.0, 76573.0, 278134.0, 1266117.0, 1881156.0, 463519.0, 116112.0, 37096.0, 14469.0, 6342.0, 3170.0, 1533.0, 882.0, 523.0, 311.0, 185.0, 107.0, 87.0, 56.0, 32.0, 19.0, 10.0, 12.0, 7.0, 6.0, 2.0, 5.0, 3.0, 4.0], "bins": [-6.6875, -6.51678466796875, -6.3460693359375, -6.17535400390625, -6.004638671875, -5.83392333984375, -5.6632080078125, -5.49249267578125, -5.32177734375, -5.15106201171875, -4.9803466796875, -4.80963134765625, -4.638916015625, -4.46820068359375, -4.2974853515625, -4.12677001953125, -3.9560546875, -3.78533935546875, -3.6146240234375, -3.44390869140625, -3.273193359375, -3.10247802734375, -2.9317626953125, -2.76104736328125, -2.59033203125, -2.41961669921875, -2.2489013671875, -2.07818603515625, -1.907470703125, -1.73675537109375, -1.5660400390625, -1.39532470703125, -1.224609375, -1.05389404296875, -0.8831787109375, -0.71246337890625, -0.541748046875, -0.37103271484375, -0.2003173828125, -0.02960205078125, 0.14111328125, 0.31182861328125, 0.4825439453125, 0.65325927734375, 0.823974609375, 0.99468994140625, 1.1654052734375, 1.33612060546875, 1.5068359375, 1.67755126953125, 1.8482666015625, 2.01898193359375, 2.189697265625, 2.36041259765625, 2.5311279296875, 2.70184326171875, 2.87255859375, 3.04327392578125, 3.2139892578125, 3.38470458984375, 3.555419921875, 3.72613525390625, 3.8968505859375, 4.06756591796875, 4.23828125]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 4.0, 4.0, 4.0, 5.0, 5.0, 9.0, 6.0, 11.0, 16.0, 20.0, 24.0, 39.0, 40.0, 38.0, 52.0, 65.0, 61.0, 81.0, 62.0, 82.0, 68.0, 64.0, 46.0, 49.0, 39.0, 28.0, 26.0, 15.0, 16.0, 8.0, 8.0, 6.0, 2.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-43.69527816772461, -42.381736755371094, -41.06819534301758, -39.75465393066406, -38.44111251831055, -37.12757110595703, -35.814029693603516, -34.50048828125, -33.186946868896484, -31.87340545654297, -30.559864044189453, -29.246322631835938, -27.932781219482422, -26.619239807128906, -25.30569839477539, -23.992156982421875, -22.67861557006836, -21.365074157714844, -20.051532745361328, -18.737991333007812, -17.424449920654297, -16.11090850830078, -14.797367095947266, -13.48382568359375, -12.170284271240234, -10.856742858886719, -9.543201446533203, -8.229660034179688, -6.916118621826172, -5.602577209472656, -4.289035797119141, -2.975494384765625, -1.6619529724121094, -0.34841156005859375, 0.9651298522949219, 2.2786712646484375, 3.592212677001953, 4.905754089355469, 6.219295501708984, 7.5328369140625, 8.846378326416016, 10.159919738769531, 11.473461151123047, 12.787002563476562, 14.100543975830078, 15.414085388183594, 16.72762680053711, 18.041168212890625, 19.35470962524414, 20.668251037597656, 21.981792449951172, 23.295333862304688, 24.608875274658203, 25.92241668701172, 27.235958099365234, 28.54949951171875, 29.863040924072266, 31.17658233642578, 32.4901237487793, 33.80366516113281, 35.11720657348633, 36.430747985839844, 37.74428939819336, 39.057830810546875, 40.37137222290039]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 7.0, 9.0, 10.0, 15.0, 21.0, 22.0, 23.0, 26.0, 23.0, 38.0, 46.0, 46.0, 43.0, 40.0, 48.0, 53.0, 45.0, 55.0, 32.0, 42.0, 50.0, 34.0, 43.0, 36.0, 32.0, 29.0, 23.0, 20.0, 13.0, 23.0, 13.0, 11.0, 8.0, 4.0, 3.0, 5.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.803714752197266, -37.73438262939453, -36.6650505065918, -35.59571838378906, -34.52638244628906, -33.45705032348633, -32.387718200683594, -31.31838607788086, -30.249053955078125, -29.17972183227539, -28.110387802124023, -27.04105567932129, -25.971723556518555, -24.902389526367188, -23.833057403564453, -22.76372528076172, -21.69439125061035, -20.625059127807617, -19.55572509765625, -18.486392974853516, -17.41706085205078, -16.347728729248047, -15.27839469909668, -14.209062576293945, -13.139729499816895, -12.070396423339844, -11.00106430053711, -9.931731224060059, -8.862398147583008, -7.793066024780273, -6.723732948303223, -5.65440034866333, -4.58506965637207, -3.5157370567321777, -2.446404218673706, -1.3770713806152344, -0.3077387809753418, 0.7615938186645508, 1.8309268951416016, 2.900259494781494, 3.9695920944213867, 5.038924694061279, 6.108257293701172, 7.177590370178223, 8.246923446655273, 9.316255569458008, 10.385588645935059, 11.45492172241211, 12.524253845214844, 13.593586921691895, 14.662919044494629, 15.73225212097168, 16.801584243774414, 17.87091827392578, 18.940250396728516, 20.00958251953125, 21.078914642333984, 22.14824676513672, 23.217580795288086, 24.28691291809082, 25.356245040893555, 26.425579071044922, 27.494911193847656, 28.56424331665039, 29.633577346801758]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 11.0, 11.0, 8.0, 12.0, 21.0, 21.0, 13.0, 22.0, 32.0, 29.0, 30.0, 35.0, 36.0, 36.0, 49.0, 46.0, 43.0, 50.0, 43.0, 40.0, 52.0, 34.0, 43.0, 34.0, 35.0, 37.0, 24.0, 23.0, 27.0, 22.0, 16.0, 19.0, 9.0, 11.0, 11.0, 5.0, 4.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-61.0, -59.29638671875, -57.5927734375, -55.88916015625, -54.185546875, -52.48193359375, -50.7783203125, -49.07470703125, -47.37109375, -45.66748046875, -43.9638671875, -42.26025390625, -40.556640625, -38.85302734375, -37.1494140625, -35.44580078125, -33.7421875, -32.03857421875, -30.3349609375, -28.63134765625, -26.927734375, -25.22412109375, -23.5205078125, -21.81689453125, -20.11328125, -18.40966796875, -16.7060546875, -15.00244140625, -13.298828125, -11.59521484375, -9.8916015625, -8.18798828125, -6.484375, -4.78076171875, -3.0771484375, -1.37353515625, 0.330078125, 2.03369140625, 3.7373046875, 5.44091796875, 7.14453125, 8.84814453125, 10.5517578125, 12.25537109375, 13.958984375, 15.66259765625, 17.3662109375, 19.06982421875, 20.7734375, 22.47705078125, 24.1806640625, 25.88427734375, 27.587890625, 29.29150390625, 30.9951171875, 32.69873046875, 34.40234375, 36.10595703125, 37.8095703125, 39.51318359375, 41.216796875, 42.92041015625, 44.6240234375, 46.32763671875, 48.03125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 3.0, 6.0, 12.0, 18.0, 19.0, 38.0, 59.0, 84.0, 124.0, 167.0, 238.0, 367.0, 484.0, 706.0, 1052.0, 1577.0, 2293.0, 3493.0, 5232.0, 8359.0, 12716.0, 19970.0, 31785.0, 51304.0, 82083.0, 128609.0, 182123.0, 177637.0, 124464.0, 78577.0, 49163.0, 30494.0, 19447.0, 12334.0, 7999.0, 5022.0, 3461.0, 2196.0, 1575.0, 1008.0, 665.0, 465.0, 365.0, 226.0, 158.0, 130.0, 85.0, 60.0, 38.0, 26.0, 17.0, 9.0, 9.0, 7.0, 3.0, 3.0], "bins": [-3.888671875, -3.777435302734375, -3.66619873046875, -3.554962158203125, -3.4437255859375, -3.332489013671875, -3.22125244140625, -3.110015869140625, -2.998779296875, -2.887542724609375, -2.77630615234375, -2.665069580078125, -2.5538330078125, -2.442596435546875, -2.33135986328125, -2.220123291015625, -2.10888671875, -1.997650146484375, -1.88641357421875, -1.775177001953125, -1.6639404296875, -1.552703857421875, -1.44146728515625, -1.330230712890625, -1.218994140625, -1.107757568359375, -0.99652099609375, -0.885284423828125, -0.7740478515625, -0.662811279296875, -0.55157470703125, -0.440338134765625, -0.3291015625, -0.217864990234375, -0.10662841796875, 0.004608154296875, 0.1158447265625, 0.227081298828125, 0.33831787109375, 0.449554443359375, 0.560791015625, 0.672027587890625, 0.78326416015625, 0.894500732421875, 1.0057373046875, 1.116973876953125, 1.22821044921875, 1.339447021484375, 1.45068359375, 1.561920166015625, 1.67315673828125, 1.784393310546875, 1.8956298828125, 2.006866455078125, 2.11810302734375, 2.229339599609375, 2.340576171875, 2.451812744140625, 2.56304931640625, 2.674285888671875, 2.7855224609375, 2.896759033203125, 3.00799560546875, 3.119232177734375, 3.23046875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 5.0, 6.0, 8.0, 13.0, 7.0, 3.0, 6.0, 17.0, 12.0, 18.0, 16.0, 28.0, 28.0, 20.0, 22.0, 28.0, 29.0, 36.0, 36.0, 38.0, 37.0, 45.0, 1070.0, 42.0, 47.0, 32.0, 40.0, 34.0, 43.0, 31.0, 24.0, 38.0, 19.0, 28.0, 21.0, 25.0, 16.0, 12.0, 9.0, 8.0, 8.0, 5.0, 6.0, 5.0, 2.0, 4.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-28.15625, -27.218994140625, -26.28173828125, -25.344482421875, -24.4072265625, -23.469970703125, -22.53271484375, -21.595458984375, -20.658203125, -19.720947265625, -18.78369140625, -17.846435546875, -16.9091796875, -15.971923828125, -15.03466796875, -14.097412109375, -13.16015625, -12.222900390625, -11.28564453125, -10.348388671875, -9.4111328125, -8.473876953125, -7.53662109375, -6.599365234375, -5.662109375, -4.724853515625, -3.78759765625, -2.850341796875, -1.9130859375, -0.975830078125, -0.03857421875, 0.898681640625, 1.8359375, 2.773193359375, 3.71044921875, 4.647705078125, 5.5849609375, 6.522216796875, 7.45947265625, 8.396728515625, 9.333984375, 10.271240234375, 11.20849609375, 12.145751953125, 13.0830078125, 14.020263671875, 14.95751953125, 15.894775390625, 16.83203125, 17.769287109375, 18.70654296875, 19.643798828125, 20.5810546875, 21.518310546875, 22.45556640625, 23.392822265625, 24.330078125, 25.267333984375, 26.20458984375, 27.141845703125, 28.0791015625, 29.016357421875, 29.95361328125, 30.890869140625, 31.828125]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 11.0, 11.0, 15.0, 39.0, 52.0, 77.0, 109.0, 180.0, 240.0, 363.0, 535.0, 843.0, 1198.0, 1724.0, 2580.0, 3804.0, 5631.0, 8525.0, 12363.0, 18277.0, 26508.0, 39914.0, 61740.0, 94770.0, 142652.0, 1220102.0, 153629.0, 102210.0, 66164.0, 43622.0, 29099.0, 19735.0, 13036.0, 8897.0, 5982.0, 4060.0, 2810.0, 1809.0, 1228.0, 872.0, 581.0, 369.0, 279.0, 171.0, 107.0, 70.0, 49.0, 38.0, 21.0, 13.0, 8.0, 7.0, 5.0, 4.0, 2.0], "bins": [-3.392578125, -3.29449462890625, -3.1964111328125, -3.09832763671875, -3.000244140625, -2.90216064453125, -2.8040771484375, -2.70599365234375, -2.60791015625, -2.50982666015625, -2.4117431640625, -2.31365966796875, -2.215576171875, -2.11749267578125, -2.0194091796875, -1.92132568359375, -1.8232421875, -1.72515869140625, -1.6270751953125, -1.52899169921875, -1.430908203125, -1.33282470703125, -1.2347412109375, -1.13665771484375, -1.03857421875, -0.94049072265625, -0.8424072265625, -0.74432373046875, -0.646240234375, -0.54815673828125, -0.4500732421875, -0.35198974609375, -0.25390625, -0.15582275390625, -0.0577392578125, 0.04034423828125, 0.138427734375, 0.23651123046875, 0.3345947265625, 0.43267822265625, 0.53076171875, 0.62884521484375, 0.7269287109375, 0.82501220703125, 0.923095703125, 1.02117919921875, 1.1192626953125, 1.21734619140625, 1.3154296875, 1.41351318359375, 1.5115966796875, 1.60968017578125, 1.707763671875, 1.80584716796875, 1.9039306640625, 2.00201416015625, 2.10009765625, 2.19818115234375, 2.2962646484375, 2.39434814453125, 2.492431640625, 2.59051513671875, 2.6885986328125, 2.78668212890625, 2.884765625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 10.0, 10.0, 16.0, 17.0, 17.0, 27.0, 27.0, 16.0, 26.0, 31.0, 34.0, 32.0, 39.0, 64.0, 80.0, 108.0, 98.0, 72.0, 42.0, 27.0, 39.0, 22.0, 20.0, 22.0, 17.0, 12.0, 15.0, 11.0, 5.0, 9.0, 6.0, 3.0, 8.0, 3.0, 4.0, 0.0, 3.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0848388671875, -0.08196353912353516, -0.07908821105957031, -0.07621288299560547, -0.07333755493164062, -0.07046222686767578, -0.06758689880371094, -0.0647115707397461, -0.06183624267578125, -0.058960914611816406, -0.05608558654785156, -0.05321025848388672, -0.050334930419921875, -0.04745960235595703, -0.04458427429199219, -0.041708946228027344, -0.0388336181640625, -0.035958290100097656, -0.03308296203613281, -0.03020763397216797, -0.027332305908203125, -0.02445697784423828, -0.021581649780273438, -0.018706321716308594, -0.01583099365234375, -0.012955665588378906, -0.010080337524414062, -0.007205009460449219, -0.004329681396484375, -0.0014543533325195312, 0.0014209747314453125, 0.004296302795410156, 0.007171630859375, 0.010046958923339844, 0.012922286987304688, 0.01579761505126953, 0.018672943115234375, 0.02154827117919922, 0.024423599243164062, 0.027298927307128906, 0.03017425537109375, 0.033049583435058594, 0.03592491149902344, 0.03880023956298828, 0.041675567626953125, 0.04455089569091797, 0.04742622375488281, 0.050301551818847656, 0.0531768798828125, 0.056052207946777344, 0.05892753601074219, 0.06180286407470703, 0.06467819213867188, 0.06755352020263672, 0.07042884826660156, 0.0733041763305664, 0.07617950439453125, 0.0790548324584961, 0.08193016052246094, 0.08480548858642578, 0.08768081665039062, 0.09055614471435547, 0.09343147277832031, 0.09630680084228516, 0.09918212890625]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 4.0, 7.0, 6.0, 14.0, 18.0, 19.0, 28.0, 40.0, 50.0, 50.0, 88.0, 117.0, 162.0, 230.0, 391.0, 711.0, 1326.0, 3074.0, 7161.0, 18687.0, 54156.0, 186007.0, 540865.0, 159054.0, 47203.0, 16535.0, 6506.0, 2855.0, 1298.0, 630.0, 402.0, 222.0, 169.0, 112.0, 112.0, 65.0, 45.0, 38.0, 25.0, 14.0, 18.0, 11.0, 6.0, 6.0, 6.0, 4.0, 5.0, 2.0, 3.0, 2.0, 4.0, 1.0], "bins": [-0.53515625, -0.5196189880371094, -0.5040817260742188, -0.4885444641113281, -0.4730072021484375, -0.4574699401855469, -0.44193267822265625, -0.4263954162597656, -0.410858154296875, -0.3953208923339844, -0.37978363037109375, -0.3642463684082031, -0.3487091064453125, -0.3331718444824219, -0.31763458251953125, -0.3020973205566406, -0.28656005859375, -0.2710227966308594, -0.25548553466796875, -0.23994827270507812, -0.2244110107421875, -0.20887374877929688, -0.19333648681640625, -0.17779922485351562, -0.162261962890625, -0.14672470092773438, -0.13118743896484375, -0.11565017700195312, -0.1001129150390625, -0.08457565307617188, -0.06903839111328125, -0.053501129150390625, -0.0379638671875, -0.022426605224609375, -0.00688934326171875, 0.008647918701171875, 0.0241851806640625, 0.039722442626953125, 0.05525970458984375, 0.07079696655273438, 0.086334228515625, 0.10187149047851562, 0.11740875244140625, 0.13294601440429688, 0.1484832763671875, 0.16402053833007812, 0.17955780029296875, 0.19509506225585938, 0.21063232421875, 0.22616958618164062, 0.24170684814453125, 0.2572441101074219, 0.2727813720703125, 0.2883186340332031, 0.30385589599609375, 0.3193931579589844, 0.334930419921875, 0.3504676818847656, 0.36600494384765625, 0.3815422058105469, 0.3970794677734375, 0.4126167297363281, 0.42815399169921875, 0.4436912536621094, 0.459228515625]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 1.0, 2.0, 5.0, 2.0, 6.0, 10.0, 25.0, 25.0, 44.0, 63.0, 105.0, 137.0, 150.0, 140.0, 124.0, 73.0, 45.0, 24.0, 13.0, 7.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.2371276617050171, -0.23265095055103302, -0.22817422449588776, -0.2236975133419037, -0.21922078728675842, -0.21474407613277435, -0.21026736497879028, -0.20579063892364502, -0.20131392776966095, -0.19683721661567688, -0.19236049056053162, -0.18788377940654755, -0.18340706825256348, -0.1789303421974182, -0.17445363104343414, -0.16997691988945007, -0.1655001938343048, -0.16102348268032074, -0.15654675662517548, -0.1520700454711914, -0.14759331941604614, -0.14311660826206207, -0.138639897108078, -0.13416317105293274, -0.12968645989894867, -0.1252097487449646, -0.12073302268981934, -0.11625631153583527, -0.1117795929312706, -0.10730287432670593, -0.10282616317272186, -0.0983494445681572, -0.09387273341417313, -0.08939601480960846, -0.08491930365562439, -0.08044258505105972, -0.07596586644649506, -0.07148914784193039, -0.06701242923736572, -0.06253571808338165, -0.058058999478816986, -0.05358228087425232, -0.04910556599497795, -0.04462885111570358, -0.040152132511138916, -0.03567541390657425, -0.03119869902729988, -0.026721984148025513, -0.022245265543460846, -0.01776854880154133, -0.013291832059621811, -0.008815115317702293, -0.004338398575782776, 0.00013831816613674164, 0.004615034908056259, 0.009091749787330627, 0.013568468391895294, 0.01804518513381481, 0.02252190187573433, 0.026998618617653847, 0.031475335359573364, 0.03595205396413803, 0.0404287688434124, 0.04490548372268677, 0.049382202327251434]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 2.0, 5.0, 6.0, 9.0, 8.0, 6.0, 9.0, 9.0, 13.0, 15.0, 13.0, 26.0, 22.0, 22.0, 18.0, 37.0, 45.0, 38.0, 26.0, 32.0, 31.0, 41.0, 43.0, 35.0, 37.0, 46.0, 44.0, 38.0, 30.0, 37.0, 34.0, 21.0, 33.0, 32.0, 18.0, 25.0, 16.0, 14.0, 17.0, 12.0, 10.0, 2.0, 5.0, 4.0, 9.0, 0.0, 9.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.05851620435714722, -0.056768614798784256, -0.055021025240421295, -0.053273435682058334, -0.051525846123695374, -0.04977825656533241, -0.04803066700696945, -0.04628307744860649, -0.04453548789024353, -0.04278789833188057, -0.04104030877351761, -0.03929271921515465, -0.03754512965679169, -0.035797540098428726, -0.034049950540065765, -0.032302360981702805, -0.030554771423339844, -0.028807181864976883, -0.027059592306613922, -0.02531200274825096, -0.023564413189888, -0.02181682363152504, -0.02006923407316208, -0.018321644514799118, -0.016574054956436157, -0.014826465398073196, -0.013078875839710236, -0.011331286281347275, -0.009583696722984314, -0.007836107164621353, -0.006088517606258392, -0.0043409280478954315, -0.0025933384895324707, -0.0008457489311695099, 0.0009018406271934509, 0.0026494301855564117, 0.0043970197439193726, 0.006144609302282333, 0.007892198860645294, 0.009639788419008255, 0.011387377977371216, 0.013134967535734177, 0.014882557094097137, 0.0166301466524601, 0.01837773621082306, 0.02012532576918602, 0.02187291532754898, 0.02362050488591194, 0.025368094444274902, 0.027115684002637863, 0.028863273561000824, 0.030610863119363785, 0.032358452677726746, 0.034106042236089706, 0.03585363179445267, 0.03760122135281563, 0.03934881091117859, 0.04109640046954155, 0.04284399002790451, 0.04459157958626747, 0.04633916914463043, 0.04808675870299339, 0.049834348261356354, 0.051581937819719315, 0.053329527378082275]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 11.0, 11.0, 7.0, 12.0, 22.0, 21.0, 14.0, 23.0, 29.0, 34.0, 26.0, 35.0, 38.0, 35.0, 48.0, 47.0, 39.0, 52.0, 43.0, 41.0, 53.0, 34.0, 42.0, 39.0, 32.0, 40.0, 23.0, 21.0, 26.0, 22.0, 16.0, 18.0, 10.0, 10.0, 11.0, 5.0, 4.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-61.125, -59.4169921875, -57.708984375, -56.0009765625, -54.29296875, -52.5849609375, -50.876953125, -49.1689453125, -47.4609375, -45.7529296875, -44.044921875, -42.3369140625, -40.62890625, -38.9208984375, -37.212890625, -35.5048828125, -33.796875, -32.0888671875, -30.380859375, -28.6728515625, -26.96484375, -25.2568359375, -23.548828125, -21.8408203125, -20.1328125, -18.4248046875, -16.716796875, -15.0087890625, -13.30078125, -11.5927734375, -9.884765625, -8.1767578125, -6.46875, -4.7607421875, -3.052734375, -1.3447265625, 0.36328125, 2.0712890625, 3.779296875, 5.4873046875, 7.1953125, 8.9033203125, 10.611328125, 12.3193359375, 14.02734375, 15.7353515625, 17.443359375, 19.1513671875, 20.859375, 22.5673828125, 24.275390625, 25.9833984375, 27.69140625, 29.3994140625, 31.107421875, 32.8154296875, 34.5234375, 36.2314453125, 37.939453125, 39.6474609375, 41.35546875, 43.0634765625, 44.771484375, 46.4794921875, 48.1875]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 7.0, 9.0, 18.0, 20.0, 38.0, 40.0, 50.0, 83.0, 134.0, 220.0, 324.0, 549.0, 1047.0, 1941.0, 4466.0, 13183.0, 50710.0, 260560.0, 537837.0, 133788.0, 28361.0, 8287.0, 3224.0, 1581.0, 815.0, 452.0, 270.0, 182.0, 113.0, 62.0, 59.0, 32.0, 27.0, 16.0, 14.0, 6.0, 8.0, 6.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-12.5703125, -12.2142333984375, -11.858154296875, -11.5020751953125, -11.14599609375, -10.7899169921875, -10.433837890625, -10.0777587890625, -9.7216796875, -9.3656005859375, -9.009521484375, -8.6534423828125, -8.29736328125, -7.9412841796875, -7.585205078125, -7.2291259765625, -6.873046875, -6.5169677734375, -6.160888671875, -5.8048095703125, -5.44873046875, -5.0926513671875, -4.736572265625, -4.3804931640625, -4.0244140625, -3.6683349609375, -3.312255859375, -2.9561767578125, -2.60009765625, -2.2440185546875, -1.887939453125, -1.5318603515625, -1.17578125, -0.8197021484375, -0.463623046875, -0.1075439453125, 0.24853515625, 0.6046142578125, 0.960693359375, 1.3167724609375, 1.6728515625, 2.0289306640625, 2.385009765625, 2.7410888671875, 3.09716796875, 3.4532470703125, 3.809326171875, 4.1654052734375, 4.521484375, 4.8775634765625, 5.233642578125, 5.5897216796875, 5.94580078125, 6.3018798828125, 6.657958984375, 7.0140380859375, 7.3701171875, 7.7261962890625, 8.082275390625, 8.4383544921875, 8.79443359375, 9.1505126953125, 9.506591796875, 9.8626708984375, 10.21875]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 6.0, 4.0, 10.0, 16.0, 12.0, 20.0, 18.0, 15.0, 28.0, 30.0, 28.0, 38.0, 46.0, 66.0, 41.0, 58.0, 1859.0, 287.0, 61.0, 47.0, 55.0, 33.0, 34.0, 31.0, 38.0, 28.0, 39.0, 29.0, 14.0, 15.0, 9.0, 10.0, 6.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-91.3125, -88.771484375, -86.23046875, -83.689453125, -81.1484375, -78.607421875, -76.06640625, -73.525390625, -70.984375, -68.443359375, -65.90234375, -63.361328125, -60.8203125, -58.279296875, -55.73828125, -53.197265625, -50.65625, -48.115234375, -45.57421875, -43.033203125, -40.4921875, -37.951171875, -35.41015625, -32.869140625, -30.328125, -27.787109375, -25.24609375, -22.705078125, -20.1640625, -17.623046875, -15.08203125, -12.541015625, -10.0, -7.458984375, -4.91796875, -2.376953125, 0.1640625, 2.705078125, 5.24609375, 7.787109375, 10.328125, 12.869140625, 15.41015625, 17.951171875, 20.4921875, 23.033203125, 25.57421875, 28.115234375, 30.65625, 33.197265625, 35.73828125, 38.279296875, 40.8203125, 43.361328125, 45.90234375, 48.443359375, 50.984375, 53.525390625, 56.06640625, 58.607421875, 61.1484375, 63.689453125, 66.23046875, 68.771484375, 71.3125]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 2.0, 1.0, 6.0, 7.0, 12.0, 11.0, 6.0, 10.0, 25.0, 36.0, 42.0, 63.0, 105.0, 146.0, 205.0, 309.0, 494.0, 780.0, 1530.0, 3660.0, 17472.0, 176379.0, 2797838.0, 126440.0, 13628.0, 3075.0, 1307.0, 747.0, 480.0, 273.0, 191.0, 122.0, 89.0, 58.0, 38.0, 32.0, 20.0, 13.0, 22.0, 9.0, 5.0, 4.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-14.328125, -13.8572998046875, -13.386474609375, -12.9156494140625, -12.44482421875, -11.9739990234375, -11.503173828125, -11.0323486328125, -10.5615234375, -10.0906982421875, -9.619873046875, -9.1490478515625, -8.67822265625, -8.2073974609375, -7.736572265625, -7.2657470703125, -6.794921875, -6.3240966796875, -5.853271484375, -5.3824462890625, -4.91162109375, -4.4407958984375, -3.969970703125, -3.4991455078125, -3.0283203125, -2.5574951171875, -2.086669921875, -1.6158447265625, -1.14501953125, -0.6741943359375, -0.203369140625, 0.2674560546875, 0.73828125, 1.2091064453125, 1.679931640625, 2.1507568359375, 2.62158203125, 3.0924072265625, 3.563232421875, 4.0340576171875, 4.5048828125, 4.9757080078125, 5.446533203125, 5.9173583984375, 6.38818359375, 6.8590087890625, 7.329833984375, 7.8006591796875, 8.271484375, 8.7423095703125, 9.213134765625, 9.6839599609375, 10.15478515625, 10.6256103515625, 11.096435546875, 11.5672607421875, 12.0380859375, 12.5089111328125, 12.979736328125, 13.4505615234375, 13.92138671875, 14.3922119140625, 14.863037109375, 15.3338623046875, 15.8046875]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 4.0, 5.0, 8.0, 2.0, 9.0, 23.0, 55.0, 97.0, 199.0, 229.0, 178.0, 99.0, 48.0, 17.0, 14.0, 6.0, 4.0, 6.0, 7.0, 0.0, 2.0, 0.0, 2.0], "bins": [-294.8624267578125, -289.0315246582031, -283.20062255859375, -277.36968994140625, -271.5387878417969, -265.7078857421875, -259.8769836425781, -254.04608154296875, -248.2151641845703, -242.38426208496094, -236.5533447265625, -230.72244262695312, -224.89154052734375, -219.0606231689453, -213.22972106933594, -207.3988037109375, -201.56790161132812, -195.73699951171875, -189.9060821533203, -184.07518005371094, -178.2442626953125, -172.41336059570312, -166.58245849609375, -160.75155639648438, -154.92063903808594, -149.08973693847656, -143.25881958007812, -137.42791748046875, -131.59701538085938, -125.76609802246094, -119.93519592285156, -114.10428619384766, -108.27338409423828, -102.44247436523438, -96.611572265625, -90.7806625366211, -84.94975280761719, -79.11884307861328, -73.28793334960938, -67.45703125, -61.626121520996094, -55.79521179199219, -49.96430587768555, -44.133399963378906, -38.302490234375, -32.471580505371094, -26.640674591064453, -20.809768676757812, -14.978858947753906, -9.147951126098633, -3.3170433044433594, 2.513864517211914, 8.344772338867188, 14.175680160522461, 20.006587982177734, 25.837493896484375, 31.66840362548828, 37.49931335449219, 43.33021926879883, 49.16112518310547, 54.992034912109375, 60.82294464111328, 66.65385437011719, 72.48475646972656, 78.31566619873047]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 5.0, 7.0, 11.0, 11.0, 12.0, 18.0, 20.0, 14.0, 27.0, 35.0, 34.0, 28.0, 39.0, 56.0, 51.0, 33.0, 47.0, 55.0, 53.0, 49.0, 45.0, 38.0, 29.0, 46.0, 43.0, 25.0, 24.0, 25.0, 12.0, 20.0, 16.0, 14.0, 5.0, 11.0, 10.0, 7.0, 3.0, 3.0, 2.0, 2.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-109.88785552978516, -106.7261734008789, -103.56449127197266, -100.4028091430664, -97.24111938476562, -94.07943725585938, -90.91775512695312, -87.75607299804688, -84.59439086914062, -81.43270874023438, -78.27102661132812, -75.10934448242188, -71.94766235351562, -68.78597259521484, -65.6242904663086, -62.462608337402344, -59.300926208496094, -56.139244079589844, -52.977561950683594, -49.81587600708008, -46.65419387817383, -43.49251174926758, -40.33082580566406, -37.16914367675781, -34.00746154785156, -30.845779418945312, -27.68409538269043, -24.522411346435547, -21.360729217529297, -18.199047088623047, -15.037363052368164, -11.875679016113281, -8.7139892578125, -5.552306175231934, -2.390623092651367, 0.7710599899291992, 3.9327430725097656, 7.094426155090332, 10.256109237670898, 13.417793273925781, 16.57947540283203, 19.74115753173828, 22.902841567993164, 26.064525604248047, 29.226207733154297, 32.38788986206055, 35.54957580566406, 38.71125793457031, 41.87294006347656, 45.03462219238281, 48.19630432128906, 51.35799026489258, 54.51967239379883, 57.68135452270508, 60.843040466308594, 64.00472259521484, 67.1664047241211, 70.32808685302734, 73.4897689819336, 76.65145111083984, 79.81314086914062, 82.97482299804688, 86.13650512695312, 89.29818725585938, 92.45986938476562]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 6.0, 7.0, 8.0, 11.0, 15.0, 29.0, 30.0, 33.0, 36.0, 66.0, 89.0, 129.0, 164.0, 277.0, 414.0, 918.0, 2077.0, 5122.0, 1014116.0, 15554.0, 5156.0, 2077.0, 900.0, 445.0, 253.0, 162.0, 137.0, 80.0, 72.0, 58.0, 27.0, 13.0, 22.0, 13.0, 9.0, 3.0, 7.0, 6.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0], "bins": [-36.84689712524414, -35.7630729675293, -34.67924880981445, -33.59542465209961, -32.5115966796875, -31.42777442932129, -30.343948364257812, -29.26012420654297, -28.176300048828125, -27.09247589111328, -26.008651733398438, -24.92482566833496, -23.841001510620117, -22.757177352905273, -21.673351287841797, -20.589527130126953, -19.50570297241211, -18.421878814697266, -17.338054656982422, -16.254228591918945, -15.170404434204102, -14.086580276489258, -13.002755165100098, -11.918930053710938, -10.835105895996094, -9.75128173828125, -8.66745662689209, -7.583631992340088, -6.499807357788086, -5.415982723236084, -4.332158088684082, -3.24833345413208, -2.1645050048828125, -1.0806803703308105, 0.0031442642211914062, 1.0869688987731934, 2.1707935333251953, 3.2546181678771973, 4.338442802429199, 5.422267436981201, 6.506092071533203, 7.589916706085205, 8.673741340637207, 9.757566452026367, 10.841390609741211, 11.925214767456055, 13.009039878845215, 14.092864990234375, 15.176689147949219, 16.260513305664062, 17.344337463378906, 18.428163528442383, 19.511987686157227, 20.59581184387207, 21.679637908935547, 22.76346206665039, 23.847286224365234, 24.931110382080078, 26.014934539794922, 27.0987606048584, 28.182584762573242, 29.266408920288086, 30.350234985351562, 31.434059143066406, 32.51788330078125]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 5.0, 10.0, 12.0, 39.0, 56.0, 89.0, 365.0, 51462252.0, 187.0, 61.0, 30.0, 24.0, 13.0, 10.0, 6.0, 4.0, 1.0, 1.0, 3.0, 5.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2202.11865234375, -2067.9267578125, -1933.73486328125, -1799.54296875, -1665.35107421875, -1531.1591796875, -1396.96728515625, -1262.775390625, -1128.58349609375, -994.3916015625, -860.19970703125, -726.0078125, -591.81591796875, -457.6240234375, -323.43212890625, -189.240234375, -55.04833984375, 79.1435546875, 213.33544921875, 347.52734375, 481.71923828125, 615.9111328125, 750.10302734375, 884.294921875, 1018.48681640625, 1152.6787109375, 1286.87060546875, 1421.0625, 1555.25439453125, 1689.4462890625, 1823.63818359375, 1957.830078125, 2092.0224609375, 2226.21435546875, 2360.40625, 2494.59814453125, 2628.7900390625, 2762.98193359375, 2897.173828125, 3031.36572265625, 3165.5576171875, 3299.74951171875, 3433.94140625, 3568.13330078125, 3702.3251953125, 3836.51708984375, 3970.708984375, 4104.90087890625, 4239.0927734375, 4373.28466796875, 4507.4765625, 4641.66845703125, 4775.8603515625, 4910.05224609375, 5044.244140625, 5178.43603515625, 5312.6279296875, 5446.81982421875, 5581.01171875, 5715.20361328125, 5849.3955078125, 5983.58740234375, 6117.779296875, 6251.97119140625, 6386.1630859375]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 4.0, 8.0, 6.0, 13.0, 33.0, 31.0, 37.0, 50.0, 71.0, 109.0, 185.0, 285.0, 500.0, 664.0, 999.0, 1687.0, 2821.0, 4568.0, 7339.0, 12293.0, 20886.0, 35013.0, 59646.0, 104432.0, 180056.0, 309341.0, 550656.0, 3636125.0, 590052.0, 323447.0, 187490.0, 109174.0, 62406.0, 36462.0, 21509.0, 12580.0, 7832.0, 4763.0, 2906.0, 1832.0, 1134.0, 675.0, 478.0, 272.0, 173.0, 140.0, 79.0, 50.0, 50.0, 30.0, 12.0, 8.0, 14.0, 7.0, 4.0, 2.0, 2.0], "bins": [-1.6005859375, -1.5542449951171875, -1.507904052734375, -1.4615631103515625, -1.41522216796875, -1.3688812255859375, -1.322540283203125, -1.2761993408203125, -1.2298583984375, -1.1835174560546875, -1.137176513671875, -1.0908355712890625, -1.04449462890625, -0.9981536865234375, -0.951812744140625, -0.9054718017578125, -0.859130859375, -0.8127899169921875, -0.766448974609375, -0.7201080322265625, -0.67376708984375, -0.6274261474609375, -0.581085205078125, -0.5347442626953125, -0.4884033203125, -0.4420623779296875, -0.395721435546875, -0.3493804931640625, -0.30303955078125, -0.2566986083984375, -0.210357666015625, -0.1640167236328125, -0.11767578125, -0.0713348388671875, -0.024993896484375, 0.0213470458984375, 0.06768798828125, 0.1140289306640625, 0.160369873046875, 0.2067108154296875, 0.2530517578125, 0.2993927001953125, 0.345733642578125, 0.3920745849609375, 0.43841552734375, 0.4847564697265625, 0.531097412109375, 0.5774383544921875, 0.623779296875, 0.6701202392578125, 0.716461181640625, 0.7628021240234375, 0.80914306640625, 0.8554840087890625, 0.901824951171875, 0.9481658935546875, 0.9945068359375, 1.0408477783203125, 1.087188720703125, 1.1335296630859375, 1.17987060546875, 1.2262115478515625, 1.272552490234375, 1.3188934326171875, 1.365234375]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 4.0, 5.0, 10.0, 6.0, 10.0, 11.0, 16.0, 21.0, 21.0, 17.0, 24.0, 20.0, 22.0, 33.0, 26.0, 30.0, 42.0, 27.0, 53.0, 61.0, 392.0, 679.0, 65.0, 36.0, 37.0, 43.0, 33.0, 38.0, 32.0, 26.0, 30.0, 28.0, 11.0, 14.0, 17.0, 15.0, 13.0, 9.0, 9.0, 11.0, 10.0, 3.0, 2.0, 5.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-9.4296875, -9.0941162109375, -8.758544921875, -8.4229736328125, -8.08740234375, -7.7518310546875, -7.416259765625, -7.0806884765625, -6.7451171875, -6.4095458984375, -6.073974609375, -5.7384033203125, -5.40283203125, -5.0672607421875, -4.731689453125, -4.3961181640625, -4.060546875, -3.7249755859375, -3.389404296875, -3.0538330078125, -2.71826171875, -2.3826904296875, -2.047119140625, -1.7115478515625, -1.3759765625, -1.0404052734375, -0.704833984375, -0.3692626953125, -0.03369140625, 0.3018798828125, 0.637451171875, 0.9730224609375, 1.30859375, 1.6441650390625, 1.979736328125, 2.3153076171875, 2.65087890625, 2.9864501953125, 3.322021484375, 3.6575927734375, 3.9931640625, 4.3287353515625, 4.664306640625, 4.9998779296875, 5.33544921875, 5.6710205078125, 6.006591796875, 6.3421630859375, 6.677734375, 7.0133056640625, 7.348876953125, 7.6844482421875, 8.02001953125, 8.3555908203125, 8.691162109375, 9.0267333984375, 9.3623046875, 9.6978759765625, 10.033447265625, 10.3690185546875, 10.70458984375, 11.0401611328125, 11.375732421875, 11.7113037109375, 12.046875]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 7.0, 10.0, 18.0, 20.0, 36.0, 48.0, 88.0, 134.0, 198.0, 275.0, 390.0, 463.0, 762.0, 1192.0, 1933.0, 2998.0, 4356.0, 6547.0, 10674.0, 17729.0, 29457.0, 50312.0, 89577.0, 162407.0, 306129.0, 645190.0, 3731056.0, 583331.0, 288003.0, 152990.0, 83489.0, 47688.0, 27829.0, 16572.0, 10599.0, 6637.0, 4263.0, 2732.0, 1721.0, 1207.0, 789.0, 549.0, 327.0, 259.0, 140.0, 116.0, 68.0, 39.0, 32.0, 22.0, 17.0, 8.0, 3.0, 4.0, 0.0, 3.0, 2.0, 2.0], "bins": [-1.9345703125, -1.8749542236328125, -1.815338134765625, -1.7557220458984375, -1.69610595703125, -1.6364898681640625, -1.576873779296875, -1.5172576904296875, -1.4576416015625, -1.3980255126953125, -1.338409423828125, -1.2787933349609375, -1.21917724609375, -1.1595611572265625, -1.099945068359375, -1.0403289794921875, -0.980712890625, -0.9210968017578125, -0.861480712890625, -0.8018646240234375, -0.74224853515625, -0.6826324462890625, -0.623016357421875, -0.5634002685546875, -0.5037841796875, -0.4441680908203125, -0.384552001953125, -0.3249359130859375, -0.26531982421875, -0.2057037353515625, -0.146087646484375, -0.0864715576171875, -0.02685546875, 0.0327606201171875, 0.092376708984375, 0.1519927978515625, 0.21160888671875, 0.2712249755859375, 0.330841064453125, 0.3904571533203125, 0.4500732421875, 0.5096893310546875, 0.569305419921875, 0.6289215087890625, 0.68853759765625, 0.7481536865234375, 0.807769775390625, 0.8673858642578125, 0.927001953125, 0.9866180419921875, 1.046234130859375, 1.1058502197265625, 1.16546630859375, 1.2250823974609375, 1.284698486328125, 1.3443145751953125, 1.4039306640625, 1.4635467529296875, 1.523162841796875, 1.5827789306640625, 1.64239501953125, 1.7020111083984375, 1.761627197265625, 1.8212432861328125, 1.880859375]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 4.0, 1.0, 3.0, 6.0, 6.0, 11.0, 6.0, 8.0, 9.0, 14.0, 14.0, 23.0, 25.0, 18.0, 28.0, 32.0, 25.0, 36.0, 24.0, 24.0, 38.0, 34.0, 46.0, 54.0, 355.0, 707.0, 69.0, 36.0, 36.0, 34.0, 34.0, 42.0, 24.0, 27.0, 28.0, 20.0, 23.0, 15.0, 15.0, 15.0, 7.0, 8.0, 11.0, 3.0, 5.0, 5.0, 4.0, 3.0, 4.0, 6.0, 4.0, 2.0, 4.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.9453125, -6.70703125, -6.46875, -6.23046875, -5.9921875, -5.75390625, -5.515625, -5.27734375, -5.0390625, -4.80078125, -4.5625, -4.32421875, -4.0859375, -3.84765625, -3.609375, -3.37109375, -3.1328125, -2.89453125, -2.65625, -2.41796875, -2.1796875, -1.94140625, -1.703125, -1.46484375, -1.2265625, -0.98828125, -0.75, -0.51171875, -0.2734375, -0.03515625, 0.203125, 0.44140625, 0.6796875, 0.91796875, 1.15625, 1.39453125, 1.6328125, 1.87109375, 2.109375, 2.34765625, 2.5859375, 2.82421875, 3.0625, 3.30078125, 3.5390625, 3.77734375, 4.015625, 4.25390625, 4.4921875, 4.73046875, 4.96875, 5.20703125, 5.4453125, 5.68359375, 5.921875, 6.16015625, 6.3984375, 6.63671875, 6.875, 7.11328125, 7.3515625, 7.58984375, 7.828125, 8.06640625, 8.3046875]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [6.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 2.0, 3.0, 6.0, 6.0, 9.0, 13.0, 29.0, 24.0, 22.0, 51.0, 61.0, 127.0, 196.0, 236.0, 360.0, 601.0, 972.0, 1664.0, 2961.0, 5898.0, 14801.0, 57543.0, 5849419.0, 296487.0, 38176.0, 10705.0, 4674.0, 2475.0, 1355.0, 833.0, 551.0, 348.0, 264.0, 194.0, 126.0, 75.0, 43.0, 34.0, 21.0, 31.0, 20.0, 6.0, 7.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 3.0], "bins": [-12.1015625, -11.7218017578125, -11.342041015625, -10.9622802734375, -10.58251953125, -10.2027587890625, -9.822998046875, -9.4432373046875, -9.0634765625, -8.6837158203125, -8.303955078125, -7.9241943359375, -7.54443359375, -7.1646728515625, -6.784912109375, -6.4051513671875, -6.025390625, -5.6456298828125, -5.265869140625, -4.8861083984375, -4.50634765625, -4.1265869140625, -3.746826171875, -3.3670654296875, -2.9873046875, -2.6075439453125, -2.227783203125, -1.8480224609375, -1.46826171875, -1.0885009765625, -0.708740234375, -0.3289794921875, 0.05078125, 0.4305419921875, 0.810302734375, 1.1900634765625, 1.56982421875, 1.9495849609375, 2.329345703125, 2.7091064453125, 3.0888671875, 3.4686279296875, 3.848388671875, 4.2281494140625, 4.60791015625, 4.9876708984375, 5.367431640625, 5.7471923828125, 6.126953125, 6.5067138671875, 6.886474609375, 7.2662353515625, 7.64599609375, 8.0257568359375, 8.405517578125, 8.7852783203125, 9.1650390625, 9.5447998046875, 9.924560546875, 10.3043212890625, 10.68408203125, 11.0638427734375, 11.443603515625, 11.8233642578125, 12.203125]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 7.0, 8.0, 10.0, 8.0, 14.0, 19.0, 15.0, 19.0, 31.0, 24.0, 25.0, 43.0, 44.0, 43.0, 54.0, 43.0, 50.0, 157.0, 842.0, 161.0, 45.0, 46.0, 35.0, 51.0, 37.0, 30.0, 28.0, 27.0, 18.0, 28.0, 13.0, 9.0, 8.0, 11.0, 10.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.1953125, -6.95965576171875, -6.7239990234375, -6.48834228515625, -6.252685546875, -6.01702880859375, -5.7813720703125, -5.54571533203125, -5.31005859375, -5.07440185546875, -4.8387451171875, -4.60308837890625, -4.367431640625, -4.13177490234375, -3.8961181640625, -3.66046142578125, -3.4248046875, -3.18914794921875, -2.9534912109375, -2.71783447265625, -2.482177734375, -2.24652099609375, -2.0108642578125, -1.77520751953125, -1.53955078125, -1.30389404296875, -1.0682373046875, -0.83258056640625, -0.596923828125, -0.36126708984375, -0.1256103515625, 0.11004638671875, 0.345703125, 0.58135986328125, 0.8170166015625, 1.05267333984375, 1.288330078125, 1.52398681640625, 1.7596435546875, 1.99530029296875, 2.23095703125, 2.46661376953125, 2.7022705078125, 2.93792724609375, 3.173583984375, 3.40924072265625, 3.6448974609375, 3.88055419921875, 4.1162109375, 4.35186767578125, 4.5875244140625, 4.82318115234375, 5.058837890625, 5.29449462890625, 5.5301513671875, 5.76580810546875, 6.00146484375, 6.23712158203125, 6.4727783203125, 6.70843505859375, 6.944091796875, 7.17974853515625, 7.4154052734375, 7.65106201171875, 7.88671875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 9.0, 23.0, 56.0, 289.0, 484.0, 104.0, 31.0, 9.0, 4.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.24319839477539, -52.928714752197266, -51.614227294921875, -50.29974365234375, -48.98525619506836, -47.670772552490234, -46.356285095214844, -45.04180145263672, -43.72731399536133, -42.4128303527832, -41.09834289550781, -39.78385925292969, -38.4693717956543, -37.15488815307617, -35.84040069580078, -34.525917053222656, -33.21143341064453, -31.896947860717773, -30.582462310791016, -29.267976760864258, -27.9534912109375, -26.639005661010742, -25.324520111083984, -24.01003646850586, -22.69554901123047, -21.38106346130371, -20.066577911376953, -18.752092361450195, -17.437606811523438, -16.12312126159668, -14.808636665344238, -13.49415111541748, -12.179664611816406, -10.865179061889648, -9.55069351196289, -8.236207962036133, -6.921722888946533, -5.607237339019775, -4.292752265930176, -2.978266716003418, -1.6637811660766602, -0.3492957353591919, 0.9651896953582764, 2.279675006866455, 3.594160556793213, 4.908646106719971, 6.22313117980957, 7.537616729736328, 8.852102279663086, 10.166587829589844, 11.481073379516602, 12.79555892944336, 14.110044479370117, 15.424530029296875, 16.739013671875, 18.05350112915039, 19.367984771728516, 20.682470321655273, 21.99695587158203, 23.31144142150879, 24.625926971435547, 25.940412521362305, 27.254898071289062, 28.569381713867188, 29.883869171142578]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 8.0, 11.0, 13.0, 16.0, 26.0, 34.0, 52.0, 62.0, 67.0, 72.0, 68.0, 96.0, 79.0, 79.0, 63.0, 52.0, 62.0, 36.0, 31.0, 29.0, 24.0, 15.0, 5.0, 8.0, 4.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.061434745788574, -10.474538803100586, -9.887642860412598, -9.30074691772461, -8.713851928710938, -8.12695598602295, -7.540060043334961, -6.953164577484131, -6.366268634796143, -5.779372692108154, -5.192477226257324, -4.605581283569336, -4.018685340881348, -3.4317898750305176, -2.8448939323425293, -2.257998466491699, -1.671102523803711, -1.0842068195343018, -0.497310996055603, 0.0895848274230957, 0.6764805316925049, 1.263376235961914, 1.8502721786499023, 2.4371676445007324, 3.0240635871887207, 3.61095929145813, 4.197854995727539, 4.784750938415527, 5.371646881103516, 5.958542346954346, 6.545438289642334, 7.132333755493164, 7.719228744506836, 8.306124687194824, 8.893020629882812, 9.479915618896484, 10.066811561584473, 10.653707504272461, 11.24060344696045, 11.827499389648438, 12.41439437866211, 13.001290321350098, 13.588186264038086, 14.175081253051758, 14.761977195739746, 15.348873138427734, 15.935769081115723, 16.52266502380371, 17.109561920166016, 17.696456909179688, 18.283353805541992, 18.870248794555664, 19.45714569091797, 20.04404067993164, 20.630935668945312, 21.217832565307617, 21.80472755432129, 22.39162254333496, 22.978519439697266, 23.565414428710938, 24.152311325073242, 24.739206314086914, 25.32610321044922, 25.91299819946289, 26.499893188476562]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 3.0, 0.0, 5.0, 6.0, 5.0, 5.0, 13.0, 15.0, 27.0, 38.0, 53.0, 87.0, 111.0, 163.0, 233.0, 460.0, 654.0, 1253.0, 2413.0, 5648.0, 16118.0, 84933.0, 3987982.0, 61842.0, 16921.0, 7196.0, 3335.0, 1770.0, 987.0, 644.0, 413.0, 250.0, 167.0, 121.0, 80.0, 75.0, 53.0, 48.0, 38.0, 23.0, 14.0, 20.0, 20.0, 14.0, 12.0, 7.0, 5.0, 2.0, 3.0, 0.0, 1.0, 2.0, 3.0, 4.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.286376953125, -0.2746391296386719, -0.26290130615234375, -0.2511634826660156, -0.2394256591796875, -0.22768783569335938, -0.21595001220703125, -0.20421218872070312, -0.192474365234375, -0.18073654174804688, -0.16899871826171875, -0.15726089477539062, -0.1455230712890625, -0.13378524780273438, -0.12204742431640625, -0.11030960083007812, -0.09857177734375, -0.08683395385742188, -0.07509613037109375, -0.06335830688476562, -0.0516204833984375, -0.039882659912109375, -0.02814483642578125, -0.016407012939453125, -0.004669189453125, 0.007068634033203125, 0.01880645751953125, 0.030544281005859375, 0.0422821044921875, 0.054019927978515625, 0.06575775146484375, 0.07749557495117188, 0.0892333984375, 0.10097122192382812, 0.11270904541015625, 0.12444686889648438, 0.1361846923828125, 0.14792251586914062, 0.15966033935546875, 0.17139816284179688, 0.183135986328125, 0.19487380981445312, 0.20661163330078125, 0.21834945678710938, 0.2300872802734375, 0.24182510375976562, 0.25356292724609375, 0.2653007507324219, 0.27703857421875, 0.2887763977050781, 0.30051422119140625, 0.3122520446777344, 0.3239898681640625, 0.3357276916503906, 0.34746551513671875, 0.3592033386230469, 0.370941162109375, 0.3826789855957031, 0.39441680908203125, 0.4061546325683594, 0.4178924560546875, 0.4296302795410156, 0.44136810302734375, 0.4531059265136719, 0.46484375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 6.0, 9.0, 17.0, 20.0, 28.0, 602.0, 218.0, 23.0, 16.0, 17.0, 11.0, 9.0, 5.0, 7.0, 5.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06475830078125, -0.06217384338378906, -0.059589385986328125, -0.05700492858886719, -0.05442047119140625, -0.05183601379394531, -0.049251556396484375, -0.04666709899902344, -0.0440826416015625, -0.04149818420410156, -0.038913726806640625, -0.03632926940917969, -0.03374481201171875, -0.031160354614257812, -0.028575897216796875, -0.025991439819335938, -0.023406982421875, -0.020822525024414062, -0.018238067626953125, -0.015653610229492188, -0.01306915283203125, -0.010484695434570312, -0.007900238037109375, -0.0053157806396484375, -0.0027313232421875, -0.0001468658447265625, 0.002437591552734375, 0.0050220489501953125, 0.00760650634765625, 0.010190963745117188, 0.012775421142578125, 0.015359878540039062, 0.0179443359375, 0.020528793334960938, 0.023113250732421875, 0.025697708129882812, 0.02828216552734375, 0.030866622924804688, 0.033451080322265625, 0.03603553771972656, 0.0386199951171875, 0.04120445251464844, 0.043788909912109375, 0.04637336730957031, 0.04895782470703125, 0.05154228210449219, 0.054126739501953125, 0.05671119689941406, 0.059295654296875, 0.06188011169433594, 0.06446456909179688, 0.06704902648925781, 0.06963348388671875, 0.07221794128417969, 0.07480239868164062, 0.07738685607910156, 0.0799713134765625, 0.08255577087402344, 0.08514022827148438, 0.08772468566894531, 0.09030914306640625, 0.09289360046386719, 0.09547805786132812, 0.09806251525878906, 0.10064697265625]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 8.0, 5.0, 7.0, 13.0, 18.0, 35.0, 47.0, 63.0, 128.0, 209.0, 420.0, 727.0, 1576.0, 3320.0, 9076.0, 29877.0, 140144.0, 3086753.0, 816496.0, 77803.0, 17623.0, 5633.0, 2231.0, 965.0, 443.0, 253.0, 140.0, 90.0, 62.0, 42.0, 27.0, 19.0, 15.0, 10.0, 3.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.331787109375, -0.3216896057128906, -0.31159210205078125, -0.3014945983886719, -0.2913970947265625, -0.2812995910644531, -0.27120208740234375, -0.2611045837402344, -0.251007080078125, -0.24090957641601562, -0.23081207275390625, -0.22071456909179688, -0.2106170654296875, -0.20051956176757812, -0.19042205810546875, -0.18032455444335938, -0.17022705078125, -0.16012954711914062, -0.15003204345703125, -0.13993453979492188, -0.1298370361328125, -0.11973953247070312, -0.10964202880859375, -0.09954452514648438, -0.089447021484375, -0.07934951782226562, -0.06925201416015625, -0.059154510498046875, -0.0490570068359375, -0.038959503173828125, -0.02886199951171875, -0.018764495849609375, -0.0086669921875, 0.001430511474609375, 0.01152801513671875, 0.021625518798828125, 0.0317230224609375, 0.041820526123046875, 0.05191802978515625, 0.062015533447265625, 0.072113037109375, 0.08221054077148438, 0.09230804443359375, 0.10240554809570312, 0.1125030517578125, 0.12260055541992188, 0.13269805908203125, 0.14279556274414062, 0.15289306640625, 0.16299057006835938, 0.17308807373046875, 0.18318557739257812, 0.1932830810546875, 0.20338058471679688, 0.21347808837890625, 0.22357559204101562, 0.233673095703125, 0.24377059936523438, 0.25386810302734375, 0.2639656066894531, 0.2740631103515625, 0.2841606140136719, 0.29425811767578125, 0.3043556213378906, 0.314453125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 5.0, 5.0, 5.0, 5.0, 8.0, 6.0, 11.0, 9.0, 10.0, 14.0, 17.0, 44.0, 40.0, 60.0, 53.0, 92.0, 126.0, 151.0, 245.0, 407.0, 1343.0, 565.0, 295.0, 164.0, 120.0, 72.0, 51.0, 44.0, 30.0, 32.0, 16.0, 8.0, 13.0, 6.0, 6.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.1280517578125, -0.1251201629638672, -0.12218856811523438, -0.11925697326660156, -0.11632537841796875, -0.11339378356933594, -0.11046218872070312, -0.10753059387207031, -0.1045989990234375, -0.10166740417480469, -0.09873580932617188, -0.09580421447753906, -0.09287261962890625, -0.08994102478027344, -0.08700942993164062, -0.08407783508300781, -0.081146240234375, -0.07821464538574219, -0.07528305053710938, -0.07235145568847656, -0.06941986083984375, -0.06648826599121094, -0.06355667114257812, -0.06062507629394531, -0.0576934814453125, -0.05476188659667969, -0.051830291748046875, -0.04889869689941406, -0.04596710205078125, -0.04303550720214844, -0.040103912353515625, -0.03717231750488281, -0.03424072265625, -0.03130912780761719, -0.028377532958984375, -0.025445938110351562, -0.02251434326171875, -0.019582748413085938, -0.016651153564453125, -0.013719558715820312, -0.0107879638671875, -0.007856369018554688, -0.004924774169921875, -0.0019931793212890625, 0.00093841552734375, 0.0038700103759765625, 0.006801605224609375, 0.009733200073242188, 0.012664794921875, 0.015596389770507812, 0.018527984619140625, 0.021459579467773438, 0.02439117431640625, 0.027322769165039062, 0.030254364013671875, 0.03318595886230469, 0.0361175537109375, 0.03904914855957031, 0.041980743408203125, 0.04491233825683594, 0.04784393310546875, 0.05077552795410156, 0.053707122802734375, 0.05663871765136719, 0.0595703125]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 7.0, 6.0, 5.0, 12.0, 17.0, 38.0, 62.0, 122.0, 296.0, 283.0, 94.0, 31.0, 16.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 2.0], "bins": [-2.2280988693237305, -2.1861863136291504, -2.1442737579345703, -2.1023612022399902, -2.06044864654541, -2.01853609085083, -1.9766236543655396, -1.9347110986709595, -1.8927985429763794, -1.8508859872817993, -1.8089734315872192, -1.7670608758926392, -1.7251484394073486, -1.6832358837127686, -1.6413233280181885, -1.5994107723236084, -1.5574982166290283, -1.5155856609344482, -1.4736731052398682, -1.431760549545288, -1.389847993850708, -1.3479355573654175, -1.3060230016708374, -1.2641104459762573, -1.2221978902816772, -1.1802853345870972, -1.138372778892517, -1.096460223197937, -1.0545477867126465, -1.0126352310180664, -0.9707226753234863, -0.9288101196289062, -0.886897623538971, -0.8449850678443909, -0.8030725717544556, -0.7611600160598755, -0.7192474603652954, -0.6773349046707153, -0.6354223489761353, -0.5935098528862, -0.5515972971916199, -0.5096847414970398, -0.4677722156047821, -0.4258596897125244, -0.38394713401794434, -0.34203457832336426, -0.30012205243110657, -0.2582095265388489, -0.2162969708442688, -0.17438443005084991, -0.13247188925743103, -0.09055934846401215, -0.04864680767059326, -0.0067342668771743774, 0.03517827391624451, 0.0770907998085022, 0.11900335550308228, 0.16091589629650116, 0.20282843708992004, 0.24474097788333893, 0.2866535186767578, 0.3285660743713379, 0.3704786002635956, 0.41239112615585327, 0.45430368185043335]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 7.0, 3.0, 3.0, 6.0, 11.0, 23.0, 24.0, 31.0, 37.0, 44.0, 49.0, 61.0, 74.0, 66.0, 72.0, 84.0, 79.0, 50.0, 68.0, 52.0, 39.0, 30.0, 30.0, 22.0, 9.0, 12.0, 8.0, 6.0, 5.0, 4.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8968244791030884, -0.8714236617088318, -0.8460227847099304, -0.8206219673156738, -0.7952211499214172, -0.7698203325271606, -0.7444194555282593, -0.7190186381340027, -0.6936178207397461, -0.6682170033454895, -0.6428161263465881, -0.6174153089523315, -0.592014491558075, -0.5666136741638184, -0.541212797164917, -0.5158119797706604, -0.4904111325740814, -0.46501028537750244, -0.43960946798324585, -0.41420862078666687, -0.3888078033924103, -0.3634069561958313, -0.3380061388015747, -0.3126052916049957, -0.28720444440841675, -0.26180359721183777, -0.23640277981758118, -0.2110019326210022, -0.1856011152267456, -0.16020026803016663, -0.13479943573474884, -0.10939860343933105, -0.08399778604507446, -0.05859695374965668, -0.03319611772894859, -0.007795281708240509, 0.017605550587177277, 0.04300639033317566, 0.06840722262859344, 0.09380805492401123, 0.11920888721942902, 0.1446097195148468, 0.1700105518102646, 0.19541138410568237, 0.22081223130226135, 0.24621306359767914, 0.2716138958930969, 0.2970147132873535, 0.3224155604839325, 0.3478164076805115, 0.37321722507476807, 0.39861807227134705, 0.42401888966560364, 0.4494197368621826, 0.4748205542564392, 0.5002213716506958, 0.5256222486495972, 0.5510230660438538, 0.5764239430427551, 0.6018247604370117, 0.6272255778312683, 0.6526263952255249, 0.6780272722244263, 0.7034280896186829, 0.7288289070129395]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 2.0, 10.0, 11.0, 14.0, 7.0, 12.0, 28.0, 36.0, 47.0, 67.0, 86.0, 139.0, 180.0, 251.0, 336.0, 499.0, 796.0, 1303.0, 2620.0, 5433.0, 14475.0, 73301.0, 855618.0, 67476.0, 14005.0, 5377.0, 2526.0, 1389.0, 771.0, 556.0, 328.0, 242.0, 170.0, 122.0, 77.0, 62.0, 55.0, 49.0, 23.0, 22.0, 13.0, 6.0, 3.0, 2.0, 5.0, 6.0, 5.0, 0.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.335205078125, -0.3245582580566406, -0.31391143798828125, -0.3032646179199219, -0.2926177978515625, -0.2819709777832031, -0.27132415771484375, -0.2606773376464844, -0.250030517578125, -0.23938369750976562, -0.22873687744140625, -0.21809005737304688, -0.2074432373046875, -0.19679641723632812, -0.18614959716796875, -0.17550277709960938, -0.16485595703125, -0.15420913696289062, -0.14356231689453125, -0.13291549682617188, -0.1222686767578125, -0.11162185668945312, -0.10097503662109375, -0.09032821655273438, -0.079681396484375, -0.06903457641601562, -0.05838775634765625, -0.047740936279296875, -0.0370941162109375, -0.026447296142578125, -0.01580047607421875, -0.005153656005859375, 0.0054931640625, 0.016139984130859375, 0.02678680419921875, 0.037433624267578125, 0.0480804443359375, 0.058727264404296875, 0.06937408447265625, 0.08002090454101562, 0.090667724609375, 0.10131454467773438, 0.11196136474609375, 0.12260818481445312, 0.1332550048828125, 0.14390182495117188, 0.15454864501953125, 0.16519546508789062, 0.17584228515625, 0.18648910522460938, 0.19713592529296875, 0.20778274536132812, 0.2184295654296875, 0.22907638549804688, 0.23972320556640625, 0.2503700256347656, 0.261016845703125, 0.2716636657714844, 0.28231048583984375, 0.2929573059082031, 0.3036041259765625, 0.3142509460449219, 0.32489776611328125, 0.3355445861816406, 0.34619140625]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 5.0, 2.0, 9.0, 12.0, 26.0, 42.0, 157.0, 287.0, 255.0, 94.0, 49.0, 14.0, 12.0, 7.0, 7.0, 5.0, 6.0, 4.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.06573486328125, -0.06354236602783203, -0.06134986877441406, -0.059157371520996094, -0.056964874267578125, -0.054772377014160156, -0.05257987976074219, -0.05038738250732422, -0.04819488525390625, -0.04600238800048828, -0.04380989074707031, -0.041617393493652344, -0.039424896240234375, -0.037232398986816406, -0.03503990173339844, -0.03284740447998047, -0.0306549072265625, -0.02846240997314453, -0.026269912719726562, -0.024077415466308594, -0.021884918212890625, -0.019692420959472656, -0.017499923706054688, -0.015307426452636719, -0.01311492919921875, -0.010922431945800781, -0.008729934692382812, -0.006537437438964844, -0.004344940185546875, -0.0021524429321289062, 4.00543212890625e-05, 0.0022325515747070312, 0.004425048828125, 0.006617546081542969, 0.008810043334960938, 0.011002540588378906, 0.013195037841796875, 0.015387535095214844, 0.017580032348632812, 0.01977252960205078, 0.02196502685546875, 0.02415752410888672, 0.026350021362304688, 0.028542518615722656, 0.030735015869140625, 0.032927513122558594, 0.03512001037597656, 0.03731250762939453, 0.0395050048828125, 0.04169750213623047, 0.04388999938964844, 0.046082496643066406, 0.048274993896484375, 0.050467491149902344, 0.05265998840332031, 0.05485248565673828, 0.05704498291015625, 0.05923748016357422, 0.06142997741699219, 0.06362247467041016, 0.06581497192382812, 0.0680074691772461, 0.07019996643066406, 0.07239246368408203, 0.0745849609375]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 10.0, 11.0, 6.0, 11.0, 13.0, 14.0, 28.0, 27.0, 55.0, 86.0, 136.0, 164.0, 341.0, 772.0, 1684.0, 5259.0, 28054.0, 340530.0, 616347.0, 43918.0, 7218.0, 2031.0, 847.0, 370.0, 177.0, 121.0, 85.0, 70.0, 43.0, 32.0, 21.0, 13.0, 12.0, 14.0, 8.0, 6.0, 5.0, 2.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5849609375, -0.56781005859375, -0.5506591796875, -0.53350830078125, -0.516357421875, -0.49920654296875, -0.4820556640625, -0.46490478515625, -0.44775390625, -0.43060302734375, -0.4134521484375, -0.39630126953125, -0.379150390625, -0.36199951171875, -0.3448486328125, -0.32769775390625, -0.310546875, -0.29339599609375, -0.2762451171875, -0.25909423828125, -0.241943359375, -0.22479248046875, -0.2076416015625, -0.19049072265625, -0.17333984375, -0.15618896484375, -0.1390380859375, -0.12188720703125, -0.104736328125, -0.08758544921875, -0.0704345703125, -0.05328369140625, -0.0361328125, -0.01898193359375, -0.0018310546875, 0.01531982421875, 0.032470703125, 0.04962158203125, 0.0667724609375, 0.08392333984375, 0.10107421875, 0.11822509765625, 0.1353759765625, 0.15252685546875, 0.169677734375, 0.18682861328125, 0.2039794921875, 0.22113037109375, 0.23828125, 0.25543212890625, 0.2725830078125, 0.28973388671875, 0.306884765625, 0.32403564453125, 0.3411865234375, 0.35833740234375, 0.37548828125, 0.39263916015625, 0.4097900390625, 0.42694091796875, 0.444091796875, 0.46124267578125, 0.4783935546875, 0.49554443359375, 0.5126953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 7.0, 5.0, 7.0, 15.0, 17.0, 14.0, 17.0, 13.0, 22.0, 26.0, 24.0, 31.0, 25.0, 31.0, 32.0, 37.0, 27.0, 31.0, 42.0, 41.0, 30.0, 35.0, 44.0, 31.0, 35.0, 38.0, 43.0, 40.0, 22.0, 28.0, 18.0, 24.0, 21.0, 16.0, 17.0, 17.0, 8.0, 8.0, 7.0, 13.0, 14.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 3.0, 1.0, 1.0], "bins": [-0.20458984375, -0.19791793823242188, -0.19124603271484375, -0.18457412719726562, -0.1779022216796875, -0.17123031616210938, -0.16455841064453125, -0.15788650512695312, -0.151214599609375, -0.14454269409179688, -0.13787078857421875, -0.13119888305664062, -0.1245269775390625, -0.11785507202148438, -0.11118316650390625, -0.10451126098632812, -0.09783935546875, -0.09116744995117188, -0.08449554443359375, -0.07782363891601562, -0.0711517333984375, -0.06447982788085938, -0.05780792236328125, -0.051136016845703125, -0.044464111328125, -0.037792205810546875, -0.03112030029296875, -0.024448394775390625, -0.0177764892578125, -0.011104583740234375, -0.00443267822265625, 0.002239227294921875, 0.0089111328125, 0.015583038330078125, 0.02225494384765625, 0.028926849365234375, 0.0355987548828125, 0.042270660400390625, 0.04894256591796875, 0.055614471435546875, 0.062286376953125, 0.06895828247070312, 0.07563018798828125, 0.08230209350585938, 0.0889739990234375, 0.09564590454101562, 0.10231781005859375, 0.10898971557617188, 0.11566162109375, 0.12233352661132812, 0.12900543212890625, 0.13567733764648438, 0.1423492431640625, 0.14902114868164062, 0.15569305419921875, 0.16236495971679688, 0.169036865234375, 0.17570877075195312, 0.18238067626953125, 0.18905258178710938, 0.1957244873046875, 0.20239639282226562, 0.20906829833984375, 0.21574020385742188, 0.222412109375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 6.0, 7.0, 6.0, 10.0, 7.0, 15.0, 34.0, 41.0, 56.0, 112.0, 206.0, 443.0, 1124.0, 3945.0, 42681.0, 979302.0, 16453.0, 2455.0, 853.0, 339.0, 176.0, 91.0, 57.0, 55.0, 23.0, 19.0, 11.0, 12.0, 10.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.84326171875, -0.8206863403320312, -0.7981109619140625, -0.7755355834960938, -0.752960205078125, -0.7303848266601562, -0.7078094482421875, -0.6852340698242188, -0.66265869140625, -0.6400833129882812, -0.6175079345703125, -0.5949325561523438, -0.572357177734375, -0.5497817993164062, -0.5272064208984375, -0.5046310424804688, -0.4820556640625, -0.45948028564453125, -0.4369049072265625, -0.41432952880859375, -0.391754150390625, -0.36917877197265625, -0.3466033935546875, -0.32402801513671875, -0.30145263671875, -0.27887725830078125, -0.2563018798828125, -0.23372650146484375, -0.211151123046875, -0.18857574462890625, -0.1660003662109375, -0.14342498779296875, -0.120849609375, -0.09827423095703125, -0.0756988525390625, -0.05312347412109375, -0.030548095703125, -0.00797271728515625, 0.0146026611328125, 0.03717803955078125, 0.05975341796875, 0.08232879638671875, 0.1049041748046875, 0.12747955322265625, 0.150054931640625, 0.17263031005859375, 0.1952056884765625, 0.21778106689453125, 0.2403564453125, 0.26293182373046875, 0.2855072021484375, 0.30808258056640625, 0.330657958984375, 0.35323333740234375, 0.3758087158203125, 0.39838409423828125, 0.42095947265625, 0.44353485107421875, 0.4661102294921875, 0.48868560791015625, 0.511260986328125, 0.5338363647460938, 0.5564117431640625, 0.5789871215820312, 0.6015625]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 4.0, 4.0, 10.0, 9.0, 9.0, 8.0, 14.0, 16.0, 17.0, 24.0, 22.0, 36.0, 74.0, 129.0, 296.0, 125.0, 57.0, 24.0, 25.0, 13.0, 20.0, 13.0, 9.0, 8.0, 6.0, 6.0, 7.0, 8.0, 3.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0013647079467773438, -0.001318320631980896, -0.0012719333171844482, -0.0012255460023880005, -0.0011791586875915527, -0.001132771372795105, -0.0010863840579986572, -0.0010399967432022095, -0.0009936094284057617, -0.000947222113609314, -0.0009008347988128662, -0.0008544474840164185, -0.0008080601692199707, -0.000761672854423523, -0.0007152855396270752, -0.0006688982248306274, -0.0006225109100341797, -0.0005761235952377319, -0.0005297362804412842, -0.0004833489656448364, -0.00043696165084838867, -0.0003905743360519409, -0.00034418702125549316, -0.0002977997064590454, -0.00025141239166259766, -0.0002050250768661499, -0.00015863776206970215, -0.0001122504472732544, -6.586313247680664e-05, -1.9475817680358887e-05, 2.6911497116088867e-05, 7.329881191253662e-05, 0.00011968612670898438, 0.00016607344150543213, 0.00021246075630187988, 0.00025884807109832764, 0.0003052353858947754, 0.00035162270069122314, 0.0003980100154876709, 0.00044439733028411865, 0.0004907846450805664, 0.0005371719598770142, 0.0005835592746734619, 0.0006299465894699097, 0.0006763339042663574, 0.0007227212190628052, 0.0007691085338592529, 0.0008154958486557007, 0.0008618831634521484, 0.0009082704782485962, 0.0009546577930450439, 0.0010010451078414917, 0.0010474324226379395, 0.0010938197374343872, 0.001140207052230835, 0.0011865943670272827, 0.0012329816818237305, 0.0012793689966201782, 0.001325756311416626, 0.0013721436262130737, 0.0014185309410095215, 0.0014649182558059692, 0.001511305570602417, 0.0015576928853988647, 0.0016040802001953125]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 5.0, 5.0, 8.0, 12.0, 17.0, 28.0, 37.0, 50.0, 71.0, 129.0, 195.0, 288.0, 558.0, 932.0, 1826.0, 4283.0, 12438.0, 61135.0, 812972.0, 124779.0, 18164.0, 5535.0, 2323.0, 1167.0, 603.0, 362.0, 231.0, 112.0, 94.0, 56.0, 34.0, 32.0, 18.0, 19.0, 7.0, 7.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.379150390625, -0.3682060241699219, -0.35726165771484375, -0.3463172912597656, -0.3353729248046875, -0.3244285583496094, -0.31348419189453125, -0.3025398254394531, -0.291595458984375, -0.2806510925292969, -0.26970672607421875, -0.2587623596191406, -0.2478179931640625, -0.23687362670898438, -0.22592926025390625, -0.21498489379882812, -0.20404052734375, -0.19309616088867188, -0.18215179443359375, -0.17120742797851562, -0.1602630615234375, -0.14931869506835938, -0.13837432861328125, -0.12742996215820312, -0.116485595703125, -0.10554122924804688, -0.09459686279296875, -0.08365249633789062, -0.0727081298828125, -0.061763763427734375, -0.05081939697265625, -0.039875030517578125, -0.0289306640625, -0.017986297607421875, -0.00704193115234375, 0.003902435302734375, 0.0148468017578125, 0.025791168212890625, 0.03673553466796875, 0.047679901123046875, 0.058624267578125, 0.06956863403320312, 0.08051300048828125, 0.09145736694335938, 0.1024017333984375, 0.11334609985351562, 0.12429046630859375, 0.13523483276367188, 0.14617919921875, 0.15712356567382812, 0.16806793212890625, 0.17901229858398438, 0.1899566650390625, 0.20090103149414062, 0.21184539794921875, 0.22278976440429688, 0.233734130859375, 0.24467849731445312, 0.25562286376953125, 0.2665672302246094, 0.2775115966796875, 0.2884559631347656, 0.29940032958984375, 0.3103446960449219, 0.3212890625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 0.0, 2.0, 5.0, 5.0, 8.0, 8.0, 13.0, 16.0, 24.0, 38.0, 51.0, 83.0, 117.0, 176.0, 163.0, 113.0, 61.0, 47.0, 21.0, 11.0, 14.0, 1.0, 7.0, 4.0, 3.0, 7.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.304443359375, -0.2938995361328125, -0.283355712890625, -0.2728118896484375, -0.26226806640625, -0.2517242431640625, -0.241180419921875, -0.2306365966796875, -0.2200927734375, -0.2095489501953125, -0.199005126953125, -0.1884613037109375, -0.17791748046875, -0.1673736572265625, -0.156829833984375, -0.1462860107421875, -0.1357421875, -0.1251983642578125, -0.114654541015625, -0.1041107177734375, -0.09356689453125, -0.0830230712890625, -0.072479248046875, -0.0619354248046875, -0.0513916015625, -0.0408477783203125, -0.030303955078125, -0.0197601318359375, -0.00921630859375, 0.0013275146484375, 0.011871337890625, 0.0224151611328125, 0.032958984375, 0.0435028076171875, 0.054046630859375, 0.0645904541015625, 0.07513427734375, 0.0856781005859375, 0.096221923828125, 0.1067657470703125, 0.1173095703125, 0.1278533935546875, 0.138397216796875, 0.1489410400390625, 0.15948486328125, 0.1700286865234375, 0.180572509765625, 0.1911163330078125, 0.20166015625, 0.2122039794921875, 0.222747802734375, 0.2332916259765625, 0.24383544921875, 0.2543792724609375, 0.264923095703125, 0.2754669189453125, 0.2860107421875, 0.2965545654296875, 0.307098388671875, 0.3176422119140625, 0.32818603515625, 0.3387298583984375, 0.349273681640625, 0.3598175048828125, 0.370361328125]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 4.0, 2.0, 2.0, 4.0, 3.0, 8.0, 17.0, 34.0, 66.0, 148.0, 362.0, 239.0, 62.0, 30.0, 13.0, 4.0, 3.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.241870880126953, -5.09929084777832, -4.9567108154296875, -4.814130783081055, -4.671550750732422, -4.528970718383789, -4.386390686035156, -4.243810653686523, -4.101230621337891, -3.958650588989258, -3.816070556640625, -3.673490524291992, -3.5309104919433594, -3.3883304595947266, -3.2457501888275146, -3.103170156478882, -2.96058988571167, -2.818009853363037, -2.6754298210144043, -2.5328497886657715, -2.3902697563171387, -2.247689723968506, -2.105109453201294, -1.9625294208526611, -1.8199493885040283, -1.6773693561553955, -1.5347893238067627, -1.3922091722488403, -1.2496291399002075, -1.1070491075515747, -0.9644690155982971, -0.8218889236450195, -0.6793093681335449, -0.5367293357849121, -0.3941492438316345, -0.2515691816806793, -0.10898911952972412, 0.03359091281890869, 0.17617100477218628, 0.31875109672546387, 0.4613311290740967, 0.6039111614227295, 0.7464912533760071, 0.8890713453292847, 1.0316513776779175, 1.1742314100265503, 1.3168115615844727, 1.4593915939331055, 1.6019716262817383, 1.744551658630371, 1.887131690979004, 2.0297117233276367, 2.1722917556762695, 2.3148717880249023, 2.4574520587921143, 2.600032091140747, 2.74261212348938, 2.8851921558380127, 3.0277721881866455, 3.1703522205352783, 3.3129324913024902, 3.455512523651123, 3.598092555999756, 3.7406725883483887, 3.8832526206970215]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 3.0, 1.0, 3.0, 1.0, 3.0, 1.0, 9.0, 8.0, 8.0, 13.0, 32.0, 41.0, 60.0, 94.0, 123.0, 126.0, 114.0, 109.0, 69.0, 61.0, 33.0, 24.0, 17.0, 8.0, 15.0, 2.0, 4.0, 2.0, 3.0, 3.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.390454292297363, -4.252532482147217, -4.11461067199707, -3.976688861846924, -3.8387670516967773, -3.700845241546631, -3.5629234313964844, -3.425001621246338, -3.2870798110961914, -3.149158000946045, -3.0112361907958984, -2.873314380645752, -2.7353925704956055, -2.597470760345459, -2.4595489501953125, -2.321627140045166, -2.1837055683135986, -2.045783758163452, -1.9078619480133057, -1.7699401378631592, -1.6320183277130127, -1.4940965175628662, -1.3561748266220093, -1.2182530164718628, -1.0803312063217163, -0.9424093961715698, -0.8044875860214233, -0.6665658354759216, -0.5286440253257751, -0.39072221517562866, -0.25280046463012695, -0.11487865447998047, 0.023043155670166016, 0.1609649509191513, 0.2988867461681366, 0.4368085265159607, 0.5747303366661072, 0.7126521468162537, 0.8505738973617554, 0.9884957075119019, 1.1264175176620483, 1.2643393278121948, 1.4022611379623413, 1.5401828289031982, 1.6781046390533447, 1.8160264492034912, 1.9539482593536377, 2.091870069503784, 2.2297918796539307, 2.367713689804077, 2.5056354999542236, 2.64355731010437, 2.7814791202545166, 2.919400930404663, 3.0573225021362305, 3.195244312286377, 3.3331661224365234, 3.47108793258667, 3.6090097427368164, 3.746931552886963, 3.8848533630371094, 4.022775173187256, 4.160696983337402, 4.298618793487549, 4.436540603637695]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 10.0, 12.0, 15.0, 60.0, 295.0, 5501.0, 4177379.0, 10247.0, 598.0, 94.0, 30.0, 18.0, 17.0, 6.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.021484375, -1.899261474609375, -1.77703857421875, -1.654815673828125, -1.5325927734375, -1.410369873046875, -1.28814697265625, -1.165924072265625, -1.043701171875, -0.921478271484375, -0.79925537109375, -0.677032470703125, -0.5548095703125, -0.432586669921875, -0.31036376953125, -0.188140869140625, -0.06591796875, 0.056304931640625, 0.17852783203125, 0.300750732421875, 0.4229736328125, 0.545196533203125, 0.66741943359375, 0.789642333984375, 0.911865234375, 1.034088134765625, 1.15631103515625, 1.278533935546875, 1.4007568359375, 1.522979736328125, 1.64520263671875, 1.767425537109375, 1.8896484375, 2.011871337890625, 2.13409423828125, 2.256317138671875, 2.3785400390625, 2.500762939453125, 2.62298583984375, 2.745208740234375, 2.867431640625, 2.989654541015625, 3.11187744140625, 3.234100341796875, 3.3563232421875, 3.478546142578125, 3.60076904296875, 3.722991943359375, 3.84521484375, 3.967437744140625, 4.08966064453125, 4.211883544921875, 4.3341064453125, 4.456329345703125, 4.57855224609375, 4.700775146484375, 4.822998046875, 4.945220947265625, 5.06744384765625, 5.189666748046875, 5.3118896484375, 5.434112548828125, 5.55633544921875, 5.678558349609375, 5.80078125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 3.0, 1.0, 7.0, 2.0, 6.0, 8.0, 5.0, 14.0, 10.0, 12.0, 30.0, 33.0, 55.0, 60.0, 101.0, 95.0, 111.0, 100.0, 92.0, 75.0, 46.0, 38.0, 17.0, 22.0, 7.0, 6.0, 8.0, 2.0, 6.0, 4.0, 7.0, 3.0, 1.0, 4.0, 2.0, 1.0, 6.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.035797119140625, -0.034763336181640625, -0.03372955322265625, -0.032695770263671875, -0.0316619873046875, -0.030628204345703125, -0.02959442138671875, -0.028560638427734375, -0.02752685546875, -0.026493072509765625, -0.02545928955078125, -0.024425506591796875, -0.0233917236328125, -0.022357940673828125, -0.02132415771484375, -0.020290374755859375, -0.019256591796875, -0.018222808837890625, -0.01718902587890625, -0.016155242919921875, -0.0151214599609375, -0.014087677001953125, -0.01305389404296875, -0.012020111083984375, -0.010986328125, -0.009952545166015625, -0.00891876220703125, -0.007884979248046875, -0.0068511962890625, -0.005817413330078125, -0.00478363037109375, -0.003749847412109375, -0.002716064453125, -0.001682281494140625, -0.00064849853515625, 0.000385284423828125, 0.0014190673828125, 0.002452850341796875, 0.00348663330078125, 0.004520416259765625, 0.00555419921875, 0.006587982177734375, 0.00762176513671875, 0.008655548095703125, 0.0096893310546875, 0.010723114013671875, 0.01175689697265625, 0.012790679931640625, 0.013824462890625, 0.014858245849609375, 0.01589202880859375, 0.016925811767578125, 0.0179595947265625, 0.018993377685546875, 0.02002716064453125, 0.021060943603515625, 0.0220947265625, 0.023128509521484375, 0.02416229248046875, 0.025196075439453125, 0.0262298583984375, 0.027263641357421875, 0.02829742431640625, 0.029331207275390625, 0.030364990234375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 3.0, 1.0, 3.0, 6.0, 4.0, 13.0, 18.0, 33.0, 51.0, 72.0, 108.0, 186.0, 315.0, 519.0, 1061.0, 2245.0, 5093.0, 14109.0, 53297.0, 1413115.0, 2619738.0, 59335.0, 15119.0, 5399.0, 2226.0, 1080.0, 520.0, 276.0, 147.0, 71.0, 55.0, 17.0, 20.0, 18.0, 3.0, 6.0, 1.0, 4.0, 0.0, 2.0, 2.0], "bins": [-0.70703125, -0.6905975341796875, -0.674163818359375, -0.6577301025390625, -0.64129638671875, -0.6248626708984375, -0.608428955078125, -0.5919952392578125, -0.5755615234375, -0.5591278076171875, -0.542694091796875, -0.5262603759765625, -0.50982666015625, -0.4933929443359375, -0.476959228515625, -0.4605255126953125, -0.444091796875, -0.4276580810546875, -0.411224365234375, -0.3947906494140625, -0.37835693359375, -0.3619232177734375, -0.345489501953125, -0.3290557861328125, -0.3126220703125, -0.2961883544921875, -0.279754638671875, -0.2633209228515625, -0.24688720703125, -0.2304534912109375, -0.214019775390625, -0.1975860595703125, -0.18115234375, -0.1647186279296875, -0.148284912109375, -0.1318511962890625, -0.11541748046875, -0.0989837646484375, -0.082550048828125, -0.0661163330078125, -0.0496826171875, -0.0332489013671875, -0.016815185546875, -0.0003814697265625, 0.01605224609375, 0.0324859619140625, 0.048919677734375, 0.0653533935546875, 0.081787109375, 0.0982208251953125, 0.114654541015625, 0.1310882568359375, 0.14752197265625, 0.1639556884765625, 0.180389404296875, 0.1968231201171875, 0.2132568359375, 0.2296905517578125, 0.246124267578125, 0.2625579833984375, 0.27899169921875, 0.2954254150390625, 0.311859130859375, 0.3282928466796875, 0.3447265625]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 9.0, 5.0, 7.0, 8.0, 11.0, 5.0, 19.0, 27.0, 23.0, 36.0, 50.0, 91.0, 263.0, 1589.0, 1182.0, 293.0, 149.0, 71.0, 63.0, 33.0, 34.0, 19.0, 10.0, 10.0, 16.0, 8.0, 9.0, 6.0, 3.0, 3.0, 0.0, 5.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.0791015625, -0.07683849334716797, -0.07457542419433594, -0.0723123550415039, -0.07004928588867188, -0.06778621673583984, -0.06552314758300781, -0.06326007843017578, -0.06099700927734375, -0.05873394012451172, -0.05647087097167969, -0.054207801818847656, -0.051944732666015625, -0.049681663513183594, -0.04741859436035156, -0.04515552520751953, -0.0428924560546875, -0.04062938690185547, -0.03836631774902344, -0.036103248596191406, -0.033840179443359375, -0.031577110290527344, -0.029314041137695312, -0.02705097198486328, -0.02478790283203125, -0.02252483367919922, -0.020261764526367188, -0.017998695373535156, -0.015735626220703125, -0.013472557067871094, -0.011209487915039062, -0.008946418762207031, -0.006683349609375, -0.004420280456542969, -0.0021572113037109375, 0.00010585784912109375, 0.002368927001953125, 0.004631996154785156, 0.0068950653076171875, 0.009158134460449219, 0.01142120361328125, 0.013684272766113281, 0.015947341918945312, 0.018210411071777344, 0.020473480224609375, 0.022736549377441406, 0.024999618530273438, 0.02726268768310547, 0.0295257568359375, 0.03178882598876953, 0.03405189514160156, 0.036314964294433594, 0.038578033447265625, 0.040841102600097656, 0.04310417175292969, 0.04536724090576172, 0.04763031005859375, 0.04989337921142578, 0.05215644836425781, 0.054419517517089844, 0.056682586669921875, 0.058945655822753906, 0.06120872497558594, 0.06347179412841797, 0.06573486328125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 48.0, 501.0, 343.0, 69.0, 22.0, 7.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5254411697387695, -4.411787509918213, -4.298133850097656, -4.1844801902771, -4.070826530456543, -3.9571726322174072, -3.8435187339782715, -3.729865074157715, -3.616211414337158, -3.5025577545166016, -3.388904094696045, -3.275250196456909, -3.1615965366363525, -3.047942876815796, -2.93428897857666, -2.8206353187561035, -2.706981658935547, -2.5933279991149902, -2.4796743392944336, -2.366020441055298, -2.252366781234741, -2.1387131214141846, -2.025059223175049, -1.9114055633544922, -1.7977519035339355, -1.684098243713379, -1.5704444646835327, -1.4567906856536865, -1.3431370258331299, -1.2294833660125732, -1.115829586982727, -1.0021758079528809, -0.8885223865509033, -0.7748686671257019, -0.6612149477005005, -0.5475612282752991, -0.43390750885009766, -0.32025378942489624, -0.20660006999969482, -0.09294635057449341, 0.020707368850708008, 0.13436108827590942, 0.24801480770111084, 0.36166852712631226, 0.47532224655151367, 0.5889759659767151, 0.7026296854019165, 0.8162834048271179, 0.9299371242523193, 1.043590784072876, 1.1572445631027222, 1.2708983421325684, 1.384552001953125, 1.4982056617736816, 1.6118594408035278, 1.725513219833374, 1.8391668796539307, 1.9528205394744873, 2.066474437713623, 2.1801280975341797, 2.2937817573547363, 2.407435417175293, 2.5210890769958496, 2.6347429752349854, 2.748396635055542]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 7.0, 1.0, 6.0, 10.0, 12.0, 12.0, 19.0, 36.0, 38.0, 41.0, 39.0, 45.0, 71.0, 70.0, 69.0, 79.0, 77.0, 67.0, 62.0, 46.0, 45.0, 27.0, 37.0, 18.0, 27.0, 12.0, 6.0, 6.0, 12.0, 1.0, 3.0, 5.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8437067270278931, -0.8190926313400269, -0.7944785356521606, -0.7698644399642944, -0.745250403881073, -0.7206363081932068, -0.6960222125053406, -0.6714081168174744, -0.6467940211296082, -0.6221799254417419, -0.5975658297538757, -0.5729517936706543, -0.5483376979827881, -0.5237236022949219, -0.49910950660705566, -0.47449541091918945, -0.44988134503364563, -0.4252672493457794, -0.4006531834602356, -0.3760390877723694, -0.3514249920845032, -0.32681089639663696, -0.30219683051109314, -0.27758273482322693, -0.2529686689376831, -0.2283545881509781, -0.20374049246311188, -0.17912641167640686, -0.15451231598854065, -0.12989823520183563, -0.10528415441513062, -0.0806700587272644, -0.05605596303939819, -0.03144187480211258, -0.006827790290117264, 0.017786294221878052, 0.042400382459163666, 0.06701447069644928, 0.0916285514831543, 0.11624264717102051, 0.14085672795772552, 0.16547080874443054, 0.19008490443229675, 0.21469898521900177, 0.2393130660057068, 0.263927161693573, 0.2885412573814392, 0.3131553530693054, 0.33776941895484924, 0.36238351464271545, 0.3869975805282593, 0.4116116762161255, 0.4362257719039917, 0.4608398675918579, 0.48545393347740173, 0.5100680589675903, 0.5346820950508118, 0.559296190738678, 0.5839102864265442, 0.6085243225097656, 0.6331384181976318, 0.657752513885498, 0.6823666095733643, 0.7069807052612305, 0.7315948009490967]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 3.0, 8.0, 4.0, 8.0, 13.0, 17.0, 16.0, 44.0, 50.0, 62.0, 120.0, 181.0, 326.0, 567.0, 996.0, 1882.0, 4059.0, 9436.0, 27008.0, 113029.0, 658325.0, 174193.0, 36814.0, 11792.0, 4759.0, 2156.0, 1102.0, 596.0, 370.0, 193.0, 138.0, 104.0, 59.0, 39.0, 24.0, 24.0, 10.0, 9.0, 9.0, 10.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46435546875, -0.4501190185546875, -0.435882568359375, -0.4216461181640625, -0.40740966796875, -0.3931732177734375, -0.378936767578125, -0.3647003173828125, -0.3504638671875, -0.3362274169921875, -0.321990966796875, -0.3077545166015625, -0.29351806640625, -0.2792816162109375, -0.265045166015625, -0.2508087158203125, -0.236572265625, -0.2223358154296875, -0.208099365234375, -0.1938629150390625, -0.17962646484375, -0.1653900146484375, -0.151153564453125, -0.1369171142578125, -0.1226806640625, -0.1084442138671875, -0.094207763671875, -0.0799713134765625, -0.06573486328125, -0.0514984130859375, -0.037261962890625, -0.0230255126953125, -0.0087890625, 0.0054473876953125, 0.019683837890625, 0.0339202880859375, 0.04815673828125, 0.0623931884765625, 0.076629638671875, 0.0908660888671875, 0.1051025390625, 0.1193389892578125, 0.133575439453125, 0.1478118896484375, 0.16204833984375, 0.1762847900390625, 0.190521240234375, 0.2047576904296875, 0.218994140625, 0.2332305908203125, 0.247467041015625, 0.2617034912109375, 0.27593994140625, 0.2901763916015625, 0.304412841796875, 0.3186492919921875, 0.3328857421875, 0.3471221923828125, 0.361358642578125, 0.3755950927734375, 0.38983154296875, 0.4040679931640625, 0.418304443359375, 0.4325408935546875, 0.44677734375]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 3.0, 3.0, 4.0, 4.0, 4.0, 11.0, 26.0, 29.0, 41.0, 60.0, 53.0, 85.0, 84.0, 102.0, 100.0, 88.0, 91.0, 62.0, 32.0, 38.0, 19.0, 18.0, 15.0, 12.0, 8.0, 7.0, 4.0, 6.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04095458984375, -0.03944110870361328, -0.03792762756347656, -0.036414146423339844, -0.034900665283203125, -0.033387184143066406, -0.03187370300292969, -0.03036022186279297, -0.02884674072265625, -0.02733325958251953, -0.025819778442382812, -0.024306297302246094, -0.022792816162109375, -0.021279335021972656, -0.019765853881835938, -0.01825237274169922, -0.0167388916015625, -0.015225410461425781, -0.013711929321289062, -0.012198448181152344, -0.010684967041015625, -0.009171485900878906, -0.0076580047607421875, -0.006144523620605469, -0.00463104248046875, -0.0031175613403320312, -0.0016040802001953125, -9.059906005859375e-05, 0.001422882080078125, 0.0029363632202148438, 0.0044498443603515625, 0.005963325500488281, 0.007476806640625, 0.008990287780761719, 0.010503768920898438, 0.012017250061035156, 0.013530731201171875, 0.015044212341308594, 0.016557693481445312, 0.01807117462158203, 0.01958465576171875, 0.02109813690185547, 0.022611618041992188, 0.024125099182128906, 0.025638580322265625, 0.027152061462402344, 0.028665542602539062, 0.03017902374267578, 0.0316925048828125, 0.03320598602294922, 0.03471946716308594, 0.036232948303222656, 0.037746429443359375, 0.039259910583496094, 0.04077339172363281, 0.04228687286376953, 0.04380035400390625, 0.04531383514404297, 0.04682731628417969, 0.048340797424316406, 0.049854278564453125, 0.051367759704589844, 0.05288124084472656, 0.05439472198486328, 0.055908203125]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 3.0, 3.0, 6.0, 2.0, 7.0, 8.0, 13.0, 13.0, 12.0, 39.0, 161.0, 1940.0, 862655.0, 182347.0, 1098.0, 132.0, 31.0, 15.0, 17.0, 8.0, 7.0, 5.0, 2.0, 7.0, 7.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.814453125, -1.749420166015625, -1.68438720703125, -1.619354248046875, -1.5543212890625, -1.489288330078125, -1.42425537109375, -1.359222412109375, -1.294189453125, -1.229156494140625, -1.16412353515625, -1.099090576171875, -1.0340576171875, -0.969024658203125, -0.90399169921875, -0.838958740234375, -0.77392578125, -0.708892822265625, -0.64385986328125, -0.578826904296875, -0.5137939453125, -0.448760986328125, -0.38372802734375, -0.318695068359375, -0.253662109375, -0.188629150390625, -0.12359619140625, -0.058563232421875, 0.0064697265625, 0.071502685546875, 0.13653564453125, 0.201568603515625, 0.2666015625, 0.331634521484375, 0.39666748046875, 0.461700439453125, 0.5267333984375, 0.591766357421875, 0.65679931640625, 0.721832275390625, 0.786865234375, 0.851898193359375, 0.91693115234375, 0.981964111328125, 1.0469970703125, 1.112030029296875, 1.17706298828125, 1.242095947265625, 1.30712890625, 1.372161865234375, 1.43719482421875, 1.502227783203125, 1.5672607421875, 1.632293701171875, 1.69732666015625, 1.762359619140625, 1.827392578125, 1.892425537109375, 1.95745849609375, 2.022491455078125, 2.0875244140625, 2.152557373046875, 2.21759033203125, 2.282623291015625, 2.34765625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 7.0, 2.0, 2.0, 0.0, 5.0, 7.0, 14.0, 11.0, 11.0, 15.0, 27.0, 25.0, 34.0, 30.0, 36.0, 50.0, 45.0, 58.0, 46.0, 54.0, 53.0, 56.0, 66.0, 51.0, 42.0, 46.0, 42.0, 35.0, 25.0, 18.0, 14.0, 22.0, 14.0, 16.0, 11.0, 10.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1826171875, -0.176361083984375, -0.17010498046875, -0.163848876953125, -0.1575927734375, -0.151336669921875, -0.14508056640625, -0.138824462890625, -0.132568359375, -0.126312255859375, -0.12005615234375, -0.113800048828125, -0.1075439453125, -0.101287841796875, -0.09503173828125, -0.088775634765625, -0.08251953125, -0.076263427734375, -0.07000732421875, -0.063751220703125, -0.0574951171875, -0.051239013671875, -0.04498291015625, -0.038726806640625, -0.032470703125, -0.026214599609375, -0.01995849609375, -0.013702392578125, -0.0074462890625, -0.001190185546875, 0.00506591796875, 0.011322021484375, 0.017578125, 0.023834228515625, 0.03009033203125, 0.036346435546875, 0.0426025390625, 0.048858642578125, 0.05511474609375, 0.061370849609375, 0.067626953125, 0.073883056640625, 0.08013916015625, 0.086395263671875, 0.0926513671875, 0.098907470703125, 0.10516357421875, 0.111419677734375, 0.11767578125, 0.123931884765625, 0.13018798828125, 0.136444091796875, 0.1427001953125, 0.148956298828125, 0.15521240234375, 0.161468505859375, 0.167724609375, 0.173980712890625, 0.18023681640625, 0.186492919921875, 0.1927490234375, 0.199005126953125, 0.20526123046875, 0.211517333984375, 0.2177734375]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 3.0, 2.0, 4.0, 9.0, 8.0, 8.0, 16.0, 49.0, 244.0, 3201.0, 1042890.0, 1844.0, 203.0, 35.0, 16.0, 9.0, 4.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-12.9921875, -12.6451416015625, -12.298095703125, -11.9510498046875, -11.60400390625, -11.2569580078125, -10.909912109375, -10.5628662109375, -10.2158203125, -9.8687744140625, -9.521728515625, -9.1746826171875, -8.82763671875, -8.4805908203125, -8.133544921875, -7.7864990234375, -7.439453125, -7.0924072265625, -6.745361328125, -6.3983154296875, -6.05126953125, -5.7042236328125, -5.357177734375, -5.0101318359375, -4.6630859375, -4.3160400390625, -3.968994140625, -3.6219482421875, -3.27490234375, -2.9278564453125, -2.580810546875, -2.2337646484375, -1.88671875, -1.5396728515625, -1.192626953125, -0.8455810546875, -0.49853515625, -0.1514892578125, 0.195556640625, 0.5426025390625, 0.8896484375, 1.2366943359375, 1.583740234375, 1.9307861328125, 2.27783203125, 2.6248779296875, 2.971923828125, 3.3189697265625, 3.666015625, 4.0130615234375, 4.360107421875, 4.7071533203125, 5.05419921875, 5.4012451171875, 5.748291015625, 6.0953369140625, 6.4423828125, 6.7894287109375, 7.136474609375, 7.4835205078125, 7.83056640625, 8.1776123046875, 8.524658203125, 8.8717041015625, 9.21875]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 6.0, 6.0, 7.0, 10.0, 10.0, 17.0, 24.0, 32.0, 69.0, 104.0, 134.0, 124.0, 122.0, 90.0, 57.0, 41.0, 32.0, 26.0, 18.0, 15.0, 13.0, 7.0, 2.0, 7.0, 5.0, 4.0, 5.0, 4.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0006198883056640625, -0.0006013959646224976, -0.0005829036235809326, -0.0005644112825393677, -0.0005459189414978027, -0.0005274266004562378, -0.0005089342594146729, -0.0004904419183731079, -0.00047194957733154297, -0.00045345723628997803, -0.0004349648952484131, -0.00041647255420684814, -0.0003979802131652832, -0.00037948787212371826, -0.0003609955310821533, -0.0003425031900405884, -0.00032401084899902344, -0.0003055185079574585, -0.00028702616691589355, -0.0002685338258743286, -0.00025004148483276367, -0.00023154914379119873, -0.0002130568027496338, -0.00019456446170806885, -0.0001760721206665039, -0.00015757977962493896, -0.00013908743858337402, -0.00012059509754180908, -0.00010210275650024414, -8.36104154586792e-05, -6.511807441711426e-05, -4.6625733375549316e-05, -2.8133392333984375e-05, -9.641051292419434e-06, 8.851289749145508e-06, 2.734363079071045e-05, 4.583597183227539e-05, 6.432831287384033e-05, 8.282065391540527e-05, 0.00010131299495697021, 0.00011980533599853516, 0.0001382976770401001, 0.00015679001808166504, 0.00017528235912322998, 0.00019377470016479492, 0.00021226704120635986, 0.0002307593822479248, 0.00024925172328948975, 0.0002677440643310547, 0.00028623640537261963, 0.00030472874641418457, 0.0003232210874557495, 0.00034171342849731445, 0.0003602057695388794, 0.00037869811058044434, 0.0003971904516220093, 0.0004156827926635742, 0.00043417513370513916, 0.0004526674747467041, 0.00047115981578826904, 0.000489652156829834, 0.0005081444978713989, 0.0005266368389129639, 0.0005451291799545288, 0.0005636215209960938]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 4.0, 9.0, 7.0, 11.0, 13.0, 18.0, 32.0, 41.0, 60.0, 86.0, 185.0, 361.0, 726.0, 1782.0, 5001.0, 21885.0, 968666.0, 38758.0, 6856.0, 2167.0, 883.0, 435.0, 210.0, 107.0, 76.0, 58.0, 34.0, 26.0, 13.0, 13.0, 15.0, 8.0, 4.0, 6.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.5234375, -1.4702301025390625, -1.417022705078125, -1.3638153076171875, -1.31060791015625, -1.2574005126953125, -1.204193115234375, -1.1509857177734375, -1.0977783203125, -1.0445709228515625, -0.991363525390625, -0.9381561279296875, -0.88494873046875, -0.8317413330078125, -0.778533935546875, -0.7253265380859375, -0.672119140625, -0.6189117431640625, -0.565704345703125, -0.5124969482421875, -0.45928955078125, -0.4060821533203125, -0.352874755859375, -0.2996673583984375, -0.2464599609375, -0.1932525634765625, -0.140045166015625, -0.0868377685546875, -0.03363037109375, 0.0195770263671875, 0.072784423828125, 0.1259918212890625, 0.17919921875, 0.2324066162109375, 0.285614013671875, 0.3388214111328125, 0.39202880859375, 0.4452362060546875, 0.498443603515625, 0.5516510009765625, 0.6048583984375, 0.6580657958984375, 0.711273193359375, 0.7644805908203125, 0.81768798828125, 0.8708953857421875, 0.924102783203125, 0.9773101806640625, 1.030517578125, 1.0837249755859375, 1.136932373046875, 1.1901397705078125, 1.24334716796875, 1.2965545654296875, 1.349761962890625, 1.4029693603515625, 1.4561767578125, 1.5093841552734375, 1.562591552734375, 1.6157989501953125, 1.66900634765625, 1.7222137451171875, 1.775421142578125, 1.8286285400390625, 1.8818359375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 8.0, 4.0, 11.0, 7.0, 9.0, 18.0, 41.0, 345.0, 447.0, 47.0, 22.0, 10.0, 9.0, 7.0, 4.0, 3.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.93115234375, -0.8907699584960938, -0.8503875732421875, -0.8100051879882812, -0.769622802734375, -0.7292404174804688, -0.6888580322265625, -0.6484756469726562, -0.60809326171875, -0.5677108764648438, -0.5273284912109375, -0.48694610595703125, -0.446563720703125, -0.40618133544921875, -0.3657989501953125, -0.32541656494140625, -0.2850341796875, -0.24465179443359375, -0.2042694091796875, -0.16388702392578125, -0.123504638671875, -0.08312225341796875, -0.0427398681640625, -0.00235748291015625, 0.03802490234375, 0.07840728759765625, 0.1187896728515625, 0.15917205810546875, 0.199554443359375, 0.23993682861328125, 0.2803192138671875, 0.32070159912109375, 0.361083984375, 0.40146636962890625, 0.4418487548828125, 0.48223114013671875, 0.522613525390625, 0.5629959106445312, 0.6033782958984375, 0.6437606811523438, 0.68414306640625, 0.7245254516601562, 0.7649078369140625, 0.8052902221679688, 0.845672607421875, 0.8860549926757812, 0.9264373779296875, 0.9668197631835938, 1.0072021484375, 1.0475845336914062, 1.0879669189453125, 1.1283493041992188, 1.168731689453125, 1.2091140747070312, 1.2494964599609375, 1.2898788452148438, 1.33026123046875, 1.3706436157226562, 1.4110260009765625, 1.4514083862304688, 1.491790771484375, 1.5321731567382812, 1.5725555419921875, 1.6129379272460938, 1.6533203125]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 4.0, 9.0, 12.0, 28.0, 117.0, 329.0, 275.0, 123.0, 52.0, 30.0, 11.0, 9.0, 3.0, 3.0, 4.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.880826950073242, -4.732195854187012, -4.583564758300781, -4.434933662414551, -4.28630256652832, -4.13767147064209, -3.9890406131744385, -3.840409517288208, -3.6917784214019775, -3.543147325515747, -3.3945162296295166, -3.245885133743286, -3.0972542762756348, -2.9486231803894043, -2.799992084503174, -2.6513609886169434, -2.502729892730713, -2.3540987968444824, -2.205467700958252, -2.0568366050720215, -1.9082056283950806, -1.75957453250885, -1.6109435558319092, -1.4623124599456787, -1.3136813640594482, -1.1650502681732178, -1.0164191722869873, -0.8677881956100464, -0.7191570997238159, -0.5705260038375854, -0.42189496755599976, -0.27326393127441406, -0.12463235855102539, 0.02399870753288269, 0.17262977361679077, 0.32126083970069885, 0.46989190578460693, 0.6185230016708374, 0.7671540379524231, 0.9157850742340088, 1.0644161701202393, 1.2130472660064697, 1.3616783618927002, 1.5103093385696411, 1.6589404344558716, 1.807571530342102, 1.956202507019043, 2.1048336029052734, 2.253464698791504, 2.4020957946777344, 2.550726890563965, 2.6993579864501953, 2.847989082336426, 2.9966201782226562, 3.1452510356903076, 3.293882131576538, 3.4425132274627686, 3.591144323348999, 3.7397754192352295, 3.88840651512146, 4.037037372589111, 4.185668468475342, 4.334299564361572, 4.482930660247803, 4.631561756134033]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 5.0, 3.0, 4.0, 5.0, 8.0, 13.0, 7.0, 20.0, 24.0, 28.0, 32.0, 45.0, 54.0, 44.0, 47.0, 62.0, 71.0, 86.0, 85.0, 61.0, 59.0, 44.0, 43.0, 32.0, 31.0, 18.0, 19.0, 19.0, 11.0, 6.0, 6.0, 3.0, 6.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.32629132270813, -2.261723518371582, -2.197155714035034, -2.1325879096984863, -2.0680201053619385, -2.0034523010253906, -1.9388844966888428, -1.874316692352295, -1.809748888015747, -1.7451810836791992, -1.6806132793426514, -1.6160454750061035, -1.5514776706695557, -1.4869098663330078, -1.42234206199646, -1.357774257659912, -1.2932063341140747, -1.2286385297775269, -1.164070725440979, -1.0995029211044312, -1.0349351167678833, -0.9703673124313354, -0.9057994484901428, -0.841231644153595, -0.7766638398170471, -0.7120960354804993, -0.6475282311439514, -0.5829603672027588, -0.5183925628662109, -0.4538247883319855, -0.38925695419311523, -0.3246891498565674, -0.26012134552001953, -0.19555354118347168, -0.13098572194576263, -0.06641790270805359, -0.0018500983715057373, 0.06271770596504211, 0.12728554010391235, 0.1918533444404602, 0.25642114877700806, 0.3209889531135559, 0.38555675745010376, 0.450124591588974, 0.5146924257278442, 0.5792602300643921, 0.6438280344009399, 0.7083958387374878, 0.7729636430740356, 0.8375314474105835, 0.9020992517471313, 0.9666670560836792, 1.031234860420227, 1.095802664756775, 1.1603705883026123, 1.2249383926391602, 1.289506196975708, 1.3540740013122559, 1.4186418056488037, 1.4832096099853516, 1.5477774143218994, 1.6123452186584473, 1.6769130229949951, 1.741480827331543, 1.8060486316680908]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 3.0, 1.0, 4.0, 1.0, 14.0, 6.0, 10.0, 19.0, 13.0, 26.0, 39.0, 39.0, 78.0, 93.0, 160.0, 269.0, 424.0, 700.0, 1251.0, 2786.0, 6707.0, 19103.0, 134778.0, 3938602.0, 64810.0, 13685.0, 5194.0, 2331.0, 1269.0, 678.0, 397.0, 257.0, 185.0, 110.0, 75.0, 47.0, 35.0, 23.0, 6.0, 18.0, 8.0, 6.0, 7.0, 4.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.96337890625, -0.9345016479492188, -0.9056243896484375, -0.8767471313476562, -0.847869873046875, -0.8189926147460938, -0.7901153564453125, -0.7612380981445312, -0.73236083984375, -0.7034835815429688, -0.6746063232421875, -0.6457290649414062, -0.616851806640625, -0.5879745483398438, -0.5590972900390625, -0.5302200317382812, -0.5013427734375, -0.47246551513671875, -0.4435882568359375, -0.41471099853515625, -0.385833740234375, -0.35695648193359375, -0.3280792236328125, -0.29920196533203125, -0.27032470703125, -0.24144744873046875, -0.2125701904296875, -0.18369293212890625, -0.154815673828125, -0.12593841552734375, -0.0970611572265625, -0.06818389892578125, -0.039306640625, -0.01042938232421875, 0.0184478759765625, 0.04732513427734375, 0.076202392578125, 0.10507965087890625, 0.1339569091796875, 0.16283416748046875, 0.19171142578125, 0.22058868408203125, 0.2494659423828125, 0.27834320068359375, 0.307220458984375, 0.33609771728515625, 0.3649749755859375, 0.39385223388671875, 0.4227294921875, 0.45160675048828125, 0.4804840087890625, 0.5093612670898438, 0.538238525390625, 0.5671157836914062, 0.5959930419921875, 0.6248703002929688, 0.65374755859375, 0.6826248168945312, 0.7115020751953125, 0.7403793334960938, 0.769256591796875, 0.7981338500976562, 0.8270111083984375, 0.8558883666992188, 0.884765625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 1.0, 4.0, 2.0, 2.0, 5.0, 6.0, 6.0, 9.0, 22.0, 26.0, 32.0, 39.0, 46.0, 51.0, 65.0, 71.0, 93.0, 99.0, 80.0, 75.0, 50.0, 51.0, 39.0, 30.0, 23.0, 17.0, 12.0, 14.0, 5.0, 9.0, 8.0, 3.0, 3.0, 2.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0408935546875, -0.03976702690124512, -0.038640499114990234, -0.03751397132873535, -0.03638744354248047, -0.035260915756225586, -0.0341343879699707, -0.03300786018371582, -0.03188133239746094, -0.030754804611206055, -0.029628276824951172, -0.02850174903869629, -0.027375221252441406, -0.026248693466186523, -0.02512216567993164, -0.023995637893676758, -0.022869110107421875, -0.021742582321166992, -0.02061605453491211, -0.019489526748657227, -0.018362998962402344, -0.01723647117614746, -0.016109943389892578, -0.014983415603637695, -0.013856887817382812, -0.01273036003112793, -0.011603832244873047, -0.010477304458618164, -0.009350776672363281, -0.008224248886108398, -0.007097721099853516, -0.005971193313598633, -0.00484466552734375, -0.003718137741088867, -0.0025916099548339844, -0.0014650821685791016, -0.00033855438232421875, 0.0007879734039306641, 0.0019145011901855469, 0.0030410289764404297, 0.0041675567626953125, 0.005294084548950195, 0.006420612335205078, 0.007547140121459961, 0.008673667907714844, 0.009800195693969727, 0.01092672348022461, 0.012053251266479492, 0.013179779052734375, 0.014306306838989258, 0.01543283462524414, 0.016559362411499023, 0.017685890197753906, 0.01881241798400879, 0.019938945770263672, 0.021065473556518555, 0.022192001342773438, 0.02331852912902832, 0.024445056915283203, 0.025571584701538086, 0.02669811248779297, 0.02782464027404785, 0.028951168060302734, 0.030077695846557617, 0.0312042236328125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0, 6.0, 4.0, 7.0, 11.0, 22.0, 20.0, 25.0, 66.0, 112.0, 519.0, 4719.0, 2638836.0, 1544818.0, 4438.0, 408.0, 129.0, 53.0, 25.0, 18.0, 7.0, 11.0, 6.0, 4.0, 4.0, 8.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.4150390625, -1.3535003662109375, -1.291961669921875, -1.2304229736328125, -1.16888427734375, -1.1073455810546875, -1.045806884765625, -0.9842681884765625, -0.9227294921875, -0.8611907958984375, -0.799652099609375, -0.7381134033203125, -0.67657470703125, -0.6150360107421875, -0.553497314453125, -0.4919586181640625, -0.430419921875, -0.3688812255859375, -0.307342529296875, -0.2458038330078125, -0.18426513671875, -0.1227264404296875, -0.061187744140625, 0.0003509521484375, 0.0618896484375, 0.1234283447265625, 0.184967041015625, 0.2465057373046875, 0.30804443359375, 0.3695831298828125, 0.431121826171875, 0.4926605224609375, 0.55419921875, 0.6157379150390625, 0.677276611328125, 0.7388153076171875, 0.80035400390625, 0.8618927001953125, 0.923431396484375, 0.9849700927734375, 1.0465087890625, 1.1080474853515625, 1.169586181640625, 1.2311248779296875, 1.29266357421875, 1.3542022705078125, 1.415740966796875, 1.4772796630859375, 1.538818359375, 1.6003570556640625, 1.661895751953125, 1.7234344482421875, 1.78497314453125, 1.8465118408203125, 1.908050537109375, 1.9695892333984375, 2.0311279296875, 2.0926666259765625, 2.154205322265625, 2.2157440185546875, 2.27728271484375, 2.3388214111328125, 2.400360107421875, 2.4618988037109375, 2.5234375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 2.0, 3.0, 4.0, 5.0, 5.0, 4.0, 5.0, 4.0, 4.0, 15.0, 20.0, 35.0, 44.0, 54.0, 116.0, 270.0, 1357.0, 1538.0, 266.0, 127.0, 58.0, 34.0, 41.0, 16.0, 14.0, 12.0, 12.0, 4.0, 8.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1168212890625, -0.11374855041503906, -0.11067581176757812, -0.10760307312011719, -0.10453033447265625, -0.10145759582519531, -0.09838485717773438, -0.09531211853027344, -0.0922393798828125, -0.08916664123535156, -0.08609390258789062, -0.08302116394042969, -0.07994842529296875, -0.07687568664550781, -0.07380294799804688, -0.07073020935058594, -0.067657470703125, -0.06458473205566406, -0.061511993408203125, -0.05843925476074219, -0.05536651611328125, -0.05229377746582031, -0.049221038818359375, -0.04614830017089844, -0.0430755615234375, -0.04000282287597656, -0.036930084228515625, -0.03385734558105469, -0.03078460693359375, -0.027711868286132812, -0.024639129638671875, -0.021566390991210938, -0.01849365234375, -0.015420913696289062, -0.012348175048828125, -0.009275436401367188, -0.00620269775390625, -0.0031299591064453125, -5.7220458984375e-05, 0.0030155181884765625, 0.0060882568359375, 0.009160995483398438, 0.012233734130859375, 0.015306472778320312, 0.01837921142578125, 0.021451950073242188, 0.024524688720703125, 0.027597427368164062, 0.030670166015625, 0.03374290466308594, 0.036815643310546875, 0.03988838195800781, 0.04296112060546875, 0.04603385925292969, 0.049106597900390625, 0.05217933654785156, 0.0552520751953125, 0.05832481384277344, 0.061397552490234375, 0.06447029113769531, 0.06754302978515625, 0.07061576843261719, 0.07368850708007812, 0.07676124572753906, 0.079833984375]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 18.0, 170.0, 795.0, 26.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5699529647827148, -0.4626213312149048, -0.3552897274494171, -0.24795812368392944, -0.14062649011611938, -0.033294856548309326, 0.07403671741485596, 0.18136835098266602, 0.2886999845504761, 0.39603161811828613, 0.5033632516860962, 0.6106948256492615, 0.7180264592170715, 0.8253580927848816, 0.9326896667480469, 1.040021300315857, 1.147352933883667, 1.254684567451477, 1.362016201019287, 1.4693477153778076, 1.5766794681549072, 1.6840109825134277, 1.7913426160812378, 1.8986742496490479, 2.0060057640075684, 2.113337278366089, 2.2206690311431885, 2.328000545501709, 2.4353322982788086, 2.542663812637329, 2.6499953269958496, 2.757327079772949, 2.864658832550049, 2.9719903469085693, 3.079322099685669, 3.1866536140441895, 3.293985366821289, 3.4013168811798096, 3.50864839553833, 3.6159801483154297, 3.7233119010925293, 3.83064341545105, 3.9379751682281494, 4.04530668258667, 4.1526384353637695, 4.259970188140869, 4.3673014640808105, 4.47463321685791, 4.581964492797852, 4.689296245574951, 4.796627521514893, 4.903959274291992, 5.011291027069092, 5.118622779846191, 5.225954055786133, 5.333285808563232, 5.440617561340332, 5.547949314117432, 5.655280590057373, 5.762612342834473, 5.869944095611572, 5.977275848388672, 6.084607124328613, 6.191938877105713, 6.2992706298828125]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 1.0, 4.0, 4.0, 8.0, 12.0, 17.0, 21.0, 33.0, 31.0, 43.0, 51.0, 49.0, 66.0, 71.0, 77.0, 76.0, 75.0, 60.0, 54.0, 56.0, 51.0, 28.0, 32.0, 21.0, 8.0, 16.0, 11.0, 7.0, 4.0, 2.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.3770429491996765, -0.3650261163711548, -0.35300931334495544, -0.3409924805164337, -0.3289756774902344, -0.31695884466171265, -0.3049420118331909, -0.2929252088069916, -0.28090837597846985, -0.2688915431499481, -0.2568747401237488, -0.24485790729522705, -0.23284108936786652, -0.22082427144050598, -0.20880745351314545, -0.1967906355857849, -0.18477381765842438, -0.17275699973106384, -0.1607401818037033, -0.14872336387634277, -0.13670653104782104, -0.12468971312046051, -0.11267289519309998, -0.10065606981515884, -0.08863925188779831, -0.07662243396043777, -0.06460560858249664, -0.05258879065513611, -0.040571969002485275, -0.028555147349834442, -0.016538329422473907, -0.004521504044532776, 0.007495313882827759, 0.019512135535478592, 0.031528957188129425, 0.04354577511548996, 0.05556259676814079, 0.06757941842079163, 0.07959623634815216, 0.09161306172609329, 0.10362987965345383, 0.11564669758081436, 0.1276635229587555, 0.13968034088611603, 0.15169715881347656, 0.1637139916419983, 0.17573079466819763, 0.18774762749671936, 0.1997644454240799, 0.21178126335144043, 0.22379808127880096, 0.2358148992061615, 0.24783173203468323, 0.25984853506088257, 0.2718653678894043, 0.283882200717926, 0.29589900374412537, 0.3079158365726471, 0.31993263959884644, 0.33194947242736816, 0.3439662754535675, 0.35598310828208923, 0.3679999113082886, 0.3800167441368103, 0.39203357696533203]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 5.0, 7.0, 13.0, 15.0, 17.0, 23.0, 22.0, 30.0, 33.0, 36.0, 42.0, 48.0, 72.0, 576.0, 62839.0, 978477.0, 5724.0, 210.0, 62.0, 53.0, 44.0, 48.0, 25.0, 23.0, 20.0, 21.0, 7.0, 10.0, 3.0, 11.0, 10.0, 5.0, 3.0, 8.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.98486328125, -0.9425735473632812, -0.9002838134765625, -0.8579940795898438, -0.815704345703125, -0.7734146118164062, -0.7311248779296875, -0.6888351440429688, -0.64654541015625, -0.6042556762695312, -0.5619659423828125, -0.5196762084960938, -0.477386474609375, -0.43509674072265625, -0.3928070068359375, -0.35051727294921875, -0.3082275390625, -0.26593780517578125, -0.2236480712890625, -0.18135833740234375, -0.139068603515625, -0.09677886962890625, -0.0544891357421875, -0.01219940185546875, 0.03009033203125, 0.07238006591796875, 0.1146697998046875, 0.15695953369140625, 0.199249267578125, 0.24153900146484375, 0.2838287353515625, 0.32611846923828125, 0.368408203125, 0.41069793701171875, 0.4529876708984375, 0.49527740478515625, 0.537567138671875, 0.5798568725585938, 0.6221466064453125, 0.6644363403320312, 0.70672607421875, 0.7490158081054688, 0.7913055419921875, 0.8335952758789062, 0.875885009765625, 0.9181747436523438, 0.9604644775390625, 1.0027542114257812, 1.0450439453125, 1.0873336791992188, 1.1296234130859375, 1.1719131469726562, 1.214202880859375, 1.2564926147460938, 1.2987823486328125, 1.3410720825195312, 1.38336181640625, 1.4256515502929688, 1.4679412841796875, 1.5102310180664062, 1.552520751953125, 1.5948104858398438, 1.6371002197265625, 1.6793899536132812, 1.7216796875]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 4.0, 14.0, 13.0, 25.0, 16.0, 27.0, 28.0, 43.0, 47.0, 34.0, 50.0, 52.0, 58.0, 65.0, 64.0, 59.0, 59.0, 41.0, 55.0, 36.0, 42.0, 28.0, 26.0, 19.0, 25.0, 14.0, 11.0, 13.0, 5.0, 9.0, 6.0, 7.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.02447509765625, -0.023670434951782227, -0.022865772247314453, -0.02206110954284668, -0.021256446838378906, -0.020451784133911133, -0.01964712142944336, -0.018842458724975586, -0.018037796020507812, -0.01723313331604004, -0.016428470611572266, -0.015623807907104492, -0.014819145202636719, -0.014014482498168945, -0.013209819793701172, -0.012405157089233398, -0.011600494384765625, -0.010795831680297852, -0.009991168975830078, -0.009186506271362305, -0.008381843566894531, -0.007577180862426758, -0.006772518157958984, -0.005967855453491211, -0.0051631927490234375, -0.004358530044555664, -0.0035538673400878906, -0.002749204635620117, -0.0019445419311523438, -0.0011398792266845703, -0.0003352165222167969, 0.00046944618225097656, 0.00127410888671875, 0.0020787715911865234, 0.002883434295654297, 0.0036880970001220703, 0.004492759704589844, 0.005297422409057617, 0.006102085113525391, 0.006906747817993164, 0.0077114105224609375, 0.008516073226928711, 0.009320735931396484, 0.010125398635864258, 0.010930061340332031, 0.011734724044799805, 0.012539386749267578, 0.013344049453735352, 0.014148712158203125, 0.014953374862670898, 0.015758037567138672, 0.016562700271606445, 0.01736736297607422, 0.018172025680541992, 0.018976688385009766, 0.01978135108947754, 0.020586013793945312, 0.021390676498413086, 0.02219533920288086, 0.023000001907348633, 0.023804664611816406, 0.02460932731628418, 0.025413990020751953, 0.026218652725219727, 0.0270233154296875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 3.0, 9.0, 9.0, 15.0, 15.0, 35.0, 43.0, 68.0, 103.0, 163.0, 276.0, 622.0, 1718.0, 6297.0, 34697.0, 282135.0, 606050.0, 96891.0, 14208.0, 3136.0, 1049.0, 454.0, 206.0, 137.0, 68.0, 56.0, 21.0, 15.0, 11.0, 12.0, 10.0, 7.0, 7.0, 4.0, 3.0, 5.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4384765625, -0.42348480224609375, -0.4084930419921875, -0.39350128173828125, -0.378509521484375, -0.36351776123046875, -0.3485260009765625, -0.33353424072265625, -0.31854248046875, -0.30355072021484375, -0.2885589599609375, -0.27356719970703125, -0.258575439453125, -0.24358367919921875, -0.2285919189453125, -0.21360015869140625, -0.1986083984375, -0.18361663818359375, -0.1686248779296875, -0.15363311767578125, -0.138641357421875, -0.12364959716796875, -0.1086578369140625, -0.09366607666015625, -0.07867431640625, -0.06368255615234375, -0.0486907958984375, -0.03369903564453125, -0.018707275390625, -0.00371551513671875, 0.0112762451171875, 0.02626800537109375, 0.041259765625, 0.05625152587890625, 0.0712432861328125, 0.08623504638671875, 0.101226806640625, 0.11621856689453125, 0.1312103271484375, 0.14620208740234375, 0.16119384765625, 0.17618560791015625, 0.1911773681640625, 0.20616912841796875, 0.221160888671875, 0.23615264892578125, 0.2511444091796875, 0.26613616943359375, 0.2811279296875, 0.29611968994140625, 0.3111114501953125, 0.32610321044921875, 0.341094970703125, 0.35608673095703125, 0.3710784912109375, 0.38607025146484375, 0.40106201171875, 0.41605377197265625, 0.4310455322265625, 0.44603729248046875, 0.461029052734375, 0.47602081298828125, 0.4910125732421875, 0.5060043334960938, 0.52099609375]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 4.0, 4.0, 4.0, 4.0, 5.0, 8.0, 4.0, 9.0, 11.0, 16.0, 15.0, 20.0, 27.0, 21.0, 28.0, 32.0, 40.0, 41.0, 40.0, 38.0, 42.0, 43.0, 49.0, 44.0, 27.0, 32.0, 39.0, 31.0, 24.0, 30.0, 39.0, 30.0, 28.0, 27.0, 17.0, 21.0, 23.0, 18.0, 12.0, 7.0, 10.0, 10.0, 13.0, 5.0, 4.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.1429443359375, -0.1386260986328125, -0.134307861328125, -0.1299896240234375, -0.12567138671875, -0.1213531494140625, -0.117034912109375, -0.1127166748046875, -0.1083984375, -0.1040802001953125, -0.099761962890625, -0.0954437255859375, -0.09112548828125, -0.0868072509765625, -0.082489013671875, -0.0781707763671875, -0.0738525390625, -0.0695343017578125, -0.065216064453125, -0.0608978271484375, -0.05657958984375, -0.0522613525390625, -0.047943115234375, -0.0436248779296875, -0.039306640625, -0.0349884033203125, -0.030670166015625, -0.0263519287109375, -0.02203369140625, -0.0177154541015625, -0.013397216796875, -0.0090789794921875, -0.0047607421875, -0.0004425048828125, 0.003875732421875, 0.0081939697265625, 0.01251220703125, 0.0168304443359375, 0.021148681640625, 0.0254669189453125, 0.02978515625, 0.0341033935546875, 0.038421630859375, 0.0427398681640625, 0.04705810546875, 0.0513763427734375, 0.055694580078125, 0.0600128173828125, 0.0643310546875, 0.0686492919921875, 0.072967529296875, 0.0772857666015625, 0.08160400390625, 0.0859222412109375, 0.090240478515625, 0.0945587158203125, 0.098876953125, 0.1031951904296875, 0.107513427734375, 0.1118316650390625, 0.11614990234375, 0.1204681396484375, 0.124786376953125, 0.1291046142578125, 0.1334228515625]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 10.0, 7.0, 15.0, 21.0, 28.0, 32.0, 48.0, 97.0, 147.0, 340.0, 883.0, 3765.0, 34529.0, 936522.0, 65251.0, 4967.0, 1059.0, 387.0, 173.0, 94.0, 54.0, 43.0, 23.0, 23.0, 11.0, 10.0, 5.0, 9.0, 1.0, 5.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.744140625, -0.7111968994140625, -0.678253173828125, -0.6453094482421875, -0.61236572265625, -0.5794219970703125, -0.546478271484375, -0.5135345458984375, -0.4805908203125, -0.4476470947265625, -0.414703369140625, -0.3817596435546875, -0.34881591796875, -0.3158721923828125, -0.282928466796875, -0.2499847412109375, -0.217041015625, -0.1840972900390625, -0.151153564453125, -0.1182098388671875, -0.08526611328125, -0.0523223876953125, -0.019378662109375, 0.0135650634765625, 0.0465087890625, 0.0794525146484375, 0.112396240234375, 0.1453399658203125, 0.17828369140625, 0.2112274169921875, 0.244171142578125, 0.2771148681640625, 0.31005859375, 0.3430023193359375, 0.375946044921875, 0.4088897705078125, 0.44183349609375, 0.4747772216796875, 0.507720947265625, 0.5406646728515625, 0.5736083984375, 0.6065521240234375, 0.639495849609375, 0.6724395751953125, 0.70538330078125, 0.7383270263671875, 0.771270751953125, 0.8042144775390625, 0.837158203125, 0.8701019287109375, 0.903045654296875, 0.9359893798828125, 0.96893310546875, 1.0018768310546875, 1.034820556640625, 1.0677642822265625, 1.1007080078125, 1.1336517333984375, 1.166595458984375, 1.1995391845703125, 1.23248291015625, 1.2654266357421875, 1.298370361328125, 1.3313140869140625, 1.3642578125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 4.0, 3.0, 4.0, 5.0, 4.0, 1.0, 11.0, 10.0, 13.0, 14.0, 21.0, 30.0, 35.0, 63.0, 81.0, 161.0, 169.0, 119.0, 82.0, 45.0, 33.0, 26.0, 13.0, 11.0, 10.0, 5.0, 7.0, 6.0, 3.0, 3.0, 4.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00042629241943359375, -0.0004106462001800537, -0.00039499998092651367, -0.00037935376167297363, -0.0003637075424194336, -0.00034806132316589355, -0.0003324151039123535, -0.0003167688846588135, -0.00030112266540527344, -0.0002854764461517334, -0.00026983022689819336, -0.0002541840076446533, -0.00023853778839111328, -0.00022289156913757324, -0.0002072453498840332, -0.00019159913063049316, -0.00017595291137695312, -0.00016030669212341309, -0.00014466047286987305, -0.000129014253616333, -0.00011336803436279297, -9.772181510925293e-05, -8.207559585571289e-05, -6.642937660217285e-05, -5.078315734863281e-05, -3.5136938095092773e-05, -1.9490718841552734e-05, -3.844499588012695e-06, 1.1801719665527344e-05, 2.7447938919067383e-05, 4.309415817260742e-05, 5.874037742614746e-05, 7.43865966796875e-05, 9.003281593322754e-05, 0.00010567903518676758, 0.00012132525444030762, 0.00013697147369384766, 0.0001526176929473877, 0.00016826391220092773, 0.00018391013145446777, 0.0001995563507080078, 0.00021520256996154785, 0.0002308487892150879, 0.00024649500846862793, 0.00026214122772216797, 0.000277787446975708, 0.00029343366622924805, 0.0003090798854827881, 0.0003247261047363281, 0.00034037232398986816, 0.0003560185432434082, 0.00037166476249694824, 0.0003873109817504883, 0.0004029572010040283, 0.00041860342025756836, 0.0004342496395111084, 0.00044989585876464844, 0.0004655420780181885, 0.0004811882972717285, 0.0004968345165252686, 0.0005124807357788086, 0.0005281269550323486, 0.0005437731742858887, 0.0005594193935394287, 0.0005750656127929688]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 5.0, 2.0, 5.0, 2.0, 6.0, 8.0, 1.0, 12.0, 6.0, 30.0, 46.0, 76.0, 197.0, 436.0, 1291.0, 4942.0, 43731.0, 976962.0, 16152.0, 3179.0, 872.0, 331.0, 120.0, 49.0, 41.0, 21.0, 7.0, 16.0, 2.0, 4.0, 1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0], "bins": [-3.048828125, -2.9713134765625, -2.893798828125, -2.8162841796875, -2.73876953125, -2.6612548828125, -2.583740234375, -2.5062255859375, -2.4287109375, -2.3511962890625, -2.273681640625, -2.1961669921875, -2.11865234375, -2.0411376953125, -1.963623046875, -1.8861083984375, -1.80859375, -1.7310791015625, -1.653564453125, -1.5760498046875, -1.49853515625, -1.4210205078125, -1.343505859375, -1.2659912109375, -1.1884765625, -1.1109619140625, -1.033447265625, -0.9559326171875, -0.87841796875, -0.8009033203125, -0.723388671875, -0.6458740234375, -0.568359375, -0.4908447265625, -0.413330078125, -0.3358154296875, -0.25830078125, -0.1807861328125, -0.103271484375, -0.0257568359375, 0.0517578125, 0.1292724609375, 0.206787109375, 0.2843017578125, 0.36181640625, 0.4393310546875, 0.516845703125, 0.5943603515625, 0.671875, 0.7493896484375, 0.826904296875, 0.9044189453125, 0.98193359375, 1.0594482421875, 1.136962890625, 1.2144775390625, 1.2919921875, 1.3695068359375, 1.447021484375, 1.5245361328125, 1.60205078125, 1.6795654296875, 1.757080078125, 1.8345947265625, 1.912109375]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 2.0, 2.0, 7.0, 4.0, 3.0, 4.0, 7.0, 10.0, 5.0, 17.0, 21.0, 26.0, 48.0, 116.0, 151.0, 183.0, 132.0, 83.0, 53.0, 33.0, 24.0, 13.0, 11.0, 11.0, 4.0, 2.0, 4.0, 2.0, 3.0, 2.0, 6.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.27197265625, -0.263031005859375, -0.25408935546875, -0.245147705078125, -0.2362060546875, -0.227264404296875, -0.21832275390625, -0.209381103515625, -0.200439453125, -0.191497802734375, -0.18255615234375, -0.173614501953125, -0.1646728515625, -0.155731201171875, -0.14678955078125, -0.137847900390625, -0.12890625, -0.119964599609375, -0.11102294921875, -0.102081298828125, -0.0931396484375, -0.084197998046875, -0.07525634765625, -0.066314697265625, -0.057373046875, -0.048431396484375, -0.03948974609375, -0.030548095703125, -0.0216064453125, -0.012664794921875, -0.00372314453125, 0.005218505859375, 0.01416015625, 0.023101806640625, 0.03204345703125, 0.040985107421875, 0.0499267578125, 0.058868408203125, 0.06781005859375, 0.076751708984375, 0.085693359375, 0.094635009765625, 0.10357666015625, 0.112518310546875, 0.1214599609375, 0.130401611328125, 0.13934326171875, 0.148284912109375, 0.1572265625, 0.166168212890625, 0.17510986328125, 0.184051513671875, 0.1929931640625, 0.201934814453125, 0.21087646484375, 0.219818115234375, 0.228759765625, 0.237701416015625, 0.24664306640625, 0.255584716796875, 0.2645263671875, 0.273468017578125, 0.28240966796875, 0.291351318359375, 0.30029296875]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [2.0, 4.0, 34.0, 856.0, 118.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.135040760040283, -2.2754461765289307, -1.4158515930175781, -0.5562570095062256, 0.30333757400512695, 1.1629319190979004, 2.022526741027832, 2.8821215629577637, 3.741715908050537, 4.601310729980469, 5.460905075073242, 6.320499420166016, 7.180094242095947, 8.039688110351562, 8.899283409118652, 9.758878707885742, 10.618473052978516, 11.478067398071289, 12.337661743164062, 13.197257041931152, 14.056851387023926, 14.9164457321167, 15.776041030883789, 16.635635375976562, 17.495229721069336, 18.35482406616211, 19.214418411254883, 20.074012756347656, 20.933609008789062, 21.793201446533203, 22.65279769897461, 23.512392044067383, 24.371986389160156, 25.23158073425293, 26.091175079345703, 26.950769424438477, 27.81036376953125, 28.669960021972656, 29.52955436706543, 30.389148712158203, 31.248743057250977, 32.10833740234375, 32.967933654785156, 33.8275260925293, 34.6871223449707, 35.546714782714844, 36.40631103515625, 37.265907287597656, 38.1254997253418, 38.9850959777832, 39.844688415527344, 40.70428466796875, 41.56387710571289, 42.4234733581543, 43.28306579589844, 44.142662048339844, 45.00225830078125, 45.861854553222656, 46.7214469909668, 47.5810432434082, 48.440635681152344, 49.30023193359375, 50.15982437133789, 51.0194206237793, 51.87901306152344]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 6.0, 7.0, 11.0, 19.0, 16.0, 21.0, 23.0, 32.0, 40.0, 58.0, 51.0, 58.0, 72.0, 66.0, 64.0, 60.0, 51.0, 65.0, 61.0, 49.0, 39.0, 40.0, 25.0, 17.0, 14.0, 15.0, 8.0, 3.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7439658641815186, -1.6912264823913574, -1.6384871006011963, -1.5857477188110352, -1.5330082178115845, -1.4802688360214233, -1.4275294542312622, -1.374790072441101, -1.3220505714416504, -1.2693111896514893, -1.2165718078613281, -1.163832426071167, -1.1110929250717163, -1.0583535432815552, -1.005614161491394, -0.9528747797012329, -0.9001353979110718, -0.8473960161209106, -0.7946565747261047, -0.7419171929359436, -0.6891777515411377, -0.6364383697509766, -0.5836989879608154, -0.5309596061706543, -0.4782201647758484, -0.42548075318336487, -0.37274134159088135, -0.3200019598007202, -0.2672625482082367, -0.21452313661575317, -0.16178375482559204, -0.10904434323310852, -0.05630481243133545, -0.0035654082894325256, 0.0491739958524704, 0.10191339254379272, 0.15465280413627625, 0.20739221572875977, 0.2601315975189209, 0.3128710091114044, 0.36561042070388794, 0.41834983229637146, 0.471089243888855, 0.5238286256790161, 0.5765680074691772, 0.6293074488639832, 0.6820468306541443, 0.7347862720489502, 0.7875256538391113, 0.8402650356292725, 0.8930044770240784, 0.9457438588142395, 0.9984833002090454, 1.0512226819992065, 1.1039620637893677, 1.1567014455795288, 1.2094409465789795, 1.2621803283691406, 1.3149197101593018, 1.367659091949463, 1.4203985929489136, 1.4731379747390747, 1.5258773565292358, 1.578616738319397, 1.631356120109558]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 4.0, 6.0, 0.0, 3.0, 6.0, 8.0, 12.0, 13.0, 22.0, 14.0, 28.0, 40.0, 65.0, 59.0, 100.0, 211.0, 416.0, 1253.0, 10239.0, 3996493.0, 180615.0, 3468.0, 524.0, 217.0, 140.0, 105.0, 59.0, 53.0, 33.0, 20.0, 17.0, 10.0, 12.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.5606689453125, -2.482666015625, -2.4046630859375, -2.32666015625, -2.2486572265625, -2.170654296875, -2.0926513671875, -2.0146484375, -1.9366455078125, -1.858642578125, -1.7806396484375, -1.70263671875, -1.6246337890625, -1.546630859375, -1.4686279296875, -1.390625, -1.3126220703125, -1.234619140625, -1.1566162109375, -1.07861328125, -1.0006103515625, -0.922607421875, -0.8446044921875, -0.7666015625, -0.6885986328125, -0.610595703125, -0.5325927734375, -0.45458984375, -0.3765869140625, -0.298583984375, -0.2205810546875, -0.142578125, -0.0645751953125, 0.013427734375, 0.0914306640625, 0.16943359375, 0.2474365234375, 0.325439453125, 0.4034423828125, 0.4814453125, 0.5594482421875, 0.637451171875, 0.7154541015625, 0.79345703125, 0.8714599609375, 0.949462890625, 1.0274658203125, 1.10546875, 1.1834716796875, 1.261474609375, 1.3394775390625, 1.41748046875, 1.4954833984375, 1.573486328125, 1.6514892578125, 1.7294921875, 1.8074951171875, 1.885498046875, 1.9635009765625, 2.04150390625, 2.1195068359375, 2.197509765625, 2.2755126953125, 2.353515625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 8.0, 22.0, 23.0, 18.0, 25.0, 38.0, 53.0, 54.0, 68.0, 79.0, 84.0, 80.0, 83.0, 76.0, 56.0, 54.0, 52.0, 25.0, 27.0, 20.0, 14.0, 12.0, 3.0, 9.0, 1.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0634765625, -0.06192779541015625, -0.0603790283203125, -0.05883026123046875, -0.057281494140625, -0.05573272705078125, -0.0541839599609375, -0.05263519287109375, -0.05108642578125, -0.04953765869140625, -0.0479888916015625, -0.04644012451171875, -0.044891357421875, -0.04334259033203125, -0.0417938232421875, -0.04024505615234375, -0.0386962890625, -0.03714752197265625, -0.0355987548828125, -0.03404998779296875, -0.032501220703125, -0.03095245361328125, -0.0294036865234375, -0.02785491943359375, -0.02630615234375, -0.02475738525390625, -0.0232086181640625, -0.02165985107421875, -0.020111083984375, -0.01856231689453125, -0.0170135498046875, -0.01546478271484375, -0.013916015625, -0.01236724853515625, -0.0108184814453125, -0.00926971435546875, -0.007720947265625, -0.00617218017578125, -0.0046234130859375, -0.00307464599609375, -0.00152587890625, 2.288818359375e-05, 0.0015716552734375, 0.00312042236328125, 0.004669189453125, 0.00621795654296875, 0.0077667236328125, 0.00931549072265625, 0.0108642578125, 0.01241302490234375, 0.0139617919921875, 0.01551055908203125, 0.017059326171875, 0.01860809326171875, 0.0201568603515625, 0.02170562744140625, 0.02325439453125, 0.02480316162109375, 0.0263519287109375, 0.02790069580078125, 0.029449462890625, 0.03099822998046875, 0.0325469970703125, 0.03409576416015625, 0.03564453125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 12.0, 21.0, 45.0, 88.0, 131.0, 328.0, 1983.0, 4175479.0, 15144.0, 479.0, 228.0, 136.0, 77.0, 64.0, 34.0, 13.0, 12.0, 3.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.751953125, -3.551239013671875, -3.35052490234375, -3.149810791015625, -2.9490966796875, -2.748382568359375, -2.54766845703125, -2.346954345703125, -2.146240234375, -1.945526123046875, -1.74481201171875, -1.544097900390625, -1.3433837890625, -1.142669677734375, -0.94195556640625, -0.741241455078125, -0.54052734375, -0.339813232421875, -0.13909912109375, 0.061614990234375, 0.2623291015625, 0.463043212890625, 0.66375732421875, 0.864471435546875, 1.065185546875, 1.265899658203125, 1.46661376953125, 1.667327880859375, 1.8680419921875, 2.068756103515625, 2.26947021484375, 2.470184326171875, 2.6708984375, 2.871612548828125, 3.07232666015625, 3.273040771484375, 3.4737548828125, 3.674468994140625, 3.87518310546875, 4.075897216796875, 4.276611328125, 4.477325439453125, 4.67803955078125, 4.878753662109375, 5.0794677734375, 5.280181884765625, 5.48089599609375, 5.681610107421875, 5.88232421875, 6.083038330078125, 6.28375244140625, 6.484466552734375, 6.6851806640625, 6.885894775390625, 7.08660888671875, 7.287322998046875, 7.488037109375, 7.688751220703125, 7.88946533203125, 8.090179443359375, 8.2908935546875, 8.491607666015625, 8.69232177734375, 8.893035888671875, 9.09375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 4.0, 10.0, 13.0, 69.0, 344.0, 3247.0, 316.0, 60.0, 20.0, 4.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1407470703125, -0.12418937683105469, -0.10763168334960938, -0.09107398986816406, -0.07451629638671875, -0.05795860290527344, -0.041400909423828125, -0.024843215942382812, -0.0082855224609375, 0.008272171020507812, 0.024829864501953125, 0.04138755798339844, 0.05794525146484375, 0.07450294494628906, 0.09106063842773438, 0.10761833190917969, 0.124176025390625, 0.1407337188720703, 0.15729141235351562, 0.17384910583496094, 0.19040679931640625, 0.20696449279785156, 0.22352218627929688, 0.2400798797607422, 0.2566375732421875, 0.2731952667236328, 0.2897529602050781, 0.30631065368652344, 0.32286834716796875, 0.33942604064941406, 0.3559837341308594, 0.3725414276123047, 0.38909912109375, 0.4056568145751953, 0.4222145080566406, 0.43877220153808594, 0.45532989501953125, 0.47188758850097656, 0.4884452819824219, 0.5050029754638672, 0.5215606689453125, 0.5381183624267578, 0.5546760559082031, 0.5712337493896484, 0.5877914428710938, 0.6043491363525391, 0.6209068298339844, 0.6374645233154297, 0.654022216796875, 0.6705799102783203, 0.6871376037597656, 0.7036952972412109, 0.7202529907226562, 0.7368106842041016, 0.7533683776855469, 0.7699260711669922, 0.7864837646484375, 0.8030414581298828, 0.8195991516113281, 0.8361568450927734, 0.8527145385742188, 0.8692722320556641, 0.8858299255371094, 0.9023876190185547, 0.9189453125]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 2.0, 11.0, 27.0, 256.0, 595.0, 103.0, 12.0, 2.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1594884395599365, -2.952620029449463, -2.7457518577575684, -2.5388834476470947, -2.332015037536621, -2.1251468658447266, -1.918278455734253, -1.7114101648330688, -1.5045418739318848, -1.2976735830307007, -1.0908052921295166, -0.883936882019043, -0.6770685911178589, -0.4702003002166748, -0.26333189010620117, -0.05646359920501709, 0.150404691696167, 0.35727301239967346, 0.5641413331031799, 0.7710096836090088, 0.9778779745101929, 1.184746265411377, 1.3916146755218506, 1.5984829664230347, 1.8053512573242188, 2.0122196674346924, 2.219087839126587, 2.4259562492370605, 2.632824420928955, 2.8396928310394287, 3.0465612411499023, 3.253429412841797, 3.4602975845336914, 3.667165994644165, 3.8740341663360596, 4.080902576446533, 4.287770748138428, 4.4946393966674805, 4.701507568359375, 4.9083757400512695, 5.115243911743164, 5.322112083435059, 5.528980731964111, 5.735848903656006, 5.9427170753479, 6.149585723876953, 6.356453895568848, 6.563322067260742, 6.770190715789795, 6.9770588874816895, 7.183927536010742, 7.390795707702637, 7.597663879394531, 7.804532051086426, 8.01140022277832, 8.218269348144531, 8.425137519836426, 8.63200569152832, 8.838873863220215, 9.04574203491211, 9.25261116027832, 9.459479331970215, 9.66634750366211, 9.873215675354004, 10.080083847045898]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 6.0, 13.0, 18.0, 29.0, 53.0, 90.0, 121.0, 137.0, 156.0, 112.0, 102.0, 70.0, 43.0, 23.0, 19.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392868757247925, -2.3183772563934326, -2.2438859939575195, -2.1693944931030273, -2.094902992248535, -2.020411491394043, -1.9459201097488403, -1.8714287281036377, -1.7969372272491455, -1.7224457263946533, -1.6479543447494507, -1.573462963104248, -1.4989714622497559, -1.4244799613952637, -1.349988579750061, -1.2754971981048584, -1.2010056972503662, -1.126514196395874, -1.0520228147506714, -0.977531373500824, -0.9030399322509766, -0.8285484910011292, -0.7540570497512817, -0.6795656085014343, -0.6050741672515869, -0.5305827260017395, -0.4560912847518921, -0.3815998435020447, -0.30710840225219727, -0.23261696100234985, -0.15812551975250244, -0.08363407850265503, -0.009142875671386719, 0.0653485655784607, 0.1398400068283081, 0.21433144807815552, 0.28882288932800293, 0.36331433057785034, 0.43780577182769775, 0.5122972130775452, 0.5867886543273926, 0.66128009557724, 0.7357715368270874, 0.8102629780769348, 0.8847544193267822, 0.9592458605766296, 1.033737301826477, 1.1082286834716797, 1.1827201843261719, 1.257211685180664, 1.3317030668258667, 1.4061944484710693, 1.4806859493255615, 1.5551774501800537, 1.6296688318252563, 1.704160213470459, 1.7786517143249512, 1.8531432151794434, 1.927634596824646, 2.0021259784698486, 2.076617479324341, 2.151108980178833, 2.225600242614746, 2.3000917434692383, 2.3745832443237305]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 3.0, 4.0, 3.0, 5.0, 8.0, 7.0, 9.0, 18.0, 17.0, 18.0, 24.0, 38.0, 62.0, 77.0, 173.0, 439.0, 1688.0, 15767.0, 794130.0, 228193.0, 6126.0, 1041.0, 342.0, 122.0, 73.0, 43.0, 34.0, 25.0, 15.0, 13.0, 8.0, 13.0, 8.0, 5.0, 3.0, 1.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.630859375, -1.570068359375, -1.50927734375, -1.448486328125, -1.3876953125, -1.326904296875, -1.26611328125, -1.205322265625, -1.14453125, -1.083740234375, -1.02294921875, -0.962158203125, -0.9013671875, -0.840576171875, -0.77978515625, -0.718994140625, -0.658203125, -0.597412109375, -0.53662109375, -0.475830078125, -0.4150390625, -0.354248046875, -0.29345703125, -0.232666015625, -0.171875, -0.111083984375, -0.05029296875, 0.010498046875, 0.0712890625, 0.132080078125, 0.19287109375, 0.253662109375, 0.314453125, 0.375244140625, 0.43603515625, 0.496826171875, 0.5576171875, 0.618408203125, 0.67919921875, 0.739990234375, 0.80078125, 0.861572265625, 0.92236328125, 0.983154296875, 1.0439453125, 1.104736328125, 1.16552734375, 1.226318359375, 1.287109375, 1.347900390625, 1.40869140625, 1.469482421875, 1.5302734375, 1.591064453125, 1.65185546875, 1.712646484375, 1.7734375, 1.834228515625, 1.89501953125, 1.955810546875, 2.0166015625, 2.077392578125, 2.13818359375, 2.198974609375, 2.259765625]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 3.0, 4.0, 10.0, 16.0, 19.0, 26.0, 35.0, 44.0, 57.0, 94.0, 84.0, 105.0, 92.0, 97.0, 90.0, 64.0, 55.0, 38.0, 26.0, 16.0, 13.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08587646484375, -0.08290958404541016, -0.07994270324707031, -0.07697582244873047, -0.07400894165039062, -0.07104206085205078, -0.06807518005371094, -0.0651082992553711, -0.06214141845703125, -0.059174537658691406, -0.05620765686035156, -0.05324077606201172, -0.050273895263671875, -0.04730701446533203, -0.04434013366699219, -0.041373252868652344, -0.0384063720703125, -0.035439491271972656, -0.03247261047363281, -0.02950572967529297, -0.026538848876953125, -0.02357196807861328, -0.020605087280273438, -0.017638206481933594, -0.01467132568359375, -0.011704444885253906, -0.008737564086914062, -0.005770683288574219, -0.002803802490234375, 0.00016307830810546875, 0.0031299591064453125, 0.006096839904785156, 0.009063720703125, 0.012030601501464844, 0.014997482299804688, 0.01796436309814453, 0.020931243896484375, 0.02389812469482422, 0.026865005493164062, 0.029831886291503906, 0.03279876708984375, 0.035765647888183594, 0.03873252868652344, 0.04169940948486328, 0.044666290283203125, 0.04763317108154297, 0.05060005187988281, 0.053566932678222656, 0.0565338134765625, 0.059500694274902344, 0.06246757507324219, 0.06543445587158203, 0.06840133666992188, 0.07136821746826172, 0.07433509826660156, 0.0773019790649414, 0.08026885986328125, 0.0832357406616211, 0.08620262145996094, 0.08916950225830078, 0.09213638305664062, 0.09510326385498047, 0.09807014465332031, 0.10103702545166016, 0.10400390625]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 3.0, 3.0, 7.0, 6.0, 10.0, 22.0, 22.0, 32.0, 42.0, 58.0, 85.0, 130.0, 225.0, 379.0, 732.0, 1624.0, 4703.0, 20968.0, 159228.0, 663728.0, 165937.0, 21999.0, 5180.0, 1651.0, 761.0, 368.0, 202.0, 147.0, 95.0, 54.0, 49.0, 23.0, 23.0, 11.0, 13.0, 10.0, 9.0, 4.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.5244140625, -0.5060195922851562, -0.4876251220703125, -0.46923065185546875, -0.450836181640625, -0.43244171142578125, -0.4140472412109375, -0.39565277099609375, -0.37725830078125, -0.35886383056640625, -0.3404693603515625, -0.32207489013671875, -0.303680419921875, -0.28528594970703125, -0.2668914794921875, -0.24849700927734375, -0.2301025390625, -0.21170806884765625, -0.1933135986328125, -0.17491912841796875, -0.156524658203125, -0.13813018798828125, -0.1197357177734375, -0.10134124755859375, -0.08294677734375, -0.06455230712890625, -0.0461578369140625, -0.02776336669921875, -0.009368896484375, 0.00902557373046875, 0.0274200439453125, 0.04581451416015625, 0.064208984375, 0.08260345458984375, 0.1009979248046875, 0.11939239501953125, 0.137786865234375, 0.15618133544921875, 0.1745758056640625, 0.19297027587890625, 0.21136474609375, 0.22975921630859375, 0.2481536865234375, 0.26654815673828125, 0.284942626953125, 0.30333709716796875, 0.3217315673828125, 0.34012603759765625, 0.3585205078125, 0.37691497802734375, 0.3953094482421875, 0.41370391845703125, 0.432098388671875, 0.45049285888671875, 0.4688873291015625, 0.48728179931640625, 0.50567626953125, 0.5240707397460938, 0.5424652099609375, 0.5608596801757812, 0.579254150390625, 0.5976486206054688, 0.6160430908203125, 0.6344375610351562, 0.65283203125]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 3.0, 5.0, 7.0, 8.0, 9.0, 10.0, 12.0, 12.0, 25.0, 29.0, 33.0, 41.0, 44.0, 49.0, 45.0, 53.0, 51.0, 42.0, 47.0, 58.0, 59.0, 54.0, 39.0, 54.0, 41.0, 25.0, 22.0, 22.0, 14.0, 19.0, 18.0, 8.0, 9.0, 10.0, 5.0, 4.0, 5.0, 0.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.257568359375, -0.24903106689453125, -0.2404937744140625, -0.23195648193359375, -0.223419189453125, -0.21488189697265625, -0.2063446044921875, -0.19780731201171875, -0.18927001953125, -0.18073272705078125, -0.1721954345703125, -0.16365814208984375, -0.155120849609375, -0.14658355712890625, -0.1380462646484375, -0.12950897216796875, -0.1209716796875, -0.11243438720703125, -0.1038970947265625, -0.09535980224609375, -0.086822509765625, -0.07828521728515625, -0.0697479248046875, -0.06121063232421875, -0.05267333984375, -0.04413604736328125, -0.0355987548828125, -0.02706146240234375, -0.018524169921875, -0.00998687744140625, -0.0014495849609375, 0.00708770751953125, 0.015625, 0.02416229248046875, 0.0326995849609375, 0.04123687744140625, 0.049774169921875, 0.05831146240234375, 0.0668487548828125, 0.07538604736328125, 0.08392333984375, 0.09246063232421875, 0.1009979248046875, 0.10953521728515625, 0.118072509765625, 0.12660980224609375, 0.1351470947265625, 0.14368438720703125, 0.1522216796875, 0.16075897216796875, 0.1692962646484375, 0.17783355712890625, 0.186370849609375, 0.19490814208984375, 0.2034454345703125, 0.21198272705078125, 0.22052001953125, 0.22905731201171875, 0.2375946044921875, 0.24613189697265625, 0.254669189453125, 0.26320648193359375, 0.2717437744140625, 0.28028106689453125, 0.288818359375]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 4.0, 6.0, 7.0, 5.0, 25.0, 36.0, 61.0, 147.0, 351.0, 1057.0, 6756.0, 266657.0, 759347.0, 11785.0, 1526.0, 437.0, 177.0, 81.0, 45.0, 19.0, 15.0, 8.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.73486328125, -0.6983261108398438, -0.6617889404296875, -0.6252517700195312, -0.588714599609375, -0.5521774291992188, -0.5156402587890625, -0.47910308837890625, -0.44256591796875, -0.40602874755859375, -0.3694915771484375, -0.33295440673828125, -0.296417236328125, -0.25988006591796875, -0.2233428955078125, -0.18680572509765625, -0.1502685546875, -0.11373138427734375, -0.0771942138671875, -0.04065704345703125, -0.004119873046875, 0.03241729736328125, 0.0689544677734375, 0.10549163818359375, 0.14202880859375, 0.17856597900390625, 0.2151031494140625, 0.25164031982421875, 0.288177490234375, 0.32471466064453125, 0.3612518310546875, 0.39778900146484375, 0.434326171875, 0.47086334228515625, 0.5074005126953125, 0.5439376831054688, 0.580474853515625, 0.6170120239257812, 0.6535491943359375, 0.6900863647460938, 0.72662353515625, 0.7631607055664062, 0.7996978759765625, 0.8362350463867188, 0.872772216796875, 0.9093093872070312, 0.9458465576171875, 0.9823837280273438, 1.0189208984375, 1.0554580688476562, 1.0919952392578125, 1.1285324096679688, 1.165069580078125, 1.2016067504882812, 1.2381439208984375, 1.2746810913085938, 1.31121826171875, 1.3477554321289062, 1.3842926025390625, 1.4208297729492188, 1.457366943359375, 1.4939041137695312, 1.5304412841796875, 1.5669784545898438, 1.603515625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 2.0, 3.0, 1.0, 2.0, 11.0, 11.0, 11.0, 12.0, 22.0, 17.0, 30.0, 38.0, 68.0, 83.0, 155.0, 159.0, 122.0, 72.0, 49.0, 34.0, 32.0, 15.0, 11.0, 11.0, 3.0, 5.0, 4.0, 7.0, 1.0, 5.0, 4.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003390312194824219, -0.0003260672092437744, -0.00031310319900512695, -0.0003001391887664795, -0.00028717517852783203, -0.00027421116828918457, -0.0002612471580505371, -0.00024828314781188965, -0.0002353191375732422, -0.00022235512733459473, -0.00020939111709594727, -0.0001964271068572998, -0.00018346309661865234, -0.00017049908638000488, -0.00015753507614135742, -0.00014457106590270996, -0.0001316070556640625, -0.00011864304542541504, -0.00010567903518676758, -9.271502494812012e-05, -7.975101470947266e-05, -6.67870044708252e-05, -5.3822994232177734e-05, -4.0858983993530273e-05, -2.7894973754882812e-05, -1.4930963516235352e-05, -1.9669532775878906e-06, 1.099705696105957e-05, 2.396106719970703e-05, 3.692507743835449e-05, 4.988908767700195e-05, 6.285309791564941e-05, 7.581710815429688e-05, 8.878111839294434e-05, 0.0001017451286315918, 0.00011470913887023926, 0.00012767314910888672, 0.00014063715934753418, 0.00015360116958618164, 0.0001665651798248291, 0.00017952919006347656, 0.00019249320030212402, 0.00020545721054077148, 0.00021842122077941895, 0.0002313852310180664, 0.00024434924125671387, 0.00025731325149536133, 0.0002702772617340088, 0.00028324127197265625, 0.0002962052822113037, 0.00030916929244995117, 0.00032213330268859863, 0.0003350973129272461, 0.00034806132316589355, 0.000361025333404541, 0.0003739893436431885, 0.00038695335388183594, 0.0003999173641204834, 0.00041288137435913086, 0.0004258453845977783, 0.0004388093948364258, 0.00045177340507507324, 0.0004647374153137207, 0.00047770142555236816, 0.0004906654357910156]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 0.0, 4.0, 3.0, 1.0, 4.0, 11.0, 9.0, 30.0, 27.0, 40.0, 57.0, 82.0, 154.0, 243.0, 472.0, 1097.0, 2681.0, 7930.0, 31454.0, 267713.0, 638609.0, 75966.0, 14295.0, 4354.0, 1680.0, 719.0, 369.0, 190.0, 129.0, 64.0, 43.0, 38.0, 18.0, 17.0, 11.0, 9.0, 9.0, 7.0, 4.0, 6.0, 2.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.484375, -0.468353271484375, -0.45233154296875, -0.436309814453125, -0.4202880859375, -0.404266357421875, -0.38824462890625, -0.372222900390625, -0.356201171875, -0.340179443359375, -0.32415771484375, -0.308135986328125, -0.2921142578125, -0.276092529296875, -0.26007080078125, -0.244049072265625, -0.22802734375, -0.212005615234375, -0.19598388671875, -0.179962158203125, -0.1639404296875, -0.147918701171875, -0.13189697265625, -0.115875244140625, -0.099853515625, -0.083831787109375, -0.06781005859375, -0.051788330078125, -0.0357666015625, -0.019744873046875, -0.00372314453125, 0.012298583984375, 0.0283203125, 0.044342041015625, 0.06036376953125, 0.076385498046875, 0.0924072265625, 0.108428955078125, 0.12445068359375, 0.140472412109375, 0.156494140625, 0.172515869140625, 0.18853759765625, 0.204559326171875, 0.2205810546875, 0.236602783203125, 0.25262451171875, 0.268646240234375, 0.28466796875, 0.300689697265625, 0.31671142578125, 0.332733154296875, 0.3487548828125, 0.364776611328125, 0.38079833984375, 0.396820068359375, 0.412841796875, 0.428863525390625, 0.44488525390625, 0.460906982421875, 0.4769287109375, 0.492950439453125, 0.50897216796875, 0.524993896484375, 0.541015625]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 4.0, 0.0, 4.0, 0.0, 6.0, 5.0, 4.0, 6.0, 10.0, 11.0, 13.0, 23.0, 34.0, 40.0, 55.0, 70.0, 90.0, 100.0, 83.0, 93.0, 78.0, 72.0, 64.0, 36.0, 32.0, 17.0, 10.0, 8.0, 8.0, 11.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.1864013671875, -0.17926597595214844, -0.17213058471679688, -0.1649951934814453, -0.15785980224609375, -0.1507244110107422, -0.14358901977539062, -0.13645362854003906, -0.1293182373046875, -0.12218284606933594, -0.11504745483398438, -0.10791206359863281, -0.10077667236328125, -0.09364128112792969, -0.08650588989257812, -0.07937049865722656, -0.072235107421875, -0.06509971618652344, -0.057964324951171875, -0.05082893371582031, -0.04369354248046875, -0.03655815124511719, -0.029422760009765625, -0.022287368774414062, -0.0151519775390625, -0.008016586303710938, -0.000881195068359375, 0.0062541961669921875, 0.01338958740234375, 0.020524978637695312, 0.027660369873046875, 0.03479576110839844, 0.04193115234375, 0.04906654357910156, 0.056201934814453125, 0.06333732604980469, 0.07047271728515625, 0.07760810852050781, 0.08474349975585938, 0.09187889099121094, 0.0990142822265625, 0.10614967346191406, 0.11328506469726562, 0.12042045593261719, 0.12755584716796875, 0.1346912384033203, 0.14182662963867188, 0.14896202087402344, 0.156097412109375, 0.16323280334472656, 0.17036819458007812, 0.1775035858154297, 0.18463897705078125, 0.1917743682861328, 0.19890975952148438, 0.20604515075683594, 0.2131805419921875, 0.22031593322753906, 0.22745132446289062, 0.2345867156982422, 0.24172210693359375, 0.2488574981689453, 0.2559928894042969, 0.26312828063964844, 0.270263671875]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 8.0, 17.0, 21.0, 79.0, 165.0, 304.0, 263.0, 96.0, 34.0, 9.0, 5.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.8867506980896, -4.724406719207764, -4.562062740325928, -4.399718761444092, -4.237374305725098, -4.075030326843262, -3.912686347961426, -3.75034236907959, -3.587998390197754, -3.425654411315918, -3.263310432434082, -3.100966215133667, -2.938622236251831, -2.776278257369995, -2.61393404006958, -2.451590061187744, -2.289246082305908, -2.1269021034240723, -1.9645580053329468, -1.8022139072418213, -1.6398699283599854, -1.4775259494781494, -1.315181851387024, -1.1528377532958984, -0.9904937744140625, -0.8281497359275818, -0.6658056974411011, -0.5034616589546204, -0.34111762046813965, -0.17877358198165894, -0.016429543495178223, 0.14591455459594727, 0.308258056640625, 0.4706020951271057, 0.6329461336135864, 0.7952901721000671, 0.9576342105865479, 1.1199781894683838, 1.2823222875595093, 1.4446663856506348, 1.6070103645324707, 1.7693543434143066, 1.9316984415054321, 2.0940425395965576, 2.2563865184783936, 2.4187304973602295, 2.5810747146606445, 2.7434186935424805, 2.9057626724243164, 3.0681066513061523, 3.2304506301879883, 3.3927948474884033, 3.5551388263702393, 3.717482805252075, 3.8798270225524902, 4.042171001434326, 4.204514980316162, 4.366858959197998, 4.529202938079834, 4.69154691696167, 4.853891372680664, 5.0162353515625, 5.178579330444336, 5.340923309326172, 5.503267288208008]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 1.0, 6.0, 6.0, 7.0, 13.0, 12.0, 18.0, 28.0, 36.0, 22.0, 50.0, 52.0, 46.0, 70.0, 71.0, 83.0, 67.0, 76.0, 57.0, 62.0, 37.0, 46.0, 35.0, 27.0, 25.0, 15.0, 11.0, 9.0, 9.0, 4.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.827380418777466, -2.745095729827881, -2.662811279296875, -2.58052659034729, -2.498241901397705, -2.415957450866699, -2.3336727619171143, -2.2513880729675293, -2.1691036224365234, -2.0868189334869385, -2.0045344829559326, -1.9222497940063477, -1.8399652242660522, -1.7576806545257568, -1.6753959655761719, -1.5931113958358765, -1.510826826095581, -1.4285422563552856, -1.3462576866149902, -1.2639729976654053, -1.1816884279251099, -1.0994038581848145, -1.0171191692352295, -0.9348345994949341, -0.8525500297546387, -0.7702654600143433, -0.6879808306694031, -0.6056962013244629, -0.5234116315841675, -0.4411270320415497, -0.3588424324989319, -0.2765578031539917, -0.1942729949951172, -0.11198839545249939, -0.029703795909881592, 0.052580803632736206, 0.134865403175354, 0.2171500027179718, 0.2994346022605896, 0.3817192316055298, 0.4640038013458252, 0.5462883710861206, 0.6285730004310608, 0.710857629776001, 0.7931421995162964, 0.8754267692565918, 0.957711398601532, 1.0399960279464722, 1.1222805976867676, 1.204565167427063, 1.2868497371673584, 1.3691344261169434, 1.4514189958572388, 1.5337035655975342, 1.6159882545471191, 1.6982728242874146, 1.78055739402771, 1.8628419637680054, 1.9451265335083008, 2.0274112224578857, 2.1096959114074707, 2.1919803619384766, 2.2742650508880615, 2.3565497398376465, 2.4388341903686523]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 6.0, 3.0, 8.0, 11.0, 6.0, 17.0, 14.0, 20.0, 25.0, 40.0, 66.0, 171.0, 588.0, 3974.0, 90047.0, 4045082.0, 49787.0, 3116.0, 652.0, 268.0, 149.0, 79.0, 51.0, 33.0, 20.0, 19.0, 6.0, 8.0, 9.0, 4.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 1.0], "bins": [-3.068359375, -2.99603271484375, -2.9237060546875, -2.85137939453125, -2.779052734375, -2.70672607421875, -2.6343994140625, -2.56207275390625, -2.48974609375, -2.41741943359375, -2.3450927734375, -2.27276611328125, -2.200439453125, -2.12811279296875, -2.0557861328125, -1.98345947265625, -1.9111328125, -1.83880615234375, -1.7664794921875, -1.69415283203125, -1.621826171875, -1.54949951171875, -1.4771728515625, -1.40484619140625, -1.33251953125, -1.26019287109375, -1.1878662109375, -1.11553955078125, -1.043212890625, -0.97088623046875, -0.8985595703125, -0.82623291015625, -0.75390625, -0.68157958984375, -0.6092529296875, -0.53692626953125, -0.464599609375, -0.39227294921875, -0.3199462890625, -0.24761962890625, -0.17529296875, -0.10296630859375, -0.0306396484375, 0.04168701171875, 0.114013671875, 0.18634033203125, 0.2586669921875, 0.33099365234375, 0.4033203125, 0.47564697265625, 0.5479736328125, 0.62030029296875, 0.692626953125, 0.76495361328125, 0.8372802734375, 0.90960693359375, 0.98193359375, 1.05426025390625, 1.1265869140625, 1.19891357421875, 1.271240234375, 1.34356689453125, 1.4158935546875, 1.48822021484375, 1.560546875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 7.0, 7.0, 8.0, 13.0, 19.0, 22.0, 31.0, 36.0, 68.0, 51.0, 65.0, 78.0, 92.0, 79.0, 68.0, 69.0, 55.0, 67.0, 50.0, 27.0, 30.0, 19.0, 12.0, 15.0, 7.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0723876953125, -0.06962966918945312, -0.06687164306640625, -0.06411361694335938, -0.0613555908203125, -0.058597564697265625, -0.05583953857421875, -0.053081512451171875, -0.050323486328125, -0.047565460205078125, -0.04480743408203125, -0.042049407958984375, -0.0392913818359375, -0.036533355712890625, -0.03377532958984375, -0.031017303466796875, -0.02825927734375, -0.025501251220703125, -0.02274322509765625, -0.019985198974609375, -0.0172271728515625, -0.014469146728515625, -0.01171112060546875, -0.008953094482421875, -0.006195068359375, -0.003437042236328125, -0.00067901611328125, 0.002079010009765625, 0.0048370361328125, 0.007595062255859375, 0.01035308837890625, 0.013111114501953125, 0.015869140625, 0.018627166748046875, 0.02138519287109375, 0.024143218994140625, 0.0269012451171875, 0.029659271240234375, 0.03241729736328125, 0.035175323486328125, 0.037933349609375, 0.040691375732421875, 0.04344940185546875, 0.046207427978515625, 0.0489654541015625, 0.051723480224609375, 0.05448150634765625, 0.057239532470703125, 0.05999755859375, 0.06275558471679688, 0.06551361083984375, 0.06827163696289062, 0.0710296630859375, 0.07378768920898438, 0.07654571533203125, 0.07930374145507812, 0.082061767578125, 0.08481979370117188, 0.08757781982421875, 0.09033584594726562, 0.0930938720703125, 0.09585189819335938, 0.09860992431640625, 0.10136795043945312, 0.1041259765625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 5.0, 3.0, 15.0, 76.0, 285.0, 1703.0, 4127128.0, 63430.0, 1261.0, 261.0, 78.0, 22.0, 7.0, 8.0, 6.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.494140625, -3.273895263671875, -3.05364990234375, -2.833404541015625, -2.6131591796875, -2.392913818359375, -2.17266845703125, -1.952423095703125, -1.732177734375, -1.511932373046875, -1.29168701171875, -1.071441650390625, -0.8511962890625, -0.630950927734375, -0.41070556640625, -0.190460205078125, 0.02978515625, 0.250030517578125, 0.47027587890625, 0.690521240234375, 0.9107666015625, 1.131011962890625, 1.35125732421875, 1.571502685546875, 1.791748046875, 2.011993408203125, 2.23223876953125, 2.452484130859375, 2.6727294921875, 2.892974853515625, 3.11322021484375, 3.333465576171875, 3.5537109375, 3.773956298828125, 3.99420166015625, 4.214447021484375, 4.4346923828125, 4.654937744140625, 4.87518310546875, 5.095428466796875, 5.315673828125, 5.535919189453125, 5.75616455078125, 5.976409912109375, 6.1966552734375, 6.416900634765625, 6.63714599609375, 6.857391357421875, 7.07763671875, 7.297882080078125, 7.51812744140625, 7.738372802734375, 7.9586181640625, 8.178863525390625, 8.39910888671875, 8.619354248046875, 8.839599609375, 9.059844970703125, 9.28009033203125, 9.500335693359375, 9.7205810546875, 9.940826416015625, 10.16107177734375, 10.381317138671875, 10.6015625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 11.0, 23.0, 58.0, 214.0, 2574.0, 993.0, 139.0, 38.0, 11.0, 8.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.179443359375, -0.16286087036132812, -0.14627838134765625, -0.12969589233398438, -0.1131134033203125, -0.09653091430664062, -0.07994842529296875, -0.06336593627929688, -0.046783447265625, -0.030200958251953125, -0.01361846923828125, 0.002964019775390625, 0.0195465087890625, 0.036128997802734375, 0.05271148681640625, 0.06929397583007812, 0.08587646484375, 0.10245895385742188, 0.11904144287109375, 0.13562393188476562, 0.1522064208984375, 0.16878890991210938, 0.18537139892578125, 0.20195388793945312, 0.218536376953125, 0.23511886596679688, 0.25170135498046875, 0.2682838439941406, 0.2848663330078125, 0.3014488220214844, 0.31803131103515625, 0.3346138000488281, 0.3511962890625, 0.3677787780761719, 0.38436126708984375, 0.4009437561035156, 0.4175262451171875, 0.4341087341308594, 0.45069122314453125, 0.4672737121582031, 0.483856201171875, 0.5004386901855469, 0.5170211791992188, 0.5336036682128906, 0.5501861572265625, 0.5667686462402344, 0.5833511352539062, 0.5999336242675781, 0.61651611328125, 0.6330986022949219, 0.6496810913085938, 0.6662635803222656, 0.6828460693359375, 0.6994285583496094, 0.7160110473632812, 0.7325935363769531, 0.749176025390625, 0.7657585144042969, 0.7823410034179688, 0.7989234924316406, 0.8155059814453125, 0.8320884704589844, 0.8486709594726562, 0.8652534484863281, 0.8818359375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 16.0, 43.0, 212.0, 491.0, 175.0, 45.0, 11.0, 5.0, 3.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.293306350708008, -2.152834415435791, -2.012362241744995, -1.8718903064727783, -1.731418251991272, -1.5909461975097656, -1.4504742622375488, -1.3100022077560425, -1.1695301532745361, -1.0290580987930298, -0.8885861039161682, -0.7481141090393066, -0.6076420545578003, -0.46717000007629395, -0.3266980051994324, -0.1862260103225708, -0.04575395584106445, 0.0947180688381195, 0.23519009351730347, 0.3756621181964874, 0.5161341428756714, 0.6566061973571777, 0.7970781922340393, 0.9375501871109009, 1.0780222415924072, 1.2184942960739136, 1.35896635055542, 1.4994382858276367, 1.639910340309143, 1.7803823947906494, 1.9208543300628662, 2.061326503753662, 2.201798439025879, 2.3422703742980957, 2.4827425479888916, 2.6232144832611084, 2.7636866569519043, 2.904158592224121, 3.044630527496338, 3.1851024627685547, 3.3255746364593506, 3.4660465717315674, 3.6065187454223633, 3.74699068069458, 3.887462615966797, 4.027935028076172, 4.168406963348389, 4.3088788986206055, 4.449350833892822, 4.589822769165039, 4.730294704437256, 4.870767116546631, 5.011239051818848, 5.1517109870910645, 5.292182922363281, 5.432654857635498, 5.573126792907715, 5.713598728179932, 5.854070663452148, 5.994543075561523, 6.13501501083374, 6.275486946105957, 6.415958881378174, 6.556430816650391, 6.696903228759766]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 4.0, 7.0, 9.0, 18.0, 22.0, 35.0, 33.0, 53.0, 68.0, 81.0, 94.0, 96.0, 90.0, 80.0, 83.0, 59.0, 49.0, 40.0, 24.0, 12.0, 20.0, 13.0, 7.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.547823190689087, -1.4959408044815063, -1.4440584182739258, -1.3921759128570557, -1.340293526649475, -1.2884111404418945, -1.236528754234314, -1.1846463680267334, -1.1327638626098633, -1.0808814764022827, -1.0289990901947021, -0.9771166443824768, -0.9252341985702515, -0.8733518123626709, -0.8214694261550903, -0.7695870399475098, -0.7177046537399292, -0.6658222675323486, -0.6139398217201233, -0.5620574355125427, -0.5101749897003174, -0.4582926034927368, -0.40641021728515625, -0.3545278012752533, -0.30264538526535034, -0.2507629692554474, -0.19888056814670563, -0.14699816703796387, -0.09511575102806091, -0.04323333501815796, 0.008649051189422607, 0.06053146719932556, 0.11241400241851807, 0.16429641842842102, 0.21617881953716278, 0.26806122064590454, 0.3199436366558075, 0.37182605266571045, 0.423708438873291, 0.47559085488319397, 0.5274732708930969, 0.5793556571006775, 0.6312381029129028, 0.6831204891204834, 0.735002875328064, 0.7868853211402893, 0.8387677073478699, 0.8906501531600952, 0.9425325393676758, 0.9944149255752563, 1.046297311782837, 1.098179817199707, 1.1500622034072876, 1.2019445896148682, 1.2538269758224487, 1.3057093620300293, 1.3575918674468994, 1.40947425365448, 1.4613566398620605, 1.5132391452789307, 1.5651215314865112, 1.6170039176940918, 1.6688863039016724, 1.720768690109253, 1.7726510763168335]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 5.0, 3.0, 7.0, 5.0, 10.0, 16.0, 21.0, 31.0, 32.0, 54.0, 91.0, 144.0, 219.0, 415.0, 1111.0, 4044.0, 26255.0, 448757.0, 529688.0, 30879.0, 4494.0, 1115.0, 488.0, 252.0, 138.0, 92.0, 52.0, 37.0, 25.0, 20.0, 20.0, 10.0, 11.0, 4.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.0947265625, -1.0570220947265625, -1.019317626953125, -0.9816131591796875, -0.94390869140625, -0.9062042236328125, -0.868499755859375, -0.8307952880859375, -0.7930908203125, -0.7553863525390625, -0.717681884765625, -0.6799774169921875, -0.64227294921875, -0.6045684814453125, -0.566864013671875, -0.5291595458984375, -0.491455078125, -0.4537506103515625, -0.416046142578125, -0.3783416748046875, -0.34063720703125, -0.3029327392578125, -0.265228271484375, -0.2275238037109375, -0.1898193359375, -0.1521148681640625, -0.114410400390625, -0.0767059326171875, -0.03900146484375, -0.0012969970703125, 0.036407470703125, 0.0741119384765625, 0.11181640625, 0.1495208740234375, 0.187225341796875, 0.2249298095703125, 0.26263427734375, 0.3003387451171875, 0.338043212890625, 0.3757476806640625, 0.4134521484375, 0.4511566162109375, 0.488861083984375, 0.5265655517578125, 0.56427001953125, 0.6019744873046875, 0.639678955078125, 0.6773834228515625, 0.715087890625, 0.7527923583984375, 0.790496826171875, 0.8282012939453125, 0.86590576171875, 0.9036102294921875, 0.941314697265625, 0.9790191650390625, 1.0167236328125, 1.0544281005859375, 1.092132568359375, 1.1298370361328125, 1.16754150390625, 1.2052459716796875, 1.242950439453125, 1.2806549072265625, 1.318359375]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 4.0, 4.0, 8.0, 8.0, 18.0, 28.0, 32.0, 60.0, 75.0, 75.0, 91.0, 82.0, 83.0, 104.0, 79.0, 69.0, 47.0, 50.0, 22.0, 19.0, 18.0, 10.0, 16.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.12384033203125, -0.11945629119873047, -0.11507225036621094, -0.1106882095336914, -0.10630416870117188, -0.10192012786865234, -0.09753608703613281, -0.09315204620361328, -0.08876800537109375, -0.08438396453857422, -0.07999992370605469, -0.07561588287353516, -0.07123184204101562, -0.0668478012084961, -0.06246376037597656, -0.05807971954345703, -0.0536956787109375, -0.04931163787841797, -0.04492759704589844, -0.040543556213378906, -0.036159515380859375, -0.031775474548339844, -0.027391433715820312, -0.02300739288330078, -0.01862335205078125, -0.014239311218261719, -0.009855270385742188, -0.005471229553222656, -0.001087188720703125, 0.0032968521118164062, 0.0076808929443359375, 0.012064933776855469, 0.016448974609375, 0.02083301544189453, 0.025217056274414062, 0.029601097106933594, 0.033985137939453125, 0.038369178771972656, 0.04275321960449219, 0.04713726043701172, 0.05152130126953125, 0.05590534210205078, 0.06028938293457031, 0.06467342376708984, 0.06905746459960938, 0.0734415054321289, 0.07782554626464844, 0.08220958709716797, 0.0865936279296875, 0.09097766876220703, 0.09536170959472656, 0.0997457504272461, 0.10412979125976562, 0.10851383209228516, 0.11289787292480469, 0.11728191375732422, 0.12166595458984375, 0.12604999542236328, 0.1304340362548828, 0.13481807708740234, 0.13920211791992188, 0.1435861587524414, 0.14797019958496094, 0.15235424041748047, 0.15673828125]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 6.0, 3.0, 3.0, 8.0, 12.0, 13.0, 20.0, 18.0, 28.0, 37.0, 29.0, 53.0, 98.0, 144.0, 239.0, 396.0, 896.0, 1971.0, 5499.0, 20779.0, 126406.0, 605819.0, 238256.0, 34501.0, 8034.0, 2758.0, 1125.0, 555.0, 302.0, 187.0, 108.0, 76.0, 42.0, 35.0, 30.0, 20.0, 14.0, 11.0, 9.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.5615234375, -0.5437850952148438, -0.5260467529296875, -0.5083084106445312, -0.490570068359375, -0.47283172607421875, -0.4550933837890625, -0.43735504150390625, -0.41961669921875, -0.40187835693359375, -0.3841400146484375, -0.36640167236328125, -0.348663330078125, -0.33092498779296875, -0.3131866455078125, -0.29544830322265625, -0.2777099609375, -0.25997161865234375, -0.2422332763671875, -0.22449493408203125, -0.206756591796875, -0.18901824951171875, -0.1712799072265625, -0.15354156494140625, -0.13580322265625, -0.11806488037109375, -0.1003265380859375, -0.08258819580078125, -0.064849853515625, -0.04711151123046875, -0.0293731689453125, -0.01163482666015625, 0.006103515625, 0.02384185791015625, 0.0415802001953125, 0.05931854248046875, 0.077056884765625, 0.09479522705078125, 0.1125335693359375, 0.13027191162109375, 0.14801025390625, 0.16574859619140625, 0.1834869384765625, 0.20122528076171875, 0.218963623046875, 0.23670196533203125, 0.2544403076171875, 0.27217864990234375, 0.2899169921875, 0.30765533447265625, 0.3253936767578125, 0.34313201904296875, 0.360870361328125, 0.37860870361328125, 0.3963470458984375, 0.41408538818359375, 0.43182373046875, 0.44956207275390625, 0.4673004150390625, 0.48503875732421875, 0.502777099609375, 0.5205154418945312, 0.5382537841796875, 0.5559921264648438, 0.57373046875]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 3.0, 3.0, 4.0, 2.0, 4.0, 5.0, 4.0, 11.0, 15.0, 14.0, 14.0, 11.0, 22.0, 28.0, 39.0, 32.0, 38.0, 54.0, 67.0, 51.0, 54.0, 47.0, 69.0, 59.0, 57.0, 43.0, 42.0, 37.0, 42.0, 39.0, 18.0, 14.0, 10.0, 14.0, 8.0, 7.0, 7.0, 5.0, 4.0, 4.0, 0.0, 3.0, 3.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.406494140625, -0.3946380615234375, -0.382781982421875, -0.3709259033203125, -0.35906982421875, -0.3472137451171875, -0.335357666015625, -0.3235015869140625, -0.3116455078125, -0.2997894287109375, -0.287933349609375, -0.2760772705078125, -0.26422119140625, -0.2523651123046875, -0.240509033203125, -0.2286529541015625, -0.216796875, -0.2049407958984375, -0.193084716796875, -0.1812286376953125, -0.16937255859375, -0.1575164794921875, -0.145660400390625, -0.1338043212890625, -0.1219482421875, -0.1100921630859375, -0.098236083984375, -0.0863800048828125, -0.07452392578125, -0.0626678466796875, -0.050811767578125, -0.0389556884765625, -0.027099609375, -0.0152435302734375, -0.003387451171875, 0.0084686279296875, 0.02032470703125, 0.0321807861328125, 0.044036865234375, 0.0558929443359375, 0.0677490234375, 0.0796051025390625, 0.091461181640625, 0.1033172607421875, 0.11517333984375, 0.1270294189453125, 0.138885498046875, 0.1507415771484375, 0.16259765625, 0.1744537353515625, 0.186309814453125, 0.1981658935546875, 0.21002197265625, 0.2218780517578125, 0.233734130859375, 0.2455902099609375, 0.2574462890625, 0.2693023681640625, 0.281158447265625, 0.2930145263671875, 0.30487060546875, 0.3167266845703125, 0.328582763671875, 0.3404388427734375, 0.352294921875]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 7.0, 7.0, 10.0, 11.0, 14.0, 15.0, 25.0, 24.0, 51.0, 75.0, 133.0, 210.0, 321.0, 626.0, 1179.0, 2401.0, 5101.0, 15579.0, 272453.0, 708240.0, 28894.0, 6977.0, 2937.0, 1447.0, 739.0, 385.0, 245.0, 147.0, 92.0, 64.0, 46.0, 28.0, 22.0, 18.0, 8.0, 7.0, 9.0, 5.0, 2.0, 0.0, 1.0, 0.0, 2.0, 5.0, 1.0], "bins": [-0.65625, -0.6390533447265625, -0.621856689453125, -0.6046600341796875, -0.58746337890625, -0.5702667236328125, -0.553070068359375, -0.5358734130859375, -0.5186767578125, -0.5014801025390625, -0.484283447265625, -0.4670867919921875, -0.44989013671875, -0.4326934814453125, -0.415496826171875, -0.3983001708984375, -0.381103515625, -0.3639068603515625, -0.346710205078125, -0.3295135498046875, -0.31231689453125, -0.2951202392578125, -0.277923583984375, -0.2607269287109375, -0.2435302734375, -0.2263336181640625, -0.209136962890625, -0.1919403076171875, -0.17474365234375, -0.1575469970703125, -0.140350341796875, -0.1231536865234375, -0.10595703125, -0.0887603759765625, -0.071563720703125, -0.0543670654296875, -0.03717041015625, -0.0199737548828125, -0.002777099609375, 0.0144195556640625, 0.0316162109375, 0.0488128662109375, 0.066009521484375, 0.0832061767578125, 0.10040283203125, 0.1175994873046875, 0.134796142578125, 0.1519927978515625, 0.169189453125, 0.1863861083984375, 0.203582763671875, 0.2207794189453125, 0.23797607421875, 0.2551727294921875, 0.272369384765625, 0.2895660400390625, 0.3067626953125, 0.3239593505859375, 0.341156005859375, 0.3583526611328125, 0.37554931640625, 0.3927459716796875, 0.409942626953125, 0.4271392822265625, 0.4443359375]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 3.0, 0.0, 3.0, 3.0, 8.0, 6.0, 13.0, 12.0, 18.0, 38.0, 52.0, 60.0, 84.0, 81.0, 115.0, 101.0, 115.0, 89.0, 52.0, 39.0, 30.0, 28.0, 17.0, 17.0, 4.0, 6.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00020194053649902344, -0.00019613467156887054, -0.00019032880663871765, -0.00018452294170856476, -0.00017871707677841187, -0.00017291121184825897, -0.00016710534691810608, -0.00016129948198795319, -0.0001554936170578003, -0.0001496877521276474, -0.0001438818871974945, -0.00013807602226734161, -0.00013227015733718872, -0.00012646429240703583, -0.00012065842747688293, -0.00011485256254673004, -0.00010904669761657715, -0.00010324083268642426, -9.743496775627136e-05, -9.162910282611847e-05, -8.582323789596558e-05, -8.001737296581268e-05, -7.421150803565979e-05, -6.84056431055069e-05, -6.2599778175354e-05, -5.679391324520111e-05, -5.098804831504822e-05, -4.5182183384895325e-05, -3.937631845474243e-05, -3.357045352458954e-05, -2.7764588594436646e-05, -2.1958723664283752e-05, -1.615285873413086e-05, -1.0346993803977966e-05, -4.541128873825073e-06, 1.2647360563278198e-06, 7.070600986480713e-06, 1.2876465916633606e-05, 1.86823308467865e-05, 2.4488195776939392e-05, 3.0294060707092285e-05, 3.609992563724518e-05, 4.190579056739807e-05, 4.7711655497550964e-05, 5.351752042770386e-05, 5.932338535785675e-05, 6.512925028800964e-05, 7.093511521816254e-05, 7.674098014831543e-05, 8.254684507846832e-05, 8.835271000862122e-05, 9.415857493877411e-05, 9.9964439868927e-05, 0.0001057703047990799, 0.00011157616972923279, 0.00011738203465938568, 0.00012318789958953857, 0.00012899376451969147, 0.00013479962944984436, 0.00014060549437999725, 0.00014641135931015015, 0.00015221722424030304, 0.00015802308917045593, 0.00016382895410060883, 0.00016963481903076172]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 12.0, 7.0, 7.0, 6.0, 22.0, 19.0, 39.0, 61.0, 73.0, 153.0, 350.0, 783.0, 1966.0, 4966.0, 19327.0, 907121.0, 100200.0, 8311.0, 2865.0, 1191.0, 515.0, 241.0, 122.0, 71.0, 40.0, 26.0, 15.0, 7.0, 11.0, 5.0, 4.0, 4.0, 4.0, 5.0, 2.0, 2.0, 0.0, 0.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75146484375, -0.724365234375, -0.697265625, -0.670166015625, -0.64306640625, -0.615966796875, -0.5888671875, -0.561767578125, -0.53466796875, -0.507568359375, -0.48046875, -0.453369140625, -0.42626953125, -0.399169921875, -0.3720703125, -0.344970703125, -0.31787109375, -0.290771484375, -0.263671875, -0.236572265625, -0.20947265625, -0.182373046875, -0.1552734375, -0.128173828125, -0.10107421875, -0.073974609375, -0.046875, -0.019775390625, 0.00732421875, 0.034423828125, 0.0615234375, 0.088623046875, 0.11572265625, 0.142822265625, 0.169921875, 0.197021484375, 0.22412109375, 0.251220703125, 0.2783203125, 0.305419921875, 0.33251953125, 0.359619140625, 0.38671875, 0.413818359375, 0.44091796875, 0.468017578125, 0.4951171875, 0.522216796875, 0.54931640625, 0.576416015625, 0.603515625, 0.630615234375, 0.65771484375, 0.684814453125, 0.7119140625, 0.739013671875, 0.76611328125, 0.793212890625, 0.8203125, 0.847412109375, 0.87451171875, 0.901611328125, 0.9287109375, 0.955810546875, 0.98291015625]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 11.0, 11.0, 16.0, 54.0, 91.0, 125.0, 174.0, 207.0, 124.0, 88.0, 33.0, 20.0, 13.0, 5.0, 2.0, 1.0, 9.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.364990234375, -0.3538856506347656, -0.34278106689453125, -0.3316764831542969, -0.3205718994140625, -0.3094673156738281, -0.29836273193359375, -0.2872581481933594, -0.276153564453125, -0.2650489807128906, -0.25394439697265625, -0.24283981323242188, -0.2317352294921875, -0.22063064575195312, -0.20952606201171875, -0.19842147827148438, -0.18731689453125, -0.17621231079101562, -0.16510772705078125, -0.15400314331054688, -0.1428985595703125, -0.13179397583007812, -0.12068939208984375, -0.10958480834960938, -0.098480224609375, -0.08737564086914062, -0.07627105712890625, -0.06516647338867188, -0.0540618896484375, -0.042957305908203125, -0.03185272216796875, -0.020748138427734375, -0.0096435546875, 0.001461029052734375, 0.01256561279296875, 0.023670196533203125, 0.0347747802734375, 0.045879364013671875, 0.05698394775390625, 0.06808853149414062, 0.079193115234375, 0.09029769897460938, 0.10140228271484375, 0.11250686645507812, 0.1236114501953125, 0.13471603393554688, 0.14582061767578125, 0.15692520141601562, 0.16802978515625, 0.17913436889648438, 0.19023895263671875, 0.20134353637695312, 0.2124481201171875, 0.22355270385742188, 0.23465728759765625, 0.24576187133789062, 0.256866455078125, 0.2679710388183594, 0.27907562255859375, 0.2901802062988281, 0.3012847900390625, 0.3123893737792969, 0.32349395751953125, 0.3345985412597656, 0.345703125]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 8.0, 6.0, 51.0, 481.0, 394.0, 53.0, 13.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.600482940673828, -15.210250854492188, -14.820018768310547, -14.42978572845459, -14.03955364227295, -13.649321556091309, -13.259089469909668, -12.868856430053711, -12.47862434387207, -12.08839225769043, -11.698160171508789, -11.307927131652832, -10.917695045471191, -10.52746295928955, -10.13723087310791, -9.746997833251953, -9.356765747070312, -8.966533660888672, -8.576301574707031, -8.186068534851074, -7.795836448669434, -7.405604362487793, -7.015372276306152, -6.6251397132873535, -6.234908103942871, -5.8446760177612305, -5.454443454742432, -5.064211368560791, -4.673978805541992, -4.283746719360352, -3.893514394760132, -3.503282070159912, -3.1130495071411133, -2.7228171825408936, -2.332584857940674, -1.9423526525497437, -1.552120327949524, -1.1618880033493042, -0.771655797958374, -0.3814234733581543, 0.00880885124206543, 0.39904114603996277, 0.7892734408378601, 1.179505705833435, 1.5697380304336548, 1.9599703550338745, 2.3502025604248047, 2.7404348850250244, 3.130667209625244, 3.520899534225464, 3.9111318588256836, 4.301363945007324, 4.691596508026123, 5.081828594207764, 5.4720611572265625, 5.862293243408203, 6.252525329589844, 6.642757415771484, 7.032989978790283, 7.423222064971924, 7.813454627990723, 8.203686714172363, 8.593918800354004, 8.984151840209961, 9.374383926391602]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 5.0, 2.0, 6.0, 3.0, 4.0, 7.0, 5.0, 8.0, 8.0, 24.0, 16.0, 33.0, 28.0, 46.0, 48.0, 37.0, 40.0, 48.0, 39.0, 61.0, 52.0, 62.0, 61.0, 43.0, 48.0, 59.0, 39.0, 45.0, 22.0, 18.0, 17.0, 16.0, 18.0, 11.0, 10.0, 8.0, 5.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.280726432800293, -2.2077527046203613, -2.1347789764404297, -2.061805486679077, -1.9888317584991455, -1.9158580303192139, -1.8428844213485718, -1.7699108123779297, -1.696937084197998, -1.6239633560180664, -1.5509897470474243, -1.4780161380767822, -1.4050424098968506, -1.332068681716919, -1.2590950727462769, -1.1861214637756348, -1.1131477355957031, -1.0401740074157715, -0.9672003984451294, -0.8942267298698425, -0.8212530612945557, -0.7482793927192688, -0.6753057241439819, -0.6023320555686951, -0.5293583869934082, -0.45638471841812134, -0.3834110498428345, -0.3104373812675476, -0.23746371269226074, -0.16449004411697388, -0.09151637554168701, -0.018542706966400146, 0.05443120002746582, 0.12740486860275269, 0.20037853717803955, 0.2733522057533264, 0.3463258743286133, 0.41929954290390015, 0.492273211479187, 0.5652468800544739, 0.6382205486297607, 0.7111942172050476, 0.7841678857803345, 0.8571415543556213, 0.9301152229309082, 1.0030889511108398, 1.076062560081482, 1.149036169052124, 1.2220098972320557, 1.2949836254119873, 1.3679572343826294, 1.4409308433532715, 1.5139045715332031, 1.5868782997131348, 1.6598519086837769, 1.732825517654419, 1.8057992458343506, 1.8787729740142822, 1.9517465829849243, 2.0247201919555664, 2.097693920135498, 2.1706676483154297, 2.2436413764953613, 2.316614866256714, 2.3895885944366455]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 4.0, 7.0, 11.0, 9.0, 19.0, 27.0, 25.0, 64.0, 126.0, 374.0, 1151.0, 6441.0, 181468.0, 3971835.0, 28434.0, 2890.0, 761.0, 292.0, 169.0, 74.0, 52.0, 22.0, 10.0, 7.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.630859375, -2.5686187744140625, -2.506378173828125, -2.4441375732421875, -2.38189697265625, -2.3196563720703125, -2.257415771484375, -2.1951751708984375, -2.1329345703125, -2.0706939697265625, -2.008453369140625, -1.9462127685546875, -1.88397216796875, -1.8217315673828125, -1.759490966796875, -1.6972503662109375, -1.635009765625, -1.5727691650390625, -1.510528564453125, -1.4482879638671875, -1.38604736328125, -1.3238067626953125, -1.261566162109375, -1.1993255615234375, -1.1370849609375, -1.0748443603515625, -1.012603759765625, -0.9503631591796875, -0.88812255859375, -0.8258819580078125, -0.763641357421875, -0.7014007568359375, -0.63916015625, -0.5769195556640625, -0.514678955078125, -0.4524383544921875, -0.39019775390625, -0.3279571533203125, -0.265716552734375, -0.2034759521484375, -0.1412353515625, -0.0789947509765625, -0.016754150390625, 0.0454864501953125, 0.10772705078125, 0.1699676513671875, 0.232208251953125, 0.2944488525390625, 0.356689453125, 0.4189300537109375, 0.481170654296875, 0.5434112548828125, 0.60565185546875, 0.6678924560546875, 0.730133056640625, 0.7923736572265625, 0.8546142578125, 0.9168548583984375, 0.979095458984375, 1.0413360595703125, 1.10357666015625, 1.1658172607421875, 1.228057861328125, 1.2902984619140625, 1.3525390625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 4.0, 7.0, 9.0, 18.0, 32.0, 32.0, 51.0, 49.0, 58.0, 81.0, 73.0, 100.0, 72.0, 76.0, 66.0, 73.0, 61.0, 39.0, 28.0, 28.0, 13.0, 12.0, 10.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1015625, -0.09732818603515625, -0.0930938720703125, -0.08885955810546875, -0.084625244140625, -0.08039093017578125, -0.0761566162109375, -0.07192230224609375, -0.06768798828125, -0.06345367431640625, -0.0592193603515625, -0.05498504638671875, -0.050750732421875, -0.04651641845703125, -0.0422821044921875, -0.03804779052734375, -0.0338134765625, -0.02957916259765625, -0.0253448486328125, -0.02111053466796875, -0.016876220703125, -0.01264190673828125, -0.0084075927734375, -0.00417327880859375, 6.103515625e-05, 0.00429534912109375, 0.0085296630859375, 0.01276397705078125, 0.016998291015625, 0.02123260498046875, 0.0254669189453125, 0.02970123291015625, 0.033935546875, 0.03816986083984375, 0.0424041748046875, 0.04663848876953125, 0.050872802734375, 0.05510711669921875, 0.0593414306640625, 0.06357574462890625, 0.06781005859375, 0.07204437255859375, 0.0762786865234375, 0.08051300048828125, 0.084747314453125, 0.08898162841796875, 0.0932159423828125, 0.09745025634765625, 0.1016845703125, 0.10591888427734375, 0.1101531982421875, 0.11438751220703125, 0.118621826171875, 0.12285614013671875, 0.1270904541015625, 0.13132476806640625, 0.13555908203125, 0.13979339599609375, 0.1440277099609375, 0.14826202392578125, 0.152496337890625, 0.15673065185546875, 0.1609649658203125, 0.16519927978515625, 0.16943359375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 6.0, 7.0, 7.0, 13.0, 26.0, 47.0, 74.0, 122.0, 327.0, 2511.0, 4183697.0, 6834.0, 423.0, 98.0, 51.0, 26.0, 9.0, 11.0, 4.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-9.0859375, -8.90643310546875, -8.7269287109375, -8.54742431640625, -8.367919921875, -8.18841552734375, -8.0089111328125, -7.82940673828125, -7.64990234375, -7.47039794921875, -7.2908935546875, -7.11138916015625, -6.931884765625, -6.75238037109375, -6.5728759765625, -6.39337158203125, -6.2138671875, -6.03436279296875, -5.8548583984375, -5.67535400390625, -5.495849609375, -5.31634521484375, -5.1368408203125, -4.95733642578125, -4.77783203125, -4.59832763671875, -4.4188232421875, -4.23931884765625, -4.059814453125, -3.88031005859375, -3.7008056640625, -3.52130126953125, -3.341796875, -3.16229248046875, -2.9827880859375, -2.80328369140625, -2.623779296875, -2.44427490234375, -2.2647705078125, -2.08526611328125, -1.90576171875, -1.72625732421875, -1.5467529296875, -1.36724853515625, -1.187744140625, -1.00823974609375, -0.8287353515625, -0.64923095703125, -0.4697265625, -0.29022216796875, -0.1107177734375, 0.06878662109375, 0.248291015625, 0.42779541015625, 0.6072998046875, 0.78680419921875, 0.96630859375, 1.14581298828125, 1.3253173828125, 1.50482177734375, 1.684326171875, 1.86383056640625, 2.0433349609375, 2.22283935546875, 2.40234375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 5.0, 17.0, 89.0, 2342.0, 1547.0, 76.0, 11.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.515625, -1.4870109558105469, -1.4583969116210938, -1.4297828674316406, -1.4011688232421875, -1.3725547790527344, -1.3439407348632812, -1.3153266906738281, -1.286712646484375, -1.2580986022949219, -1.2294845581054688, -1.2008705139160156, -1.1722564697265625, -1.1436424255371094, -1.1150283813476562, -1.0864143371582031, -1.05780029296875, -1.0291862487792969, -1.0005722045898438, -0.9719581604003906, -0.9433441162109375, -0.9147300720214844, -0.8861160278320312, -0.8575019836425781, -0.828887939453125, -0.8002738952636719, -0.7716598510742188, -0.7430458068847656, -0.7144317626953125, -0.6858177185058594, -0.6572036743164062, -0.6285896301269531, -0.5999755859375, -0.5713615417480469, -0.5427474975585938, -0.5141334533691406, -0.4855194091796875, -0.4569053649902344, -0.42829132080078125, -0.3996772766113281, -0.371063232421875, -0.3424491882324219, -0.31383514404296875, -0.2852210998535156, -0.2566070556640625, -0.22799301147460938, -0.19937896728515625, -0.17076492309570312, -0.14215087890625, -0.11353683471679688, -0.08492279052734375, -0.056308746337890625, -0.0276947021484375, 0.000919342041015625, 0.02953338623046875, 0.058147430419921875, 0.086761474609375, 0.11537551879882812, 0.14398956298828125, 0.17260360717773438, 0.2012176513671875, 0.22983169555664062, 0.25844573974609375, 0.2870597839355469, 0.315673828125]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 30.0, 569.0, 385.0, 18.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.532149791717529, -7.2884416580200195, -7.044733047485352, -6.801024436950684, -6.557316303253174, -6.313608169555664, -6.069899559020996, -5.826190948486328, -5.582482814788818, -5.338774681091309, -5.095066070556641, -4.851357460021973, -4.607649326324463, -4.363941192626953, -4.120232582092285, -3.8765242099761963, -3.6328158378601074, -3.3891074657440186, -3.1453990936279297, -2.901690721511841, -2.657982349395752, -2.414273977279663, -2.170565605163574, -1.9268572330474854, -1.6831488609313965, -1.4394404888153076, -1.1957321166992188, -0.9520237445831299, -0.708315372467041, -0.46460700035095215, -0.22089862823486328, 0.022809743881225586, 0.26651859283447266, 0.5102269649505615, 0.7539353370666504, 0.9976437091827393, 1.2413520812988281, 1.485060453414917, 1.7287688255310059, 1.9724771976470947, 2.2161855697631836, 2.4598939418792725, 2.7036023139953613, 2.94731068611145, 3.191019058227539, 3.434727430343628, 3.678435802459717, 3.9221441745758057, 4.1658525466918945, 4.4095611572265625, 4.653269290924072, 4.896977424621582, 5.14068603515625, 5.384394645690918, 5.628102779388428, 5.8718109130859375, 6.1155195236206055, 6.359228134155273, 6.602936267852783, 6.846644401550293, 7.090353012084961, 7.334061622619629, 7.577769756317139, 7.821477890014648, 8.065186500549316]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 6.0, 9.0, 15.0, 30.0, 63.0, 88.0, 137.0, 165.0, 161.0, 129.0, 94.0, 51.0, 37.0, 11.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.628159761428833, -1.559004783630371, -1.4898496866226196, -1.4206947088241577, -1.3515396118164062, -1.2823846340179443, -1.2132296562194824, -1.1440746784210205, -1.074919581413269, -1.0057646036148071, -0.9366095066070557, -0.8674545288085938, -0.7982994914054871, -0.7291444540023804, -0.6599894762039185, -0.5908344388008118, -0.5216794013977051, -0.4525243639945984, -0.3833693563938141, -0.3142143487930298, -0.2450593113899231, -0.1759042739868164, -0.1067492663860321, -0.0375942587852478, 0.03156077861785889, 0.10071580111980438, 0.16987082362174988, 0.23902584612369537, 0.30818086862564087, 0.37733590602874756, 0.44649091362953186, 0.5156459212303162, 0.5848007202148438, 0.6539557576179504, 0.7231107950210571, 0.792265772819519, 0.8614208102226257, 0.9305758476257324, 0.9997308254241943, 1.0688858032226562, 1.1380409002304077, 1.2071958780288696, 1.276350975036621, 1.345505952835083, 1.414660930633545, 1.4838160276412964, 1.5529710054397583, 1.6221261024475098, 1.6912810802459717, 1.7604360580444336, 1.829591155052185, 1.898746132850647, 1.9679012298583984, 2.0370562076568604, 2.1062111854553223, 2.175366163253784, 2.244521141052246, 2.313676118850708, 2.38283109664917, 2.451986312866211, 2.521141290664673, 2.5902962684631348, 2.6594512462615967, 2.7286062240600586, 2.7977614402770996]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 4.0, 5.0, 2.0, 13.0, 12.0, 28.0, 38.0, 62.0, 102.0, 194.0, 443.0, 1167.0, 4424.0, 47299.0, 808524.0, 174257.0, 9004.0, 1828.0, 616.0, 266.0, 98.0, 57.0, 35.0, 26.0, 15.0, 16.0, 6.0, 5.0, 2.0, 2.0, 5.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.689453125, -1.644622802734375, -1.59979248046875, -1.554962158203125, -1.5101318359375, -1.465301513671875, -1.42047119140625, -1.375640869140625, -1.330810546875, -1.285980224609375, -1.24114990234375, -1.196319580078125, -1.1514892578125, -1.106658935546875, -1.06182861328125, -1.016998291015625, -0.97216796875, -0.927337646484375, -0.88250732421875, -0.837677001953125, -0.7928466796875, -0.748016357421875, -0.70318603515625, -0.658355712890625, -0.613525390625, -0.568695068359375, -0.52386474609375, -0.479034423828125, -0.4342041015625, -0.389373779296875, -0.34454345703125, -0.299713134765625, -0.2548828125, -0.210052490234375, -0.16522216796875, -0.120391845703125, -0.0755615234375, -0.030731201171875, 0.01409912109375, 0.058929443359375, 0.103759765625, 0.148590087890625, 0.19342041015625, 0.238250732421875, 0.2830810546875, 0.327911376953125, 0.37274169921875, 0.417572021484375, 0.46240234375, 0.507232666015625, 0.55206298828125, 0.596893310546875, 0.6417236328125, 0.686553955078125, 0.73138427734375, 0.776214599609375, 0.821044921875, 0.865875244140625, 0.91070556640625, 0.955535888671875, 1.0003662109375, 1.045196533203125, 1.09002685546875, 1.134857177734375, 1.1796875]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 8.0, 7.0, 5.0, 13.0, 8.0, 31.0, 34.0, 28.0, 48.0, 38.0, 40.0, 54.0, 78.0, 64.0, 68.0, 57.0, 60.0, 62.0, 53.0, 51.0, 35.0, 41.0, 26.0, 26.0, 19.0, 14.0, 15.0, 8.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.09991455078125, -0.09666919708251953, -0.09342384338378906, -0.0901784896850586, -0.08693313598632812, -0.08368778228759766, -0.08044242858886719, -0.07719707489013672, -0.07395172119140625, -0.07070636749267578, -0.06746101379394531, -0.06421566009521484, -0.060970306396484375, -0.057724952697753906, -0.05447959899902344, -0.05123424530029297, -0.0479888916015625, -0.04474353790283203, -0.04149818420410156, -0.038252830505371094, -0.035007476806640625, -0.031762123107910156, -0.028516769409179688, -0.02527141571044922, -0.02202606201171875, -0.01878070831298828, -0.015535354614257812, -0.012290000915527344, -0.009044647216796875, -0.005799293518066406, -0.0025539398193359375, 0.0006914138793945312, 0.003936767578125, 0.007182121276855469, 0.010427474975585938, 0.013672828674316406, 0.016918182373046875, 0.020163536071777344, 0.023408889770507812, 0.02665424346923828, 0.02989959716796875, 0.03314495086669922, 0.03639030456542969, 0.039635658264160156, 0.042881011962890625, 0.046126365661621094, 0.04937171936035156, 0.05261707305908203, 0.0558624267578125, 0.05910778045654297, 0.06235313415527344, 0.0655984878540039, 0.06884384155273438, 0.07208919525146484, 0.07533454895019531, 0.07857990264892578, 0.08182525634765625, 0.08507061004638672, 0.08831596374511719, 0.09156131744384766, 0.09480667114257812, 0.0980520248413086, 0.10129737854003906, 0.10454273223876953, 0.1077880859375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 4.0, 3.0, 3.0, 6.0, 5.0, 7.0, 10.0, 4.0, 8.0, 11.0, 20.0, 19.0, 23.0, 21.0, 25.0, 56.0, 72.0, 70.0, 120.0, 179.0, 312.0, 527.0, 963.0, 1976.0, 4449.0, 12542.0, 50806.0, 280973.0, 528031.0, 127922.0, 25566.0, 7427.0, 3031.0, 1356.0, 755.0, 409.0, 230.0, 164.0, 113.0, 77.0, 54.0, 53.0, 37.0, 21.0, 20.0, 13.0, 13.0, 7.0, 6.0, 12.0, 7.0, 4.0, 6.0, 2.0, 10.0, 1.0, 6.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.50048828125, -0.48339080810546875, -0.4662933349609375, -0.44919586181640625, -0.432098388671875, -0.41500091552734375, -0.3979034423828125, -0.38080596923828125, -0.36370849609375, -0.34661102294921875, -0.3295135498046875, -0.31241607666015625, -0.295318603515625, -0.27822113037109375, -0.2611236572265625, -0.24402618408203125, -0.2269287109375, -0.20983123779296875, -0.1927337646484375, -0.17563629150390625, -0.158538818359375, -0.14144134521484375, -0.1243438720703125, -0.10724639892578125, -0.09014892578125, -0.07305145263671875, -0.0559539794921875, -0.03885650634765625, -0.021759033203125, -0.00466156005859375, 0.0124359130859375, 0.02953338623046875, 0.046630859375, 0.06372833251953125, 0.0808258056640625, 0.09792327880859375, 0.115020751953125, 0.13211822509765625, 0.1492156982421875, 0.16631317138671875, 0.18341064453125, 0.20050811767578125, 0.2176055908203125, 0.23470306396484375, 0.251800537109375, 0.26889801025390625, 0.2859954833984375, 0.30309295654296875, 0.3201904296875, 0.33728790283203125, 0.3543853759765625, 0.37148284912109375, 0.388580322265625, 0.40567779541015625, 0.4227752685546875, 0.43987274169921875, 0.45697021484375, 0.47406768798828125, 0.4911651611328125, 0.5082626342773438, 0.525360107421875, 0.5424575805664062, 0.5595550537109375, 0.5766525268554688, 0.59375]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 0.0, 5.0, 3.0, 5.0, 11.0, 4.0, 6.0, 8.0, 14.0, 8.0, 19.0, 21.0, 25.0, 31.0, 44.0, 36.0, 52.0, 46.0, 51.0, 50.0, 54.0, 49.0, 53.0, 40.0, 39.0, 36.0, 47.0, 32.0, 32.0, 31.0, 31.0, 23.0, 19.0, 13.0, 18.0, 8.0, 8.0, 7.0, 2.0, 8.0, 7.0, 3.0, 1.0, 1.0, 4.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.375, -0.3632011413574219, -0.35140228271484375, -0.3396034240722656, -0.3278045654296875, -0.3160057067871094, -0.30420684814453125, -0.2924079895019531, -0.280609130859375, -0.2688102722167969, -0.25701141357421875, -0.24521255493164062, -0.2334136962890625, -0.22161483764648438, -0.20981597900390625, -0.19801712036132812, -0.18621826171875, -0.17441940307617188, -0.16262054443359375, -0.15082168579101562, -0.1390228271484375, -0.12722396850585938, -0.11542510986328125, -0.10362625122070312, -0.091827392578125, -0.08002853393554688, -0.06822967529296875, -0.056430816650390625, -0.0446319580078125, -0.032833099365234375, -0.02103424072265625, -0.009235382080078125, 0.0025634765625, 0.014362335205078125, 0.02616119384765625, 0.037960052490234375, 0.0497589111328125, 0.061557769775390625, 0.07335662841796875, 0.08515548706054688, 0.096954345703125, 0.10875320434570312, 0.12055206298828125, 0.13235092163085938, 0.1441497802734375, 0.15594863891601562, 0.16774749755859375, 0.17954635620117188, 0.19134521484375, 0.20314407348632812, 0.21494293212890625, 0.22674179077148438, 0.2385406494140625, 0.2503395080566406, 0.26213836669921875, 0.2739372253417969, 0.285736083984375, 0.2975349426269531, 0.30933380126953125, 0.3211326599121094, 0.3329315185546875, 0.3447303771972656, 0.35652923583984375, 0.3683280944824219, 0.380126953125]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 6.0, 7.0, 7.0, 6.0, 10.0, 8.0, 15.0, 22.0, 38.0, 56.0, 78.0, 109.0, 225.0, 348.0, 724.0, 1530.0, 3466.0, 10272.0, 41962.0, 275382.0, 572303.0, 110664.0, 20616.0, 5967.0, 2281.0, 1048.0, 569.0, 340.0, 169.0, 111.0, 66.0, 45.0, 32.0, 23.0, 10.0, 8.0, 6.0, 8.0, 6.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.30419921875, -0.2955741882324219, -0.28694915771484375, -0.2783241271972656, -0.2696990966796875, -0.2610740661621094, -0.25244903564453125, -0.24382400512695312, -0.235198974609375, -0.22657394409179688, -0.21794891357421875, -0.20932388305664062, -0.2006988525390625, -0.19207382202148438, -0.18344879150390625, -0.17482376098632812, -0.16619873046875, -0.15757369995117188, -0.14894866943359375, -0.14032363891601562, -0.1316986083984375, -0.12307357788085938, -0.11444854736328125, -0.10582351684570312, -0.097198486328125, -0.08857345581054688, -0.07994842529296875, -0.07132339477539062, -0.0626983642578125, -0.054073333740234375, -0.04544830322265625, -0.036823272705078125, -0.0281982421875, -0.019573211669921875, -0.01094818115234375, -0.002323150634765625, 0.0063018798828125, 0.014926910400390625, 0.02355194091796875, 0.032176971435546875, 0.040802001953125, 0.049427032470703125, 0.05805206298828125, 0.06667709350585938, 0.0753021240234375, 0.08392715454101562, 0.09255218505859375, 0.10117721557617188, 0.10980224609375, 0.11842727661132812, 0.12705230712890625, 0.13567733764648438, 0.1443023681640625, 0.15292739868164062, 0.16155242919921875, 0.17017745971679688, 0.178802490234375, 0.18742752075195312, 0.19605255126953125, 0.20467758178710938, 0.2133026123046875, 0.22192764282226562, 0.23055267333984375, 0.23917770385742188, 0.247802734375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 2.0, 0.0, 4.0, 6.0, 9.0, 7.0, 13.0, 13.0, 19.0, 21.0, 19.0, 36.0, 52.0, 83.0, 94.0, 124.0, 130.0, 103.0, 71.0, 49.0, 38.0, 35.0, 23.0, 13.0, 17.0, 4.0, 7.0, 5.0, 4.0, 4.0, 4.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00013303756713867188, -0.00012812763452529907, -0.00012321770191192627, -0.00011830776929855347, -0.00011339783668518066, -0.00010848790407180786, -0.00010357797145843506, -9.866803884506226e-05, -9.375810623168945e-05, -8.884817361831665e-05, -8.393824100494385e-05, -7.902830839157104e-05, -7.411837577819824e-05, -6.920844316482544e-05, -6.429851055145264e-05, -5.9388577938079834e-05, -5.447864532470703e-05, -4.956871271133423e-05, -4.4658780097961426e-05, -3.974884748458862e-05, -3.483891487121582e-05, -2.9928982257843018e-05, -2.5019049644470215e-05, -2.0109117031097412e-05, -1.519918441772461e-05, -1.0289251804351807e-05, -5.379319190979004e-06, -4.6938657760620117e-07, 4.4405460357666016e-06, 9.350478649139404e-06, 1.4260411262512207e-05, 1.917034387588501e-05, 2.4080276489257812e-05, 2.8990209102630615e-05, 3.390014171600342e-05, 3.881007432937622e-05, 4.3720006942749023e-05, 4.8629939556121826e-05, 5.353987216949463e-05, 5.844980478286743e-05, 6.335973739624023e-05, 6.826967000961304e-05, 7.317960262298584e-05, 7.808953523635864e-05, 8.299946784973145e-05, 8.790940046310425e-05, 9.281933307647705e-05, 9.772926568984985e-05, 0.00010263919830322266, 0.00010754913091659546, 0.00011245906352996826, 0.00011736899614334106, 0.00012227892875671387, 0.00012718886137008667, 0.00013209879398345947, 0.00013700872659683228, 0.00014191865921020508, 0.00014682859182357788, 0.00015173852443695068, 0.00015664845705032349, 0.0001615583896636963, 0.0001664683222770691, 0.0001713782548904419, 0.0001762881875038147, 0.0001811981201171875]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 5.0, 4.0, 8.0, 10.0, 11.0, 13.0, 23.0, 31.0, 71.0, 111.0, 169.0, 277.0, 557.0, 1219.0, 2975.0, 9200.0, 43965.0, 389595.0, 521637.0, 60852.0, 11527.0, 3525.0, 1303.0, 631.0, 321.0, 203.0, 105.0, 62.0, 38.0, 33.0, 24.0, 21.0, 7.0, 6.0, 4.0, 1.0, 5.0, 7.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3427734375, -0.3324127197265625, -0.322052001953125, -0.3116912841796875, -0.30133056640625, -0.2909698486328125, -0.280609130859375, -0.2702484130859375, -0.2598876953125, -0.2495269775390625, -0.239166259765625, -0.2288055419921875, -0.21844482421875, -0.2080841064453125, -0.197723388671875, -0.1873626708984375, -0.177001953125, -0.1666412353515625, -0.156280517578125, -0.1459197998046875, -0.13555908203125, -0.1251983642578125, -0.114837646484375, -0.1044769287109375, -0.0941162109375, -0.0837554931640625, -0.073394775390625, -0.0630340576171875, -0.05267333984375, -0.0423126220703125, -0.031951904296875, -0.0215911865234375, -0.01123046875, -0.0008697509765625, 0.009490966796875, 0.0198516845703125, 0.03021240234375, 0.0405731201171875, 0.050933837890625, 0.0612945556640625, 0.0716552734375, 0.0820159912109375, 0.092376708984375, 0.1027374267578125, 0.11309814453125, 0.1234588623046875, 0.133819580078125, 0.1441802978515625, 0.154541015625, 0.1649017333984375, 0.175262451171875, 0.1856231689453125, 0.19598388671875, 0.2063446044921875, 0.216705322265625, 0.2270660400390625, 0.2374267578125, 0.2477874755859375, 0.258148193359375, 0.2685089111328125, 0.27886962890625, 0.2892303466796875, 0.299591064453125, 0.3099517822265625, 0.3203125]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 6.0, 3.0, 2.0, 8.0, 9.0, 10.0, 13.0, 22.0, 42.0, 41.0, 63.0, 77.0, 97.0, 142.0, 122.0, 107.0, 73.0, 64.0, 33.0, 15.0, 25.0, 10.0, 3.0, 6.0, 3.0, 6.0, 2.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.224609375, -0.2168426513671875, -0.209075927734375, -0.2013092041015625, -0.19354248046875, -0.1857757568359375, -0.178009033203125, -0.1702423095703125, -0.1624755859375, -0.1547088623046875, -0.146942138671875, -0.1391754150390625, -0.13140869140625, -0.1236419677734375, -0.115875244140625, -0.1081085205078125, -0.100341796875, -0.0925750732421875, -0.084808349609375, -0.0770416259765625, -0.06927490234375, -0.0615081787109375, -0.053741455078125, -0.0459747314453125, -0.0382080078125, -0.0304412841796875, -0.022674560546875, -0.0149078369140625, -0.00714111328125, 0.0006256103515625, 0.008392333984375, 0.0161590576171875, 0.02392578125, 0.0316925048828125, 0.039459228515625, 0.0472259521484375, 0.05499267578125, 0.0627593994140625, 0.070526123046875, 0.0782928466796875, 0.0860595703125, 0.0938262939453125, 0.101593017578125, 0.1093597412109375, 0.11712646484375, 0.1248931884765625, 0.132659912109375, 0.1404266357421875, 0.148193359375, 0.1559600830078125, 0.163726806640625, 0.1714935302734375, 0.17926025390625, 0.1870269775390625, 0.194793701171875, 0.2025604248046875, 0.2103271484375, 0.2180938720703125, 0.225860595703125, 0.2336273193359375, 0.24139404296875, 0.2491607666015625, 0.256927490234375, 0.2646942138671875, 0.2724609375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 7.0, 8.0, 26.0, 36.0, 81.0, 126.0, 193.0, 196.0, 155.0, 76.0, 51.0, 17.0, 9.0, 10.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6697518825531006, -2.5362534523010254, -2.402754783630371, -2.269256353378296, -2.1357579231262207, -2.0022592544555664, -1.8687608242034912, -1.735262393951416, -1.6017638444900513, -1.4682652950286865, -1.3347668647766113, -1.2012683153152466, -1.0677697658538818, -0.9342713356018066, -0.8007727861404419, -0.6672742962837219, -0.533775806427002, -0.400277316570282, -0.2667787969112396, -0.13328027725219727, 0.00021821260452270508, 0.13371670246124268, 0.2672152519226074, 0.4007137417793274, 0.5342122316360474, 0.6677107214927673, 0.8012092113494873, 0.934707760810852, 1.0682063102722168, 1.201704740524292, 1.3352032899856567, 1.4687018394470215, 1.6022000312805176, 1.7356985807418823, 1.8691970109939575, 2.0026955604553223, 2.1361939907073975, 2.2696924209594727, 2.403191089630127, 2.536689519882202, 2.6701879501342773, 2.8036863803863525, 2.937185049057007, 3.070683479309082, 3.2041819095611572, 3.3376803398132324, 3.4711790084838867, 3.604677438735962, 3.738176107406616, 3.8716745376586914, 4.005173206329346, 4.138671875, 4.272170066833496, 4.40566873550415, 4.539167404174805, 4.672665596008301, 4.806164264678955, 4.939662933349609, 5.0731611251831055, 5.20665979385376, 5.340158462524414, 5.47365665435791, 5.6071553230285645, 5.740653991699219, 5.874152183532715]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 4.0, 14.0, 17.0, 10.0, 16.0, 22.0, 15.0, 25.0, 29.0, 35.0, 34.0, 43.0, 38.0, 44.0, 31.0, 43.0, 59.0, 49.0, 52.0, 42.0, 44.0, 37.0, 39.0, 41.0, 33.0, 30.0, 24.0, 22.0, 18.0, 10.0, 14.0, 12.0, 11.0, 15.0, 1.0, 7.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.1113431453704834, -2.045388698577881, -1.9794343709945679, -1.9134800434112549, -1.8475255966186523, -1.7815712690353394, -1.7156169414520264, -1.6496624946594238, -1.5837081670761108, -1.5177538394927979, -1.4517993927001953, -1.3858450651168823, -1.3198907375335693, -1.2539362907409668, -1.1879819631576538, -1.1220276355743408, -1.0560731887817383, -0.9901188015937805, -0.9241644144058228, -0.8582100868225098, -0.792255699634552, -0.7263013124465942, -0.6603469848632812, -0.5943925976753235, -0.5284382104873657, -0.46248382329940796, -0.3965294659137726, -0.3305751085281372, -0.26462072134017944, -0.19866633415222168, -0.1327119767665863, -0.06675761938095093, -0.0008032321929931641, 0.0651511400938034, 0.13110551238059998, 0.19705988466739655, 0.2630142569541931, 0.3289686441421509, 0.39492300152778625, 0.46087735891342163, 0.5268317461013794, 0.5927861332893372, 0.6587405204772949, 0.7246948480606079, 0.7906492352485657, 0.8566036224365234, 0.9225579500198364, 0.9885123372077942, 1.054466724395752, 1.120421051979065, 1.1863754987716675, 1.2523298263549805, 1.318284273147583, 1.384238600730896, 1.450192928314209, 1.5161473751068115, 1.5821017026901245, 1.6480560302734375, 1.71401047706604, 1.779964804649353, 1.845919132232666, 1.9118735790252686, 1.9778279066085815, 2.0437822341918945, 2.109736680984497]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 5.0, 4.0, 2.0, 1.0, 4.0, 6.0, 6.0, 12.0, 11.0, 15.0, 20.0, 37.0, 39.0, 61.0, 88.0, 171.0, 289.0, 613.0, 1229.0, 3356.0, 11133.0, 66751.0, 3425804.0, 637364.0, 35536.0, 7367.0, 2308.0, 956.0, 473.0, 238.0, 142.0, 78.0, 56.0, 38.0, 25.0, 17.0, 10.0, 8.0, 7.0, 3.0, 4.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.416015625, -1.3753814697265625, -1.334747314453125, -1.2941131591796875, -1.25347900390625, -1.2128448486328125, -1.172210693359375, -1.1315765380859375, -1.0909423828125, -1.0503082275390625, -1.009674072265625, -0.9690399169921875, -0.92840576171875, -0.8877716064453125, -0.847137451171875, -0.8065032958984375, -0.765869140625, -0.7252349853515625, -0.684600830078125, -0.6439666748046875, -0.60333251953125, -0.5626983642578125, -0.522064208984375, -0.4814300537109375, -0.4407958984375, -0.4001617431640625, -0.359527587890625, -0.3188934326171875, -0.27825927734375, -0.2376251220703125, -0.196990966796875, -0.1563568115234375, -0.11572265625, -0.0750885009765625, -0.034454345703125, 0.0061798095703125, 0.04681396484375, 0.0874481201171875, 0.128082275390625, 0.1687164306640625, 0.2093505859375, 0.2499847412109375, 0.290618896484375, 0.3312530517578125, 0.37188720703125, 0.4125213623046875, 0.453155517578125, 0.4937896728515625, 0.534423828125, 0.5750579833984375, 0.615692138671875, 0.6563262939453125, 0.69696044921875, 0.7375946044921875, 0.778228759765625, 0.8188629150390625, 0.8594970703125, 0.9001312255859375, 0.940765380859375, 0.9813995361328125, 1.02203369140625, 1.0626678466796875, 1.103302001953125, 1.1439361572265625, 1.1845703125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 5.0, 8.0, 6.0, 4.0, 8.0, 15.0, 22.0, 20.0, 19.0, 27.0, 43.0, 58.0, 53.0, 55.0, 64.0, 63.0, 61.0, 69.0, 69.0, 67.0, 57.0, 46.0, 40.0, 35.0, 26.0, 23.0, 11.0, 13.0, 8.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.130859375, -0.12725448608398438, -0.12364959716796875, -0.12004470825195312, -0.1164398193359375, -0.11283493041992188, -0.10923004150390625, -0.10562515258789062, -0.102020263671875, -0.09841537475585938, -0.09481048583984375, -0.09120559692382812, -0.0876007080078125, -0.08399581909179688, -0.08039093017578125, -0.07678604125976562, -0.07318115234375, -0.06957626342773438, -0.06597137451171875, -0.062366485595703125, -0.0587615966796875, -0.055156707763671875, -0.05155181884765625, -0.047946929931640625, -0.044342041015625, -0.040737152099609375, -0.03713226318359375, -0.033527374267578125, -0.0299224853515625, -0.026317596435546875, -0.02271270751953125, -0.019107818603515625, -0.0155029296875, -0.011898040771484375, -0.00829315185546875, -0.004688262939453125, -0.0010833740234375, 0.002521514892578125, 0.00612640380859375, 0.009731292724609375, 0.013336181640625, 0.016941070556640625, 0.02054595947265625, 0.024150848388671875, 0.0277557373046875, 0.031360626220703125, 0.03496551513671875, 0.038570404052734375, 0.04217529296875, 0.045780181884765625, 0.04938507080078125, 0.052989959716796875, 0.0565948486328125, 0.060199737548828125, 0.06380462646484375, 0.06740951538085938, 0.071014404296875, 0.07461929321289062, 0.07822418212890625, 0.08182907104492188, 0.0854339599609375, 0.08903884887695312, 0.09264373779296875, 0.09624862670898438, 0.099853515625]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 11.0, 11.0, 17.0, 37.0, 61.0, 128.0, 310.0, 1076.0, 4962.0, 65742.0, 4100118.0, 18169.0, 2445.0, 666.0, 249.0, 121.0, 63.0, 35.0, 22.0, 14.0, 5.0, 6.0, 10.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9423828125, -1.8419036865234375, -1.741424560546875, -1.6409454345703125, -1.54046630859375, -1.4399871826171875, -1.339508056640625, -1.2390289306640625, -1.1385498046875, -1.0380706787109375, -0.937591552734375, -0.8371124267578125, -0.73663330078125, -0.6361541748046875, -0.535675048828125, -0.4351959228515625, -0.334716796875, -0.2342376708984375, -0.133758544921875, -0.0332794189453125, 0.06719970703125, 0.1676788330078125, 0.268157958984375, 0.3686370849609375, 0.4691162109375, 0.5695953369140625, 0.670074462890625, 0.7705535888671875, 0.87103271484375, 0.9715118408203125, 1.071990966796875, 1.1724700927734375, 1.27294921875, 1.3734283447265625, 1.473907470703125, 1.5743865966796875, 1.67486572265625, 1.7753448486328125, 1.875823974609375, 1.9763031005859375, 2.0767822265625, 2.1772613525390625, 2.277740478515625, 2.3782196044921875, 2.47869873046875, 2.5791778564453125, 2.679656982421875, 2.7801361083984375, 2.880615234375, 2.9810943603515625, 3.081573486328125, 3.1820526123046875, 3.28253173828125, 3.3830108642578125, 3.483489990234375, 3.5839691162109375, 3.6844482421875, 3.7849273681640625, 3.885406494140625, 3.9858856201171875, 4.08636474609375, 4.1868438720703125, 4.287322998046875, 4.3878021240234375, 4.48828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 5.0, 5.0, 5.0, 4.0, 5.0, 9.0, 8.0, 5.0, 21.0, 13.0, 23.0, 62.0, 93.0, 239.0, 587.0, 1843.0, 658.0, 220.0, 116.0, 66.0, 25.0, 21.0, 11.0, 2.0, 12.0, 5.0, 5.0, 1.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.358642578125, -0.3465156555175781, -0.33438873291015625, -0.3222618103027344, -0.3101348876953125, -0.2980079650878906, -0.28588104248046875, -0.2737541198730469, -0.261627197265625, -0.24950027465820312, -0.23737335205078125, -0.22524642944335938, -0.2131195068359375, -0.20099258422851562, -0.18886566162109375, -0.17673873901367188, -0.16461181640625, -0.15248489379882812, -0.14035797119140625, -0.12823104858398438, -0.1161041259765625, -0.10397720336914062, -0.09185028076171875, -0.07972335815429688, -0.067596435546875, -0.055469512939453125, -0.04334259033203125, -0.031215667724609375, -0.0190887451171875, -0.006961822509765625, 0.00516510009765625, 0.017292022705078125, 0.0294189453125, 0.041545867919921875, 0.05367279052734375, 0.06579971313476562, 0.0779266357421875, 0.09005355834960938, 0.10218048095703125, 0.11430740356445312, 0.126434326171875, 0.13856124877929688, 0.15068817138671875, 0.16281509399414062, 0.1749420166015625, 0.18706893920898438, 0.19919586181640625, 0.21132278442382812, 0.22344970703125, 0.23557662963867188, 0.24770355224609375, 0.2598304748535156, 0.2719573974609375, 0.2840843200683594, 0.29621124267578125, 0.3083381652832031, 0.320465087890625, 0.3325920104980469, 0.34471893310546875, 0.3568458557128906, 0.3689727783203125, 0.3810997009277344, 0.39322662353515625, 0.4053535461425781, 0.41748046875]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 7.0, 29.0, 100.0, 474.0, 292.0, 71.0, 20.0, 9.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.53142261505127, -8.287139892578125, -8.042856216430664, -7.7985734939575195, -7.554290294647217, -7.310007095336914, -7.0657243728637695, -6.821441173553467, -6.577157974243164, -6.332874774932861, -6.088591575622559, -5.844308853149414, -5.600025653839111, -5.355742454528809, -5.111459732055664, -4.867176532745361, -4.622893333435059, -4.378610134124756, -4.134326934814453, -3.8900442123413086, -3.645761013031006, -3.401477813720703, -3.1571948528289795, -2.912911891937256, -2.668628692626953, -2.4243454933166504, -2.1800625324249268, -1.9357794523239136, -1.6914963722229004, -1.4472132921218872, -1.202930212020874, -0.9586471319198608, -0.7143640518188477, -0.4700809717178345, -0.2257978916168213, 0.018485188484191895, 0.2627682685852051, 0.5070513486862183, 0.7513344287872314, 0.9956175088882446, 1.2399005889892578, 1.484183669090271, 1.7284667491912842, 1.9727498292922974, 2.2170329093933105, 2.4613161087036133, 2.705599069595337, 2.9498820304870605, 3.1941652297973633, 3.438448429107666, 3.6827313899993896, 3.9270143508911133, 4.171297550201416, 4.415580749511719, 4.659863471984863, 4.904146671295166, 5.148429870605469, 5.3927130699157715, 5.636996269226074, 5.881278991699219, 6.1255621910095215, 6.369845390319824, 6.614128112792969, 6.8584113121032715, 7.102694511413574]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 4.0, 7.0, 5.0, 13.0, 18.0, 20.0, 19.0, 39.0, 62.0, 60.0, 85.0, 87.0, 74.0, 93.0, 73.0, 65.0, 61.0, 52.0, 48.0, 34.0, 32.0, 13.0, 17.0, 7.0, 5.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9084796905517578, -1.8494879007339478, -1.7904961109161377, -1.7315044403076172, -1.6725126504898071, -1.613520860671997, -1.5545291900634766, -1.4955374002456665, -1.4365456104278564, -1.3775538206100464, -1.3185620307922363, -1.2595703601837158, -1.2005785703659058, -1.1415867805480957, -1.0825951099395752, -1.0236033201217651, -0.9646115303039551, -0.905619740486145, -0.8466280102729797, -0.7876362800598145, -0.7286444902420044, -0.6696527004241943, -0.610660970211029, -0.5516692399978638, -0.4926774501800537, -0.43368569016456604, -0.37469393014907837, -0.3157021701335907, -0.256710410118103, -0.19771865010261536, -0.13872689008712769, -0.07973513007164001, -0.020743489265441895, 0.038248270750045776, 0.09724003076553345, 0.15623179078102112, 0.2152235507965088, 0.27421531081199646, 0.33320707082748413, 0.3921988308429718, 0.4511905908584595, 0.5101823806762695, 0.5691741108894348, 0.6281658411026001, 0.6871576309204102, 0.7461494207382202, 0.8051411509513855, 0.8641328811645508, 0.9231246709823608, 0.9821164608001709, 1.0411081314086914, 1.1000999212265015, 1.1590917110443115, 1.2180835008621216, 1.2770752906799316, 1.3360669612884521, 1.3950587511062622, 1.4540505409240723, 1.5130422115325928, 1.5720340013504028, 1.631025791168213, 1.690017580986023, 1.749009370803833, 1.8080010414123535, 1.8669928312301636]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 2.0, 7.0, 1.0, 4.0, 8.0, 7.0, 18.0, 22.0, 24.0, 36.0, 54.0, 84.0, 133.0, 205.0, 330.0, 602.0, 1183.0, 3170.0, 13086.0, 116555.0, 724726.0, 165276.0, 16458.0, 3625.0, 1254.0, 676.0, 340.0, 207.0, 145.0, 91.0, 71.0, 42.0, 20.0, 29.0, 16.0, 18.0, 10.0, 6.0, 3.0, 5.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0888671875, -1.056427001953125, -1.02398681640625, -0.991546630859375, -0.9591064453125, -0.926666259765625, -0.89422607421875, -0.861785888671875, -0.829345703125, -0.796905517578125, -0.76446533203125, -0.732025146484375, -0.6995849609375, -0.667144775390625, -0.63470458984375, -0.602264404296875, -0.56982421875, -0.537384033203125, -0.50494384765625, -0.472503662109375, -0.4400634765625, -0.407623291015625, -0.37518310546875, -0.342742919921875, -0.310302734375, -0.277862548828125, -0.24542236328125, -0.212982177734375, -0.1805419921875, -0.148101806640625, -0.11566162109375, -0.083221435546875, -0.05078125, -0.018341064453125, 0.01409912109375, 0.046539306640625, 0.0789794921875, 0.111419677734375, 0.14385986328125, 0.176300048828125, 0.208740234375, 0.241180419921875, 0.27362060546875, 0.306060791015625, 0.3385009765625, 0.370941162109375, 0.40338134765625, 0.435821533203125, 0.46826171875, 0.500701904296875, 0.53314208984375, 0.565582275390625, 0.5980224609375, 0.630462646484375, 0.66290283203125, 0.695343017578125, 0.727783203125, 0.760223388671875, 0.79266357421875, 0.825103759765625, 0.8575439453125, 0.889984130859375, 0.92242431640625, 0.954864501953125, 0.9873046875]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 4.0, 9.0, 12.0, 27.0, 35.0, 33.0, 61.0, 64.0, 78.0, 98.0, 103.0, 91.0, 88.0, 73.0, 67.0, 39.0, 45.0, 27.0, 15.0, 15.0, 4.0, 4.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.18994140625, -0.1846141815185547, -0.17928695678710938, -0.17395973205566406, -0.16863250732421875, -0.16330528259277344, -0.15797805786132812, -0.1526508331298828, -0.1473236083984375, -0.1419963836669922, -0.13666915893554688, -0.13134193420410156, -0.12601470947265625, -0.12068748474121094, -0.11536026000976562, -0.11003303527832031, -0.104705810546875, -0.09937858581542969, -0.09405136108398438, -0.08872413635253906, -0.08339691162109375, -0.07806968688964844, -0.07274246215820312, -0.06741523742675781, -0.0620880126953125, -0.05676078796386719, -0.051433563232421875, -0.04610633850097656, -0.04077911376953125, -0.03545188903808594, -0.030124664306640625, -0.024797439575195312, -0.01947021484375, -0.014142990112304688, -0.008815765380859375, -0.0034885406494140625, 0.00183868408203125, 0.0071659088134765625, 0.012493133544921875, 0.017820358276367188, 0.0231475830078125, 0.028474807739257812, 0.033802032470703125, 0.03912925720214844, 0.04445648193359375, 0.04978370666503906, 0.055110931396484375, 0.06043815612792969, 0.065765380859375, 0.07109260559082031, 0.07641983032226562, 0.08174705505371094, 0.08707427978515625, 0.09240150451660156, 0.09772872924804688, 0.10305595397949219, 0.1083831787109375, 0.11371040344238281, 0.11903762817382812, 0.12436485290527344, 0.12969207763671875, 0.13501930236816406, 0.14034652709960938, 0.1456737518310547, 0.1510009765625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 3.0, 11.0, 4.0, 20.0, 18.0, 17.0, 33.0, 41.0, 42.0, 91.0, 83.0, 175.0, 274.0, 368.0, 794.0, 1664.0, 3933.0, 10324.0, 29665.0, 95490.0, 288754.0, 383338.0, 158176.0, 48419.0, 16037.0, 5831.0, 2396.0, 1096.0, 568.0, 296.0, 189.0, 112.0, 92.0, 55.0, 39.0, 29.0, 20.0, 14.0, 10.0, 11.0, 9.0, 7.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0], "bins": [-0.369873046875, -0.35906219482421875, -0.3482513427734375, -0.33744049072265625, -0.326629638671875, -0.31581878662109375, -0.3050079345703125, -0.29419708251953125, -0.28338623046875, -0.27257537841796875, -0.2617645263671875, -0.25095367431640625, -0.240142822265625, -0.22933197021484375, -0.2185211181640625, -0.20771026611328125, -0.1968994140625, -0.18608856201171875, -0.1752777099609375, -0.16446685791015625, -0.153656005859375, -0.14284515380859375, -0.1320343017578125, -0.12122344970703125, -0.11041259765625, -0.09960174560546875, -0.0887908935546875, -0.07798004150390625, -0.067169189453125, -0.05635833740234375, -0.0455474853515625, -0.03473663330078125, -0.02392578125, -0.01311492919921875, -0.0023040771484375, 0.00850677490234375, 0.019317626953125, 0.03012847900390625, 0.0409393310546875, 0.05175018310546875, 0.06256103515625, 0.07337188720703125, 0.0841827392578125, 0.09499359130859375, 0.105804443359375, 0.11661529541015625, 0.1274261474609375, 0.13823699951171875, 0.1490478515625, 0.15985870361328125, 0.1706695556640625, 0.18148040771484375, 0.192291259765625, 0.20310211181640625, 0.2139129638671875, 0.22472381591796875, 0.23553466796875, 0.24634552001953125, 0.2571563720703125, 0.26796722412109375, 0.278778076171875, 0.28958892822265625, 0.3003997802734375, 0.31121063232421875, 0.322021484375]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 4.0, 6.0, 2.0, 3.0, 2.0, 10.0, 7.0, 10.0, 11.0, 20.0, 13.0, 12.0, 19.0, 27.0, 21.0, 27.0, 23.0, 31.0, 45.0, 46.0, 48.0, 42.0, 46.0, 35.0, 32.0, 34.0, 45.0, 47.0, 44.0, 29.0, 36.0, 25.0, 26.0, 28.0, 24.0, 24.0, 21.0, 17.0, 6.0, 14.0, 10.0, 11.0, 5.0, 6.0, 5.0, 2.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.35888671875, -0.3480644226074219, -0.33724212646484375, -0.3264198303222656, -0.3155975341796875, -0.3047752380371094, -0.29395294189453125, -0.2831306457519531, -0.272308349609375, -0.2614860534667969, -0.25066375732421875, -0.23984146118164062, -0.2290191650390625, -0.21819686889648438, -0.20737457275390625, -0.19655227661132812, -0.18572998046875, -0.17490768432617188, -0.16408538818359375, -0.15326309204101562, -0.1424407958984375, -0.13161849975585938, -0.12079620361328125, -0.10997390747070312, -0.099151611328125, -0.08832931518554688, -0.07750701904296875, -0.06668472290039062, -0.0558624267578125, -0.045040130615234375, -0.03421783447265625, -0.023395538330078125, -0.0125732421875, -0.001750946044921875, 0.00907135009765625, 0.019893646240234375, 0.0307159423828125, 0.041538238525390625, 0.05236053466796875, 0.06318283081054688, 0.074005126953125, 0.08482742309570312, 0.09564971923828125, 0.10647201538085938, 0.1172943115234375, 0.12811660766601562, 0.13893890380859375, 0.14976119995117188, 0.16058349609375, 0.17140579223632812, 0.18222808837890625, 0.19305038452148438, 0.2038726806640625, 0.21469497680664062, 0.22551727294921875, 0.23633956909179688, 0.247161865234375, 0.2579841613769531, 0.26880645751953125, 0.2796287536621094, 0.2904510498046875, 0.3012733459472656, 0.31209564208984375, 0.3229179382324219, 0.333740234375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 7.0, 5.0, 15.0, 22.0, 18.0, 25.0, 31.0, 38.0, 70.0, 100.0, 156.0, 305.0, 566.0, 1486.0, 4732.0, 25380.0, 242082.0, 642150.0, 112406.0, 13720.0, 3042.0, 1099.0, 445.0, 248.0, 120.0, 82.0, 41.0, 49.0, 30.0, 19.0, 24.0, 14.0, 10.0, 10.0, 6.0, 2.0, 1.0, 1.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.301513671875, -0.2924690246582031, -0.28342437744140625, -0.2743797302246094, -0.2653350830078125, -0.2562904357910156, -0.24724578857421875, -0.23820114135742188, -0.229156494140625, -0.22011184692382812, -0.21106719970703125, -0.20202255249023438, -0.1929779052734375, -0.18393325805664062, -0.17488861083984375, -0.16584396362304688, -0.15679931640625, -0.14775466918945312, -0.13871002197265625, -0.12966537475585938, -0.1206207275390625, -0.11157608032226562, -0.10253143310546875, -0.09348678588867188, -0.084442138671875, -0.07539749145507812, -0.06635284423828125, -0.057308197021484375, -0.0482635498046875, -0.039218902587890625, -0.03017425537109375, -0.021129608154296875, -0.0120849609375, -0.003040313720703125, 0.00600433349609375, 0.015048980712890625, 0.0240936279296875, 0.033138275146484375, 0.04218292236328125, 0.051227569580078125, 0.060272216796875, 0.06931686401367188, 0.07836151123046875, 0.08740615844726562, 0.0964508056640625, 0.10549545288085938, 0.11454010009765625, 0.12358474731445312, 0.13262939453125, 0.14167404174804688, 0.15071868896484375, 0.15976333618164062, 0.1688079833984375, 0.17785263061523438, 0.18689727783203125, 0.19594192504882812, 0.204986572265625, 0.21403121948242188, 0.22307586669921875, 0.23212051391601562, 0.2411651611328125, 0.2502098083496094, 0.25925445556640625, 0.2682991027832031, 0.27734375]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 8.0, 9.0, 12.0, 46.0, 99.0, 311.0, 340.0, 108.0, 32.0, 18.0, 17.0, 4.0, 2.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00014901161193847656, -0.00013557448983192444, -0.00012213736772537231, -0.00010870024561882019, -9.526312351226807e-05, -8.182600140571594e-05, -6.838887929916382e-05, -5.4951757192611694e-05, -4.151463508605957e-05, -2.8077512979507446e-05, -1.4640390872955322e-05, -1.2032687664031982e-06, 1.2233853340148926e-05, 2.567097544670105e-05, 3.9108097553253174e-05, 5.25452196598053e-05, 6.598234176635742e-05, 7.941946387290955e-05, 9.285658597946167e-05, 0.0001062937080860138, 0.00011973083019256592, 0.00013316795229911804, 0.00014660507440567017, 0.0001600421965122223, 0.00017347931861877441, 0.00018691644072532654, 0.00020035356283187866, 0.00021379068493843079, 0.0002272278070449829, 0.00024066492915153503, 0.00025410205125808716, 0.0002675391733646393, 0.0002809762954711914, 0.00029441341757774353, 0.00030785053968429565, 0.0003212876617908478, 0.0003347247838973999, 0.000348161906003952, 0.00036159902811050415, 0.0003750361502170563, 0.0003884732723236084, 0.0004019103944301605, 0.00041534751653671265, 0.00042878463864326477, 0.0004422217607498169, 0.000455658882856369, 0.00046909600496292114, 0.00048253312706947327, 0.0004959702491760254, 0.0005094073712825775, 0.0005228444933891296, 0.0005362816154956818, 0.0005497187376022339, 0.000563155859708786, 0.0005765929818153381, 0.0005900301039218903, 0.0006034672260284424, 0.0006169043481349945, 0.0006303414702415466, 0.0006437785923480988, 0.0006572157144546509, 0.000670652836561203, 0.0006840899586677551, 0.0006975270807743073, 0.0007109642028808594]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 4.0, 3.0, 7.0, 6.0, 7.0, 21.0, 22.0, 19.0, 65.0, 79.0, 134.0, 251.0, 480.0, 1093.0, 2903.0, 9373.0, 46103.0, 358394.0, 526919.0, 82207.0, 13967.0, 3883.0, 1377.0, 566.0, 266.0, 142.0, 94.0, 52.0, 39.0, 23.0, 19.0, 11.0, 10.0, 5.0, 7.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2420654296875, -0.23375892639160156, -0.22545242309570312, -0.2171459197998047, -0.20883941650390625, -0.2005329132080078, -0.19222640991210938, -0.18391990661621094, -0.1756134033203125, -0.16730690002441406, -0.15900039672851562, -0.1506938934326172, -0.14238739013671875, -0.1340808868408203, -0.12577438354492188, -0.11746788024902344, -0.109161376953125, -0.10085487365722656, -0.09254837036132812, -0.08424186706542969, -0.07593536376953125, -0.06762886047363281, -0.059322357177734375, -0.05101585388183594, -0.0427093505859375, -0.03440284729003906, -0.026096343994140625, -0.017789840698242188, -0.00948333740234375, -0.0011768341064453125, 0.007129669189453125, 0.015436172485351562, 0.02374267578125, 0.03204917907714844, 0.040355682373046875, 0.04866218566894531, 0.05696868896484375, 0.06527519226074219, 0.07358169555664062, 0.08188819885253906, 0.0901947021484375, 0.09850120544433594, 0.10680770874023438, 0.11511421203613281, 0.12342071533203125, 0.1317272186279297, 0.14003372192382812, 0.14834022521972656, 0.156646728515625, 0.16495323181152344, 0.17325973510742188, 0.1815662384033203, 0.18987274169921875, 0.1981792449951172, 0.20648574829101562, 0.21479225158691406, 0.2230987548828125, 0.23140525817871094, 0.23971176147460938, 0.2480182647705078, 0.25632476806640625, 0.2646312713623047, 0.2729377746582031, 0.28124427795410156, 0.28955078125]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 3.0, 7.0, 5.0, 18.0, 11.0, 17.0, 25.0, 20.0, 27.0, 40.0, 48.0, 70.0, 81.0, 58.0, 71.0, 68.0, 73.0, 46.0, 73.0, 48.0, 42.0, 23.0, 30.0, 16.0, 19.0, 9.0, 7.0, 6.0, 9.0, 5.0, 2.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.160400390625, -0.15581321716308594, -0.15122604370117188, -0.1466388702392578, -0.14205169677734375, -0.1374645233154297, -0.13287734985351562, -0.12829017639160156, -0.1237030029296875, -0.11911582946777344, -0.11452865600585938, -0.10994148254394531, -0.10535430908203125, -0.10076713562011719, -0.09617996215820312, -0.09159278869628906, -0.087005615234375, -0.08241844177246094, -0.07783126831054688, -0.07324409484863281, -0.06865692138671875, -0.06406974792480469, -0.059482574462890625, -0.05489540100097656, -0.0503082275390625, -0.04572105407714844, -0.041133880615234375, -0.03654670715332031, -0.03195953369140625, -0.027372360229492188, -0.022785186767578125, -0.018198013305664062, -0.01361083984375, -0.009023666381835938, -0.004436492919921875, 0.0001506805419921875, 0.00473785400390625, 0.009325027465820312, 0.013912200927734375, 0.018499374389648438, 0.0230865478515625, 0.027673721313476562, 0.032260894775390625, 0.03684806823730469, 0.04143524169921875, 0.04602241516113281, 0.050609588623046875, 0.05519676208496094, 0.059783935546875, 0.06437110900878906, 0.06895828247070312, 0.07354545593261719, 0.07813262939453125, 0.08271980285644531, 0.08730697631835938, 0.09189414978027344, 0.0964813232421875, 0.10106849670410156, 0.10565567016601562, 0.11024284362792969, 0.11483001708984375, 0.11941719055175781, 0.12400436401367188, 0.12859153747558594, 0.1331787109375]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 8.0, 19.0, 30.0, 58.0, 122.0, 231.0, 223.0, 159.0, 88.0, 39.0, 9.0, 12.0, 5.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.126567840576172, -1.9855422973632812, -1.8445167541503906, -1.7034913301467896, -1.562465786933899, -1.4214402437210083, -1.2804148197174072, -1.1393892765045166, -0.998363733291626, -0.8573381900787354, -0.7163127064704895, -0.5752872228622437, -0.434261679649353, -0.2932361364364624, -0.15221065282821655, -0.011185169219970703, 0.12984037399291992, 0.27086588740348816, 0.4118914008140564, 0.5529168844223022, 0.6939424276351929, 0.8349679708480835, 0.9759934544563293, 1.1170189380645752, 1.2580444812774658, 1.3990700244903564, 1.540095567703247, 1.6811209917068481, 1.8221465349197388, 1.9631720781326294, 2.1041975021362305, 2.245223045349121, 2.3862485885620117, 2.5272741317749023, 2.668299674987793, 2.8093252182006836, 2.950350761413574, 3.091376304626465, 3.2324016094207764, 3.373427152633667, 3.5144526958465576, 3.6554782390594482, 3.796503782272339, 3.9375293254852295, 4.078554630279541, 4.219580173492432, 4.360605716705322, 4.501631259918213, 4.6426568031311035, 4.783682346343994, 4.924707889556885, 5.065733432769775, 5.206758975982666, 5.347784519195557, 5.488810062408447, 5.62983512878418, 5.77086067199707, 5.911886215209961, 6.052911758422852, 6.193937301635742, 6.334962844848633, 6.475988388061523, 6.617013931274414, 6.758039474487305, 6.899065017700195]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 7.0, 12.0, 3.0, 9.0, 6.0, 17.0, 20.0, 25.0, 23.0, 23.0, 33.0, 26.0, 34.0, 42.0, 46.0, 57.0, 42.0, 52.0, 57.0, 45.0, 49.0, 36.0, 46.0, 34.0, 38.0, 43.0, 28.0, 23.0, 27.0, 29.0, 17.0, 12.0, 4.0, 7.0, 9.0, 8.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.192502021789551, -2.119662284851074, -2.0468225479125977, -1.9739826917648315, -1.9011428356170654, -1.8283030986785889, -1.7554633617401123, -1.6826235055923462, -1.60978364944458, -1.5369439125061035, -1.4641040563583374, -1.3912643194198608, -1.3184244632720947, -1.2455847263336182, -1.1727449893951416, -1.0999051332473755, -1.027065396308899, -0.9542255997657776, -0.8813858032226562, -0.8085460662841797, -0.7357062101364136, -0.662866473197937, -0.5900266766548157, -0.5171868801116943, -0.444347083568573, -0.37150728702545166, -0.2986674904823303, -0.22582772374153137, -0.15298792719841003, -0.0801481306552887, -0.007308363914489746, 0.06553143262863159, 0.13837122917175293, 0.21121102571487427, 0.2840508222579956, 0.35689058899879456, 0.4297303855419159, 0.5025701522827148, 0.5754099488258362, 0.6482497453689575, 0.7210895419120789, 0.7939293384552002, 0.8667691349983215, 0.9396089315414429, 1.0124486684799194, 1.0852885246276855, 1.158128261566162, 1.2309679985046387, 1.3038078546524048, 1.3766475915908813, 1.4494874477386475, 1.522327184677124, 1.5951670408248901, 1.6680067777633667, 1.7408466339111328, 1.8136863708496094, 1.886526107788086, 1.9593658447265625, 2.032205581665039, 2.1050455570220947, 2.1778852939605713, 2.250725030899048, 2.3235647678375244, 2.39640474319458, 2.4692444801330566]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 5.0, 8.0, 8.0, 11.0, 12.0, 27.0, 46.0, 54.0, 102.0, 189.0, 426.0, 1352.0, 7761.0, 446726.0, 3721463.0, 13294.0, 1810.0, 591.0, 204.0, 83.0, 47.0, 24.0, 12.0, 11.0, 2.0, 4.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.953125, -1.8941192626953125, -1.835113525390625, -1.7761077880859375, -1.71710205078125, -1.6580963134765625, -1.599090576171875, -1.5400848388671875, -1.4810791015625, -1.4220733642578125, -1.363067626953125, -1.3040618896484375, -1.24505615234375, -1.1860504150390625, -1.127044677734375, -1.0680389404296875, -1.009033203125, -0.9500274658203125, -0.891021728515625, -0.8320159912109375, -0.77301025390625, -0.7140045166015625, -0.654998779296875, -0.5959930419921875, -0.5369873046875, -0.4779815673828125, -0.418975830078125, -0.3599700927734375, -0.30096435546875, -0.2419586181640625, -0.182952880859375, -0.1239471435546875, -0.06494140625, -0.0059356689453125, 0.053070068359375, 0.1120758056640625, 0.17108154296875, 0.2300872802734375, 0.289093017578125, 0.3480987548828125, 0.4071044921875, 0.4661102294921875, 0.525115966796875, 0.5841217041015625, 0.64312744140625, 0.7021331787109375, 0.761138916015625, 0.8201446533203125, 0.879150390625, 0.9381561279296875, 0.997161865234375, 1.0561676025390625, 1.11517333984375, 1.1741790771484375, 1.233184814453125, 1.2921905517578125, 1.3511962890625, 1.4102020263671875, 1.469207763671875, 1.5282135009765625, 1.58721923828125, 1.6462249755859375, 1.705230712890625, 1.7642364501953125, 1.8232421875]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 3.0, 11.0, 9.0, 18.0, 28.0, 29.0, 40.0, 47.0, 53.0, 51.0, 89.0, 73.0, 79.0, 98.0, 66.0, 51.0, 48.0, 46.0, 37.0, 37.0, 21.0, 14.0, 14.0, 11.0, 6.0, 2.0, 5.0, 4.0, 2.0, 0.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1571044921875, -0.15253829956054688, -0.14797210693359375, -0.14340591430664062, -0.1388397216796875, -0.13427352905273438, -0.12970733642578125, -0.12514114379882812, -0.120574951171875, -0.11600875854492188, -0.11144256591796875, -0.10687637329101562, -0.1023101806640625, -0.09774398803710938, -0.09317779541015625, -0.08861160278320312, -0.08404541015625, -0.07947921752929688, -0.07491302490234375, -0.07034683227539062, -0.0657806396484375, -0.061214447021484375, -0.05664825439453125, -0.052082061767578125, -0.047515869140625, -0.042949676513671875, -0.03838348388671875, -0.033817291259765625, -0.0292510986328125, -0.024684906005859375, -0.02011871337890625, -0.015552520751953125, -0.010986328125, -0.006420135498046875, -0.00185394287109375, 0.002712249755859375, 0.0072784423828125, 0.011844635009765625, 0.01641082763671875, 0.020977020263671875, 0.025543212890625, 0.030109405517578125, 0.03467559814453125, 0.039241790771484375, 0.0438079833984375, 0.048374176025390625, 0.05294036865234375, 0.057506561279296875, 0.06207275390625, 0.06663894653320312, 0.07120513916015625, 0.07577133178710938, 0.0803375244140625, 0.08490371704101562, 0.08946990966796875, 0.09403610229492188, 0.098602294921875, 0.10316848754882812, 0.10773468017578125, 0.11230087280273438, 0.1168670654296875, 0.12143325805664062, 0.12599945068359375, 0.13056564331054688, 0.1351318359375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 6.0, 4.0, 2.0, 7.0, 12.0, 11.0, 15.0, 25.0, 46.0, 43.0, 83.0, 123.0, 260.0, 520.0, 1251.0, 4063.0, 18520.0, 168708.0, 3812525.0, 163130.0, 18354.0, 4191.0, 1278.0, 528.0, 243.0, 127.0, 71.0, 47.0, 23.0, 24.0, 15.0, 11.0, 8.0, 12.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57275390625, -0.5483779907226562, -0.5240020751953125, -0.49962615966796875, -0.475250244140625, -0.45087432861328125, -0.4264984130859375, -0.40212249755859375, -0.37774658203125, -0.35337066650390625, -0.3289947509765625, -0.30461883544921875, -0.280242919921875, -0.25586700439453125, -0.2314910888671875, -0.20711517333984375, -0.1827392578125, -0.15836334228515625, -0.1339874267578125, -0.10961151123046875, -0.085235595703125, -0.06085968017578125, -0.0364837646484375, -0.01210784912109375, 0.01226806640625, 0.03664398193359375, 0.0610198974609375, 0.08539581298828125, 0.109771728515625, 0.13414764404296875, 0.1585235595703125, 0.18289947509765625, 0.207275390625, 0.23165130615234375, 0.2560272216796875, 0.28040313720703125, 0.304779052734375, 0.32915496826171875, 0.3535308837890625, 0.37790679931640625, 0.40228271484375, 0.42665863037109375, 0.4510345458984375, 0.47541046142578125, 0.499786376953125, 0.5241622924804688, 0.5485382080078125, 0.5729141235351562, 0.5972900390625, 0.6216659545898438, 0.6460418701171875, 0.6704177856445312, 0.694793701171875, 0.7191696166992188, 0.7435455322265625, 0.7679214477539062, 0.79229736328125, 0.8166732788085938, 0.8410491943359375, 0.8654251098632812, 0.889801025390625, 0.9141769409179688, 0.9385528564453125, 0.9629287719726562, 0.9873046875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 8.0, 8.0, 20.0, 29.0, 63.0, 106.0, 289.0, 1162.0, 1814.0, 321.0, 124.0, 50.0, 31.0, 17.0, 13.0, 5.0, 5.0, 5.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.3984375, -0.3879890441894531, -0.37754058837890625, -0.3670921325683594, -0.3566436767578125, -0.3461952209472656, -0.33574676513671875, -0.3252983093261719, -0.314849853515625, -0.3044013977050781, -0.29395294189453125, -0.2835044860839844, -0.2730560302734375, -0.2626075744628906, -0.25215911865234375, -0.24171066284179688, -0.23126220703125, -0.22081375122070312, -0.21036529541015625, -0.19991683959960938, -0.1894683837890625, -0.17901992797851562, -0.16857147216796875, -0.15812301635742188, -0.147674560546875, -0.13722610473632812, -0.12677764892578125, -0.11632919311523438, -0.1058807373046875, -0.09543228149414062, -0.08498382568359375, -0.07453536987304688, -0.0640869140625, -0.053638458251953125, -0.04319000244140625, -0.032741546630859375, -0.0222930908203125, -0.011844635009765625, -0.00139617919921875, 0.009052276611328125, 0.019500732421875, 0.029949188232421875, 0.04039764404296875, 0.050846099853515625, 0.0612945556640625, 0.07174301147460938, 0.08219146728515625, 0.09263992309570312, 0.10308837890625, 0.11353683471679688, 0.12398529052734375, 0.13443374633789062, 0.1448822021484375, 0.15533065795898438, 0.16577911376953125, 0.17622756958007812, 0.186676025390625, 0.19712448120117188, 0.20757293701171875, 0.21802139282226562, 0.2284698486328125, 0.23891830444335938, 0.24936676025390625, 0.2598152160644531, 0.270263671875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 7.0, 6.0, 8.0, 15.0, 47.0, 149.0, 245.0, 290.0, 157.0, 56.0, 14.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.86898136138916, -2.7941884994506836, -2.719395875930786, -2.6446030139923096, -2.569810390472412, -2.4950175285339355, -2.420224666595459, -2.3454318046569824, -2.270639181137085, -2.1958463191986084, -2.121053695678711, -2.0462608337402344, -1.9714680910110474, -1.8966753482818604, -1.8218824863433838, -1.7470897436141968, -1.6722970008850098, -1.5975042581558228, -1.5227115154266357, -1.4479186534881592, -1.3731259107589722, -1.2983331680297852, -1.2235403060913086, -1.1487475633621216, -1.0739548206329346, -0.9991620779037476, -0.9243692755699158, -0.849576473236084, -0.774783730506897, -0.69999098777771, -0.6251981854438782, -0.5504053831100464, -0.4756128787994385, -0.4008201062679291, -0.3260273337364197, -0.2512345612049103, -0.17644178867340088, -0.10164901614189148, -0.02685624361038208, 0.04793655872344971, 0.12272930145263672, 0.19752207398414612, 0.2723148465156555, 0.3471076190471649, 0.4219003915786743, 0.4966931641101837, 0.5714859366416931, 0.6462787389755249, 0.7210714817047119, 0.7958642244338989, 0.8706570267677307, 0.9454498291015625, 1.0202425718307495, 1.0950353145599365, 1.169828176498413, 1.2446209192276, 1.319413661956787, 1.3942064046859741, 1.4689991474151611, 1.5437920093536377, 1.6185847520828247, 1.6933774948120117, 1.7681703567504883, 1.8429630994796753, 1.9177558422088623]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 8.0, 13.0, 17.0, 24.0, 34.0, 33.0, 34.0, 40.0, 49.0, 49.0, 70.0, 62.0, 59.0, 59.0, 67.0, 55.0, 59.0, 56.0, 40.0, 38.0, 37.0, 31.0, 14.0, 8.0, 12.0, 9.0, 7.0, 7.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0], "bins": [-1.1935267448425293, -1.1634591817855835, -1.1333916187286377, -1.1033239364624023, -1.0732563734054565, -1.0431888103485107, -1.0131211280822754, -0.9830535650253296, -0.9529860019683838, -0.922918438911438, -0.8928508162498474, -0.8627831935882568, -0.832715630531311, -0.8026480674743652, -0.7725804448127747, -0.7425128221511841, -0.7124452590942383, -0.6823776960372925, -0.6523100733757019, -0.6222424507141113, -0.5921748876571655, -0.5621073246002197, -0.5320397019386292, -0.5019720792770386, -0.4719045162200928, -0.4418369233608246, -0.4117693305015564, -0.3817017376422882, -0.35163414478302, -0.32156655192375183, -0.29149895906448364, -0.26143136620521545, -0.2313637137413025, -0.2012961208820343, -0.1712285280227661, -0.14116093516349792, -0.11109334230422974, -0.08102574944496155, -0.05095815658569336, -0.02089056372642517, 0.009177029132843018, 0.039244621992111206, 0.0693122148513794, 0.09937980771064758, 0.12944740056991577, 0.15951499342918396, 0.18958258628845215, 0.21965017914772034, 0.24971777200698853, 0.2797853648662567, 0.3098529577255249, 0.3399205505847931, 0.3699881434440613, 0.40005573630332947, 0.43012332916259766, 0.46019092202186584, 0.49025851488113403, 0.5203261375427246, 0.5503937005996704, 0.5804612636566162, 0.6105288863182068, 0.6405965089797974, 0.6706640720367432, 0.700731635093689, 0.7307992577552795]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 13.0, 16.0, 7.0, 21.0, 43.0, 43.0, 89.0, 146.0, 225.0, 439.0, 990.0, 2852.0, 17281.0, 270256.0, 691291.0, 56095.0, 5893.0, 1535.0, 611.0, 282.0, 174.0, 97.0, 48.0, 30.0, 26.0, 17.0, 13.0, 5.0, 4.0, 6.0, 3.0, 3.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.90673828125, -0.8721694946289062, -0.8376007080078125, -0.8030319213867188, -0.768463134765625, -0.7338943481445312, -0.6993255615234375, -0.6647567749023438, -0.63018798828125, -0.5956192016601562, -0.5610504150390625, -0.5264816284179688, -0.491912841796875, -0.45734405517578125, -0.4227752685546875, -0.38820648193359375, -0.3536376953125, -0.31906890869140625, -0.2845001220703125, -0.24993133544921875, -0.215362548828125, -0.18079376220703125, -0.1462249755859375, -0.11165618896484375, -0.07708740234375, -0.04251861572265625, -0.0079498291015625, 0.02661895751953125, 0.061187744140625, 0.09575653076171875, 0.1303253173828125, 0.16489410400390625, 0.199462890625, 0.23403167724609375, 0.2686004638671875, 0.30316925048828125, 0.337738037109375, 0.37230682373046875, 0.4068756103515625, 0.44144439697265625, 0.47601318359375, 0.5105819702148438, 0.5451507568359375, 0.5797195434570312, 0.614288330078125, 0.6488571166992188, 0.6834259033203125, 0.7179946899414062, 0.7525634765625, 0.7871322631835938, 0.8217010498046875, 0.8562698364257812, 0.890838623046875, 0.9254074096679688, 0.9599761962890625, 0.9945449829101562, 1.02911376953125, 1.0636825561523438, 1.0982513427734375, 1.1328201293945312, 1.167388916015625, 1.2019577026367188, 1.2365264892578125, 1.2710952758789062, 1.3056640625]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 7.0, 3.0, 4.0, 15.0, 11.0, 25.0, 20.0, 33.0, 55.0, 44.0, 58.0, 75.0, 87.0, 66.0, 71.0, 82.0, 62.0, 62.0, 50.0, 45.0, 39.0, 23.0, 21.0, 15.0, 6.0, 6.0, 5.0, 5.0, 4.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1522216796875, -0.14744949340820312, -0.14267730712890625, -0.13790512084960938, -0.1331329345703125, -0.12836074829101562, -0.12358856201171875, -0.11881637573242188, -0.114044189453125, -0.10927200317382812, -0.10449981689453125, -0.09972763061523438, -0.0949554443359375, -0.09018325805664062, -0.08541107177734375, -0.08063888549804688, -0.07586669921875, -0.07109451293945312, -0.06632232666015625, -0.061550140380859375, -0.0567779541015625, -0.052005767822265625, -0.04723358154296875, -0.042461395263671875, -0.037689208984375, -0.032917022705078125, -0.02814483642578125, -0.023372650146484375, -0.0186004638671875, -0.013828277587890625, -0.00905609130859375, -0.004283905029296875, 0.00048828125, 0.005260467529296875, 0.01003265380859375, 0.014804840087890625, 0.0195770263671875, 0.024349212646484375, 0.02912139892578125, 0.033893585205078125, 0.038665771484375, 0.043437957763671875, 0.04821014404296875, 0.052982330322265625, 0.0577545166015625, 0.06252670288085938, 0.06729888916015625, 0.07207107543945312, 0.07684326171875, 0.08161544799804688, 0.08638763427734375, 0.09115982055664062, 0.0959320068359375, 0.10070419311523438, 0.10547637939453125, 0.11024856567382812, 0.115020751953125, 0.11979293823242188, 0.12456512451171875, 0.12933731079101562, 0.1341094970703125, 0.13888168334960938, 0.14365386962890625, 0.14842605590820312, 0.1531982421875]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 5.0, 6.0, 3.0, 9.0, 13.0, 16.0, 17.0, 31.0, 32.0, 39.0, 45.0, 69.0, 114.0, 143.0, 196.0, 233.0, 370.0, 561.0, 903.0, 1648.0, 3272.0, 7037.0, 16770.0, 42162.0, 111857.0, 271627.0, 329613.0, 159083.0, 60297.0, 23195.0, 9554.0, 4229.0, 2060.0, 1145.0, 687.0, 432.0, 309.0, 181.0, 152.0, 113.0, 81.0, 68.0, 44.0, 46.0, 18.0, 31.0, 13.0, 9.0, 9.0, 3.0, 4.0, 4.0, 2.0, 4.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.279052734375, -0.2703819274902344, -0.26171112060546875, -0.2530403137207031, -0.2443695068359375, -0.23569869995117188, -0.22702789306640625, -0.21835708618164062, -0.209686279296875, -0.20101547241210938, -0.19234466552734375, -0.18367385864257812, -0.1750030517578125, -0.16633224487304688, -0.15766143798828125, -0.14899063110351562, -0.14031982421875, -0.13164901733398438, -0.12297821044921875, -0.11430740356445312, -0.1056365966796875, -0.09696578979492188, -0.08829498291015625, -0.07962417602539062, -0.070953369140625, -0.062282562255859375, -0.05361175537109375, -0.044940948486328125, -0.0362701416015625, -0.027599334716796875, -0.01892852783203125, -0.010257720947265625, -0.0015869140625, 0.007083892822265625, 0.01575469970703125, 0.024425506591796875, 0.0330963134765625, 0.041767120361328125, 0.05043792724609375, 0.059108734130859375, 0.067779541015625, 0.07645034790039062, 0.08512115478515625, 0.09379196166992188, 0.1024627685546875, 0.11113357543945312, 0.11980438232421875, 0.12847518920898438, 0.13714599609375, 0.14581680297851562, 0.15448760986328125, 0.16315841674804688, 0.1718292236328125, 0.18050003051757812, 0.18917083740234375, 0.19784164428710938, 0.206512451171875, 0.21518325805664062, 0.22385406494140625, 0.23252487182617188, 0.2411956787109375, 0.24986648559570312, 0.25853729248046875, 0.2672080993652344, 0.27587890625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 3.0, 4.0, 6.0, 1.0, 4.0, 7.0, 12.0, 5.0, 8.0, 5.0, 14.0, 11.0, 29.0, 22.0, 29.0, 22.0, 24.0, 16.0, 27.0, 31.0, 32.0, 35.0, 24.0, 36.0, 32.0, 39.0, 42.0, 29.0, 37.0, 48.0, 42.0, 41.0, 42.0, 27.0, 29.0, 25.0, 17.0, 23.0, 23.0, 13.0, 13.0, 10.0, 13.0, 13.0, 5.0, 11.0, 8.0, 3.0, 8.0, 3.0, 3.0, 0.0, 3.0, 2.0, 3.0, 2.0], "bins": [-0.334228515625, -0.32444000244140625, -0.3146514892578125, -0.30486297607421875, -0.295074462890625, -0.28528594970703125, -0.2754974365234375, -0.26570892333984375, -0.25592041015625, -0.24613189697265625, -0.2363433837890625, -0.22655487060546875, -0.216766357421875, -0.20697784423828125, -0.1971893310546875, -0.18740081787109375, -0.1776123046875, -0.16782379150390625, -0.1580352783203125, -0.14824676513671875, -0.138458251953125, -0.12866973876953125, -0.1188812255859375, -0.10909271240234375, -0.09930419921875, -0.08951568603515625, -0.0797271728515625, -0.06993865966796875, -0.060150146484375, -0.05036163330078125, -0.0405731201171875, -0.03078460693359375, -0.02099609375, -0.01120758056640625, -0.0014190673828125, 0.00836944580078125, 0.018157958984375, 0.02794647216796875, 0.0377349853515625, 0.04752349853515625, 0.05731201171875, 0.06710052490234375, 0.0768890380859375, 0.08667755126953125, 0.096466064453125, 0.10625457763671875, 0.1160430908203125, 0.12583160400390625, 0.1356201171875, 0.14540863037109375, 0.1551971435546875, 0.16498565673828125, 0.174774169921875, 0.18456268310546875, 0.1943511962890625, 0.20413970947265625, 0.21392822265625, 0.22371673583984375, 0.2335052490234375, 0.24329376220703125, 0.253082275390625, 0.26287078857421875, 0.2726593017578125, 0.28244781494140625, 0.292236328125]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 6.0, 3.0, 7.0, 9.0, 20.0, 29.0, 59.0, 85.0, 180.0, 373.0, 831.0, 2133.0, 8342.0, 60335.0, 537677.0, 391434.0, 37795.0, 6159.0, 1785.0, 624.0, 301.0, 149.0, 83.0, 47.0, 34.0, 18.0, 12.0, 12.0, 3.0, 2.0, 4.0, 2.0, 0.0, 4.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.314697265625, -0.30593109130859375, -0.2971649169921875, -0.28839874267578125, -0.279632568359375, -0.27086639404296875, -0.2621002197265625, -0.25333404541015625, -0.24456787109375, -0.23580169677734375, -0.2270355224609375, -0.21826934814453125, -0.209503173828125, -0.20073699951171875, -0.1919708251953125, -0.18320465087890625, -0.1744384765625, -0.16567230224609375, -0.1569061279296875, -0.14813995361328125, -0.139373779296875, -0.13060760498046875, -0.1218414306640625, -0.11307525634765625, -0.10430908203125, -0.09554290771484375, -0.0867767333984375, -0.07801055908203125, -0.069244384765625, -0.06047821044921875, -0.0517120361328125, -0.04294586181640625, -0.0341796875, -0.02541351318359375, -0.0166473388671875, -0.00788116455078125, 0.000885009765625, 0.00965118408203125, 0.0184173583984375, 0.02718353271484375, 0.03594970703125, 0.04471588134765625, 0.0534820556640625, 0.06224822998046875, 0.071014404296875, 0.07978057861328125, 0.0885467529296875, 0.09731292724609375, 0.1060791015625, 0.11484527587890625, 0.1236114501953125, 0.13237762451171875, 0.141143798828125, 0.14990997314453125, 0.1586761474609375, 0.16744232177734375, 0.17620849609375, 0.18497467041015625, 0.1937408447265625, 0.20250701904296875, 0.211273193359375, 0.22003936767578125, 0.2288055419921875, 0.23757171630859375, 0.246337890625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 4.0, 4.0, 8.0, 5.0, 14.0, 12.0, 30.0, 31.0, 47.0, 59.0, 86.0, 105.0, 138.0, 161.0, 109.0, 53.0, 49.0, 31.0, 19.0, 16.0, 12.0, 8.0, 6.0, 3.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001499652862548828, -0.00014523044228553772, -0.00014049559831619263, -0.00013576075434684753, -0.00013102591037750244, -0.00012629106640815735, -0.00012155622243881226, -0.00011682137846946716, -0.00011208653450012207, -0.00010735169053077698, -0.00010261684656143188, -9.788200259208679e-05, -9.31471586227417e-05, -8.84123146533966e-05, -8.367747068405151e-05, -7.894262671470642e-05, -7.420778274536133e-05, -6.947293877601624e-05, -6.473809480667114e-05, -6.000325083732605e-05, -5.526840686798096e-05, -5.0533562898635864e-05, -4.579871892929077e-05, -4.106387495994568e-05, -3.6329030990600586e-05, -3.159418702125549e-05, -2.68593430519104e-05, -2.2124499082565308e-05, -1.7389655113220215e-05, -1.2654811143875122e-05, -7.91996717453003e-06, -3.1851232051849365e-06, 1.5497207641601562e-06, 6.284564733505249e-06, 1.1019408702850342e-05, 1.5754252672195435e-05, 2.0489096641540527e-05, 2.522394061088562e-05, 2.9958784580230713e-05, 3.4693628549575806e-05, 3.94284725189209e-05, 4.416331648826599e-05, 4.8898160457611084e-05, 5.363300442695618e-05, 5.836784839630127e-05, 6.310269236564636e-05, 6.783753633499146e-05, 7.257238030433655e-05, 7.730722427368164e-05, 8.204206824302673e-05, 8.677691221237183e-05, 9.151175618171692e-05, 9.624660015106201e-05, 0.0001009814441204071, 0.0001057162880897522, 0.00011045113205909729, 0.00011518597602844238, 0.00011992081999778748, 0.00012465566396713257, 0.00012939050793647766, 0.00013412535190582275, 0.00013886019587516785, 0.00014359503984451294, 0.00014832988381385803, 0.00015306472778320312]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 6.0, 3.0, 6.0, 10.0, 11.0, 18.0, 32.0, 28.0, 57.0, 111.0, 177.0, 344.0, 690.0, 1537.0, 4069.0, 15003.0, 84713.0, 502766.0, 369091.0, 53511.0, 10685.0, 3172.0, 1223.0, 565.0, 306.0, 164.0, 91.0, 52.0, 42.0, 29.0, 12.0, 13.0, 7.0, 3.0, 5.0, 1.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.22607421875, -0.2182464599609375, -0.210418701171875, -0.2025909423828125, -0.19476318359375, -0.1869354248046875, -0.179107666015625, -0.1712799072265625, -0.1634521484375, -0.1556243896484375, -0.147796630859375, -0.1399688720703125, -0.13214111328125, -0.1243133544921875, -0.116485595703125, -0.1086578369140625, -0.100830078125, -0.0930023193359375, -0.085174560546875, -0.0773468017578125, -0.06951904296875, -0.0616912841796875, -0.053863525390625, -0.0460357666015625, -0.0382080078125, -0.0303802490234375, -0.022552490234375, -0.0147247314453125, -0.00689697265625, 0.0009307861328125, 0.008758544921875, 0.0165863037109375, 0.0244140625, 0.0322418212890625, 0.040069580078125, 0.0478973388671875, 0.05572509765625, 0.0635528564453125, 0.071380615234375, 0.0792083740234375, 0.0870361328125, 0.0948638916015625, 0.102691650390625, 0.1105194091796875, 0.11834716796875, 0.1261749267578125, 0.134002685546875, 0.1418304443359375, 0.149658203125, 0.1574859619140625, 0.165313720703125, 0.1731414794921875, 0.18096923828125, 0.1887969970703125, 0.196624755859375, 0.2044525146484375, 0.2122802734375, 0.2201080322265625, 0.227935791015625, 0.2357635498046875, 0.24359130859375, 0.2514190673828125, 0.259246826171875, 0.2670745849609375, 0.27490234375]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 6.0, 3.0, 6.0, 9.0, 12.0, 18.0, 23.0, 40.0, 32.0, 68.0, 71.0, 88.0, 90.0, 101.0, 96.0, 97.0, 68.0, 50.0, 35.0, 28.0, 19.0, 9.0, 9.0, 9.0, 6.0, 4.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1790771484375, -0.17206764221191406, -0.16505813598632812, -0.1580486297607422, -0.15103912353515625, -0.1440296173095703, -0.13702011108398438, -0.13001060485839844, -0.1230010986328125, -0.11599159240722656, -0.10898208618164062, -0.10197257995605469, -0.09496307373046875, -0.08795356750488281, -0.08094406127929688, -0.07393455505371094, -0.066925048828125, -0.05991554260253906, -0.052906036376953125, -0.04589653015136719, -0.03888702392578125, -0.03187751770019531, -0.024868011474609375, -0.017858505249023438, -0.0108489990234375, -0.0038394927978515625, 0.003170013427734375, 0.010179519653320312, 0.01718902587890625, 0.024198532104492188, 0.031208038330078125, 0.03821754455566406, 0.04522705078125, 0.05223655700683594, 0.059246063232421875, 0.06625556945800781, 0.07326507568359375, 0.08027458190917969, 0.08728408813476562, 0.09429359436035156, 0.1013031005859375, 0.10831260681152344, 0.11532211303710938, 0.12233161926269531, 0.12934112548828125, 0.1363506317138672, 0.14336013793945312, 0.15036964416503906, 0.157379150390625, 0.16438865661621094, 0.17139816284179688, 0.1784076690673828, 0.18541717529296875, 0.1924266815185547, 0.19943618774414062, 0.20644569396972656, 0.2134552001953125, 0.22046470642089844, 0.22747421264648438, 0.2344837188720703, 0.24149322509765625, 0.2485027313232422, 0.2555122375488281, 0.26252174377441406, 0.26953125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 7.0, 11.0, 15.0, 26.0, 57.0, 119.0, 183.0, 232.0, 160.0, 108.0, 42.0, 21.0, 12.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.433022499084473, -4.301145076751709, -4.169267177581787, -4.037389755249023, -3.9055123329162598, -3.773634672164917, -3.641757011413574, -3.5098795890808105, -3.3780019283294678, -3.246124267578125, -3.1142468452453613, -2.9823691844940186, -2.850491523742676, -2.718614101409912, -2.5867364406585693, -2.4548587799072266, -2.322981357574463, -2.19110369682312, -2.0592262744903564, -1.9273486137390137, -1.7954710721969604, -1.6635935306549072, -1.5317158699035645, -1.3998383283615112, -1.267960786819458, -1.1360832452774048, -1.0042057037353516, -0.8723280429840088, -0.7404505014419556, -0.6085729598999023, -0.47669535875320435, -0.34481775760650635, -0.21294021606445312, -0.08106264472007751, 0.050814926624298096, 0.1826924979686737, 0.3145700693130493, 0.44644761085510254, 0.5783252120018005, 0.7102028131484985, 0.8420803546905518, 0.973957896232605, 1.1058354377746582, 1.237713098526001, 1.3695906400680542, 1.5014681816101074, 1.6333458423614502, 1.7652233839035034, 1.8971009254455566, 2.0289785861968994, 2.160856008529663, 2.292733669281006, 2.4246110916137695, 2.5564887523651123, 2.688366413116455, 2.8202438354492188, 2.9521214962005615, 3.0839991569519043, 3.215876579284668, 3.3477542400360107, 3.4796319007873535, 3.611509323120117, 3.74338698387146, 3.8752646446228027, 4.007142066955566]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 3.0, 7.0, 12.0, 10.0, 7.0, 15.0, 17.0, 25.0, 9.0, 19.0, 30.0, 31.0, 36.0, 40.0, 34.0, 41.0, 59.0, 41.0, 36.0, 51.0, 49.0, 36.0, 36.0, 32.0, 28.0, 30.0, 35.0, 27.0, 26.0, 30.0, 25.0, 16.0, 23.0, 12.0, 15.0, 12.0, 11.0, 10.0, 7.0, 3.0, 3.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 3.0, 1.0, 1.0], "bins": [-2.1684422492980957, -2.104820728302002, -2.0411994457244873, -1.9775779247283936, -1.9139564037322998, -1.8503350019454956, -1.7867136001586914, -1.7230920791625977, -1.659470558166504, -1.5958491563796997, -1.532227635383606, -1.4686062335968018, -1.404984712600708, -1.3413633108139038, -1.2777419090270996, -1.2141203880310059, -1.1504989862442017, -1.0868775844573975, -1.0232560634613037, -0.9596346616744995, -0.8960131406784058, -0.8323917388916016, -0.7687702775001526, -0.7051488161087036, -0.6415273547172546, -0.5779058933258057, -0.5142844319343567, -0.4506630003452301, -0.38704153895378113, -0.32342007756233215, -0.25979864597320557, -0.1961771845817566, -0.13255560398101807, -0.06893415004014969, -0.005312696099281311, 0.05830875039100647, 0.12193021178245544, 0.18555167317390442, 0.249173104763031, 0.31279456615448, 0.37641602754592896, 0.44003748893737793, 0.5036589503288269, 0.5672804117202759, 0.6309018135070801, 0.6945233345031738, 0.758144736289978, 0.821766197681427, 0.885387659072876, 0.949009120464325, 1.012630581855774, 1.0762519836425781, 1.1398735046386719, 1.203494906425476, 1.2671163082122803, 1.330737829208374, 1.3943593502044678, 1.457980751991272, 1.5216022729873657, 1.58522367477417, 1.6488451957702637, 1.7124665975570679, 1.776087999343872, 1.8397095203399658, 1.90333092212677]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 3.0, 4.0, 8.0, 7.0, 5.0, 12.0, 24.0, 18.0, 21.0, 34.0, 50.0, 77.0, 97.0, 140.0, 266.0, 529.0, 1482.0, 5318.0, 37078.0, 3720169.0, 406052.0, 17541.0, 3427.0, 1025.0, 410.0, 211.0, 111.0, 55.0, 31.0, 22.0, 13.0, 12.0, 9.0, 8.0, 5.0, 5.0, 6.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3740234375, -1.333404541015625, -1.29278564453125, -1.252166748046875, -1.2115478515625, -1.170928955078125, -1.13031005859375, -1.089691162109375, -1.049072265625, -1.008453369140625, -0.96783447265625, -0.927215576171875, -0.8865966796875, -0.845977783203125, -0.80535888671875, -0.764739990234375, -0.72412109375, -0.683502197265625, -0.64288330078125, -0.602264404296875, -0.5616455078125, -0.521026611328125, -0.48040771484375, -0.439788818359375, -0.399169921875, -0.358551025390625, -0.31793212890625, -0.277313232421875, -0.2366943359375, -0.196075439453125, -0.15545654296875, -0.114837646484375, -0.07421875, -0.033599853515625, 0.00701904296875, 0.047637939453125, 0.0882568359375, 0.128875732421875, 0.16949462890625, 0.210113525390625, 0.250732421875, 0.291351318359375, 0.33197021484375, 0.372589111328125, 0.4132080078125, 0.453826904296875, 0.49444580078125, 0.535064697265625, 0.57568359375, 0.616302490234375, 0.65692138671875, 0.697540283203125, 0.7381591796875, 0.778778076171875, 0.81939697265625, 0.860015869140625, 0.900634765625, 0.941253662109375, 0.98187255859375, 1.022491455078125, 1.0631103515625, 1.103729248046875, 1.14434814453125, 1.184967041015625, 1.2255859375]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 5.0, 6.0, 8.0, 10.0, 17.0, 19.0, 24.0, 28.0, 33.0, 54.0, 48.0, 62.0, 58.0, 64.0, 55.0, 76.0, 59.0, 51.0, 65.0, 50.0, 46.0, 40.0, 34.0, 24.0, 9.0, 13.0, 11.0, 7.0, 15.0, 4.0, 4.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.153076171875, -0.14856338500976562, -0.14405059814453125, -0.13953781127929688, -0.1350250244140625, -0.13051223754882812, -0.12599945068359375, -0.12148666381835938, -0.116973876953125, -0.11246109008789062, -0.10794830322265625, -0.10343551635742188, -0.0989227294921875, -0.09440994262695312, -0.08989715576171875, -0.08538436889648438, -0.08087158203125, -0.07635879516601562, -0.07184600830078125, -0.06733322143554688, -0.0628204345703125, -0.058307647705078125, -0.05379486083984375, -0.049282073974609375, -0.044769287109375, -0.040256500244140625, -0.03574371337890625, -0.031230926513671875, -0.0267181396484375, -0.022205352783203125, -0.01769256591796875, -0.013179779052734375, -0.0086669921875, -0.004154205322265625, 0.00035858154296875, 0.004871368408203125, 0.0093841552734375, 0.013896942138671875, 0.01840972900390625, 0.022922515869140625, 0.027435302734375, 0.031948089599609375, 0.03646087646484375, 0.040973663330078125, 0.0454864501953125, 0.049999237060546875, 0.05451202392578125, 0.059024810791015625, 0.06353759765625, 0.06805038452148438, 0.07256317138671875, 0.07707595825195312, 0.0815887451171875, 0.08610153198242188, 0.09061431884765625, 0.09512710571289062, 0.099639892578125, 0.10415267944335938, 0.10866546630859375, 0.11317825317382812, 0.1176910400390625, 0.12220382690429688, 0.12671661376953125, 0.13122940063476562, 0.1357421875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 1.0, 4.0, 8.0, 5.0, 7.0, 11.0, 25.0, 22.0, 41.0, 68.0, 109.0, 178.0, 256.0, 379.0, 688.0, 1271.0, 2904.0, 8756.0, 37387.0, 358946.0, 3584282.0, 163576.0, 24095.0, 6498.0, 2371.0, 1039.0, 534.0, 331.0, 191.0, 112.0, 71.0, 37.0, 27.0, 17.0, 6.0, 8.0, 7.0, 3.0, 1.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.69873046875, -0.6789703369140625, -0.659210205078125, -0.6394500732421875, -0.61968994140625, -0.5999298095703125, -0.580169677734375, -0.5604095458984375, -0.5406494140625, -0.5208892822265625, -0.501129150390625, -0.4813690185546875, -0.46160888671875, -0.4418487548828125, -0.422088623046875, -0.4023284912109375, -0.382568359375, -0.3628082275390625, -0.343048095703125, -0.3232879638671875, -0.30352783203125, -0.2837677001953125, -0.264007568359375, -0.2442474365234375, -0.2244873046875, -0.2047271728515625, -0.184967041015625, -0.1652069091796875, -0.14544677734375, -0.1256866455078125, -0.105926513671875, -0.0861663818359375, -0.06640625, -0.0466461181640625, -0.026885986328125, -0.0071258544921875, 0.01263427734375, 0.0323944091796875, 0.052154541015625, 0.0719146728515625, 0.0916748046875, 0.1114349365234375, 0.131195068359375, 0.1509552001953125, 0.17071533203125, 0.1904754638671875, 0.210235595703125, 0.2299957275390625, 0.249755859375, 0.2695159912109375, 0.289276123046875, 0.3090362548828125, 0.32879638671875, 0.3485565185546875, 0.368316650390625, 0.3880767822265625, 0.4078369140625, 0.4275970458984375, 0.447357177734375, 0.4671173095703125, 0.48687744140625, 0.5066375732421875, 0.526397705078125, 0.5461578369140625, 0.56591796875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 1.0, 2.0, 9.0, 16.0, 15.0, 31.0, 60.0, 84.0, 148.0, 377.0, 1278.0, 1265.0, 395.0, 171.0, 78.0, 42.0, 32.0, 22.0, 15.0, 13.0, 8.0, 2.0, 7.0, 3.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.399658203125, -0.38966941833496094, -0.3796806335449219, -0.3696918487548828, -0.35970306396484375, -0.3497142791748047, -0.3397254943847656, -0.32973670959472656, -0.3197479248046875, -0.30975914001464844, -0.2997703552246094, -0.2897815704345703, -0.27979278564453125, -0.2698040008544922, -0.2598152160644531, -0.24982643127441406, -0.239837646484375, -0.22984886169433594, -0.21986007690429688, -0.2098712921142578, -0.19988250732421875, -0.1898937225341797, -0.17990493774414062, -0.16991615295410156, -0.1599273681640625, -0.14993858337402344, -0.13994979858398438, -0.1299610137939453, -0.11997222900390625, -0.10998344421386719, -0.09999465942382812, -0.09000587463378906, -0.08001708984375, -0.07002830505371094, -0.060039520263671875, -0.05005073547363281, -0.04006195068359375, -0.030073165893554688, -0.020084381103515625, -0.010095596313476562, -0.0001068115234375, 0.009881973266601562, 0.019870758056640625, 0.029859542846679688, 0.03984832763671875, 0.04983711242675781, 0.059825897216796875, 0.06981468200683594, 0.079803466796875, 0.08979225158691406, 0.09978103637695312, 0.10976982116699219, 0.11975860595703125, 0.1297473907470703, 0.13973617553710938, 0.14972496032714844, 0.1597137451171875, 0.16970252990722656, 0.17969131469726562, 0.1896800994873047, 0.19966888427734375, 0.2096576690673828, 0.21964645385742188, 0.22963523864746094, 0.2396240234375]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 11.0, 24.0, 78.0, 157.0, 251.0, 225.0, 142.0, 70.0, 19.0, 9.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3143388032913208, -1.2312127351760864, -1.148086667060852, -1.0649605989456177, -0.9818344712257385, -0.8987084031105042, -0.815582275390625, -0.7324562072753906, -0.6493301391601562, -0.5662040710449219, -0.4830779731273651, -0.39995187520980835, -0.316825807094574, -0.2336997389793396, -0.15057364106178284, -0.06744754314422607, 0.0156785249710083, 0.09880460798740387, 0.18193069100379944, 0.2650567889213562, 0.3481828570365906, 0.43130892515182495, 0.5144350528717041, 0.5975611209869385, 0.6806871891021729, 0.7638132572174072, 0.8469393253326416, 0.9300654530525208, 1.0131914615631104, 1.0963175296783447, 1.1794437170028687, 1.262569785118103, 1.345695972442627, 1.4288220405578613, 1.5119481086730957, 1.59507417678833, 1.6782002449035645, 1.7613263130187988, 1.8444525003433228, 1.9275785684585571, 2.010704517364502, 2.0938305854797363, 2.1769566535949707, 2.260082721710205, 2.3432087898254395, 2.426334857940674, 2.509460926055908, 2.5925869941711426, 2.675713300704956, 2.7588393688201904, 2.841965436935425, 2.925091505050659, 3.0082175731658936, 3.091343641281128, 3.1744697093963623, 3.257596015930176, 3.34072208404541, 3.4238481521606445, 3.506974220275879, 3.5901002883911133, 3.6732263565063477, 3.756352424621582, 3.8394784927368164, 3.922604560852051, 4.005730628967285]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 3.0, 5.0, 2.0, 8.0, 5.0, 13.0, 16.0, 16.0, 18.0, 28.0, 43.0, 45.0, 55.0, 61.0, 44.0, 64.0, 71.0, 64.0, 63.0, 62.0, 47.0, 48.0, 32.0, 40.0, 27.0, 26.0, 28.0, 17.0, 21.0, 9.0, 9.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.2003357410430908, -1.1675477027893066, -1.134759545326233, -1.1019715070724487, -1.069183349609375, -1.0363953113555908, -1.003607153892517, -0.9708191156387329, -0.938031017780304, -0.905242919921875, -0.872454822063446, -0.8396667242050171, -0.8068786859512329, -0.7740905284881592, -0.741302490234375, -0.708514392375946, -0.6757262945175171, -0.6429381966590881, -0.6101500988006592, -0.5773620009422302, -0.5445739030838013, -0.5117858648300171, -0.47899776697158813, -0.4462096691131592, -0.4134215712547302, -0.38063347339630127, -0.3478453755378723, -0.31505730748176575, -0.2822692096233368, -0.24948111176490784, -0.21669302880764008, -0.18390494585037231, -0.1511167287826538, -0.11832863837480545, -0.08554054796695709, -0.052752457559108734, -0.019964367151260376, 0.012823730707168579, 0.04561181366443634, 0.0783998966217041, 0.11118799448013306, 0.143976092338562, 0.17676417529582977, 0.20955225825309753, 0.2423403561115265, 0.27512845396995544, 0.307916522026062, 0.34070461988449097, 0.3734927177429199, 0.4062808156013489, 0.43906891345977783, 0.4718569815158844, 0.5046451091766357, 0.5374331474304199, 0.5702212452888489, 0.6030093431472778, 0.6357974410057068, 0.6685855388641357, 0.7013736367225647, 0.7341617345809937, 0.7669497728347778, 0.7997379302978516, 0.8325259685516357, 0.8653140664100647, 0.8981021642684937]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 5.0, 1.0, 6.0, 4.0, 9.0, 12.0, 22.0, 42.0, 75.0, 145.0, 322.0, 866.0, 3832.0, 36161.0, 852499.0, 144229.0, 7931.0, 1548.0, 466.0, 180.0, 89.0, 54.0, 28.0, 13.0, 6.0, 4.0, 3.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.7587890625, -1.7095184326171875, -1.660247802734375, -1.6109771728515625, -1.56170654296875, -1.5124359130859375, -1.463165283203125, -1.4138946533203125, -1.3646240234375, -1.3153533935546875, -1.266082763671875, -1.2168121337890625, -1.16754150390625, -1.1182708740234375, -1.069000244140625, -1.0197296142578125, -0.970458984375, -0.9211883544921875, -0.871917724609375, -0.8226470947265625, -0.77337646484375, -0.7241058349609375, -0.674835205078125, -0.6255645751953125, -0.5762939453125, -0.5270233154296875, -0.477752685546875, -0.4284820556640625, -0.37921142578125, -0.3299407958984375, -0.280670166015625, -0.2313995361328125, -0.18212890625, -0.1328582763671875, -0.083587646484375, -0.0343170166015625, 0.01495361328125, 0.0642242431640625, 0.113494873046875, 0.1627655029296875, 0.2120361328125, 0.2613067626953125, 0.310577392578125, 0.3598480224609375, 0.40911865234375, 0.4583892822265625, 0.507659912109375, 0.5569305419921875, 0.606201171875, 0.6554718017578125, 0.704742431640625, 0.7540130615234375, 0.80328369140625, 0.8525543212890625, 0.901824951171875, 0.9510955810546875, 1.0003662109375, 1.0496368408203125, 1.098907470703125, 1.1481781005859375, 1.19744873046875, 1.2467193603515625, 1.295989990234375, 1.3452606201171875, 1.39453125]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 5.0, 1.0, 5.0, 4.0, 4.0, 7.0, 13.0, 14.0, 26.0, 33.0, 47.0, 48.0, 54.0, 79.0, 61.0, 74.0, 79.0, 46.0, 48.0, 70.0, 58.0, 49.0, 38.0, 38.0, 29.0, 23.0, 11.0, 15.0, 6.0, 9.0, 1.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17236328125, -0.16737937927246094, -0.16239547729492188, -0.1574115753173828, -0.15242767333984375, -0.1474437713623047, -0.14245986938476562, -0.13747596740722656, -0.1324920654296875, -0.12750816345214844, -0.12252426147460938, -0.11754035949707031, -0.11255645751953125, -0.10757255554199219, -0.10258865356445312, -0.09760475158691406, -0.092620849609375, -0.08763694763183594, -0.08265304565429688, -0.07766914367675781, -0.07268524169921875, -0.06770133972167969, -0.06271743774414062, -0.05773353576660156, -0.0527496337890625, -0.04776573181152344, -0.042781829833984375, -0.03779792785644531, -0.03281402587890625, -0.027830123901367188, -0.022846221923828125, -0.017862319946289062, -0.01287841796875, -0.007894515991210938, -0.002910614013671875, 0.0020732879638671875, 0.00705718994140625, 0.012041091918945312, 0.017024993896484375, 0.022008895874023438, 0.0269927978515625, 0.03197669982910156, 0.036960601806640625, 0.04194450378417969, 0.04692840576171875, 0.05191230773925781, 0.056896209716796875, 0.06188011169433594, 0.066864013671875, 0.07184791564941406, 0.07683181762695312, 0.08181571960449219, 0.08679962158203125, 0.09178352355957031, 0.09676742553710938, 0.10175132751464844, 0.1067352294921875, 0.11171913146972656, 0.11670303344726562, 0.12168693542480469, 0.12667083740234375, 0.1316547393798828, 0.13663864135742188, 0.14162254333496094, 0.1466064453125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 2.0, 9.0, 12.0, 15.0, 21.0, 25.0, 40.0, 55.0, 77.0, 124.0, 189.0, 341.0, 699.0, 1604.0, 4013.0, 12892.0, 59272.0, 345813.0, 501026.0, 94567.0, 18543.0, 5324.0, 1973.0, 895.0, 415.0, 246.0, 140.0, 65.0, 43.0, 34.0, 25.0, 13.0, 11.0, 6.0, 8.0, 4.0, 4.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0], "bins": [-0.59423828125, -0.5777931213378906, -0.5613479614257812, -0.5449028015136719, -0.5284576416015625, -0.5120124816894531, -0.49556732177734375, -0.4791221618652344, -0.462677001953125, -0.4462318420410156, -0.42978668212890625, -0.4133415222167969, -0.3968963623046875, -0.3804512023925781, -0.36400604248046875, -0.3475608825683594, -0.33111572265625, -0.3146705627441406, -0.29822540283203125, -0.2817802429199219, -0.2653350830078125, -0.24888992309570312, -0.23244476318359375, -0.21599960327148438, -0.199554443359375, -0.18310928344726562, -0.16666412353515625, -0.15021896362304688, -0.1337738037109375, -0.11732864379882812, -0.10088348388671875, -0.08443832397460938, -0.0679931640625, -0.051548004150390625, -0.03510284423828125, -0.018657684326171875, -0.0022125244140625, 0.014232635498046875, 0.03067779541015625, 0.047122955322265625, 0.063568115234375, 0.08001327514648438, 0.09645843505859375, 0.11290359497070312, 0.1293487548828125, 0.14579391479492188, 0.16223907470703125, 0.17868423461914062, 0.19512939453125, 0.21157455444335938, 0.22801971435546875, 0.24446487426757812, 0.2609100341796875, 0.2773551940917969, 0.29380035400390625, 0.3102455139160156, 0.326690673828125, 0.3431358337402344, 0.35958099365234375, 0.3760261535644531, 0.3924713134765625, 0.4089164733886719, 0.42536163330078125, 0.4418067932128906, 0.458251953125]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 5.0, 5.0, 8.0, 5.0, 7.0, 5.0, 10.0, 7.0, 10.0, 11.0, 17.0, 18.0, 20.0, 25.0, 24.0, 30.0, 28.0, 33.0, 36.0, 42.0, 40.0, 44.0, 31.0, 40.0, 43.0, 46.0, 44.0, 39.0, 41.0, 37.0, 36.0, 44.0, 31.0, 21.0, 21.0, 12.0, 10.0, 9.0, 10.0, 11.0, 9.0, 6.0, 5.0, 9.0, 4.0, 8.0, 5.0, 3.0, 4.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4013671875, -0.3892097473144531, -0.37705230712890625, -0.3648948669433594, -0.3527374267578125, -0.3405799865722656, -0.32842254638671875, -0.3162651062011719, -0.304107666015625, -0.2919502258300781, -0.27979278564453125, -0.2676353454589844, -0.2554779052734375, -0.24332046508789062, -0.23116302490234375, -0.21900558471679688, -0.20684814453125, -0.19469070434570312, -0.18253326416015625, -0.17037582397460938, -0.1582183837890625, -0.14606094360351562, -0.13390350341796875, -0.12174606323242188, -0.109588623046875, -0.09743118286132812, -0.08527374267578125, -0.07311630249023438, -0.0609588623046875, -0.048801422119140625, -0.03664398193359375, -0.024486541748046875, -0.0123291015625, -0.000171661376953125, 0.01198577880859375, 0.024143218994140625, 0.0363006591796875, 0.048458099365234375, 0.06061553955078125, 0.07277297973632812, 0.084930419921875, 0.09708786010742188, 0.10924530029296875, 0.12140274047851562, 0.1335601806640625, 0.14571762084960938, 0.15787506103515625, 0.17003250122070312, 0.18218994140625, 0.19434738159179688, 0.20650482177734375, 0.21866226196289062, 0.2308197021484375, 0.24297714233398438, 0.25513458251953125, 0.2672920227050781, 0.279449462890625, 0.2916069030761719, 0.30376434326171875, 0.3159217834472656, 0.3280792236328125, 0.3402366638183594, 0.35239410400390625, 0.3645515441894531, 0.376708984375]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 6.0, 10.0, 11.0, 19.0, 23.0, 50.0, 128.0, 229.0, 417.0, 1038.0, 3150.0, 27613.0, 713677.0, 287924.0, 10745.0, 2037.0, 782.0, 350.0, 164.0, 78.0, 42.0, 27.0, 20.0, 6.0, 6.0, 2.0, 5.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.398681640625, -0.3875541687011719, -0.37642669677734375, -0.3652992248535156, -0.3541717529296875, -0.3430442810058594, -0.33191680908203125, -0.3207893371582031, -0.309661865234375, -0.2985343933105469, -0.28740692138671875, -0.2762794494628906, -0.2651519775390625, -0.2540245056152344, -0.24289703369140625, -0.23176956176757812, -0.22064208984375, -0.20951461791992188, -0.19838714599609375, -0.18725967407226562, -0.1761322021484375, -0.16500473022460938, -0.15387725830078125, -0.14274978637695312, -0.131622314453125, -0.12049484252929688, -0.10936737060546875, -0.09823989868164062, -0.0871124267578125, -0.07598495483398438, -0.06485748291015625, -0.053730010986328125, -0.0426025390625, -0.031475067138671875, -0.02034759521484375, -0.009220123291015625, 0.0019073486328125, 0.013034820556640625, 0.02416229248046875, 0.035289764404296875, 0.046417236328125, 0.057544708251953125, 0.06867218017578125, 0.07979965209960938, 0.0909271240234375, 0.10205459594726562, 0.11318206787109375, 0.12430953979492188, 0.13543701171875, 0.14656448364257812, 0.15769195556640625, 0.16881942749023438, 0.1799468994140625, 0.19107437133789062, 0.20220184326171875, 0.21332931518554688, 0.224456787109375, 0.23558425903320312, 0.24671173095703125, 0.2578392028808594, 0.2689666748046875, 0.2800941467285156, 0.29122161865234375, 0.3023490905761719, 0.3134765625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 0.0, 5.0, 10.0, 16.0, 35.0, 76.0, 153.0, 238.0, 204.0, 144.0, 53.0, 32.0, 22.0, 6.0, 5.0, 6.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00019598007202148438, -0.00018896162509918213, -0.00018194317817687988, -0.00017492473125457764, -0.0001679062843322754, -0.00016088783740997314, -0.0001538693904876709, -0.00014685094356536865, -0.0001398324966430664, -0.00013281404972076416, -0.00012579560279846191, -0.00011877715587615967, -0.00011175870895385742, -0.00010474026203155518, -9.772181510925293e-05, -9.070336818695068e-05, -8.368492126464844e-05, -7.666647434234619e-05, -6.964802742004395e-05, -6.26295804977417e-05, -5.561113357543945e-05, -4.859268665313721e-05, -4.157423973083496e-05, -3.4555792808532715e-05, -2.753734588623047e-05, -2.0518898963928223e-05, -1.3500452041625977e-05, -6.4820051193237305e-06, 5.364418029785156e-07, 7.554888725280762e-06, 1.4573335647583008e-05, 2.1591782569885254e-05, 2.86102294921875e-05, 3.5628676414489746e-05, 4.264712333679199e-05, 4.966557025909424e-05, 5.6684017181396484e-05, 6.370246410369873e-05, 7.072091102600098e-05, 7.773935794830322e-05, 8.475780487060547e-05, 9.177625179290771e-05, 9.879469871520996e-05, 0.00010581314563751221, 0.00011283159255981445, 0.0001198500394821167, 0.00012686848640441895, 0.0001338869333267212, 0.00014090538024902344, 0.00014792382717132568, 0.00015494227409362793, 0.00016196072101593018, 0.00016897916793823242, 0.00017599761486053467, 0.00018301606178283691, 0.00019003450870513916, 0.0001970529556274414, 0.00020407140254974365, 0.0002110898494720459, 0.00021810829639434814, 0.0002251267433166504, 0.00023214519023895264, 0.00023916363716125488, 0.00024618208408355713, 0.0002532005310058594]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 0.0, 6.0, 5.0, 6.0, 5.0, 20.0, 24.0, 31.0, 45.0, 72.0, 154.0, 239.0, 533.0, 1719.0, 9348.0, 146489.0, 828981.0, 53823.0, 4999.0, 1142.0, 426.0, 187.0, 92.0, 59.0, 50.0, 35.0, 24.0, 16.0, 9.0, 4.0, 3.0, 1.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.344482421875, -0.3331298828125, -0.32177734375, -0.3104248046875, -0.299072265625, -0.2877197265625, -0.2763671875, -0.2650146484375, -0.253662109375, -0.2423095703125, -0.23095703125, -0.2196044921875, -0.208251953125, -0.1968994140625, -0.185546875, -0.1741943359375, -0.162841796875, -0.1514892578125, -0.14013671875, -0.1287841796875, -0.117431640625, -0.1060791015625, -0.0947265625, -0.0833740234375, -0.072021484375, -0.0606689453125, -0.04931640625, -0.0379638671875, -0.026611328125, -0.0152587890625, -0.00390625, 0.0074462890625, 0.018798828125, 0.0301513671875, 0.04150390625, 0.0528564453125, 0.064208984375, 0.0755615234375, 0.0869140625, 0.0982666015625, 0.109619140625, 0.1209716796875, 0.13232421875, 0.1436767578125, 0.155029296875, 0.1663818359375, 0.177734375, 0.1890869140625, 0.200439453125, 0.2117919921875, 0.22314453125, 0.2344970703125, 0.245849609375, 0.2572021484375, 0.2685546875, 0.2799072265625, 0.291259765625, 0.3026123046875, 0.31396484375, 0.3253173828125, 0.336669921875, 0.3480224609375, 0.359375, 0.3707275390625, 0.382080078125]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 4.0, 7.0, 5.0, 21.0, 29.0, 36.0, 52.0, 80.0, 121.0, 123.0, 126.0, 133.0, 84.0, 75.0, 50.0, 22.0, 18.0, 11.0, 7.0, 5.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.20849609375, -0.20026779174804688, -0.19203948974609375, -0.18381118774414062, -0.1755828857421875, -0.16735458374023438, -0.15912628173828125, -0.15089797973632812, -0.142669677734375, -0.13444137573242188, -0.12621307373046875, -0.11798477172851562, -0.1097564697265625, -0.10152816772460938, -0.09329986572265625, -0.08507156372070312, -0.07684326171875, -0.06861495971679688, -0.06038665771484375, -0.052158355712890625, -0.0439300537109375, -0.035701751708984375, -0.02747344970703125, -0.019245147705078125, -0.011016845703125, -0.002788543701171875, 0.00543975830078125, 0.013668060302734375, 0.0218963623046875, 0.030124664306640625, 0.03835296630859375, 0.046581268310546875, 0.0548095703125, 0.06303787231445312, 0.07126617431640625, 0.07949447631835938, 0.0877227783203125, 0.09595108032226562, 0.10417938232421875, 0.11240768432617188, 0.120635986328125, 0.12886428833007812, 0.13709259033203125, 0.14532089233398438, 0.1535491943359375, 0.16177749633789062, 0.17000579833984375, 0.17823410034179688, 0.18646240234375, 0.19469070434570312, 0.20291900634765625, 0.21114730834960938, 0.2193756103515625, 0.22760391235351562, 0.23583221435546875, 0.24406051635742188, 0.252288818359375, 0.2605171203613281, 0.26874542236328125, 0.2769737243652344, 0.2852020263671875, 0.2934303283691406, 0.30165863037109375, 0.3098869323730469, 0.318115234375]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [3.0, 5.0, 8.0, 19.0, 38.0, 79.0, 157.0, 218.0, 214.0, 150.0, 65.0, 26.0, 15.0, 9.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2401728630065918, -1.08524751663208, -0.9303220510482788, -0.7753966450691223, -0.6204712390899658, -0.4655458331108093, -0.31062042713165283, -0.15569496154785156, -0.0007696151733398438, 0.15415579080581665, 0.30908119678497314, 0.46400660276412964, 0.6189320087432861, 0.7738574147224426, 0.9287828207015991, 1.0837082862854004, 1.238633632659912, 1.3935589790344238, 1.548484444618225, 1.7034099102020264, 1.858335256576538, 2.01326060295105, 2.1681861877441406, 2.3231115341186523, 2.478036880493164, 2.632962226867676, 2.7878875732421875, 2.9428131580352783, 3.09773850440979, 3.2526638507843018, 3.4075894355773926, 3.5625147819519043, 3.717439651489258, 3.8723649978637695, 4.027290344238281, 4.182215690612793, 4.337141036987305, 4.492066860198975, 4.646992206573486, 4.801917552947998, 4.95684289932251, 5.1117682456970215, 5.266693592071533, 5.421618938446045, 5.576544761657715, 5.731470108032227, 5.886395454406738, 6.04132080078125, 6.196246147155762, 6.351171493530273, 6.506096839904785, 6.661022186279297, 6.815947532653809, 6.9708733558654785, 7.12579870223999, 7.280724048614502, 7.435649394989014, 7.590574741363525, 7.745500087738037, 7.900425434112549, 8.055351257324219, 8.21027660369873, 8.365201950073242, 8.520127296447754, 8.675052642822266]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 3.0, 7.0, 7.0, 7.0, 10.0, 8.0, 14.0, 13.0, 13.0, 13.0, 18.0, 14.0, 26.0, 21.0, 23.0, 28.0, 20.0, 29.0, 36.0, 22.0, 29.0, 36.0, 34.0, 35.0, 32.0, 41.0, 38.0, 34.0, 36.0, 37.0, 28.0, 27.0, 26.0, 31.0, 32.0, 28.0, 27.0, 13.0, 17.0, 17.0, 14.0, 12.0, 9.0, 7.0, 11.0, 8.0, 1.0, 0.0, 4.0, 6.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.6670024394989014, -1.6125273704528809, -1.5580523014068604, -1.5035772323608398, -1.4491021633148193, -1.3946270942687988, -1.3401521444320679, -1.2856770753860474, -1.2312020063400269, -1.1767269372940063, -1.1222518682479858, -1.0677767992019653, -1.0133018493652344, -0.9588267207145691, -0.9043517112731934, -0.8498766422271729, -0.7954015731811523, -0.7409265041351318, -0.6864514350891113, -0.6319764256477356, -0.5775013566017151, -0.5230262875556946, -0.46855124831199646, -0.41407620906829834, -0.35960114002227783, -0.3051260709762573, -0.2506510317325592, -0.1961759775876999, -0.14170092344284058, -0.08722585439682007, -0.03275081515312195, 0.021724224090576172, 0.07619941234588623, 0.13067446649074554, 0.18514952063560486, 0.23962457478046417, 0.2940996289253235, 0.348574697971344, 0.4030497372150421, 0.45752477645874023, 0.5119998455047607, 0.5664749145507812, 0.6209499835968018, 0.6754249930381775, 0.729900062084198, 0.7843751311302185, 0.8388501405715942, 0.8933252096176147, 0.9478002786636353, 1.0022753477096558, 1.0567504167556763, 1.1112254858016968, 1.1657004356384277, 1.2201755046844482, 1.2746505737304688, 1.3291256427764893, 1.3836007118225098, 1.4380757808685303, 1.4925508499145508, 1.5470259189605713, 1.6015009880065918, 1.6559760570526123, 1.7104510068893433, 1.7649260759353638, 1.8194011449813843]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 3.0, 3.0, 5.0, 3.0, 4.0, 6.0, 8.0, 8.0, 9.0, 18.0, 13.0, 26.0, 29.0, 36.0, 33.0, 61.0, 116.0, 153.0, 269.0, 598.0, 1394.0, 4382.0, 20109.0, 212662.0, 3845796.0, 90990.0, 12451.0, 3062.0, 1061.0, 443.0, 191.0, 125.0, 88.0, 45.0, 24.0, 23.0, 10.0, 9.0, 9.0, 4.0, 3.0, 2.0, 2.0, 0.0, 4.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.05078125, -1.0201950073242188, -0.9896087646484375, -0.9590225219726562, -0.928436279296875, -0.8978500366210938, -0.8672637939453125, -0.8366775512695312, -0.80609130859375, -0.7755050659179688, -0.7449188232421875, -0.7143325805664062, -0.683746337890625, -0.6531600952148438, -0.6225738525390625, -0.5919876098632812, -0.5614013671875, -0.5308151245117188, -0.5002288818359375, -0.46964263916015625, -0.439056396484375, -0.40847015380859375, -0.3778839111328125, -0.34729766845703125, -0.31671142578125, -0.28612518310546875, -0.2555389404296875, -0.22495269775390625, -0.194366455078125, -0.16378021240234375, -0.1331939697265625, -0.10260772705078125, -0.072021484375, -0.04143524169921875, -0.0108489990234375, 0.01973724365234375, 0.050323486328125, 0.08090972900390625, 0.1114959716796875, 0.14208221435546875, 0.17266845703125, 0.20325469970703125, 0.2338409423828125, 0.26442718505859375, 0.295013427734375, 0.32559967041015625, 0.3561859130859375, 0.38677215576171875, 0.4173583984375, 0.44794464111328125, 0.4785308837890625, 0.5091171264648438, 0.539703369140625, 0.5702896118164062, 0.6008758544921875, 0.6314620971679688, 0.66204833984375, 0.6926345825195312, 0.7232208251953125, 0.7538070678710938, 0.784393310546875, 0.8149795532226562, 0.8455657958984375, 0.8761520385742188, 0.90673828125]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 5.0, 9.0, 11.0, 19.0, 10.0, 15.0, 37.0, 33.0, 41.0, 54.0, 56.0, 63.0, 67.0, 75.0, 69.0, 68.0, 49.0, 46.0, 38.0, 60.0, 30.0, 31.0, 25.0, 23.0, 18.0, 12.0, 12.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1690673828125, -0.16409873962402344, -0.15913009643554688, -0.1541614532470703, -0.14919281005859375, -0.1442241668701172, -0.13925552368164062, -0.13428688049316406, -0.1293182373046875, -0.12434959411621094, -0.11938095092773438, -0.11441230773925781, -0.10944366455078125, -0.10447502136230469, -0.09950637817382812, -0.09453773498535156, -0.089569091796875, -0.08460044860839844, -0.07963180541992188, -0.07466316223144531, -0.06969451904296875, -0.06472587585449219, -0.059757232666015625, -0.05478858947753906, -0.0498199462890625, -0.04485130310058594, -0.039882659912109375, -0.03491401672363281, -0.02994537353515625, -0.024976730346679688, -0.020008087158203125, -0.015039443969726562, -0.01007080078125, -0.0051021575927734375, -0.000133514404296875, 0.0048351287841796875, 0.00980377197265625, 0.014772415161132812, 0.019741058349609375, 0.024709701538085938, 0.0296783447265625, 0.03464698791503906, 0.039615631103515625, 0.04458427429199219, 0.04955291748046875, 0.05452156066894531, 0.059490203857421875, 0.06445884704589844, 0.069427490234375, 0.07439613342285156, 0.07936477661132812, 0.08433341979980469, 0.08930206298828125, 0.09427070617675781, 0.09923934936523438, 0.10420799255371094, 0.1091766357421875, 0.11414527893066406, 0.11911392211914062, 0.12408256530761719, 0.12905120849609375, 0.1340198516845703, 0.13898849487304688, 0.14395713806152344, 0.14892578125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 2.0, 2.0, 2.0, 1.0, 2.0, 5.0, 5.0, 12.0, 20.0, 25.0, 33.0, 44.0, 83.0, 120.0, 202.0, 417.0, 987.0, 2856.0, 11016.0, 71712.0, 3769814.0, 305477.0, 23543.0, 5072.0, 1562.0, 584.0, 293.0, 145.0, 95.0, 63.0, 37.0, 18.0, 20.0, 1.0, 10.0, 3.0, 2.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0048828125, -0.9750900268554688, -0.9452972412109375, -0.9155044555664062, -0.885711669921875, -0.8559188842773438, -0.8261260986328125, -0.7963333129882812, -0.76654052734375, -0.7367477416992188, -0.7069549560546875, -0.6771621704101562, -0.647369384765625, -0.6175765991210938, -0.5877838134765625, -0.5579910278320312, -0.5281982421875, -0.49840545654296875, -0.4686126708984375, -0.43881988525390625, -0.409027099609375, -0.37923431396484375, -0.3494415283203125, -0.31964874267578125, -0.28985595703125, -0.26006317138671875, -0.2302703857421875, -0.20047760009765625, -0.170684814453125, -0.14089202880859375, -0.1110992431640625, -0.08130645751953125, -0.051513671875, -0.02172088623046875, 0.0080718994140625, 0.03786468505859375, 0.067657470703125, 0.09745025634765625, 0.1272430419921875, 0.15703582763671875, 0.18682861328125, 0.21662139892578125, 0.2464141845703125, 0.27620697021484375, 0.305999755859375, 0.33579254150390625, 0.3655853271484375, 0.39537811279296875, 0.4251708984375, 0.45496368408203125, 0.4847564697265625, 0.5145492553710938, 0.544342041015625, 0.5741348266601562, 0.6039276123046875, 0.6337203979492188, 0.66351318359375, 0.6933059692382812, 0.7230987548828125, 0.7528915405273438, 0.782684326171875, 0.8124771118164062, 0.8422698974609375, 0.8720626831054688, 0.90185546875]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 4.0, 6.0, 10.0, 12.0, 22.0, 44.0, 66.0, 141.0, 440.0, 2217.0, 729.0, 196.0, 86.0, 41.0, 25.0, 19.0, 8.0, 7.0, 3.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.55029296875, -0.5382347106933594, -0.5261764526367188, -0.5141181945800781, -0.5020599365234375, -0.4900016784667969, -0.47794342041015625, -0.4658851623535156, -0.453826904296875, -0.4417686462402344, -0.42971038818359375, -0.4176521301269531, -0.4055938720703125, -0.3935356140136719, -0.38147735595703125, -0.3694190979003906, -0.35736083984375, -0.3453025817871094, -0.33324432373046875, -0.3211860656738281, -0.3091278076171875, -0.2970695495605469, -0.28501129150390625, -0.2729530334472656, -0.260894775390625, -0.24883651733398438, -0.23677825927734375, -0.22472000122070312, -0.2126617431640625, -0.20060348510742188, -0.18854522705078125, -0.17648696899414062, -0.1644287109375, -0.15237045288085938, -0.14031219482421875, -0.12825393676757812, -0.1161956787109375, -0.10413742065429688, -0.09207916259765625, -0.08002090454101562, -0.067962646484375, -0.055904388427734375, -0.04384613037109375, -0.031787872314453125, -0.0197296142578125, -0.007671356201171875, 0.00438690185546875, 0.016445159912109375, 0.02850341796875, 0.040561676025390625, 0.05261993408203125, 0.06467819213867188, 0.0767364501953125, 0.08879470825195312, 0.10085296630859375, 0.11291122436523438, 0.124969482421875, 0.13702774047851562, 0.14908599853515625, 0.16114425659179688, 0.1732025146484375, 0.18526077270507812, 0.19731903076171875, 0.20937728881835938, 0.221435546875]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 3.0, 3.0, 7.0, 7.0, 13.0, 29.0, 73.0, 94.0, 160.0, 176.0, 167.0, 104.0, 82.0, 47.0, 14.0, 12.0, 3.0, 5.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2688374519348145, -2.2154757976531982, -2.162114143371582, -2.108752489089966, -2.0553908348083496, -2.0020289421081543, -1.948667287826538, -1.8953056335449219, -1.8419439792633057, -1.7885823249816895, -1.7352206707000732, -1.6818588972091675, -1.6284972429275513, -1.575135588645935, -1.5217738151550293, -1.468412160873413, -1.4150505065917969, -1.3616888523101807, -1.3083271980285645, -1.2549654245376587, -1.2016037702560425, -1.1482421159744263, -1.0948803424835205, -1.0415186882019043, -0.9881570339202881, -0.9347953796386719, -0.8814336657524109, -0.8280719518661499, -0.7747102975845337, -0.7213486433029175, -0.6679869294166565, -0.6146252155303955, -0.5612634420394897, -0.5079017877578735, -0.45454007387161255, -0.40117838978767395, -0.34781670570373535, -0.29445502161979675, -0.24109333753585815, -0.18773165345191956, -0.13436996936798096, -0.08100828528404236, -0.02764660120010376, 0.02571508288383484, 0.07907676696777344, 0.13243845105171204, 0.18580013513565063, 0.23916181921958923, 0.29252350330352783, 0.34588518738746643, 0.39924687147140503, 0.45260855555534363, 0.5059702396392822, 0.5593318939208984, 0.6126936078071594, 0.6660553216934204, 0.7194169759750366, 0.7727786302566528, 0.8261403441429138, 0.8795020580291748, 0.932863712310791, 0.9862253665924072, 1.0395870208740234, 1.0929487943649292, 1.1463104486465454]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 9.0, 5.0, 16.0, 32.0, 36.0, 47.0, 73.0, 74.0, 84.0, 78.0, 93.0, 76.0, 82.0, 63.0, 83.0, 43.0, 26.0, 28.0, 16.0, 14.0, 8.0, 7.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1397440433502197, -1.0986794233322144, -1.057614803314209, -1.016550064086914, -0.9754854440689087, -0.9344208240509033, -0.893356204032898, -0.8522915244102478, -0.8112268447875977, -0.7701622247695923, -0.7290975451469421, -0.6880329251289368, -0.6469682455062866, -0.6059036254882812, -0.5648390054702759, -0.5237743258476257, -0.48270970582962036, -0.4416450560092926, -0.40058040618896484, -0.3595157861709595, -0.3184511065483093, -0.27738648653030396, -0.2363218367099762, -0.19525718688964844, -0.15419253706932068, -0.11312788724899292, -0.07206324487924576, -0.030998602509498596, 0.010066047310829163, 0.05113069713115692, 0.09219533205032349, 0.13325998187065125, 0.174324631690979, 0.21538928151130676, 0.2564539313316345, 0.2975185513496399, 0.33858323097229004, 0.3796478509902954, 0.42071250081062317, 0.4617771506309509, 0.5028418302536011, 0.5439064502716064, 0.5849711298942566, 0.626035749912262, 0.6671004295349121, 0.7081650495529175, 0.7492296695709229, 0.790294349193573, 0.8313589692115784, 0.8724235892295837, 0.9134882688522339, 0.9545528888702393, 0.9956175684928894, 1.0366822481155396, 1.077746868133545, 1.1188114881515503, 1.1598761081695557, 1.200940728187561, 1.2420053482055664, 1.2830700874328613, 1.3241347074508667, 1.365199327468872, 1.4062639474868774, 1.4473285675048828, 1.4883933067321777]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 0.0, 3.0, 3.0, 9.0, 5.0, 10.0, 10.0, 19.0, 19.0, 26.0, 40.0, 69.0, 84.0, 138.0, 229.0, 412.0, 873.0, 2323.0, 7964.0, 43836.0, 376107.0, 533912.0, 66448.0, 10903.0, 2907.0, 1073.0, 465.0, 237.0, 142.0, 96.0, 51.0, 45.0, 22.0, 17.0, 11.0, 17.0, 7.0, 8.0, 3.0, 7.0, 1.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.88720703125, -0.8604049682617188, -0.8336029052734375, -0.8068008422851562, -0.779998779296875, -0.7531967163085938, -0.7263946533203125, -0.6995925903320312, -0.67279052734375, -0.6459884643554688, -0.6191864013671875, -0.5923843383789062, -0.565582275390625, -0.5387802124023438, -0.5119781494140625, -0.48517608642578125, -0.4583740234375, -0.43157196044921875, -0.4047698974609375, -0.37796783447265625, -0.351165771484375, -0.32436370849609375, -0.2975616455078125, -0.27075958251953125, -0.24395751953125, -0.21715545654296875, -0.1903533935546875, -0.16355133056640625, -0.136749267578125, -0.10994720458984375, -0.0831451416015625, -0.05634307861328125, -0.029541015625, -0.00273895263671875, 0.0240631103515625, 0.05086517333984375, 0.077667236328125, 0.10446929931640625, 0.1312713623046875, 0.15807342529296875, 0.18487548828125, 0.21167755126953125, 0.2384796142578125, 0.26528167724609375, 0.292083740234375, 0.31888580322265625, 0.3456878662109375, 0.37248992919921875, 0.3992919921875, 0.42609405517578125, 0.4528961181640625, 0.47969818115234375, 0.506500244140625, 0.5333023071289062, 0.5601043701171875, 0.5869064331054688, 0.61370849609375, 0.6405105590820312, 0.6673126220703125, 0.6941146850585938, 0.720916748046875, 0.7477188110351562, 0.7745208740234375, 0.8013229370117188, 0.828125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 4.0, 2.0, 4.0, 4.0, 8.0, 8.0, 10.0, 17.0, 25.0, 28.0, 34.0, 38.0, 51.0, 49.0, 73.0, 78.0, 74.0, 49.0, 71.0, 59.0, 53.0, 42.0, 51.0, 35.0, 35.0, 24.0, 17.0, 14.0, 12.0, 12.0, 7.0, 6.0, 2.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.19287109375, -0.18738555908203125, -0.1819000244140625, -0.17641448974609375, -0.170928955078125, -0.16544342041015625, -0.1599578857421875, -0.15447235107421875, -0.14898681640625, -0.14350128173828125, -0.1380157470703125, -0.13253021240234375, -0.127044677734375, -0.12155914306640625, -0.1160736083984375, -0.11058807373046875, -0.1051025390625, -0.09961700439453125, -0.0941314697265625, -0.08864593505859375, -0.083160400390625, -0.07767486572265625, -0.0721893310546875, -0.06670379638671875, -0.06121826171875, -0.05573272705078125, -0.0502471923828125, -0.04476165771484375, -0.039276123046875, -0.03379058837890625, -0.0283050537109375, -0.02281951904296875, -0.017333984375, -0.01184844970703125, -0.0063629150390625, -0.00087738037109375, 0.004608154296875, 0.01009368896484375, 0.0155792236328125, 0.02106475830078125, 0.02655029296875, 0.03203582763671875, 0.0375213623046875, 0.04300689697265625, 0.048492431640625, 0.05397796630859375, 0.0594635009765625, 0.06494903564453125, 0.0704345703125, 0.07592010498046875, 0.0814056396484375, 0.08689117431640625, 0.092376708984375, 0.09786224365234375, 0.1033477783203125, 0.10883331298828125, 0.11431884765625, 0.11980438232421875, 0.1252899169921875, 0.13077545166015625, 0.136260986328125, 0.14174652099609375, 0.1472320556640625, 0.15271759033203125, 0.158203125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 3.0, 3.0, 5.0, 3.0, 3.0, 12.0, 10.0, 14.0, 19.0, 34.0, 58.0, 71.0, 134.0, 261.0, 493.0, 994.0, 2558.0, 7297.0, 23196.0, 84799.0, 306579.0, 428237.0, 139179.0, 37139.0, 10947.0, 3653.0, 1473.0, 596.0, 290.0, 178.0, 111.0, 67.0, 38.0, 31.0, 19.0, 17.0, 10.0, 5.0, 12.0, 3.0, 0.0, 5.0, 0.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44140625, -0.4276924133300781, -0.41397857666015625, -0.4002647399902344, -0.3865509033203125, -0.3728370666503906, -0.35912322998046875, -0.3454093933105469, -0.331695556640625, -0.3179817199707031, -0.30426788330078125, -0.2905540466308594, -0.2768402099609375, -0.2631263732910156, -0.24941253662109375, -0.23569869995117188, -0.22198486328125, -0.20827102661132812, -0.19455718994140625, -0.18084335327148438, -0.1671295166015625, -0.15341567993164062, -0.13970184326171875, -0.12598800659179688, -0.112274169921875, -0.09856033325195312, -0.08484649658203125, -0.07113265991210938, -0.0574188232421875, -0.043704986572265625, -0.02999114990234375, -0.016277313232421875, -0.0025634765625, 0.011150360107421875, 0.02486419677734375, 0.038578033447265625, 0.0522918701171875, 0.06600570678710938, 0.07971954345703125, 0.09343338012695312, 0.107147216796875, 0.12086105346679688, 0.13457489013671875, 0.14828872680664062, 0.1620025634765625, 0.17571640014648438, 0.18943023681640625, 0.20314407348632812, 0.21685791015625, 0.23057174682617188, 0.24428558349609375, 0.2579994201660156, 0.2717132568359375, 0.2854270935058594, 0.29914093017578125, 0.3128547668457031, 0.326568603515625, 0.3402824401855469, 0.35399627685546875, 0.3677101135253906, 0.3814239501953125, 0.3951377868652344, 0.40885162353515625, 0.4225654602050781, 0.436279296875]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 3.0, 4.0, 3.0, 7.0, 8.0, 6.0, 18.0, 13.0, 23.0, 18.0, 25.0, 26.0, 28.0, 28.0, 37.0, 50.0, 42.0, 49.0, 42.0, 44.0, 50.0, 45.0, 46.0, 40.0, 41.0, 41.0, 34.0, 26.0, 32.0, 22.0, 23.0, 17.0, 21.0, 16.0, 18.0, 18.0, 16.0, 6.0, 9.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.5712890625, -0.5552406311035156, -0.5391921997070312, -0.5231437683105469, -0.5070953369140625, -0.4910469055175781, -0.47499847412109375, -0.4589500427246094, -0.442901611328125, -0.4268531799316406, -0.41080474853515625, -0.3947563171386719, -0.3787078857421875, -0.3626594543457031, -0.34661102294921875, -0.3305625915527344, -0.31451416015625, -0.2984657287597656, -0.28241729736328125, -0.2663688659667969, -0.2503204345703125, -0.23427200317382812, -0.21822357177734375, -0.20217514038085938, -0.186126708984375, -0.17007827758789062, -0.15402984619140625, -0.13798141479492188, -0.1219329833984375, -0.10588455200195312, -0.08983612060546875, -0.07378768920898438, -0.0577392578125, -0.041690826416015625, -0.02564239501953125, -0.009593963623046875, 0.0064544677734375, 0.022502899169921875, 0.03855133056640625, 0.054599761962890625, 0.070648193359375, 0.08669662475585938, 0.10274505615234375, 0.11879348754882812, 0.1348419189453125, 0.15089035034179688, 0.16693878173828125, 0.18298721313476562, 0.19903564453125, 0.21508407592773438, 0.23113250732421875, 0.24718093872070312, 0.2632293701171875, 0.2792778015136719, 0.29532623291015625, 0.3113746643066406, 0.327423095703125, 0.3434715270996094, 0.35951995849609375, 0.3755683898925781, 0.3916168212890625, 0.4076652526855469, 0.42371368408203125, 0.4397621154785156, 0.455810546875]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 9.0, 4.0, 10.0, 12.0, 15.0, 19.0, 41.0, 92.0, 161.0, 287.0, 593.0, 1379.0, 3972.0, 17036.0, 158414.0, 711031.0, 133915.0, 15343.0, 3773.0, 1311.0, 533.0, 267.0, 138.0, 63.0, 48.0, 39.0, 22.0, 14.0, 4.0, 6.0, 2.0, 4.0, 1.0, 1.0, 1.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-0.328369140625, -0.3200492858886719, -0.31172943115234375, -0.3034095764160156, -0.2950897216796875, -0.2867698669433594, -0.27845001220703125, -0.2701301574707031, -0.261810302734375, -0.2534904479980469, -0.24517059326171875, -0.23685073852539062, -0.2285308837890625, -0.22021102905273438, -0.21189117431640625, -0.20357131958007812, -0.19525146484375, -0.18693161010742188, -0.17861175537109375, -0.17029190063476562, -0.1619720458984375, -0.15365219116210938, -0.14533233642578125, -0.13701248168945312, -0.128692626953125, -0.12037277221679688, -0.11205291748046875, -0.10373306274414062, -0.0954132080078125, -0.08709335327148438, -0.07877349853515625, -0.07045364379882812, -0.0621337890625, -0.053813934326171875, -0.04549407958984375, -0.037174224853515625, -0.0288543701171875, -0.020534515380859375, -0.01221466064453125, -0.003894805908203125, 0.004425048828125, 0.012744903564453125, 0.02106475830078125, 0.029384613037109375, 0.0377044677734375, 0.046024322509765625, 0.05434417724609375, 0.06266403198242188, 0.07098388671875, 0.07930374145507812, 0.08762359619140625, 0.09594345092773438, 0.1042633056640625, 0.11258316040039062, 0.12090301513671875, 0.12922286987304688, 0.137542724609375, 0.14586257934570312, 0.15418243408203125, 0.16250228881835938, 0.1708221435546875, 0.17914199829101562, 0.18746185302734375, 0.19578170776367188, 0.2041015625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 9.0, 12.0, 21.0, 23.0, 49.0, 93.0, 225.0, 290.0, 144.0, 64.0, 31.0, 17.0, 11.0, 8.0, 7.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00017142295837402344, -0.00016513094305992126, -0.0001588389277458191, -0.00015254691243171692, -0.00014625489711761475, -0.00013996288180351257, -0.0001336708664894104, -0.00012737885117530823, -0.00012108683586120605, -0.00011479482054710388, -0.00010850280523300171, -0.00010221078991889954, -9.591877460479736e-05, -8.962675929069519e-05, -8.333474397659302e-05, -7.704272866249084e-05, -7.075071334838867e-05, -6.44586980342865e-05, -5.8166682720184326e-05, -5.187466740608215e-05, -4.558265209197998e-05, -3.929063677787781e-05, -3.2998621463775635e-05, -2.6706606149673462e-05, -2.041459083557129e-05, -1.4122575521469116e-05, -7.830560207366943e-06, -1.5385448932647705e-06, 4.753470420837402e-06, 1.1045485734939575e-05, 1.7337501049041748e-05, 2.362951636314392e-05, 2.9921531677246094e-05, 3.6213546991348267e-05, 4.250556230545044e-05, 4.879757761955261e-05, 5.5089592933654785e-05, 6.138160824775696e-05, 6.767362356185913e-05, 7.39656388759613e-05, 8.025765419006348e-05, 8.654966950416565e-05, 9.284168481826782e-05, 9.913370013237e-05, 0.00010542571544647217, 0.00011171773076057434, 0.00011800974607467651, 0.0001243017613887787, 0.00013059377670288086, 0.00013688579201698303, 0.0001431778073310852, 0.00014946982264518738, 0.00015576183795928955, 0.00016205385327339172, 0.0001683458685874939, 0.00017463788390159607, 0.00018092989921569824, 0.00018722191452980042, 0.0001935139298439026, 0.00019980594515800476, 0.00020609796047210693, 0.0002123899757862091, 0.00021868199110031128, 0.00022497400641441345, 0.00023126602172851562]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 4.0, 8.0, 5.0, 17.0, 26.0, 37.0, 51.0, 95.0, 202.0, 360.0, 800.0, 1876.0, 6105.0, 29458.0, 234154.0, 637376.0, 114519.0, 16761.0, 4111.0, 1365.0, 603.0, 270.0, 173.0, 69.0, 48.0, 22.0, 15.0, 9.0, 4.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.264404296875, -0.25692176818847656, -0.24943923950195312, -0.2419567108154297, -0.23447418212890625, -0.2269916534423828, -0.21950912475585938, -0.21202659606933594, -0.2045440673828125, -0.19706153869628906, -0.18957901000976562, -0.1820964813232422, -0.17461395263671875, -0.1671314239501953, -0.15964889526367188, -0.15216636657714844, -0.144683837890625, -0.13720130920410156, -0.12971878051757812, -0.12223625183105469, -0.11475372314453125, -0.10727119445800781, -0.09978866577148438, -0.09230613708496094, -0.0848236083984375, -0.07734107971191406, -0.06985855102539062, -0.06237602233886719, -0.05489349365234375, -0.04741096496582031, -0.039928436279296875, -0.03244590759277344, -0.02496337890625, -0.017480850219726562, -0.009998321533203125, -0.0025157928466796875, 0.00496673583984375, 0.012449264526367188, 0.019931793212890625, 0.027414321899414062, 0.0348968505859375, 0.04237937927246094, 0.049861907958984375, 0.05734443664550781, 0.06482696533203125, 0.07230949401855469, 0.07979202270507812, 0.08727455139160156, 0.094757080078125, 0.10223960876464844, 0.10972213745117188, 0.11720466613769531, 0.12468719482421875, 0.1321697235107422, 0.13965225219726562, 0.14713478088378906, 0.1546173095703125, 0.16209983825683594, 0.16958236694335938, 0.1770648956298828, 0.18454742431640625, 0.1920299530029297, 0.19951248168945312, 0.20699501037597656, 0.2144775390625]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 4.0, 4.0, 3.0, 13.0, 9.0, 19.0, 26.0, 26.0, 49.0, 73.0, 58.0, 96.0, 108.0, 99.0, 95.0, 72.0, 90.0, 50.0, 42.0, 21.0, 14.0, 12.0, 7.0, 5.0, 5.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.220458984375, -0.21381759643554688, -0.20717620849609375, -0.20053482055664062, -0.1938934326171875, -0.18725204467773438, -0.18061065673828125, -0.17396926879882812, -0.167327880859375, -0.16068649291992188, -0.15404510498046875, -0.14740371704101562, -0.1407623291015625, -0.13412094116210938, -0.12747955322265625, -0.12083816528320312, -0.11419677734375, -0.10755538940429688, -0.10091400146484375, -0.09427261352539062, -0.0876312255859375, -0.08098983764648438, -0.07434844970703125, -0.06770706176757812, -0.061065673828125, -0.054424285888671875, -0.04778289794921875, -0.041141510009765625, -0.0345001220703125, -0.027858734130859375, -0.02121734619140625, -0.014575958251953125, -0.0079345703125, -0.001293182373046875, 0.00534820556640625, 0.011989593505859375, 0.0186309814453125, 0.025272369384765625, 0.03191375732421875, 0.038555145263671875, 0.045196533203125, 0.051837921142578125, 0.05847930908203125, 0.06512069702148438, 0.0717620849609375, 0.07840347290039062, 0.08504486083984375, 0.09168624877929688, 0.09832763671875, 0.10496902465820312, 0.11161041259765625, 0.11825180053710938, 0.1248931884765625, 0.13153457641601562, 0.13817596435546875, 0.14481735229492188, 0.151458740234375, 0.15810012817382812, 0.16474151611328125, 0.17138290405273438, 0.1780242919921875, 0.18466567993164062, 0.19130706787109375, 0.19794845581054688, 0.20458984375]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 10.0, 30.0, 67.0, 155.0, 276.0, 251.0, 149.0, 52.0, 10.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.942337989807129, -7.721164226531982, -7.499990463256836, -7.278817176818848, -7.057643413543701, -6.836469650268555, -6.615295886993408, -6.394122123718262, -6.172948837280273, -5.951775074005127, -5.7306013107299805, -5.509428024291992, -5.288254261016846, -5.067080497741699, -4.845906734466553, -4.624732971191406, -4.403559684753418, -4.1823859214782715, -3.961212396621704, -3.7400386333465576, -3.5188651084899902, -3.2976913452148438, -3.0765175819396973, -2.85534405708313, -2.6341700553894043, -2.412996292114258, -2.1918227672576904, -1.970649003982544, -1.7494754791259766, -1.52830171585083, -1.3071280717849731, -1.0859544277191162, -0.8647809028625488, -0.6436072587966919, -0.4224335849285126, -0.20125991106033325, 0.01991373300552368, 0.2410874366760254, 0.4622610807418823, 0.6834347248077393, 0.9046083688735962, 1.1257820129394531, 1.34695565700531, 1.568129301071167, 1.7893030643463135, 2.010476589202881, 2.2316503524780273, 2.452824115753174, 2.673997640609741, 2.8951714038848877, 3.116344928741455, 3.3375186920166016, 3.558692216873169, 3.7798659801483154, 4.001039505004883, 4.222213268280029, 4.443387031555176, 4.664560794830322, 4.885734558105469, 5.106907844543457, 5.3280816078186035, 5.54925537109375, 5.7704291343688965, 5.991602897644043, 6.212776184082031]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 9.0, 5.0, 7.0, 11.0, 8.0, 10.0, 11.0, 13.0, 17.0, 26.0, 22.0, 20.0, 28.0, 35.0, 27.0, 28.0, 50.0, 46.0, 40.0, 52.0, 34.0, 43.0, 38.0, 42.0, 45.0, 40.0, 29.0, 36.0, 34.0, 25.0, 33.0, 18.0, 21.0, 18.0, 18.0, 12.0, 14.0, 14.0, 14.0, 6.0, 3.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.559624195098877, -2.482694387435913, -2.405764579772949, -2.3288350105285645, -2.2519052028656006, -2.1749753952026367, -2.098045587539673, -2.021115779876709, -1.9441860914230347, -1.8672562837600708, -1.7903265953063965, -1.7133967876434326, -1.6364669799804688, -1.5595372915267944, -1.4826074838638306, -1.4056777954101562, -1.3287479877471924, -1.2518181800842285, -1.1748884916305542, -1.0979586839675903, -1.021028995513916, -0.9440991878509521, -0.8671693801879883, -0.7902396321296692, -0.7133098840713501, -0.636380136013031, -0.5594503879547119, -0.48252058029174805, -0.40559083223342896, -0.32866108417510986, -0.2517313063144684, -0.1748015284538269, -0.09787154197692871, -0.020941779017448425, 0.05598798394203186, 0.13291774690151215, 0.20984750986099243, 0.2867772579193115, 0.363707035779953, 0.4406368136405945, 0.5175665616989136, 0.5944963097572327, 0.6714260578155518, 0.7483558654785156, 0.8252856135368347, 0.9022153615951538, 0.9791451692581177, 1.056074857711792, 1.1330046653747559, 1.2099344730377197, 1.286864161491394, 1.363793969154358, 1.4407236576080322, 1.517653465270996, 1.59458327293396, 1.6715130805969238, 1.7484427690505981, 1.825372576713562, 1.9023022651672363, 1.9792320728302002, 2.056161880493164, 2.133091449737549, 2.2100212574005127, 2.2869510650634766, 2.3638808727264404]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 6.0, 5.0, 3.0, 6.0, 16.0, 13.0, 16.0, 23.0, 62.0, 71.0, 144.0, 291.0, 677.0, 2080.0, 9102.0, 90481.0, 4015742.0, 65038.0, 7738.0, 1754.0, 590.0, 212.0, 94.0, 57.0, 25.0, 15.0, 13.0, 9.0, 3.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.611328125, -1.564544677734375, -1.51776123046875, -1.470977783203125, -1.4241943359375, -1.377410888671875, -1.33062744140625, -1.283843994140625, -1.237060546875, -1.190277099609375, -1.14349365234375, -1.096710205078125, -1.0499267578125, -1.003143310546875, -0.95635986328125, -0.909576416015625, -0.86279296875, -0.816009521484375, -0.76922607421875, -0.722442626953125, -0.6756591796875, -0.628875732421875, -0.58209228515625, -0.535308837890625, -0.488525390625, -0.441741943359375, -0.39495849609375, -0.348175048828125, -0.3013916015625, -0.254608154296875, -0.20782470703125, -0.161041259765625, -0.1142578125, -0.067474365234375, -0.02069091796875, 0.026092529296875, 0.0728759765625, 0.119659423828125, 0.16644287109375, 0.213226318359375, 0.260009765625, 0.306793212890625, 0.35357666015625, 0.400360107421875, 0.4471435546875, 0.493927001953125, 0.54071044921875, 0.587493896484375, 0.63427734375, 0.681060791015625, 0.72784423828125, 0.774627685546875, 0.8214111328125, 0.868194580078125, 0.91497802734375, 0.961761474609375, 1.008544921875, 1.055328369140625, 1.10211181640625, 1.148895263671875, 1.1956787109375, 1.242462158203125, 1.28924560546875, 1.336029052734375, 1.3828125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 11.0, 12.0, 13.0, 13.0, 15.0, 29.0, 39.0, 43.0, 51.0, 50.0, 62.0, 77.0, 52.0, 58.0, 51.0, 55.0, 60.0, 45.0, 60.0, 37.0, 21.0, 23.0, 21.0, 23.0, 20.0, 11.0, 11.0, 11.0, 8.0, 4.0, 4.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.189208984375, -0.183746337890625, -0.17828369140625, -0.172821044921875, -0.1673583984375, -0.161895751953125, -0.15643310546875, -0.150970458984375, -0.1455078125, -0.140045166015625, -0.13458251953125, -0.129119873046875, -0.1236572265625, -0.118194580078125, -0.11273193359375, -0.107269287109375, -0.101806640625, -0.096343994140625, -0.09088134765625, -0.085418701171875, -0.0799560546875, -0.074493408203125, -0.06903076171875, -0.063568115234375, -0.05810546875, -0.052642822265625, -0.04718017578125, -0.041717529296875, -0.0362548828125, -0.030792236328125, -0.02532958984375, -0.019866943359375, -0.014404296875, -0.008941650390625, -0.00347900390625, 0.001983642578125, 0.0074462890625, 0.012908935546875, 0.01837158203125, 0.023834228515625, 0.029296875, 0.034759521484375, 0.04022216796875, 0.045684814453125, 0.0511474609375, 0.056610107421875, 0.06207275390625, 0.067535400390625, 0.072998046875, 0.078460693359375, 0.08392333984375, 0.089385986328125, 0.0948486328125, 0.100311279296875, 0.10577392578125, 0.111236572265625, 0.11669921875, 0.122161865234375, 0.12762451171875, 0.133087158203125, 0.1385498046875, 0.144012451171875, 0.14947509765625, 0.154937744140625, 0.160400390625]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 3.0, 2.0, 5.0, 6.0, 16.0, 21.0, 31.0, 42.0, 55.0, 98.0, 140.0, 192.0, 321.0, 469.0, 705.0, 1187.0, 1948.0, 3527.0, 6864.0, 15060.0, 40305.0, 182903.0, 3570273.0, 284060.0, 50634.0, 17757.0, 7970.0, 3910.0, 2219.0, 1275.0, 796.0, 479.0, 331.0, 226.0, 134.0, 95.0, 62.0, 49.0, 30.0, 28.0, 13.0, 11.0, 12.0, 8.0, 5.0, 4.0, 1.0, 1.0, 0.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.4462890625, -0.43170166015625, -0.4171142578125, -0.40252685546875, -0.387939453125, -0.37335205078125, -0.3587646484375, -0.34417724609375, -0.32958984375, -0.31500244140625, -0.3004150390625, -0.28582763671875, -0.271240234375, -0.25665283203125, -0.2420654296875, -0.22747802734375, -0.212890625, -0.19830322265625, -0.1837158203125, -0.16912841796875, -0.154541015625, -0.13995361328125, -0.1253662109375, -0.11077880859375, -0.09619140625, -0.08160400390625, -0.0670166015625, -0.05242919921875, -0.037841796875, -0.02325439453125, -0.0086669921875, 0.00592041015625, 0.0205078125, 0.03509521484375, 0.0496826171875, 0.06427001953125, 0.078857421875, 0.09344482421875, 0.1080322265625, 0.12261962890625, 0.13720703125, 0.15179443359375, 0.1663818359375, 0.18096923828125, 0.195556640625, 0.21014404296875, 0.2247314453125, 0.23931884765625, 0.25390625, 0.26849365234375, 0.2830810546875, 0.29766845703125, 0.312255859375, 0.32684326171875, 0.3414306640625, 0.35601806640625, 0.37060546875, 0.38519287109375, 0.3997802734375, 0.41436767578125, 0.428955078125, 0.44354248046875, 0.4581298828125, 0.47271728515625, 0.4873046875]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 7.0, 2.0, 8.0, 10.0, 12.0, 25.0, 33.0, 54.0, 73.0, 124.0, 400.0, 2249.0, 632.0, 190.0, 80.0, 36.0, 34.0, 21.0, 14.0, 12.0, 7.0, 6.0, 7.0, 2.0, 6.0, 3.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.276611328125, -0.2683887481689453, -0.2601661682128906, -0.25194358825683594, -0.24372100830078125, -0.23549842834472656, -0.22727584838867188, -0.2190532684326172, -0.2108306884765625, -0.2026081085205078, -0.19438552856445312, -0.18616294860839844, -0.17794036865234375, -0.16971778869628906, -0.16149520874023438, -0.1532726287841797, -0.145050048828125, -0.1368274688720703, -0.12860488891601562, -0.12038230895996094, -0.11215972900390625, -0.10393714904785156, -0.09571456909179688, -0.08749198913574219, -0.0792694091796875, -0.07104682922363281, -0.06282424926757812, -0.05460166931152344, -0.04637908935546875, -0.03815650939941406, -0.029933929443359375, -0.021711349487304688, -0.01348876953125, -0.0052661895751953125, 0.002956390380859375, 0.011178970336914062, 0.01940155029296875, 0.027624130249023438, 0.035846710205078125, 0.04406929016113281, 0.0522918701171875, 0.06051445007324219, 0.06873703002929688, 0.07695960998535156, 0.08518218994140625, 0.09340476989746094, 0.10162734985351562, 0.10984992980957031, 0.118072509765625, 0.1262950897216797, 0.13451766967773438, 0.14274024963378906, 0.15096282958984375, 0.15918540954589844, 0.16740798950195312, 0.1756305694580078, 0.1838531494140625, 0.1920757293701172, 0.20029830932617188, 0.20852088928222656, 0.21674346923828125, 0.22496604919433594, 0.23318862915039062, 0.2414112091064453, 0.2496337890625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 11.0, 29.0, 131.0, 386.0, 318.0, 94.0, 23.0, 11.0, 2.0, 1.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7130770683288574, -2.6084702014923096, -2.503863573074341, -2.399256706237793, -2.294649839401245, -2.1900429725646973, -2.0854363441467285, -1.9808294773101807, -1.8762227296829224, -1.771615982055664, -1.6670091152191162, -1.562402367591858, -1.4577956199645996, -1.3531887531280518, -1.2485820055007935, -1.1439752578735352, -1.0393683910369873, -0.9347615838050842, -0.8301547765731812, -0.7255480289459229, -0.6209412217140198, -0.5163344144821167, -0.4117276668548584, -0.3071208596229553, -0.20251405239105225, -0.09790726006031036, 0.0066995322704315186, 0.11130630970001221, 0.21591311693191528, 0.32051992416381836, 0.42512667179107666, 0.5297334790229797, 0.6343400478363037, 0.7389468550682068, 0.8435536623001099, 0.9481604099273682, 1.052767276763916, 1.1573740243911743, 1.2619807720184326, 1.3665876388549805, 1.4711943864822388, 1.575801134109497, 1.680408000946045, 1.7850147485733032, 1.8896214962005615, 1.9942283630371094, 2.098834991455078, 2.203441858291626, 2.308048725128174, 2.4126555919647217, 2.5172622203826904, 2.6218690872192383, 2.726475954055786, 2.831082820892334, 2.9356894493103027, 3.0402963161468506, 3.1449031829833984, 3.2495100498199463, 3.354116678237915, 3.458723545074463, 3.5633304119110107, 3.6679372787475586, 3.7725439071655273, 3.877150774002075, 3.981757402420044]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 4.0, 4.0, 6.0, 10.0, 17.0, 18.0, 19.0, 33.0, 39.0, 49.0, 67.0, 73.0, 79.0, 80.0, 74.0, 83.0, 77.0, 58.0, 53.0, 37.0, 30.0, 32.0, 17.0, 13.0, 13.0, 3.0, 11.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3814382553100586, -1.345882534980774, -1.3103266954421997, -1.274770975112915, -1.2392152547836304, -1.2036594152450562, -1.1681036949157715, -1.1325479745864868, -1.0969921350479126, -1.061436414718628, -1.0258805751800537, -0.990324854850769, -0.9547690749168396, -0.9192132949829102, -0.8836575746536255, -0.848101794719696, -0.8125460743904114, -0.7769902944564819, -0.7414345741271973, -0.7058787941932678, -0.6703230142593384, -0.6347672939300537, -0.5992115139961243, -0.5636557340621948, -0.5281000137329102, -0.4925442636013031, -0.45698848366737366, -0.4214327335357666, -0.38587695360183716, -0.3503212034702301, -0.31476545333862305, -0.2792096734046936, -0.24365395307540894, -0.20809818804264069, -0.17254242300987244, -0.13698667287826538, -0.10143090784549713, -0.06587514281272888, -0.030319392681121826, 0.005236372351646423, 0.04079213738441467, 0.07634790241718292, 0.11190365999937057, 0.14745941758155823, 0.18301518261432648, 0.21857094764709473, 0.2541266977787018, 0.28968244791030884, 0.3252382278442383, 0.36079397797584534, 0.3963497579097748, 0.43190550804138184, 0.4674612879753113, 0.5030170679092407, 0.5385727882385254, 0.5741285681724548, 0.6096843481063843, 0.6452401280403137, 0.6807958483695984, 0.7163516283035278, 0.7519074082374573, 0.7874631881713867, 0.8230189085006714, 0.8585746884346008, 0.8941304087638855]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 2.0, 3.0, 5.0, 6.0, 13.0, 15.0, 14.0, 30.0, 35.0, 43.0, 65.0, 111.0, 194.0, 293.0, 583.0, 1101.0, 2583.0, 6741.0, 23216.0, 97060.0, 370257.0, 398093.0, 109474.0, 25769.0, 7473.0, 2679.0, 1192.0, 627.0, 330.0, 172.0, 121.0, 69.0, 52.0, 27.0, 22.0, 18.0, 21.0, 10.0, 8.0, 10.0, 6.0, 3.0, 3.0, 6.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.58447265625, -0.5662307739257812, -0.5479888916015625, -0.5297470092773438, -0.511505126953125, -0.49326324462890625, -0.4750213623046875, -0.45677947998046875, -0.43853759765625, -0.42029571533203125, -0.4020538330078125, -0.38381195068359375, -0.365570068359375, -0.34732818603515625, -0.3290863037109375, -0.31084442138671875, -0.2926025390625, -0.27436065673828125, -0.2561187744140625, -0.23787689208984375, -0.219635009765625, -0.20139312744140625, -0.1831512451171875, -0.16490936279296875, -0.14666748046875, -0.12842559814453125, -0.1101837158203125, -0.09194183349609375, -0.073699951171875, -0.05545806884765625, -0.0372161865234375, -0.01897430419921875, -0.000732421875, 0.01750946044921875, 0.0357513427734375, 0.05399322509765625, 0.072235107421875, 0.09047698974609375, 0.1087188720703125, 0.12696075439453125, 0.14520263671875, 0.16344451904296875, 0.1816864013671875, 0.19992828369140625, 0.218170166015625, 0.23641204833984375, 0.2546539306640625, 0.27289581298828125, 0.2911376953125, 0.30937957763671875, 0.3276214599609375, 0.34586334228515625, 0.364105224609375, 0.38234710693359375, 0.4005889892578125, 0.41883087158203125, 0.43707275390625, 0.45531463623046875, 0.4735565185546875, 0.49179840087890625, 0.510040283203125, 0.5282821655273438, 0.5465240478515625, 0.5647659301757812, 0.5830078125]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 4.0, 15.0, 17.0, 15.0, 14.0, 29.0, 39.0, 33.0, 47.0, 49.0, 66.0, 71.0, 58.0, 63.0, 59.0, 59.0, 55.0, 64.0, 45.0, 35.0, 27.0, 37.0, 19.0, 10.0, 24.0, 16.0, 5.0, 8.0, 4.0, 0.0, 6.0, 4.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.2103271484375, -0.2042560577392578, -0.19818496704101562, -0.19211387634277344, -0.18604278564453125, -0.17997169494628906, -0.17390060424804688, -0.1678295135498047, -0.1617584228515625, -0.1556873321533203, -0.14961624145507812, -0.14354515075683594, -0.13747406005859375, -0.13140296936035156, -0.12533187866210938, -0.11926078796386719, -0.113189697265625, -0.10711860656738281, -0.10104751586914062, -0.09497642517089844, -0.08890533447265625, -0.08283424377441406, -0.07676315307617188, -0.07069206237792969, -0.0646209716796875, -0.05854988098144531, -0.052478790283203125, -0.04640769958496094, -0.04033660888671875, -0.03426551818847656, -0.028194427490234375, -0.022123336791992188, -0.01605224609375, -0.009981155395507812, -0.003910064697265625, 0.0021610260009765625, 0.00823211669921875, 0.014303207397460938, 0.020374298095703125, 0.026445388793945312, 0.0325164794921875, 0.03858757019042969, 0.044658660888671875, 0.05072975158691406, 0.05680084228515625, 0.06287193298339844, 0.06894302368164062, 0.07501411437988281, 0.081085205078125, 0.08715629577636719, 0.09322738647460938, 0.09929847717285156, 0.10536956787109375, 0.11144065856933594, 0.11751174926757812, 0.12358283996582031, 0.1296539306640625, 0.1357250213623047, 0.14179611206054688, 0.14786720275878906, 0.15393829345703125, 0.16000938415527344, 0.16608047485351562, 0.1721515655517578, 0.17822265625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 5.0, 1.0, 14.0, 15.0, 19.0, 21.0, 36.0, 36.0, 62.0, 88.0, 124.0, 225.0, 333.0, 551.0, 1146.0, 2689.0, 7426.0, 26670.0, 120275.0, 446607.0, 337611.0, 76723.0, 17984.0, 5614.0, 2095.0, 899.0, 506.0, 260.0, 153.0, 95.0, 77.0, 49.0, 40.0, 33.0, 17.0, 13.0, 9.0, 10.0, 6.0, 10.0, 5.0, 8.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.57275390625, -0.5572128295898438, -0.5416717529296875, -0.5261306762695312, -0.510589599609375, -0.49504852294921875, -0.4795074462890625, -0.46396636962890625, -0.44842529296875, -0.43288421630859375, -0.4173431396484375, -0.40180206298828125, -0.386260986328125, -0.37071990966796875, -0.3551788330078125, -0.33963775634765625, -0.3240966796875, -0.30855560302734375, -0.2930145263671875, -0.27747344970703125, -0.261932373046875, -0.24639129638671875, -0.2308502197265625, -0.21530914306640625, -0.19976806640625, -0.18422698974609375, -0.1686859130859375, -0.15314483642578125, -0.137603759765625, -0.12206268310546875, -0.1065216064453125, -0.09098052978515625, -0.075439453125, -0.05989837646484375, -0.0443572998046875, -0.02881622314453125, -0.013275146484375, 0.00226593017578125, 0.0178070068359375, 0.03334808349609375, 0.04888916015625, 0.06443023681640625, 0.0799713134765625, 0.09551239013671875, 0.111053466796875, 0.12659454345703125, 0.1421356201171875, 0.15767669677734375, 0.1732177734375, 0.18875885009765625, 0.2042999267578125, 0.21984100341796875, 0.235382080078125, 0.25092315673828125, 0.2664642333984375, 0.28200531005859375, 0.29754638671875, 0.31308746337890625, 0.3286285400390625, 0.34416961669921875, 0.359710693359375, 0.37525177001953125, 0.3907928466796875, 0.40633392333984375, 0.421875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 5.0, 4.0, 11.0, 6.0, 10.0, 11.0, 20.0, 10.0, 23.0, 25.0, 23.0, 24.0, 24.0, 39.0, 29.0, 34.0, 42.0, 51.0, 43.0, 51.0, 41.0, 43.0, 45.0, 37.0, 50.0, 31.0, 28.0, 50.0, 22.0, 20.0, 17.0, 22.0, 26.0, 11.0, 13.0, 15.0, 9.0, 11.0, 11.0, 4.0, 9.0, 2.0, 1.0, 2.0, 3.0, 2.0], "bins": [-0.7333984375, -0.7141799926757812, -0.6949615478515625, -0.6757431030273438, -0.656524658203125, -0.6373062133789062, -0.6180877685546875, -0.5988693237304688, -0.57965087890625, -0.5604324340820312, -0.5412139892578125, -0.5219955444335938, -0.502777099609375, -0.48355865478515625, -0.4643402099609375, -0.44512176513671875, -0.4259033203125, -0.40668487548828125, -0.3874664306640625, -0.36824798583984375, -0.349029541015625, -0.32981109619140625, -0.3105926513671875, -0.29137420654296875, -0.27215576171875, -0.25293731689453125, -0.2337188720703125, -0.21450042724609375, -0.195281982421875, -0.17606353759765625, -0.1568450927734375, -0.13762664794921875, -0.118408203125, -0.09918975830078125, -0.0799713134765625, -0.06075286865234375, -0.041534423828125, -0.02231597900390625, -0.0030975341796875, 0.01612091064453125, 0.03533935546875, 0.05455780029296875, 0.0737762451171875, 0.09299468994140625, 0.112213134765625, 0.13143157958984375, 0.1506500244140625, 0.16986846923828125, 0.1890869140625, 0.20830535888671875, 0.2275238037109375, 0.24674224853515625, 0.265960693359375, 0.28517913818359375, 0.3043975830078125, 0.32361602783203125, 0.34283447265625, 0.36205291748046875, 0.3812713623046875, 0.40048980712890625, 0.419708251953125, 0.43892669677734375, 0.4581451416015625, 0.47736358642578125, 0.49658203125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 3.0, 4.0, 5.0, 15.0, 18.0, 22.0, 58.0, 125.0, 276.0, 818.0, 3385.0, 39539.0, 792846.0, 200816.0, 8449.0, 1428.0, 436.0, 158.0, 76.0, 30.0, 21.0, 10.0, 7.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.44970703125, -0.4355316162109375, -0.421356201171875, -0.4071807861328125, -0.39300537109375, -0.3788299560546875, -0.364654541015625, -0.3504791259765625, -0.3363037109375, -0.3221282958984375, -0.307952880859375, -0.2937774658203125, -0.27960205078125, -0.2654266357421875, -0.251251220703125, -0.2370758056640625, -0.222900390625, -0.2087249755859375, -0.194549560546875, -0.1803741455078125, -0.16619873046875, -0.1520233154296875, -0.137847900390625, -0.1236724853515625, -0.1094970703125, -0.0953216552734375, -0.081146240234375, -0.0669708251953125, -0.05279541015625, -0.0386199951171875, -0.024444580078125, -0.0102691650390625, 0.00390625, 0.0180816650390625, 0.032257080078125, 0.0464324951171875, 0.06060791015625, 0.0747833251953125, 0.088958740234375, 0.1031341552734375, 0.1173095703125, 0.1314849853515625, 0.145660400390625, 0.1598358154296875, 0.17401123046875, 0.1881866455078125, 0.202362060546875, 0.2165374755859375, 0.230712890625, 0.2448883056640625, 0.259063720703125, 0.2732391357421875, 0.28741455078125, 0.3015899658203125, 0.315765380859375, 0.3299407958984375, 0.3441162109375, 0.3582916259765625, 0.372467041015625, 0.3866424560546875, 0.40081787109375, 0.4149932861328125, 0.429168701171875, 0.4433441162109375, 0.45751953125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 9.0, 13.0, 22.0, 28.0, 23.0, 29.0, 55.0, 111.0, 145.0, 162.0, 116.0, 81.0, 57.0, 32.0, 26.0, 23.0, 15.0, 24.0, 6.0, 3.0, 5.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001556873321533203, -0.00015189312398433685, -0.0001480989158153534, -0.00014430470764636993, -0.00014051049947738647, -0.00013671629130840302, -0.00013292208313941956, -0.0001291278749704361, -0.00012533366680145264, -0.00012153945863246918, -0.00011774525046348572, -0.00011395104229450226, -0.0001101568341255188, -0.00010636262595653534, -0.00010256841778755188, -9.877420961856842e-05, -9.498000144958496e-05, -9.11857932806015e-05, -8.739158511161804e-05, -8.359737694263458e-05, -7.980316877365112e-05, -7.600896060466766e-05, -7.22147524356842e-05, -6.842054426670074e-05, -6.462633609771729e-05, -6.0832127928733826e-05, -5.7037919759750366e-05, -5.324371159076691e-05, -4.944950342178345e-05, -4.565529525279999e-05, -4.186108708381653e-05, -3.806687891483307e-05, -3.427267074584961e-05, -3.047846257686615e-05, -2.668425440788269e-05, -2.289004623889923e-05, -1.909583806991577e-05, -1.5301629900932312e-05, -1.1507421731948853e-05, -7.713213562965393e-06, -3.919005393981934e-06, -1.2479722499847412e-07, 3.6694109439849854e-06, 7.463619112968445e-06, 1.1257827281951904e-05, 1.5052035450935364e-05, 1.8846243619918823e-05, 2.2640451788902283e-05, 2.6434659957885742e-05, 3.02288681268692e-05, 3.402307629585266e-05, 3.781728446483612e-05, 4.161149263381958e-05, 4.540570080280304e-05, 4.91999089717865e-05, 5.299411714076996e-05, 5.678832530975342e-05, 6.058253347873688e-05, 6.437674164772034e-05, 6.81709498167038e-05, 7.196515798568726e-05, 7.575936615467072e-05, 7.955357432365417e-05, 8.334778249263763e-05, 8.71419906616211e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 5.0, 10.0, 15.0, 19.0, 36.0, 45.0, 94.0, 164.0, 396.0, 899.0, 3006.0, 15743.0, 151143.0, 696869.0, 158938.0, 16344.0, 3099.0, 940.0, 359.0, 192.0, 98.0, 54.0, 28.0, 29.0, 16.0, 8.0, 5.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.389404296875, -0.3787384033203125, -0.368072509765625, -0.3574066162109375, -0.34674072265625, -0.3360748291015625, -0.325408935546875, -0.3147430419921875, -0.3040771484375, -0.2934112548828125, -0.282745361328125, -0.2720794677734375, -0.26141357421875, -0.2507476806640625, -0.240081787109375, -0.2294158935546875, -0.21875, -0.2080841064453125, -0.197418212890625, -0.1867523193359375, -0.17608642578125, -0.1654205322265625, -0.154754638671875, -0.1440887451171875, -0.1334228515625, -0.1227569580078125, -0.112091064453125, -0.1014251708984375, -0.09075927734375, -0.0800933837890625, -0.069427490234375, -0.0587615966796875, -0.048095703125, -0.0374298095703125, -0.026763916015625, -0.0160980224609375, -0.00543212890625, 0.0052337646484375, 0.015899658203125, 0.0265655517578125, 0.0372314453125, 0.0478973388671875, 0.058563232421875, 0.0692291259765625, 0.07989501953125, 0.0905609130859375, 0.101226806640625, 0.1118927001953125, 0.12255859375, 0.1332244873046875, 0.143890380859375, 0.1545562744140625, 0.16522216796875, 0.1758880615234375, 0.186553955078125, 0.1972198486328125, 0.2078857421875, 0.2185516357421875, 0.229217529296875, 0.2398834228515625, 0.25054931640625, 0.2612152099609375, 0.271881103515625, 0.2825469970703125, 0.293212890625]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 2.0, 9.0, 8.0, 13.0, 24.0, 28.0, 32.0, 52.0, 71.0, 98.0, 93.0, 112.0, 101.0, 102.0, 81.0, 54.0, 37.0, 24.0, 21.0, 12.0, 8.0, 12.0, 5.0, 6.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.269775390625, -0.259979248046875, -0.25018310546875, -0.240386962890625, -0.2305908203125, -0.220794677734375, -0.21099853515625, -0.201202392578125, -0.19140625, -0.181610107421875, -0.17181396484375, -0.162017822265625, -0.1522216796875, -0.142425537109375, -0.13262939453125, -0.122833251953125, -0.113037109375, -0.103240966796875, -0.09344482421875, -0.083648681640625, -0.0738525390625, -0.064056396484375, -0.05426025390625, -0.044464111328125, -0.03466796875, -0.024871826171875, -0.01507568359375, -0.005279541015625, 0.0045166015625, 0.014312744140625, 0.02410888671875, 0.033905029296875, 0.043701171875, 0.053497314453125, 0.06329345703125, 0.073089599609375, 0.0828857421875, 0.092681884765625, 0.10247802734375, 0.112274169921875, 0.1220703125, 0.131866455078125, 0.14166259765625, 0.151458740234375, 0.1612548828125, 0.171051025390625, 0.18084716796875, 0.190643310546875, 0.200439453125, 0.210235595703125, 0.22003173828125, 0.229827880859375, 0.2396240234375, 0.249420166015625, 0.25921630859375, 0.269012451171875, 0.27880859375, 0.288604736328125, 0.29840087890625, 0.308197021484375, 0.3179931640625, 0.327789306640625, 0.33758544921875, 0.347381591796875, 0.357177734375]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 6.0, 15.0, 39.0, 146.0, 325.0, 283.0, 144.0, 35.0, 10.0, 5.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7703189849853516, -3.454355478286743, -3.138392210006714, -2.8224287033081055, -2.506465435028076, -2.1905019283294678, -1.8745384216308594, -1.55857515335083, -1.2426116466522217, -0.9266482591629028, -0.6106848120689392, -0.2947213649749756, 0.02124202251434326, 0.3372054100036621, 0.6531689167022705, 0.9691321849822998, 1.2850956916809082, 1.601059079170227, 1.917022466659546, 2.2329859733581543, 2.5489492416381836, 2.864912748336792, 3.1808762550354004, 3.4968395233154297, 3.812803030014038, 4.1287665367126465, 4.444729804992676, 4.760693550109863, 5.076656818389893, 5.392620086669922, 5.708583831787109, 6.0245466232299805, 6.340510368347168, 6.656473636627197, 6.972437381744385, 7.288400650024414, 7.604363918304443, 7.920327186584473, 8.23629093170166, 8.552253723144531, 8.868217468261719, 9.184181213378906, 9.500144004821777, 9.816107749938965, 10.132071495056152, 10.448034286499023, 10.763998031616211, 11.079961776733398, 11.395925521850586, 11.711889266967773, 12.027852058410645, 12.343815803527832, 12.65977954864502, 12.97574234008789, 13.291706085205078, 13.607669830322266, 13.923632621765137, 14.239596366882324, 14.555559158325195, 14.871522903442383, 15.18748664855957, 15.503449440002441, 15.819413185119629, 16.1353759765625, 16.451339721679688]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 3.0, 4.0, 2.0, 3.0, 6.0, 9.0, 10.0, 13.0, 12.0, 9.0, 19.0, 18.0, 14.0, 21.0, 24.0, 23.0, 28.0, 31.0, 30.0, 33.0, 45.0, 39.0, 44.0, 39.0, 33.0, 38.0, 43.0, 44.0, 39.0, 28.0, 34.0, 39.0, 24.0, 33.0, 32.0, 32.0, 18.0, 18.0, 16.0, 14.0, 7.0, 16.0, 9.0, 2.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-3.2427821159362793, -3.1435275077819824, -3.0442728996276855, -2.9450182914733887, -2.845763921737671, -2.746509313583374, -2.647254705429077, -2.5480000972747803, -2.4487457275390625, -2.3494911193847656, -2.2502365112304688, -2.150981903076172, -2.051727533340454, -1.9524729251861572, -1.8532183170318604, -1.7539637088775635, -1.6547091007232666, -1.5554544925689697, -1.4562000036239624, -1.3569453954696655, -1.2576909065246582, -1.1584362983703613, -1.0591816902160645, -0.9599271416664124, -0.8606725931167603, -0.7614180445671082, -0.662163496017456, -0.5629088878631592, -0.4636543393135071, -0.364399790763855, -0.2651451826095581, -0.165890634059906, -0.06663632392883301, 0.032618239521980286, 0.13187280297279358, 0.23112738132476807, 0.33038192987442017, 0.42963647842407227, 0.5288910865783691, 0.6281456351280212, 0.7274001836776733, 0.8266547322273254, 0.9259092807769775, 1.0251638889312744, 1.1244184970855713, 1.2236729860305786, 1.3229275941848755, 1.4221820831298828, 1.5214366912841797, 1.6206912994384766, 1.7199457883834839, 1.8192003965377808, 1.918454885482788, 2.017709493637085, 2.116964101791382, 2.2162187099456787, 2.3154730796813965, 2.4147276878356934, 2.5139822959899902, 2.613236904144287, 2.712491273880005, 2.8117458820343018, 2.9110004901885986, 3.0102550983428955, 3.1095097064971924]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 4.0, 4.0, 5.0, 9.0, 9.0, 21.0, 17.0, 20.0, 36.0, 77.0, 114.0, 197.0, 328.0, 602.0, 1330.0, 2988.0, 7741.0, 29043.0, 373089.0, 3698357.0, 59913.0, 12620.0, 4251.0, 1861.0, 818.0, 389.0, 189.0, 108.0, 51.0, 38.0, 21.0, 18.0, 10.0, 6.0, 2.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0556640625, -1.0264968872070312, -0.9973297119140625, -0.9681625366210938, -0.938995361328125, -0.9098281860351562, -0.8806610107421875, -0.8514938354492188, -0.82232666015625, -0.7931594848632812, -0.7639923095703125, -0.7348251342773438, -0.705657958984375, -0.6764907836914062, -0.6473236083984375, -0.6181564331054688, -0.5889892578125, -0.5598220825195312, -0.5306549072265625, -0.5014877319335938, -0.472320556640625, -0.44315338134765625, -0.4139862060546875, -0.38481903076171875, -0.35565185546875, -0.32648468017578125, -0.2973175048828125, -0.26815032958984375, -0.238983154296875, -0.20981597900390625, -0.1806488037109375, -0.15148162841796875, -0.122314453125, -0.09314727783203125, -0.0639801025390625, -0.03481292724609375, -0.005645751953125, 0.02352142333984375, 0.0526885986328125, 0.08185577392578125, 0.11102294921875, 0.14019012451171875, 0.1693572998046875, 0.19852447509765625, 0.227691650390625, 0.25685882568359375, 0.2860260009765625, 0.31519317626953125, 0.3443603515625, 0.37352752685546875, 0.4026947021484375, 0.43186187744140625, 0.461029052734375, 0.49019622802734375, 0.5193634033203125, 0.5485305786132812, 0.57769775390625, 0.6068649291992188, 0.6360321044921875, 0.6651992797851562, 0.694366455078125, 0.7235336303710938, 0.7527008056640625, 0.7818679809570312, 0.81103515625]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 6.0, 16.0, 12.0, 15.0, 23.0, 33.0, 31.0, 32.0, 54.0, 51.0, 52.0, 66.0, 58.0, 53.0, 39.0, 71.0, 53.0, 55.0, 35.0, 42.0, 43.0, 25.0, 34.0, 16.0, 23.0, 15.0, 6.0, 11.0, 3.0, 9.0, 4.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2215576171875, -0.2152080535888672, -0.20885848999023438, -0.20250892639160156, -0.19615936279296875, -0.18980979919433594, -0.18346023559570312, -0.1771106719970703, -0.1707611083984375, -0.1644115447998047, -0.15806198120117188, -0.15171241760253906, -0.14536285400390625, -0.13901329040527344, -0.13266372680664062, -0.1263141632080078, -0.119964599609375, -0.11361503601074219, -0.10726547241210938, -0.10091590881347656, -0.09456634521484375, -0.08821678161621094, -0.08186721801757812, -0.07551765441894531, -0.0691680908203125, -0.06281852722167969, -0.056468963623046875, -0.05011940002441406, -0.04376983642578125, -0.03742027282714844, -0.031070709228515625, -0.024721145629882812, -0.01837158203125, -0.012022018432617188, -0.005672454833984375, 0.0006771087646484375, 0.00702667236328125, 0.013376235961914062, 0.019725799560546875, 0.026075363159179688, 0.0324249267578125, 0.03877449035644531, 0.045124053955078125, 0.05147361755371094, 0.05782318115234375, 0.06417274475097656, 0.07052230834960938, 0.07687187194824219, 0.083221435546875, 0.08957099914550781, 0.09592056274414062, 0.10227012634277344, 0.10861968994140625, 0.11496925354003906, 0.12131881713867188, 0.1276683807373047, 0.1340179443359375, 0.1403675079345703, 0.14671707153320312, 0.15306663513183594, 0.15941619873046875, 0.16576576232910156, 0.17211532592773438, 0.1784648895263672, 0.184814453125]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 8.0, 9.0, 20.0, 13.0, 34.0, 55.0, 58.0, 98.0, 126.0, 192.0, 319.0, 591.0, 1096.0, 2439.0, 5900.0, 18751.0, 119459.0, 3825572.0, 183649.0, 23380.0, 6804.0, 2760.0, 1288.0, 642.0, 346.0, 203.0, 152.0, 97.0, 45.0, 42.0, 35.0, 23.0, 26.0, 17.0, 13.0, 3.0, 5.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.76025390625, -0.7369155883789062, -0.7135772705078125, -0.6902389526367188, -0.666900634765625, -0.6435623168945312, -0.6202239990234375, -0.5968856811523438, -0.57354736328125, -0.5502090454101562, -0.5268707275390625, -0.5035324096679688, -0.480194091796875, -0.45685577392578125, -0.4335174560546875, -0.41017913818359375, -0.3868408203125, -0.36350250244140625, -0.3401641845703125, -0.31682586669921875, -0.293487548828125, -0.27014923095703125, -0.2468109130859375, -0.22347259521484375, -0.20013427734375, -0.17679595947265625, -0.1534576416015625, -0.13011932373046875, -0.106781005859375, -0.08344268798828125, -0.0601043701171875, -0.03676605224609375, -0.013427734375, 0.00991058349609375, 0.0332489013671875, 0.05658721923828125, 0.079925537109375, 0.10326385498046875, 0.1266021728515625, 0.14994049072265625, 0.17327880859375, 0.19661712646484375, 0.2199554443359375, 0.24329376220703125, 0.266632080078125, 0.28997039794921875, 0.3133087158203125, 0.33664703369140625, 0.3599853515625, 0.38332366943359375, 0.4066619873046875, 0.43000030517578125, 0.453338623046875, 0.47667694091796875, 0.5000152587890625, 0.5233535766601562, 0.54669189453125, 0.5700302124023438, 0.5933685302734375, 0.6167068481445312, 0.640045166015625, 0.6633834838867188, 0.6867218017578125, 0.7100601196289062, 0.7333984375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 5.0, 5.0, 9.0, 8.0, 15.0, 22.0, 44.0, 84.0, 262.0, 2546.0, 777.0, 143.0, 69.0, 25.0, 23.0, 13.0, 13.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.64013671875, -0.62274169921875, -0.6053466796875, -0.58795166015625, -0.570556640625, -0.55316162109375, -0.5357666015625, -0.51837158203125, -0.5009765625, -0.48358154296875, -0.4661865234375, -0.44879150390625, -0.431396484375, -0.41400146484375, -0.3966064453125, -0.37921142578125, -0.36181640625, -0.34442138671875, -0.3270263671875, -0.30963134765625, -0.292236328125, -0.27484130859375, -0.2574462890625, -0.24005126953125, -0.22265625, -0.20526123046875, -0.1878662109375, -0.17047119140625, -0.153076171875, -0.13568115234375, -0.1182861328125, -0.10089111328125, -0.08349609375, -0.06610107421875, -0.0487060546875, -0.03131103515625, -0.013916015625, 0.00347900390625, 0.0208740234375, 0.03826904296875, 0.0556640625, 0.07305908203125, 0.0904541015625, 0.10784912109375, 0.125244140625, 0.14263916015625, 0.1600341796875, 0.17742919921875, 0.19482421875, 0.21221923828125, 0.2296142578125, 0.24700927734375, 0.264404296875, 0.28179931640625, 0.2991943359375, 0.31658935546875, 0.333984375, 0.35137939453125, 0.3687744140625, 0.38616943359375, 0.403564453125, 0.42095947265625, 0.4383544921875, 0.45574951171875, 0.47314453125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 4.0, 2.0, 10.0, 37.0, 143.0, 373.0, 287.0, 121.0, 21.0, 10.0, 2.0, 6.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.682599067687988, -5.543712615966797, -5.404825687408447, -5.265938758850098, -5.127052307128906, -4.988165855407715, -4.849278926849365, -4.710391998291016, -4.571505546569824, -4.432619094848633, -4.293732166290283, -4.154845237731934, -4.015958786010742, -3.8770720958709717, -3.738185405731201, -3.5992987155914307, -3.46041202545166, -3.3215253353118896, -3.182638645172119, -3.0437519550323486, -2.904865264892578, -2.7659785747528076, -2.627091884613037, -2.4882051944732666, -2.349318504333496, -2.2104318141937256, -2.071545124053955, -1.9326584339141846, -1.793771743774414, -1.6548850536346436, -1.515998363494873, -1.3771116733551025, -1.2382252216339111, -1.0993385314941406, -0.9604518413543701, -0.8215651512145996, -0.6826784610748291, -0.5437917709350586, -0.4049050807952881, -0.2660183906555176, -0.12713170051574707, 0.011754989624023438, 0.15064167976379395, 0.28952836990356445, 0.42841506004333496, 0.5673017501831055, 0.706188440322876, 0.8450751304626465, 0.983961820602417, 1.1228485107421875, 1.261735200881958, 1.4006218910217285, 1.539508581161499, 1.6783952713012695, 1.81728196144104, 1.9561686515808105, 2.095055341720581, 2.2339420318603516, 2.372828722000122, 2.5117154121398926, 2.650602102279663, 2.7894887924194336, 2.928375482559204, 3.0672621726989746, 3.206148862838745]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 12.0, 14.0, 20.0, 25.0, 26.0, 26.0, 37.0, 51.0, 68.0, 69.0, 55.0, 70.0, 70.0, 72.0, 74.0, 60.0, 56.0, 39.0, 34.0, 34.0, 31.0, 20.0, 14.0, 10.0, 4.0, 5.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2542277574539185, -1.2096582651138306, -1.1650887727737427, -1.1205192804336548, -1.075949788093567, -1.031380295753479, -0.9868108034133911, -0.9422413110733032, -0.8976718187332153, -0.8531023263931274, -0.8085328340530396, -0.7639633417129517, -0.7193938493728638, -0.6748243570327759, -0.630254864692688, -0.5856853723526001, -0.5411158800125122, -0.4965463876724243, -0.4519768953323364, -0.40740740299224854, -0.36283791065216064, -0.31826841831207275, -0.27369892597198486, -0.22912943363189697, -0.18455994129180908, -0.1399904489517212, -0.0954209566116333, -0.05085146427154541, -0.0062819719314575195, 0.03828752040863037, 0.08285701274871826, 0.12742650508880615, 0.1719958782196045, 0.21656537055969238, 0.2611348628997803, 0.30570435523986816, 0.35027384757995605, 0.39484333992004395, 0.43941283226013184, 0.4839823246002197, 0.5285518169403076, 0.5731213092803955, 0.6176908016204834, 0.6622602939605713, 0.7068297863006592, 0.7513992786407471, 0.795968770980835, 0.8405382633209229, 0.8851077556610107, 0.9296772480010986, 0.9742467403411865, 1.0188162326812744, 1.0633857250213623, 1.1079552173614502, 1.152524709701538, 1.197094202041626, 1.2416636943817139, 1.2862331867218018, 1.3308026790618896, 1.3753721714019775, 1.4199416637420654, 1.4645111560821533, 1.5090806484222412, 1.553650140762329, 1.598219633102417]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 3.0, 3.0, 9.0, 7.0, 8.0, 6.0, 13.0, 16.0, 27.0, 37.0, 56.0, 72.0, 111.0, 182.0, 337.0, 579.0, 1138.0, 2322.0, 5560.0, 15359.0, 50468.0, 198453.0, 475451.0, 215709.0, 54761.0, 16635.0, 6057.0, 2513.0, 1212.0, 595.0, 315.0, 175.0, 130.0, 73.0, 51.0, 28.0, 24.0, 20.0, 10.0, 11.0, 9.0, 3.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0], "bins": [-0.57177734375, -0.5547256469726562, -0.5376739501953125, -0.5206222534179688, -0.503570556640625, -0.48651885986328125, -0.4694671630859375, -0.45241546630859375, -0.43536376953125, -0.41831207275390625, -0.4012603759765625, -0.38420867919921875, -0.367156982421875, -0.35010528564453125, -0.3330535888671875, -0.31600189208984375, -0.2989501953125, -0.28189849853515625, -0.2648468017578125, -0.24779510498046875, -0.230743408203125, -0.21369171142578125, -0.1966400146484375, -0.17958831787109375, -0.16253662109375, -0.14548492431640625, -0.1284332275390625, -0.11138153076171875, -0.094329833984375, -0.07727813720703125, -0.0602264404296875, -0.04317474365234375, -0.026123046875, -0.00907135009765625, 0.0079803466796875, 0.02503204345703125, 0.042083740234375, 0.05913543701171875, 0.0761871337890625, 0.09323883056640625, 0.11029052734375, 0.12734222412109375, 0.1443939208984375, 0.16144561767578125, 0.178497314453125, 0.19554901123046875, 0.2126007080078125, 0.22965240478515625, 0.2467041015625, 0.26375579833984375, 0.2808074951171875, 0.29785919189453125, 0.314910888671875, 0.33196258544921875, 0.3490142822265625, 0.36606597900390625, 0.38311767578125, 0.40016937255859375, 0.4172210693359375, 0.43427276611328125, 0.451324462890625, 0.46837615966796875, 0.4854278564453125, 0.5024795532226562, 0.51953125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 7.0, 3.0, 7.0, 7.0, 13.0, 27.0, 17.0, 26.0, 39.0, 41.0, 45.0, 51.0, 52.0, 48.0, 56.0, 70.0, 42.0, 70.0, 65.0, 54.0, 44.0, 35.0, 33.0, 28.0, 20.0, 30.0, 14.0, 20.0, 12.0, 8.0, 4.0, 6.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2431640625, -0.2362194061279297, -0.22927474975585938, -0.22233009338378906, -0.21538543701171875, -0.20844078063964844, -0.20149612426757812, -0.1945514678955078, -0.1876068115234375, -0.1806621551513672, -0.17371749877929688, -0.16677284240722656, -0.15982818603515625, -0.15288352966308594, -0.14593887329101562, -0.1389942169189453, -0.132049560546875, -0.1251049041748047, -0.11816024780273438, -0.11121559143066406, -0.10427093505859375, -0.09732627868652344, -0.09038162231445312, -0.08343696594238281, -0.0764923095703125, -0.06954765319824219, -0.06260299682617188, -0.05565834045410156, -0.04871368408203125, -0.04176902770996094, -0.034824371337890625, -0.027879714965820312, -0.02093505859375, -0.013990402221679688, -0.007045745849609375, -0.0001010894775390625, 0.00684356689453125, 0.013788223266601562, 0.020732879638671875, 0.027677536010742188, 0.0346221923828125, 0.04156684875488281, 0.048511505126953125, 0.05545616149902344, 0.06240081787109375, 0.06934547424316406, 0.07629013061523438, 0.08323478698730469, 0.090179443359375, 0.09712409973144531, 0.10406875610351562, 0.11101341247558594, 0.11795806884765625, 0.12490272521972656, 0.13184738159179688, 0.1387920379638672, 0.1457366943359375, 0.1526813507080078, 0.15962600708007812, 0.16657066345214844, 0.17351531982421875, 0.18045997619628906, 0.18740463256835938, 0.1943492889404297, 0.2012939453125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 6.0, 1.0, 6.0, 3.0, 6.0, 16.0, 12.0, 22.0, 24.0, 42.0, 53.0, 80.0, 104.0, 142.0, 231.0, 443.0, 880.0, 2005.0, 5483.0, 19772.0, 90645.0, 508394.0, 342123.0, 57297.0, 13546.0, 3972.0, 1496.0, 704.0, 358.0, 219.0, 142.0, 103.0, 59.0, 48.0, 31.0, 29.0, 20.0, 7.0, 11.0, 10.0, 5.0, 5.0, 6.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62353515625, -0.6045608520507812, -0.5855865478515625, -0.5666122436523438, -0.547637939453125, -0.5286636352539062, -0.5096893310546875, -0.49071502685546875, -0.47174072265625, -0.45276641845703125, -0.4337921142578125, -0.41481781005859375, -0.395843505859375, -0.37686920166015625, -0.3578948974609375, -0.33892059326171875, -0.3199462890625, -0.30097198486328125, -0.2819976806640625, -0.26302337646484375, -0.244049072265625, -0.22507476806640625, -0.2061004638671875, -0.18712615966796875, -0.16815185546875, -0.14917755126953125, -0.1302032470703125, -0.11122894287109375, -0.092254638671875, -0.07328033447265625, -0.0543060302734375, -0.03533172607421875, -0.016357421875, 0.00261688232421875, 0.0215911865234375, 0.04056549072265625, 0.059539794921875, 0.07851409912109375, 0.0974884033203125, 0.11646270751953125, 0.13543701171875, 0.15441131591796875, 0.1733856201171875, 0.19235992431640625, 0.211334228515625, 0.23030853271484375, 0.2492828369140625, 0.26825714111328125, 0.2872314453125, 0.30620574951171875, 0.3251800537109375, 0.34415435791015625, 0.363128662109375, 0.38210296630859375, 0.4010772705078125, 0.42005157470703125, 0.43902587890625, 0.45800018310546875, 0.4769744873046875, 0.49594879150390625, 0.514923095703125, 0.5338973999023438, 0.5528717041015625, 0.5718460083007812, 0.5908203125]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 1.0, 2.0, 3.0, 3.0, 2.0, 4.0, 8.0, 6.0, 7.0, 7.0, 12.0, 6.0, 8.0, 19.0, 16.0, 16.0, 31.0, 31.0, 33.0, 37.0, 44.0, 39.0, 37.0, 40.0, 46.0, 41.0, 42.0, 58.0, 48.0, 45.0, 35.0, 40.0, 28.0, 29.0, 37.0, 19.0, 27.0, 17.0, 18.0, 16.0, 17.0, 3.0, 7.0, 2.0, 5.0, 7.0, 6.0, 1.0, 7.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7177734375, -0.6932449340820312, -0.6687164306640625, -0.6441879272460938, -0.619659423828125, -0.5951309204101562, -0.5706024169921875, -0.5460739135742188, -0.52154541015625, -0.49701690673828125, -0.4724884033203125, -0.44795989990234375, -0.423431396484375, -0.39890289306640625, -0.3743743896484375, -0.34984588623046875, -0.3253173828125, -0.30078887939453125, -0.2762603759765625, -0.25173187255859375, -0.227203369140625, -0.20267486572265625, -0.1781463623046875, -0.15361785888671875, -0.12908935546875, -0.10456085205078125, -0.0800323486328125, -0.05550384521484375, -0.030975341796875, -0.00644683837890625, 0.0180816650390625, 0.04261016845703125, 0.067138671875, 0.09166717529296875, 0.1161956787109375, 0.14072418212890625, 0.165252685546875, 0.18978118896484375, 0.2143096923828125, 0.23883819580078125, 0.26336669921875, 0.28789520263671875, 0.3124237060546875, 0.33695220947265625, 0.361480712890625, 0.38600921630859375, 0.4105377197265625, 0.43506622314453125, 0.4595947265625, 0.48412322998046875, 0.5086517333984375, 0.5331802368164062, 0.557708740234375, 0.5822372436523438, 0.6067657470703125, 0.6312942504882812, 0.65582275390625, 0.6803512573242188, 0.7048797607421875, 0.7294082641601562, 0.753936767578125, 0.7784652709960938, 0.8029937744140625, 0.8275222778320312, 0.85205078125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 8.0, 2.0, 2.0, 7.0, 20.0, 30.0, 38.0, 65.0, 118.0, 227.0, 413.0, 850.0, 2081.0, 7346.0, 48254.0, 753890.0, 212677.0, 16152.0, 3796.0, 1285.0, 592.0, 321.0, 166.0, 81.0, 55.0, 33.0, 15.0, 13.0, 9.0, 4.0, 3.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.43798828125, -0.4232635498046875, -0.408538818359375, -0.3938140869140625, -0.37908935546875, -0.3643646240234375, -0.349639892578125, -0.3349151611328125, -0.3201904296875, -0.3054656982421875, -0.290740966796875, -0.2760162353515625, -0.26129150390625, -0.2465667724609375, -0.231842041015625, -0.2171173095703125, -0.202392578125, -0.1876678466796875, -0.172943115234375, -0.1582183837890625, -0.14349365234375, -0.1287689208984375, -0.114044189453125, -0.0993194580078125, -0.0845947265625, -0.0698699951171875, -0.055145263671875, -0.0404205322265625, -0.02569580078125, -0.0109710693359375, 0.003753662109375, 0.0184783935546875, 0.033203125, 0.0479278564453125, 0.062652587890625, 0.0773773193359375, 0.09210205078125, 0.1068267822265625, 0.121551513671875, 0.1362762451171875, 0.1510009765625, 0.1657257080078125, 0.180450439453125, 0.1951751708984375, 0.20989990234375, 0.2246246337890625, 0.239349365234375, 0.2540740966796875, 0.268798828125, 0.2835235595703125, 0.298248291015625, 0.3129730224609375, 0.32769775390625, 0.3424224853515625, 0.357147216796875, 0.3718719482421875, 0.3865966796875, 0.4013214111328125, 0.416046142578125, 0.4307708740234375, 0.44549560546875, 0.4602203369140625, 0.474945068359375, 0.4896697998046875, 0.50439453125]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 4.0, 3.0, 3.0, 9.0, 18.0, 15.0, 17.0, 26.0, 29.0, 32.0, 58.0, 79.0, 93.0, 94.0, 99.0, 84.0, 80.0, 61.0, 51.0, 45.0, 25.0, 18.0, 13.0, 11.0, 14.0, 5.0, 5.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0], "bins": [-0.00012445449829101562, -0.00012120604515075684, -0.00011795759201049805, -0.00011470913887023926, -0.00011146068572998047, -0.00010821223258972168, -0.00010496377944946289, -0.0001017153263092041, -9.846687316894531e-05, -9.521842002868652e-05, -9.196996688842773e-05, -8.872151374816895e-05, -8.547306060791016e-05, -8.222460746765137e-05, -7.897615432739258e-05, -7.572770118713379e-05, -7.2479248046875e-05, -6.923079490661621e-05, -6.598234176635742e-05, -6.273388862609863e-05, -5.9485435485839844e-05, -5.6236982345581055e-05, -5.2988529205322266e-05, -4.9740076065063477e-05, -4.649162292480469e-05, -4.32431697845459e-05, -3.999471664428711e-05, -3.674626350402832e-05, -3.349781036376953e-05, -3.0249357223510742e-05, -2.7000904083251953e-05, -2.3752450942993164e-05, -2.0503997802734375e-05, -1.7255544662475586e-05, -1.4007091522216797e-05, -1.0758638381958008e-05, -7.510185241699219e-06, -4.26173210144043e-06, -1.0132789611816406e-06, 2.2351741790771484e-06, 5.4836273193359375e-06, 8.732080459594727e-06, 1.1980533599853516e-05, 1.5228986740112305e-05, 1.8477439880371094e-05, 2.1725893020629883e-05, 2.4974346160888672e-05, 2.822279930114746e-05, 3.147125244140625e-05, 3.471970558166504e-05, 3.796815872192383e-05, 4.121661186218262e-05, 4.4465065002441406e-05, 4.7713518142700195e-05, 5.0961971282958984e-05, 5.4210424423217773e-05, 5.745887756347656e-05, 6.070733070373535e-05, 6.395578384399414e-05, 6.720423698425293e-05, 7.045269012451172e-05, 7.370114326477051e-05, 7.69495964050293e-05, 8.019804954528809e-05, 8.344650268554688e-05]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 6.0, 6.0, 3.0, 7.0, 10.0, 17.0, 13.0, 23.0, 42.0, 72.0, 110.0, 175.0, 272.0, 525.0, 1011.0, 1900.0, 4320.0, 11817.0, 46583.0, 285028.0, 544094.0, 117162.0, 22450.0, 6798.0, 2903.0, 1438.0, 763.0, 428.0, 223.0, 128.0, 82.0, 44.0, 29.0, 24.0, 17.0, 11.0, 3.0, 8.0, 6.0, 2.0, 4.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.257080078125, -0.2488555908203125, -0.240631103515625, -0.2324066162109375, -0.22418212890625, -0.2159576416015625, -0.207733154296875, -0.1995086669921875, -0.1912841796875, -0.1830596923828125, -0.174835205078125, -0.1666107177734375, -0.15838623046875, -0.1501617431640625, -0.141937255859375, -0.1337127685546875, -0.12548828125, -0.1172637939453125, -0.109039306640625, -0.1008148193359375, -0.09259033203125, -0.0843658447265625, -0.076141357421875, -0.0679168701171875, -0.0596923828125, -0.0514678955078125, -0.043243408203125, -0.0350189208984375, -0.02679443359375, -0.0185699462890625, -0.010345458984375, -0.0021209716796875, 0.006103515625, 0.0143280029296875, 0.022552490234375, 0.0307769775390625, 0.03900146484375, 0.0472259521484375, 0.055450439453125, 0.0636749267578125, 0.0718994140625, 0.0801239013671875, 0.088348388671875, 0.0965728759765625, 0.10479736328125, 0.1130218505859375, 0.121246337890625, 0.1294708251953125, 0.1376953125, 0.1459197998046875, 0.154144287109375, 0.1623687744140625, 0.17059326171875, 0.1788177490234375, 0.187042236328125, 0.1952667236328125, 0.2034912109375, 0.2117156982421875, 0.219940185546875, 0.2281646728515625, 0.23638916015625, 0.2446136474609375, 0.252838134765625, 0.2610626220703125, 0.269287109375]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 4.0, 7.0, 7.0, 7.0, 6.0, 13.0, 13.0, 36.0, 39.0, 62.0, 88.0, 81.0, 107.0, 124.0, 98.0, 81.0, 76.0, 39.0, 35.0, 21.0, 10.0, 5.0, 14.0, 8.0, 7.0, 2.0, 1.0, 6.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.40283203125, -0.3905487060546875, -0.378265380859375, -0.3659820556640625, -0.35369873046875, -0.3414154052734375, -0.329132080078125, -0.3168487548828125, -0.3045654296875, -0.2922821044921875, -0.279998779296875, -0.2677154541015625, -0.25543212890625, -0.2431488037109375, -0.230865478515625, -0.2185821533203125, -0.206298828125, -0.1940155029296875, -0.181732177734375, -0.1694488525390625, -0.15716552734375, -0.1448822021484375, -0.132598876953125, -0.1203155517578125, -0.1080322265625, -0.0957489013671875, -0.083465576171875, -0.0711822509765625, -0.05889892578125, -0.0466156005859375, -0.034332275390625, -0.0220489501953125, -0.009765625, 0.0025177001953125, 0.014801025390625, 0.0270843505859375, 0.03936767578125, 0.0516510009765625, 0.063934326171875, 0.0762176513671875, 0.0885009765625, 0.1007843017578125, 0.113067626953125, 0.1253509521484375, 0.13763427734375, 0.1499176025390625, 0.162200927734375, 0.1744842529296875, 0.186767578125, 0.1990509033203125, 0.211334228515625, 0.2236175537109375, 0.23590087890625, 0.2481842041015625, 0.260467529296875, 0.2727508544921875, 0.2850341796875, 0.2973175048828125, 0.309600830078125, 0.3218841552734375, 0.33416748046875, 0.3464508056640625, 0.358734130859375, 0.3710174560546875, 0.38330078125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 10.0, 62.0, 289.0, 497.0, 120.0, 21.0, 8.0, 5.0, 2.0], "bins": [-31.35188865661621, -30.81293296813965, -30.27397918701172, -29.735023498535156, -29.196067810058594, -28.657114028930664, -28.1181583404541, -27.579204559326172, -27.04024887084961, -26.501293182373047, -25.962339401245117, -25.423383712768555, -24.884429931640625, -24.345474243164062, -23.8065185546875, -23.26756477355957, -22.728609085083008, -22.189653396606445, -21.650699615478516, -21.111743927001953, -20.57278823852539, -20.03383445739746, -19.4948787689209, -18.95592498779297, -18.416969299316406, -17.878013610839844, -17.339059829711914, -16.80010414123535, -16.261150360107422, -15.72219467163086, -15.183238983154297, -14.64428424835205, -14.105328559875488, -13.566373825073242, -13.02741813659668, -12.488463401794434, -11.949508666992188, -11.410553932189941, -10.871599197387695, -10.332643508911133, -9.793688774108887, -9.25473403930664, -8.715778350830078, -8.176823616027832, -7.637868881225586, -7.09891414642334, -6.5599589347839355, -6.021003723144531, -5.482048988342285, -4.943094253540039, -4.404139041900635, -3.8651840686798096, -3.3262290954589844, -2.787274122238159, -2.248319149017334, -1.7093641757965088, -1.1704089641571045, -0.6314539909362793, -0.0924990177154541, 0.4464559555053711, 0.9854109287261963, 1.5243659019470215, 2.0633208751678467, 2.602275848388672, 3.141230821609497]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 2.0, 8.0, 5.0, 7.0, 11.0, 8.0, 11.0, 16.0, 12.0, 28.0, 18.0, 20.0, 35.0, 35.0, 55.0, 47.0, 41.0, 46.0, 62.0, 63.0, 52.0, 52.0, 44.0, 55.0, 43.0, 45.0, 33.0, 29.0, 21.0, 24.0, 16.0, 14.0, 17.0, 4.0, 4.0, 8.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0], "bins": [-5.692567348480225, -5.535280227661133, -5.377992630004883, -5.220705509185791, -5.063418388366699, -4.906130790710449, -4.748843669891357, -4.591556549072266, -4.434268951416016, -4.276981830596924, -4.119694232940674, -3.962407112121582, -3.8051199913024902, -3.6478326320648193, -3.4905452728271484, -3.3332581520080566, -3.175971031188965, -3.018683671951294, -2.861396551132202, -2.7041091918945312, -2.5468220710754395, -2.3895347118377686, -2.2322473526000977, -2.074960231781006, -1.917672872543335, -1.7603856325149536, -1.6030983924865723, -1.4458110332489014, -1.28852379322052, -1.1312365531921387, -0.9739492535591125, -0.8166619539260864, -0.6593742370605469, -0.5020869970321655, -0.3447996973991394, -0.18751242756843567, -0.030225157737731934, 0.12706208229064941, 0.28434938192367554, 0.44163668155670166, 0.598923921585083, 0.7562111616134644, 0.9134984612464905, 1.0707857608795166, 1.228073000907898, 1.3853602409362793, 1.5426476001739502, 1.6999348402023315, 1.857222080230713, 2.014509439468384, 2.1717965602874756, 2.3290839195251465, 2.4863710403442383, 2.643658399581909, 2.80094575881958, 2.958232879638672, 3.1155202388763428, 3.2728075981140137, 3.4300947189331055, 3.5873820781707764, 3.7446694374084473, 3.901956558227539, 4.059243679046631, 4.216531276702881, 4.373818397521973]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 0.0, 6.0, 3.0, 2.0, 1.0, 5.0, 8.0, 7.0, 20.0, 18.0, 39.0, 36.0, 46.0, 74.0, 97.0, 148.0, 224.0, 393.0, 847.0, 2157.0, 8317.0, 77529.0, 4060059.0, 35676.0, 5268.0, 1641.0, 648.0, 363.0, 207.0, 138.0, 106.0, 68.0, 44.0, 31.0, 14.0, 9.0, 10.0, 12.0, 7.0, 5.0, 3.0, 1.0, 3.0, 4.0], "bins": [-1.2236328125, -1.1947479248046875, -1.165863037109375, -1.1369781494140625, -1.10809326171875, -1.0792083740234375, -1.050323486328125, -1.0214385986328125, -0.9925537109375, -0.9636688232421875, -0.934783935546875, -0.9058990478515625, -0.87701416015625, -0.8481292724609375, -0.819244384765625, -0.7903594970703125, -0.761474609375, -0.7325897216796875, -0.703704833984375, -0.6748199462890625, -0.64593505859375, -0.6170501708984375, -0.588165283203125, -0.5592803955078125, -0.5303955078125, -0.5015106201171875, -0.472625732421875, -0.4437408447265625, -0.41485595703125, -0.3859710693359375, -0.357086181640625, -0.3282012939453125, -0.29931640625, -0.2704315185546875, -0.241546630859375, -0.2126617431640625, -0.18377685546875, -0.1548919677734375, -0.126007080078125, -0.0971221923828125, -0.0682373046875, -0.0393524169921875, -0.010467529296875, 0.0184173583984375, 0.04730224609375, 0.0761871337890625, 0.105072021484375, 0.1339569091796875, 0.162841796875, 0.1917266845703125, 0.220611572265625, 0.2494964599609375, 0.27838134765625, 0.3072662353515625, 0.336151123046875, 0.3650360107421875, 0.3939208984375, 0.4228057861328125, 0.451690673828125, 0.4805755615234375, 0.50946044921875, 0.5383453369140625, 0.567230224609375, 0.5961151123046875, 0.625]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 8.0, 5.0, 3.0, 8.0, 13.0, 13.0, 17.0, 21.0, 26.0, 36.0, 40.0, 48.0, 50.0, 40.0, 47.0, 52.0, 42.0, 57.0, 60.0, 44.0, 43.0, 49.0, 33.0, 43.0, 37.0, 34.0, 31.0, 18.0, 16.0, 19.0, 10.0, 11.0, 8.0, 6.0, 4.0, 2.0, 5.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2529296875, -0.2456035614013672, -0.23827743530273438, -0.23095130920410156, -0.22362518310546875, -0.21629905700683594, -0.20897293090820312, -0.2016468048095703, -0.1943206787109375, -0.1869945526123047, -0.17966842651367188, -0.17234230041503906, -0.16501617431640625, -0.15769004821777344, -0.15036392211914062, -0.1430377960205078, -0.135711669921875, -0.1283855438232422, -0.12105941772460938, -0.11373329162597656, -0.10640716552734375, -0.09908103942871094, -0.09175491333007812, -0.08442878723144531, -0.0771026611328125, -0.06977653503417969, -0.062450408935546875, -0.05512428283691406, -0.04779815673828125, -0.04047203063964844, -0.033145904541015625, -0.025819778442382812, -0.01849365234375, -0.011167526245117188, -0.003841400146484375, 0.0034847259521484375, 0.01081085205078125, 0.018136978149414062, 0.025463104248046875, 0.03278923034667969, 0.0401153564453125, 0.04744148254394531, 0.054767608642578125, 0.06209373474121094, 0.06941986083984375, 0.07674598693847656, 0.08407211303710938, 0.09139823913574219, 0.098724365234375, 0.10605049133300781, 0.11337661743164062, 0.12070274353027344, 0.12802886962890625, 0.13535499572753906, 0.14268112182617188, 0.1500072479248047, 0.1573333740234375, 0.1646595001220703, 0.17198562622070312, 0.17931175231933594, 0.18663787841796875, 0.19396400451660156, 0.20129013061523438, 0.2086162567138672, 0.2159423828125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 9.0, 9.0, 5.0, 4.0, 8.0, 11.0, 14.0, 20.0, 36.0, 48.0, 70.0, 98.0, 200.0, 367.0, 691.0, 1290.0, 2917.0, 7624.0, 34848.0, 4025575.0, 101419.0, 11604.0, 3831.0, 1609.0, 778.0, 466.0, 259.0, 161.0, 100.0, 66.0, 42.0, 27.0, 14.0, 20.0, 7.0, 8.0, 7.0, 9.0, 3.0, 6.0, 0.0, 1.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.638671875, -0.6164093017578125, -0.594146728515625, -0.5718841552734375, -0.54962158203125, -0.5273590087890625, -0.505096435546875, -0.4828338623046875, -0.4605712890625, -0.4383087158203125, -0.416046142578125, -0.3937835693359375, -0.37152099609375, -0.3492584228515625, -0.326995849609375, -0.3047332763671875, -0.282470703125, -0.2602081298828125, -0.237945556640625, -0.2156829833984375, -0.19342041015625, -0.1711578369140625, -0.148895263671875, -0.1266326904296875, -0.1043701171875, -0.0821075439453125, -0.059844970703125, -0.0375823974609375, -0.01531982421875, 0.0069427490234375, 0.029205322265625, 0.0514678955078125, 0.07373046875, 0.0959930419921875, 0.118255615234375, 0.1405181884765625, 0.16278076171875, 0.1850433349609375, 0.207305908203125, 0.2295684814453125, 0.2518310546875, 0.2740936279296875, 0.296356201171875, 0.3186187744140625, 0.34088134765625, 0.3631439208984375, 0.385406494140625, 0.4076690673828125, 0.429931640625, 0.4521942138671875, 0.474456787109375, 0.4967193603515625, 0.51898193359375, 0.5412445068359375, 0.563507080078125, 0.5857696533203125, 0.6080322265625, 0.6302947998046875, 0.652557373046875, 0.6748199462890625, 0.69708251953125, 0.7193450927734375, 0.741607666015625, 0.7638702392578125, 0.7861328125]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 1.0, 3.0, 10.0, 8.0, 9.0, 20.0, 52.0, 300.0, 3549.0, 79.0, 25.0, 9.0, 7.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.19140625, -0.18317031860351562, -0.17493438720703125, -0.16669845581054688, -0.1584625244140625, -0.15022659301757812, -0.14199066162109375, -0.13375473022460938, -0.125518798828125, -0.11728286743164062, -0.10904693603515625, -0.10081100463867188, -0.0925750732421875, -0.08433914184570312, -0.07610321044921875, -0.06786727905273438, -0.05963134765625, -0.051395416259765625, -0.04315948486328125, -0.034923553466796875, -0.0266876220703125, -0.018451690673828125, -0.01021575927734375, -0.001979827880859375, 0.006256103515625, 0.014492034912109375, 0.02272796630859375, 0.030963897705078125, 0.0391998291015625, 0.047435760498046875, 0.05567169189453125, 0.06390762329101562, 0.0721435546875, 0.08037948608398438, 0.08861541748046875, 0.09685134887695312, 0.1050872802734375, 0.11332321166992188, 0.12155914306640625, 0.12979507446289062, 0.138031005859375, 0.14626693725585938, 0.15450286865234375, 0.16273880004882812, 0.1709747314453125, 0.17921066284179688, 0.18744659423828125, 0.19568252563476562, 0.20391845703125, 0.21215438842773438, 0.22039031982421875, 0.22862625122070312, 0.2368621826171875, 0.24509811401367188, 0.25333404541015625, 0.2615699768066406, 0.269805908203125, 0.2780418395996094, 0.28627777099609375, 0.2945137023925781, 0.3027496337890625, 0.3109855651855469, 0.31922149658203125, 0.3274574279785156, 0.335693359375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 26.0, 48.0, 203.0, 398.0, 253.0, 62.0, 14.0, 6.0], "bins": [-2.903275728225708, -2.854921340942383, -2.8065667152404785, -2.7582123279571533, -2.709857702255249, -2.661503314971924, -2.6131486892700195, -2.5647943019866943, -2.516439914703369, -2.468085527420044, -2.4197309017181396, -2.3713765144348145, -2.32302188873291, -2.274667501449585, -2.2263131141662598, -2.1779584884643555, -2.129603862762451, -2.081249475479126, -2.0328948497772217, -1.9845404624938965, -1.9361859560012817, -1.887831449508667, -1.8394769430160522, -1.7911224365234375, -1.7427680492401123, -1.6944135427474976, -1.6460590362548828, -1.5977046489715576, -1.5493501424789429, -1.5009956359863281, -1.4526411294937134, -1.4042866230010986, -1.3559321165084839, -1.3075776100158691, -1.2592231035232544, -1.2108685970306396, -1.1625142097473145, -1.1141597032546997, -1.065805196762085, -1.0174506902694702, -0.9690961837768555, -0.9207416772842407, -0.8723872303962708, -0.824032723903656, -0.7756782174110413, -0.7273237705230713, -0.6789692640304565, -0.6306147575378418, -0.582260251045227, -0.5339057445526123, -0.48555126786231995, -0.4371967911720276, -0.38884228467941284, -0.3404878079891205, -0.2921333312988281, -0.24377882480621338, -0.19542436301708221, -0.14706987142562866, -0.0987153872847557, -0.05036090314388275, -0.0020064115524291992, 0.04634808003902435, 0.09470255672931671, 0.14305706322193146, 0.19141153991222382]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 2.0, 4.0, 3.0, 8.0, 8.0, 13.0, 17.0, 30.0, 25.0, 23.0, 23.0, 33.0, 27.0, 37.0, 46.0, 54.0, 47.0, 42.0, 53.0, 47.0, 46.0, 47.0, 44.0, 29.0, 39.0, 33.0, 38.0, 35.0, 19.0, 25.0, 24.0, 13.0, 19.0, 14.0, 14.0, 11.0, 3.0, 4.0, 5.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.38607078790664673, -0.37245360016822815, -0.3588363826274872, -0.3452191948890686, -0.33160200715065, -0.31798481941223145, -0.3043676018714905, -0.2907504141330719, -0.2771332263946533, -0.26351603865623474, -0.24989883601665497, -0.2362816333770752, -0.22266444563865662, -0.20904724299907684, -0.19543004035949707, -0.1818128526210785, -0.16819563508033752, -0.15457843244075775, -0.14096124470233917, -0.1273440420627594, -0.11372684687376022, -0.10010965168476105, -0.08649244904518127, -0.0728752538561821, -0.05925805866718292, -0.045640863478183746, -0.03202366456389427, -0.018406465649604797, -0.004789270460605621, 0.008827924728393555, 0.022445127367973328, 0.036062322556972504, 0.04967951774597168, 0.06329671293497086, 0.07691390812397003, 0.0905311107635498, 0.10414830595254898, 0.11776550114154816, 0.13138270378112793, 0.1449998915195465, 0.15861709415912628, 0.17223429679870605, 0.18585148453712463, 0.1994686871767044, 0.21308588981628418, 0.22670307755470276, 0.24032028019428253, 0.2539374828338623, 0.2675546705722809, 0.28117185831069946, 0.29478907585144043, 0.308406263589859, 0.3220234513282776, 0.33564066886901855, 0.34925785660743713, 0.3628750443458557, 0.3764922618865967, 0.39010944962501526, 0.4037266671657562, 0.4173438549041748, 0.4309610426425934, 0.44457823038101196, 0.45819544792175293, 0.4718126356601715, 0.4854298233985901]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 3.0, 6.0, 4.0, 7.0, 5.0, 6.0, 12.0, 15.0, 24.0, 37.0, 38.0, 68.0, 115.0, 165.0, 286.0, 545.0, 1127.0, 2714.0, 7118.0, 22697.0, 85171.0, 302283.0, 417501.0, 150499.0, 39464.0, 11441.0, 3966.0, 1542.0, 703.0, 387.0, 223.0, 142.0, 83.0, 53.0, 36.0, 26.0, 21.0, 10.0, 3.0, 10.0, 4.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.7021484375, -0.6837730407714844, -0.6653976440429688, -0.6470222473144531, -0.6286468505859375, -0.6102714538574219, -0.5918960571289062, -0.5735206604003906, -0.555145263671875, -0.5367698669433594, -0.5183944702148438, -0.5000190734863281, -0.4816436767578125, -0.4632682800292969, -0.44489288330078125, -0.4265174865722656, -0.40814208984375, -0.3897666931152344, -0.37139129638671875, -0.3530158996582031, -0.3346405029296875, -0.3162651062011719, -0.29788970947265625, -0.2795143127441406, -0.261138916015625, -0.24276351928710938, -0.22438812255859375, -0.20601272583007812, -0.1876373291015625, -0.16926193237304688, -0.15088653564453125, -0.13251113891601562, -0.1141357421875, -0.09576034545898438, -0.07738494873046875, -0.059009552001953125, -0.0406341552734375, -0.022258758544921875, -0.00388336181640625, 0.014492034912109375, 0.032867431640625, 0.051242828369140625, 0.06961822509765625, 0.08799362182617188, 0.1063690185546875, 0.12474441528320312, 0.14311981201171875, 0.16149520874023438, 0.17987060546875, 0.19824600219726562, 0.21662139892578125, 0.23499679565429688, 0.2533721923828125, 0.2717475891113281, 0.29012298583984375, 0.3084983825683594, 0.326873779296875, 0.3452491760253906, 0.36362457275390625, 0.3819999694824219, 0.4003753662109375, 0.4187507629394531, 0.43712615966796875, 0.4555015563964844, 0.473876953125]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 2.0, 6.0, 5.0, 6.0, 7.0, 6.0, 7.0, 18.0, 27.0, 19.0, 29.0, 36.0, 27.0, 37.0, 48.0, 39.0, 25.0, 52.0, 68.0, 52.0, 51.0, 48.0, 42.0, 39.0, 56.0, 39.0, 33.0, 26.0, 25.0, 24.0, 19.0, 14.0, 15.0, 13.0, 9.0, 10.0, 4.0, 9.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.247802734375, -0.2404937744140625, -0.233184814453125, -0.2258758544921875, -0.21856689453125, -0.2112579345703125, -0.203948974609375, -0.1966400146484375, -0.1893310546875, -0.1820220947265625, -0.174713134765625, -0.1674041748046875, -0.16009521484375, -0.1527862548828125, -0.145477294921875, -0.1381683349609375, -0.130859375, -0.1235504150390625, -0.116241455078125, -0.1089324951171875, -0.10162353515625, -0.0943145751953125, -0.087005615234375, -0.0796966552734375, -0.0723876953125, -0.0650787353515625, -0.057769775390625, -0.0504608154296875, -0.04315185546875, -0.0358428955078125, -0.028533935546875, -0.0212249755859375, -0.013916015625, -0.0066070556640625, 0.000701904296875, 0.0080108642578125, 0.01531982421875, 0.0226287841796875, 0.029937744140625, 0.0372467041015625, 0.0445556640625, 0.0518646240234375, 0.059173583984375, 0.0664825439453125, 0.07379150390625, 0.0811004638671875, 0.088409423828125, 0.0957183837890625, 0.10302734375, 0.1103363037109375, 0.117645263671875, 0.1249542236328125, 0.13226318359375, 0.1395721435546875, 0.146881103515625, 0.1541900634765625, 0.1614990234375, 0.1688079833984375, 0.176116943359375, 0.1834259033203125, 0.19073486328125, 0.1980438232421875, 0.205352783203125, 0.2126617431640625, 0.219970703125]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 0.0, 5.0, 7.0, 8.0, 9.0, 18.0, 25.0, 24.0, 66.0, 81.0, 115.0, 200.0, 346.0, 660.0, 1438.0, 5201.0, 33276.0, 480513.0, 484911.0, 33321.0, 5328.0, 1477.0, 626.0, 322.0, 186.0, 127.0, 81.0, 60.0, 44.0, 26.0, 17.0, 14.0, 9.0, 12.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9404296875, -0.9068450927734375, -0.873260498046875, -0.8396759033203125, -0.80609130859375, -0.7725067138671875, -0.738922119140625, -0.7053375244140625, -0.6717529296875, -0.6381683349609375, -0.604583740234375, -0.5709991455078125, -0.53741455078125, -0.5038299560546875, -0.470245361328125, -0.4366607666015625, -0.403076171875, -0.3694915771484375, -0.335906982421875, -0.3023223876953125, -0.26873779296875, -0.2351531982421875, -0.201568603515625, -0.1679840087890625, -0.1343994140625, -0.1008148193359375, -0.067230224609375, -0.0336456298828125, -6.103515625e-05, 0.0335235595703125, 0.067108154296875, 0.1006927490234375, 0.13427734375, 0.1678619384765625, 0.201446533203125, 0.2350311279296875, 0.26861572265625, 0.3022003173828125, 0.335784912109375, 0.3693695068359375, 0.4029541015625, 0.4365386962890625, 0.470123291015625, 0.5037078857421875, 0.53729248046875, 0.5708770751953125, 0.604461669921875, 0.6380462646484375, 0.671630859375, 0.7052154541015625, 0.738800048828125, 0.7723846435546875, 0.80596923828125, 0.8395538330078125, 0.873138427734375, 0.9067230224609375, 0.9403076171875, 0.9738922119140625, 1.007476806640625, 1.0410614013671875, 1.07464599609375, 1.1082305908203125, 1.141815185546875, 1.1753997802734375, 1.208984375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 4.0, 6.0, 16.0, 11.0, 15.0, 36.0, 38.0, 43.0, 53.0, 74.0, 65.0, 85.0, 88.0, 100.0, 76.0, 73.0, 55.0, 42.0, 37.0, 30.0, 21.0, 15.0, 11.0, 5.0, 5.0, 4.0, 4.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.2294921875, -1.1663970947265625, -1.103302001953125, -1.0402069091796875, -0.97711181640625, -0.9140167236328125, -0.850921630859375, -0.7878265380859375, -0.7247314453125, -0.6616363525390625, -0.598541259765625, -0.5354461669921875, -0.47235107421875, -0.4092559814453125, -0.346160888671875, -0.2830657958984375, -0.219970703125, -0.1568756103515625, -0.093780517578125, -0.0306854248046875, 0.03240966796875, 0.0955047607421875, 0.158599853515625, 0.2216949462890625, 0.2847900390625, 0.3478851318359375, 0.410980224609375, 0.4740753173828125, 0.53717041015625, 0.6002655029296875, 0.663360595703125, 0.7264556884765625, 0.78955078125, 0.8526458740234375, 0.915740966796875, 0.9788360595703125, 1.04193115234375, 1.1050262451171875, 1.168121337890625, 1.2312164306640625, 1.2943115234375, 1.3574066162109375, 1.420501708984375, 1.4835968017578125, 1.54669189453125, 1.6097869873046875, 1.672882080078125, 1.7359771728515625, 1.799072265625, 1.8621673583984375, 1.925262451171875, 1.9883575439453125, 2.05145263671875, 2.1145477294921875, 2.177642822265625, 2.2407379150390625, 2.3038330078125, 2.3669281005859375, 2.430023193359375, 2.4931182861328125, 2.55621337890625, 2.6193084716796875, 2.682403564453125, 2.7454986572265625, 2.80859375]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 2.0, 0.0, 6.0, 6.0, 8.0, 15.0, 13.0, 26.0, 40.0, 76.0, 122.0, 244.0, 555.0, 1626.0, 7312.0, 1023735.0, 11379.0, 2040.0, 671.0, 315.0, 172.0, 82.0, 53.0, 20.0, 16.0, 13.0, 4.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.2890625, -2.192047119140625, -2.09503173828125, -1.998016357421875, -1.9010009765625, -1.803985595703125, -1.70697021484375, -1.609954833984375, -1.512939453125, -1.415924072265625, -1.31890869140625, -1.221893310546875, -1.1248779296875, -1.027862548828125, -0.93084716796875, -0.833831787109375, -0.73681640625, -0.639801025390625, -0.54278564453125, -0.445770263671875, -0.3487548828125, -0.251739501953125, -0.15472412109375, -0.057708740234375, 0.039306640625, 0.136322021484375, 0.23333740234375, 0.330352783203125, 0.4273681640625, 0.524383544921875, 0.62139892578125, 0.718414306640625, 0.8154296875, 0.912445068359375, 1.00946044921875, 1.106475830078125, 1.2034912109375, 1.300506591796875, 1.39752197265625, 1.494537353515625, 1.591552734375, 1.688568115234375, 1.78558349609375, 1.882598876953125, 1.9796142578125, 2.076629638671875, 2.17364501953125, 2.270660400390625, 2.36767578125, 2.464691162109375, 2.56170654296875, 2.658721923828125, 2.7557373046875, 2.852752685546875, 2.94976806640625, 3.046783447265625, 3.143798828125, 3.240814208984375, 3.33782958984375, 3.434844970703125, 3.5318603515625, 3.628875732421875, 3.72589111328125, 3.822906494140625, 3.919921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 9.0, 14.0, 24.0, 42.0, 77.0, 128.0, 130.0, 155.0, 153.0, 98.0, 60.0, 39.0, 36.0, 13.0, 8.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 6.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.00018322467803955078, -0.00017868075519800186, -0.00017413683235645294, -0.00016959290951490402, -0.0001650489866733551, -0.00016050506383180618, -0.00015596114099025726, -0.00015141721814870834, -0.00014687329530715942, -0.0001423293724656105, -0.00013778544962406158, -0.00013324152678251266, -0.00012869760394096375, -0.00012415368109941483, -0.0001196097582578659, -0.00011506583541631699, -0.00011052191257476807, -0.00010597798973321915, -0.00010143406689167023, -9.689014405012131e-05, -9.234622120857239e-05, -8.780229836702347e-05, -8.325837552547455e-05, -7.871445268392563e-05, -7.417052984237671e-05, -6.962660700082779e-05, -6.508268415927887e-05, -6.053876131772995e-05, -5.599483847618103e-05, -5.145091563463211e-05, -4.690699279308319e-05, -4.236306995153427e-05, -3.781914710998535e-05, -3.327522426843643e-05, -2.8731301426887512e-05, -2.4187378585338593e-05, -1.9643455743789673e-05, -1.5099532902240753e-05, -1.0555610060691833e-05, -6.011687219142914e-06, -1.4677643775939941e-06, 3.0761584639549255e-06, 7.620081305503845e-06, 1.2164004147052765e-05, 1.6707926988601685e-05, 2.1251849830150604e-05, 2.5795772671699524e-05, 3.0339695513248444e-05, 3.488361835479736e-05, 3.942754119634628e-05, 4.39714640378952e-05, 4.851538687944412e-05, 5.305930972099304e-05, 5.760323256254196e-05, 6.214715540409088e-05, 6.66910782456398e-05, 7.123500108718872e-05, 7.577892392873764e-05, 8.032284677028656e-05, 8.486676961183548e-05, 8.94106924533844e-05, 9.395461529493332e-05, 9.849853813648224e-05, 0.00010304246097803116, 0.00010758638381958008]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 2.0, 4.0, 3.0, 6.0, 4.0, 3.0, 12.0, 16.0, 20.0, 21.0, 45.0, 70.0, 128.0, 337.0, 936.0, 2912.0, 14481.0, 990668.0, 32881.0, 3948.0, 1239.0, 405.0, 176.0, 98.0, 50.0, 37.0, 12.0, 13.0, 7.0, 9.0, 6.0, 6.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.34375, -1.29986572265625, -1.2559814453125, -1.21209716796875, -1.168212890625, -1.12432861328125, -1.0804443359375, -1.03656005859375, -0.99267578125, -0.94879150390625, -0.9049072265625, -0.86102294921875, -0.817138671875, -0.77325439453125, -0.7293701171875, -0.68548583984375, -0.6416015625, -0.59771728515625, -0.5538330078125, -0.50994873046875, -0.466064453125, -0.42218017578125, -0.3782958984375, -0.33441162109375, -0.29052734375, -0.24664306640625, -0.2027587890625, -0.15887451171875, -0.114990234375, -0.07110595703125, -0.0272216796875, 0.01666259765625, 0.060546875, 0.10443115234375, 0.1483154296875, 0.19219970703125, 0.236083984375, 0.27996826171875, 0.3238525390625, 0.36773681640625, 0.41162109375, 0.45550537109375, 0.4993896484375, 0.54327392578125, 0.587158203125, 0.63104248046875, 0.6749267578125, 0.71881103515625, 0.7626953125, 0.80657958984375, 0.8504638671875, 0.89434814453125, 0.938232421875, 0.98211669921875, 1.0260009765625, 1.06988525390625, 1.11376953125, 1.15765380859375, 1.2015380859375, 1.24542236328125, 1.289306640625, 1.33319091796875, 1.3770751953125, 1.42095947265625, 1.46484375]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 4.0, 10.0, 33.0, 146.0, 455.0, 250.0, 62.0, 17.0, 4.0, 2.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0], "bins": [-2.69140625, -2.6235504150390625, -2.555694580078125, -2.4878387451171875, -2.41998291015625, -2.3521270751953125, -2.284271240234375, -2.2164154052734375, -2.1485595703125, -2.0807037353515625, -2.012847900390625, -1.9449920654296875, -1.87713623046875, -1.8092803955078125, -1.741424560546875, -1.6735687255859375, -1.605712890625, -1.5378570556640625, -1.470001220703125, -1.4021453857421875, -1.33428955078125, -1.2664337158203125, -1.198577880859375, -1.1307220458984375, -1.0628662109375, -0.9950103759765625, -0.927154541015625, -0.8592987060546875, -0.79144287109375, -0.7235870361328125, -0.655731201171875, -0.5878753662109375, -0.52001953125, -0.4521636962890625, -0.384307861328125, -0.3164520263671875, -0.24859619140625, -0.1807403564453125, -0.112884521484375, -0.0450286865234375, 0.0228271484375, 0.0906829833984375, 0.158538818359375, 0.2263946533203125, 0.29425048828125, 0.3621063232421875, 0.429962158203125, 0.4978179931640625, 0.565673828125, 0.6335296630859375, 0.701385498046875, 0.7692413330078125, 0.83709716796875, 0.9049530029296875, 0.972808837890625, 1.0406646728515625, 1.1085205078125, 1.1763763427734375, 1.244232177734375, 1.3120880126953125, 1.37994384765625, 1.4477996826171875, 1.515655517578125, 1.5835113525390625, 1.6513671875]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 8.0, 6.0, 7.0, 18.0, 29.0, 54.0, 122.0, 232.0, 253.0, 167.0, 61.0, 25.0, 15.0, 7.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.37656021118164, -17.87976837158203, -17.38297462463379, -16.88618278503418, -16.38939094543457, -15.892597198486328, -15.395805358886719, -14.899012565612793, -14.402219772338867, -13.905426979064941, -13.408635139465332, -12.911842346191406, -12.41504955291748, -11.918256759643555, -11.421464920043945, -10.92467212677002, -10.42788028717041, -9.931087493896484, -9.434295654296875, -8.93750286102295, -8.440710067749023, -7.943917751312256, -7.447125434875488, -6.9503326416015625, -6.453540325164795, -5.956748008728027, -5.459955215454102, -4.963162899017334, -4.466370582580566, -3.9695777893066406, -3.472785472869873, -2.9759929180145264, -2.4792003631591797, -1.982407808303833, -1.4856153726577759, -0.9888229370117188, -0.49203038215637207, 0.004762172698974609, 0.5015544891357422, 0.9983470439910889, 1.4951395988464355, 1.9919321537017822, 2.488724708557129, 2.9855170249938965, 3.482309579849243, 3.97910213470459, 4.475894451141357, 4.972686767578125, 5.469479560852051, 5.966271877288818, 6.463064670562744, 6.959856986999512, 7.4566497802734375, 7.953442096710205, 8.450234413146973, 8.947027206420898, 9.443819046020508, 9.940611839294434, 10.437403678894043, 10.934196472167969, 11.430989265441895, 11.92778205871582, 12.42457389831543, 12.921366691589355, 13.418159484863281]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 4.0, 6.0, 3.0, 5.0, 7.0, 10.0, 8.0, 11.0, 17.0, 19.0, 23.0, 22.0, 35.0, 21.0, 38.0, 22.0, 36.0, 43.0, 39.0, 54.0, 47.0, 59.0, 53.0, 49.0, 41.0, 45.0, 40.0, 31.0, 32.0, 40.0, 22.0, 16.0, 26.0, 17.0, 14.0, 12.0, 6.0, 8.0, 9.0, 9.0, 4.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.689866065979004, -7.4596943855285645, -7.229522705078125, -6.9993510246276855, -6.769179344177246, -6.539007663726807, -6.308835983276367, -6.0786638259887695, -5.848492622375488, -5.618320941925049, -5.388149261474609, -5.15797758102417, -4.9278059005737305, -4.697634220123291, -4.467462539672852, -4.237290382385254, -4.0071187019348145, -3.776947021484375, -3.5467753410339355, -3.316603660583496, -3.0864319801330566, -2.856260299682617, -2.6260883808135986, -2.395916700363159, -2.1657450199127197, -1.9355733394622803, -1.7054016590118408, -1.4752298593521118, -1.2450581789016724, -1.014886498451233, -0.7847146987915039, -0.5545430183410645, -0.324371337890625, -0.09419962763786316, 0.13597208261489868, 0.3661438226699829, 0.5963155031204224, 0.8264871835708618, 1.0566589832305908, 1.2868306636810303, 1.5170023441314697, 1.7471740245819092, 1.9773457050323486, 2.207517623901367, 2.4376893043518066, 2.667860984802246, 2.8980326652526855, 3.128204345703125, 3.3583760261535645, 3.588547706604004, 3.8187193870544434, 4.048891067504883, 4.279062747955322, 4.509234428405762, 4.739406585693359, 4.969577789306641, 5.199749946594238, 5.429921627044678, 5.660093307495117, 5.890264987945557, 6.120436668395996, 6.3506083488464355, 6.580780029296875, 6.810952186584473, 7.041123390197754]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 3.0, 5.0, 4.0, 3.0, 8.0, 9.0, 12.0, 13.0, 17.0, 28.0, 51.0, 77.0, 111.0, 169.0, 278.0, 539.0, 1393.0, 5685.0, 81739.0, 4080224.0, 19353.0, 2770.0, 886.0, 343.0, 196.0, 121.0, 87.0, 58.0, 33.0, 20.0, 11.0, 12.0, 10.0, 5.0, 3.0, 7.0, 1.0, 2.0, 0.0, 1.0], "bins": [-2.123046875, -2.0739898681640625, -2.024932861328125, -1.9758758544921875, -1.92681884765625, -1.8777618408203125, -1.828704833984375, -1.7796478271484375, -1.7305908203125, -1.6815338134765625, -1.632476806640625, -1.5834197998046875, -1.53436279296875, -1.4853057861328125, -1.436248779296875, -1.3871917724609375, -1.338134765625, -1.2890777587890625, -1.240020751953125, -1.1909637451171875, -1.14190673828125, -1.0928497314453125, -1.043792724609375, -0.9947357177734375, -0.9456787109375, -0.8966217041015625, -0.847564697265625, -0.7985076904296875, -0.74945068359375, -0.7003936767578125, -0.651336669921875, -0.6022796630859375, -0.55322265625, -0.5041656494140625, -0.455108642578125, -0.4060516357421875, -0.35699462890625, -0.3079376220703125, -0.258880615234375, -0.2098236083984375, -0.1607666015625, -0.1117095947265625, -0.062652587890625, -0.0135955810546875, 0.03546142578125, 0.0845184326171875, 0.133575439453125, 0.1826324462890625, 0.231689453125, 0.2807464599609375, 0.329803466796875, 0.3788604736328125, 0.42791748046875, 0.4769744873046875, 0.526031494140625, 0.5750885009765625, 0.6241455078125, 0.6732025146484375, 0.722259521484375, 0.7713165283203125, 0.82037353515625, 0.8694305419921875, 0.918487548828125, 0.9675445556640625, 1.0166015625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 7.0, 5.0, 11.0, 10.0, 21.0, 28.0, 22.0, 36.0, 43.0, 53.0, 52.0, 73.0, 79.0, 80.0, 60.0, 60.0, 65.0, 66.0, 54.0, 34.0, 29.0, 38.0, 20.0, 19.0, 20.0, 5.0, 5.0, 0.0, 5.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.50048828125, -0.48819732666015625, -0.4759063720703125, -0.46361541748046875, -0.451324462890625, -0.43903350830078125, -0.4267425537109375, -0.41445159912109375, -0.40216064453125, -0.38986968994140625, -0.3775787353515625, -0.36528778076171875, -0.352996826171875, -0.34070587158203125, -0.3284149169921875, -0.31612396240234375, -0.3038330078125, -0.29154205322265625, -0.2792510986328125, -0.26696014404296875, -0.254669189453125, -0.24237823486328125, -0.2300872802734375, -0.21779632568359375, -0.20550537109375, -0.19321441650390625, -0.1809234619140625, -0.16863250732421875, -0.156341552734375, -0.14405059814453125, -0.1317596435546875, -0.11946868896484375, -0.107177734375, -0.09488677978515625, -0.0825958251953125, -0.07030487060546875, -0.058013916015625, -0.04572296142578125, -0.0334320068359375, -0.02114105224609375, -0.00885009765625, 0.00344085693359375, 0.0157318115234375, 0.02802276611328125, 0.040313720703125, 0.05260467529296875, 0.0648956298828125, 0.07718658447265625, 0.0894775390625, 0.10176849365234375, 0.1140594482421875, 0.12635040283203125, 0.138641357421875, 0.15093231201171875, 0.1632232666015625, 0.17551422119140625, 0.18780517578125, 0.20009613037109375, 0.2123870849609375, 0.22467803955078125, 0.236968994140625, 0.24925994873046875, 0.2615509033203125, 0.27384185791015625, 0.2861328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 3.0, 8.0, 3.0, 9.0, 12.0, 10.0, 13.0, 12.0, 25.0, 28.0, 33.0, 46.0, 82.0, 64.0, 112.0, 145.0, 262.0, 422.0, 1138.0, 3908.0, 29265.0, 4077301.0, 72240.0, 6045.0, 1547.0, 576.0, 291.0, 165.0, 110.0, 103.0, 81.0, 52.0, 47.0, 34.0, 23.0, 14.0, 14.0, 11.0, 10.0, 2.0, 5.0, 4.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.501953125, -1.4559326171875, -1.409912109375, -1.3638916015625, -1.31787109375, -1.2718505859375, -1.225830078125, -1.1798095703125, -1.1337890625, -1.0877685546875, -1.041748046875, -0.9957275390625, -0.94970703125, -0.9036865234375, -0.857666015625, -0.8116455078125, -0.765625, -0.7196044921875, -0.673583984375, -0.6275634765625, -0.58154296875, -0.5355224609375, -0.489501953125, -0.4434814453125, -0.3974609375, -0.3514404296875, -0.305419921875, -0.2593994140625, -0.21337890625, -0.1673583984375, -0.121337890625, -0.0753173828125, -0.029296875, 0.0167236328125, 0.062744140625, 0.1087646484375, 0.15478515625, 0.2008056640625, 0.246826171875, 0.2928466796875, 0.3388671875, 0.3848876953125, 0.430908203125, 0.4769287109375, 0.52294921875, 0.5689697265625, 0.614990234375, 0.6610107421875, 0.70703125, 0.7530517578125, 0.799072265625, 0.8450927734375, 0.89111328125, 0.9371337890625, 0.983154296875, 1.0291748046875, 1.0751953125, 1.1212158203125, 1.167236328125, 1.2132568359375, 1.25927734375, 1.3052978515625, 1.351318359375, 1.3973388671875, 1.443359375]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 5.0, 6.0, 23.0, 40.0, 164.0, 3538.0, 203.0, 62.0, 17.0, 13.0, 3.0, 2.0, 1.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.64501953125, -0.6305389404296875, -0.616058349609375, -0.6015777587890625, -0.58709716796875, -0.5726165771484375, -0.558135986328125, -0.5436553955078125, -0.5291748046875, -0.5146942138671875, -0.500213623046875, -0.4857330322265625, -0.47125244140625, -0.4567718505859375, -0.442291259765625, -0.4278106689453125, -0.413330078125, -0.3988494873046875, -0.384368896484375, -0.3698883056640625, -0.35540771484375, -0.3409271240234375, -0.326446533203125, -0.3119659423828125, -0.2974853515625, -0.2830047607421875, -0.268524169921875, -0.2540435791015625, -0.23956298828125, -0.2250823974609375, -0.210601806640625, -0.1961212158203125, -0.181640625, -0.1671600341796875, -0.152679443359375, -0.1381988525390625, -0.12371826171875, -0.1092376708984375, -0.094757080078125, -0.0802764892578125, -0.0657958984375, -0.0513153076171875, -0.036834716796875, -0.0223541259765625, -0.00787353515625, 0.0066070556640625, 0.021087646484375, 0.0355682373046875, 0.050048828125, 0.0645294189453125, 0.079010009765625, 0.0934906005859375, 0.10797119140625, 0.1224517822265625, 0.136932373046875, 0.1514129638671875, 0.1658935546875, 0.1803741455078125, 0.194854736328125, 0.2093353271484375, 0.22381591796875, 0.2382965087890625, 0.252777099609375, 0.2672576904296875, 0.28173828125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 4.0, 6.0, 10.0, 18.0, 33.0, 42.0, 95.0, 106.0, 157.0, 157.0, 120.0, 106.0, 60.0, 41.0, 21.0, 9.0, 4.0, 4.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7045127153396606, -0.6737846732139587, -0.6430566310882568, -0.6123285889625549, -0.581600546836853, -0.5508725047111511, -0.5201444625854492, -0.4894164204597473, -0.4586883783340454, -0.4279603362083435, -0.3972322940826416, -0.3665042519569397, -0.3357762098312378, -0.3050481677055359, -0.274320125579834, -0.24359209835529327, -0.21286407113075256, -0.18213602900505066, -0.15140798687934875, -0.12067995220422745, -0.08995191007852554, -0.059223875403404236, -0.02849583327770233, 0.0022322088479995728, 0.03296025097370148, 0.06368829309940338, 0.09441633522510529, 0.125144362449646, 0.1558724045753479, 0.1866004467010498, 0.2173284888267517, 0.2480565309524536, 0.2787845730781555, 0.3095126152038574, 0.3402406573295593, 0.37096869945526123, 0.40169674158096313, 0.43242478370666504, 0.46315282583236694, 0.49388086795806885, 0.5246089100837708, 0.5553369522094727, 0.5860649943351746, 0.6167930364608765, 0.6475210785865784, 0.6782491207122803, 0.7089771628379822, 0.7397052049636841, 0.7704331874847412, 0.8011612296104431, 0.831889271736145, 0.8626173138618469, 0.8933453559875488, 0.9240733981132507, 0.9548014402389526, 0.9855294823646545, 1.0162575244903564, 1.0469855070114136, 1.0777136087417603, 1.1084415912628174, 1.139169692993164, 1.1698976755142212, 1.2006257772445679, 1.231353759765625, 1.2620818614959717]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 4.0, 3.0, 8.0, 9.0, 10.0, 12.0, 17.0, 33.0, 32.0, 38.0, 40.0, 48.0, 41.0, 58.0, 69.0, 52.0, 60.0, 61.0, 62.0, 56.0, 53.0, 48.0, 32.0, 39.0, 25.0, 23.0, 18.0, 12.0, 10.0, 10.0, 8.0, 5.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6715912818908691, -0.6507554650306702, -0.6299196481704712, -0.6090837717056274, -0.5882479548454285, -0.5674121379852295, -0.5465763211250305, -0.5257405042648315, -0.5049046277999878, -0.4840688109397888, -0.46323296427726746, -0.4423971474170685, -0.4215613007545471, -0.40072548389434814, -0.37988966703414917, -0.3590538501739502, -0.3382180333137512, -0.31738221645355225, -0.2965463697910309, -0.2757105529308319, -0.25487470626831055, -0.23403888940811157, -0.2132030725479126, -0.19236724078655243, -0.17153140902519226, -0.1506955772638321, -0.12985974550247192, -0.10902392864227295, -0.08818809688091278, -0.06735226511955261, -0.04651644825935364, -0.02568061649799347, -0.004844784736633301, 0.01599104329943657, 0.03682687133550644, 0.05766269564628601, 0.07849852740764618, 0.09933435916900635, 0.12017017602920532, 0.1410060077905655, 0.16184183955192566, 0.18267767131328583, 0.203513503074646, 0.22434931993484497, 0.24518515169620514, 0.2660209834575653, 0.2868568003177643, 0.30769264698028564, 0.3285284638404846, 0.3493642807006836, 0.37020012736320496, 0.39103594422340393, 0.4118717908859253, 0.43270760774612427, 0.45354342460632324, 0.4743792414665222, 0.4952150881290436, 0.5160509347915649, 0.5368867516517639, 0.5577225685119629, 0.5785583853721619, 0.5993942022323608, 0.6202300786972046, 0.6410658955574036, 0.6619017124176025]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 4.0, 7.0, 5.0, 5.0, 15.0, 14.0, 27.0, 41.0, 46.0, 80.0, 164.0, 275.0, 545.0, 1187.0, 3129.0, 9049.0, 32375.0, 133255.0, 439668.0, 318331.0, 79715.0, 20373.0, 6154.0, 2185.0, 907.0, 404.0, 224.0, 144.0, 78.0, 50.0, 34.0, 19.0, 15.0, 11.0, 8.0, 4.0, 5.0, 3.0, 5.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.62548828125, -0.6045150756835938, -0.5835418701171875, -0.5625686645507812, -0.541595458984375, -0.5206222534179688, -0.4996490478515625, -0.47867584228515625, -0.45770263671875, -0.43672943115234375, -0.4157562255859375, -0.39478302001953125, -0.373809814453125, -0.35283660888671875, -0.3318634033203125, -0.31089019775390625, -0.2899169921875, -0.26894378662109375, -0.2479705810546875, -0.22699737548828125, -0.206024169921875, -0.18505096435546875, -0.1640777587890625, -0.14310455322265625, -0.12213134765625, -0.10115814208984375, -0.0801849365234375, -0.05921173095703125, -0.038238525390625, -0.01726531982421875, 0.0037078857421875, 0.02468109130859375, 0.045654296875, 0.06662750244140625, 0.0876007080078125, 0.10857391357421875, 0.129547119140625, 0.15052032470703125, 0.1714935302734375, 0.19246673583984375, 0.21343994140625, 0.23441314697265625, 0.2553863525390625, 0.27635955810546875, 0.297332763671875, 0.31830596923828125, 0.3392791748046875, 0.36025238037109375, 0.3812255859375, 0.40219879150390625, 0.4231719970703125, 0.44414520263671875, 0.465118408203125, 0.48609161376953125, 0.5070648193359375, 0.5280380249023438, 0.54901123046875, 0.5699844360351562, 0.5909576416015625, 0.6119308471679688, 0.632904052734375, 0.6538772583007812, 0.6748504638671875, 0.6958236694335938, 0.716796875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 9.0, 6.0, 4.0, 7.0, 7.0, 19.0, 32.0, 28.0, 47.0, 46.0, 51.0, 46.0, 65.0, 74.0, 69.0, 64.0, 61.0, 73.0, 46.0, 46.0, 59.0, 22.0, 34.0, 21.0, 18.0, 20.0, 12.0, 5.0, 4.0, 6.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.484375, -0.4725074768066406, -0.46063995361328125, -0.4487724304199219, -0.4369049072265625, -0.4250373840332031, -0.41316986083984375, -0.4013023376464844, -0.389434814453125, -0.3775672912597656, -0.36569976806640625, -0.3538322448730469, -0.3419647216796875, -0.3300971984863281, -0.31822967529296875, -0.3063621520996094, -0.29449462890625, -0.2826271057128906, -0.27075958251953125, -0.2588920593261719, -0.2470245361328125, -0.23515701293945312, -0.22328948974609375, -0.21142196655273438, -0.199554443359375, -0.18768692016601562, -0.17581939697265625, -0.16395187377929688, -0.1520843505859375, -0.14021682739257812, -0.12834930419921875, -0.11648178100585938, -0.1046142578125, -0.09274673461914062, -0.08087921142578125, -0.06901168823242188, -0.0571441650390625, -0.045276641845703125, -0.03340911865234375, -0.021541595458984375, -0.009674072265625, 0.002193450927734375, 0.01406097412109375, 0.025928497314453125, 0.0377960205078125, 0.049663543701171875, 0.06153106689453125, 0.07339859008789062, 0.08526611328125, 0.09713363647460938, 0.10900115966796875, 0.12086868286132812, 0.1327362060546875, 0.14460372924804688, 0.15647125244140625, 0.16833877563476562, 0.180206298828125, 0.19207382202148438, 0.20394134521484375, 0.21580886840820312, 0.2276763916015625, 0.23954391479492188, 0.25141143798828125, 0.2632789611816406, 0.275146484375]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 6.0, 8.0, 6.0, 7.0, 15.0, 29.0, 25.0, 41.0, 72.0, 115.0, 213.0, 446.0, 988.0, 2817.0, 12199.0, 137895.0, 821505.0, 60605.0, 7848.0, 2068.0, 789.0, 363.0, 184.0, 105.0, 63.0, 40.0, 37.0, 18.0, 17.0, 10.0, 7.0, 3.0, 5.0, 4.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.708984375, -1.6592559814453125, -1.609527587890625, -1.5597991943359375, -1.51007080078125, -1.4603424072265625, -1.410614013671875, -1.3608856201171875, -1.3111572265625, -1.2614288330078125, -1.211700439453125, -1.1619720458984375, -1.11224365234375, -1.0625152587890625, -1.012786865234375, -0.9630584716796875, -0.913330078125, -0.8636016845703125, -0.813873291015625, -0.7641448974609375, -0.71441650390625, -0.6646881103515625, -0.614959716796875, -0.5652313232421875, -0.5155029296875, -0.4657745361328125, -0.416046142578125, -0.3663177490234375, -0.31658935546875, -0.2668609619140625, -0.217132568359375, -0.1674041748046875, -0.11767578125, -0.0679473876953125, -0.018218994140625, 0.0315093994140625, 0.08123779296875, 0.1309661865234375, 0.180694580078125, 0.2304229736328125, 0.2801513671875, 0.3298797607421875, 0.379608154296875, 0.4293365478515625, 0.47906494140625, 0.5287933349609375, 0.578521728515625, 0.6282501220703125, 0.677978515625, 0.7277069091796875, 0.777435302734375, 0.8271636962890625, 0.87689208984375, 0.9266204833984375, 0.976348876953125, 1.0260772705078125, 1.0758056640625, 1.1255340576171875, 1.175262451171875, 1.2249908447265625, 1.27471923828125, 1.3244476318359375, 1.374176025390625, 1.4239044189453125, 1.4736328125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 6.0, 3.0, 6.0, 6.0, 10.0, 9.0, 10.0, 11.0, 18.0, 16.0, 28.0, 32.0, 25.0, 37.0, 26.0, 48.0, 42.0, 42.0, 54.0, 50.0, 39.0, 62.0, 51.0, 47.0, 50.0, 36.0, 36.0, 33.0, 34.0, 17.0, 22.0, 18.0, 9.0, 13.0, 15.0, 11.0, 14.0, 7.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.3671875, -1.325225830078125, -1.28326416015625, -1.241302490234375, -1.1993408203125, -1.157379150390625, -1.11541748046875, -1.073455810546875, -1.031494140625, -0.989532470703125, -0.94757080078125, -0.905609130859375, -0.8636474609375, -0.821685791015625, -0.77972412109375, -0.737762451171875, -0.69580078125, -0.653839111328125, -0.61187744140625, -0.569915771484375, -0.5279541015625, -0.485992431640625, -0.44403076171875, -0.402069091796875, -0.360107421875, -0.318145751953125, -0.27618408203125, -0.234222412109375, -0.1922607421875, -0.150299072265625, -0.10833740234375, -0.066375732421875, -0.0244140625, 0.017547607421875, 0.05950927734375, 0.101470947265625, 0.1434326171875, 0.185394287109375, 0.22735595703125, 0.269317626953125, 0.311279296875, 0.353240966796875, 0.39520263671875, 0.437164306640625, 0.4791259765625, 0.521087646484375, 0.56304931640625, 0.605010986328125, 0.64697265625, 0.688934326171875, 0.73089599609375, 0.772857666015625, 0.8148193359375, 0.856781005859375, 0.89874267578125, 0.940704345703125, 0.982666015625, 1.024627685546875, 1.06658935546875, 1.108551025390625, 1.1505126953125, 1.192474365234375, 1.23443603515625, 1.276397705078125, 1.318359375]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 6.0, 7.0, 13.0, 23.0, 35.0, 52.0, 91.0, 133.0, 232.0, 447.0, 1114.0, 4144.0, 37688.0, 950055.0, 47647.0, 4551.0, 1221.0, 503.0, 221.0, 120.0, 83.0, 59.0, 37.0, 24.0, 12.0, 15.0, 12.0, 3.0, 5.0, 3.0, 3.0, 0.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.240234375, -1.1951904296875, -1.150146484375, -1.1051025390625, -1.06005859375, -1.0150146484375, -0.969970703125, -0.9249267578125, -0.8798828125, -0.8348388671875, -0.789794921875, -0.7447509765625, -0.69970703125, -0.6546630859375, -0.609619140625, -0.5645751953125, -0.51953125, -0.4744873046875, -0.429443359375, -0.3843994140625, -0.33935546875, -0.2943115234375, -0.249267578125, -0.2042236328125, -0.1591796875, -0.1141357421875, -0.069091796875, -0.0240478515625, 0.02099609375, 0.0660400390625, 0.111083984375, 0.1561279296875, 0.201171875, 0.2462158203125, 0.291259765625, 0.3363037109375, 0.38134765625, 0.4263916015625, 0.471435546875, 0.5164794921875, 0.5615234375, 0.6065673828125, 0.651611328125, 0.6966552734375, 0.74169921875, 0.7867431640625, 0.831787109375, 0.8768310546875, 0.921875, 0.9669189453125, 1.011962890625, 1.0570068359375, 1.10205078125, 1.1470947265625, 1.192138671875, 1.2371826171875, 1.2822265625, 1.3272705078125, 1.372314453125, 1.4173583984375, 1.46240234375, 1.5074462890625, 1.552490234375, 1.5975341796875, 1.642578125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 4.0, 6.0, 5.0, 12.0, 30.0, 43.0, 100.0, 173.0, 188.0, 184.0, 119.0, 70.0, 32.0, 23.0, 12.0, 8.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018668174743652344, -0.00018173642456531525, -0.00017679110169410706, -0.00017184577882289886, -0.00016690045595169067, -0.00016195513308048248, -0.0001570098102092743, -0.0001520644873380661, -0.0001471191644668579, -0.00014217384159564972, -0.00013722851872444153, -0.00013228319585323334, -0.00012733787298202515, -0.00012239255011081696, -0.00011744722723960876, -0.00011250190436840057, -0.00010755658149719238, -0.00010261125862598419, -9.7665935754776e-05, -9.272061288356781e-05, -8.777529001235962e-05, -8.282996714115143e-05, -7.788464426994324e-05, -7.293932139873505e-05, -6.799399852752686e-05, -6.304867565631866e-05, -5.8103352785110474e-05, -5.315802991390228e-05, -4.821270704269409e-05, -4.32673841714859e-05, -3.832206130027771e-05, -3.337673842906952e-05, -2.8431415557861328e-05, -2.3486092686653137e-05, -1.8540769815444946e-05, -1.3595446944236755e-05, -8.650124073028564e-06, -3.7048012018203735e-06, 1.2405216693878174e-06, 6.185844540596008e-06, 1.11311674118042e-05, 1.607649028301239e-05, 2.102181315422058e-05, 2.5967136025428772e-05, 3.091245889663696e-05, 3.5857781767845154e-05, 4.0803104639053345e-05, 4.5748427510261536e-05, 5.0693750381469727e-05, 5.563907325267792e-05, 6.058439612388611e-05, 6.55297189950943e-05, 7.047504186630249e-05, 7.542036473751068e-05, 8.036568760871887e-05, 8.531101047992706e-05, 9.025633335113525e-05, 9.520165622234344e-05, 0.00010014697909355164, 0.00010509230196475983, 0.00011003762483596802, 0.00011498294770717621, 0.0001199282705783844, 0.0001248735934495926, 0.00012981891632080078]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 7.0, 3.0, 8.0, 11.0, 11.0, 21.0, 37.0, 64.0, 96.0, 193.0, 469.0, 1199.0, 4187.0, 31337.0, 890901.0, 109355.0, 7635.0, 1804.0, 602.0, 301.0, 138.0, 61.0, 35.0, 21.0, 13.0, 17.0, 9.0, 8.0, 6.0, 4.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0693359375, -1.03558349609375, -1.0018310546875, -0.96807861328125, -0.934326171875, -0.90057373046875, -0.8668212890625, -0.83306884765625, -0.79931640625, -0.76556396484375, -0.7318115234375, -0.69805908203125, -0.664306640625, -0.63055419921875, -0.5968017578125, -0.56304931640625, -0.529296875, -0.49554443359375, -0.4617919921875, -0.42803955078125, -0.394287109375, -0.36053466796875, -0.3267822265625, -0.29302978515625, -0.25927734375, -0.22552490234375, -0.1917724609375, -0.15802001953125, -0.124267578125, -0.09051513671875, -0.0567626953125, -0.02301025390625, 0.0107421875, 0.04449462890625, 0.0782470703125, 0.11199951171875, 0.145751953125, 0.17950439453125, 0.2132568359375, 0.24700927734375, 0.28076171875, 0.31451416015625, 0.3482666015625, 0.38201904296875, 0.415771484375, 0.44952392578125, 0.4832763671875, 0.51702880859375, 0.55078125, 0.58453369140625, 0.6182861328125, 0.65203857421875, 0.685791015625, 0.71954345703125, 0.7532958984375, 0.78704833984375, 0.82080078125, 0.85455322265625, 0.8883056640625, 0.92205810546875, 0.955810546875, 0.98956298828125, 1.0233154296875, 1.05706787109375, 1.0908203125]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 3.0, 3.0, 11.0, 14.0, 21.0, 17.0, 27.0, 58.0, 53.0, 111.0, 180.0, 148.0, 138.0, 75.0, 46.0, 25.0, 22.0, 12.0, 12.0, 8.0, 3.0, 7.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.0966796875, -1.0693130493164062, -1.0419464111328125, -1.0145797729492188, -0.987213134765625, -0.9598464965820312, -0.9324798583984375, -0.9051132202148438, -0.87774658203125, -0.8503799438476562, -0.8230133056640625, -0.7956466674804688, -0.768280029296875, -0.7409133911132812, -0.7135467529296875, -0.6861801147460938, -0.6588134765625, -0.6314468383789062, -0.6040802001953125, -0.5767135620117188, -0.549346923828125, -0.5219802856445312, -0.4946136474609375, -0.46724700927734375, -0.43988037109375, -0.41251373291015625, -0.3851470947265625, -0.35778045654296875, -0.330413818359375, -0.30304718017578125, -0.2756805419921875, -0.24831390380859375, -0.220947265625, -0.19358062744140625, -0.1662139892578125, -0.13884735107421875, -0.111480712890625, -0.08411407470703125, -0.0567474365234375, -0.02938079833984375, -0.00201416015625, 0.02535247802734375, 0.0527191162109375, 0.08008575439453125, 0.107452392578125, 0.13481903076171875, 0.1621856689453125, 0.18955230712890625, 0.2169189453125, 0.24428558349609375, 0.2716522216796875, 0.29901885986328125, 0.326385498046875, 0.35375213623046875, 0.3811187744140625, 0.40848541259765625, 0.43585205078125, 0.46321868896484375, 0.4905853271484375, 0.5179519653320312, 0.545318603515625, 0.5726852416992188, 0.6000518798828125, 0.6274185180664062, 0.65478515625]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 3.0, 4.0, 10.0, 21.0, 19.0, 33.0, 39.0, 73.0, 114.0, 117.0, 139.0, 118.0, 95.0, 75.0, 50.0, 34.0, 26.0, 18.0, 2.0, 2.0, 2.0, 4.0, 3.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.249927043914795, -4.979028701782227, -4.7081298828125, -4.437231540679932, -4.166332721710205, -3.8954343795776367, -3.6245357990264893, -3.353637218475342, -3.0827386379241943, -2.811840057373047, -2.5409414768218994, -2.270042896270752, -1.999144434928894, -1.7282458543777466, -1.4573473930358887, -1.1864488124847412, -0.9155502319335938, -0.6446516513824463, -0.3737531304359436, -0.10285460948944092, 0.16804397106170654, 0.438942551612854, 0.7098410129547119, 0.9807395935058594, 1.2516381740570068, 1.5225367546081543, 1.7934353351593018, 2.064333915710449, 2.3352322578430176, 2.606131076812744, 2.8770294189453125, 3.14792799949646, 3.418826103210449, 3.6897246837615967, 3.960623264312744, 4.2315216064453125, 4.502420425415039, 4.773318767547607, 5.044217109680176, 5.315115928649902, 5.586014747619629, 5.856913089752197, 6.127811908721924, 6.398710250854492, 6.669609069824219, 6.940507411956787, 7.2114057540893555, 7.482304573059082, 7.75320291519165, 8.024101257324219, 8.295000076293945, 8.565898895263672, 8.836796760559082, 9.107695579528809, 9.378594398498535, 9.649492263793945, 9.920391082763672, 10.191289901733398, 10.462187767028809, 10.733086585998535, 11.003985404968262, 11.274884223937988, 11.545782089233398, 11.816680908203125, 12.087579727172852]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 5.0, 2.0, 11.0, 7.0, 13.0, 12.0, 15.0, 16.0, 18.0, 24.0, 23.0, 29.0, 35.0, 30.0, 40.0, 43.0, 49.0, 60.0, 52.0, 34.0, 47.0, 48.0, 29.0, 44.0, 38.0, 30.0, 33.0, 30.0, 23.0, 25.0, 23.0, 19.0, 15.0, 15.0, 9.0, 11.0, 11.0, 2.0, 9.0, 11.0, 3.0, 4.0, 0.0, 3.0, 1.0, 2.0, 1.0, 4.0, 0.0, 1.0], "bins": [-5.828307151794434, -5.654782772064209, -5.481258869171143, -5.307734489440918, -5.134210586547852, -4.960686206817627, -4.787161827087402, -4.613637924194336, -4.440113544464111, -4.266589164733887, -4.09306526184082, -3.9195408821105957, -3.74601674079895, -3.5724925994873047, -3.39896821975708, -3.2254440784454346, -3.051919937133789, -2.8783957958221436, -2.704871654510498, -2.5313472747802734, -2.357823133468628, -2.1842989921569824, -2.010774612426758, -1.8372504711151123, -1.6637263298034668, -1.4902021884918213, -1.3166779279708862, -1.1431536674499512, -0.9696295261383057, -0.7961053252220154, -0.6225811243057251, -0.44905686378479004, -0.27553272247314453, -0.10200852155685425, 0.07151567935943604, 0.24503988027572632, 0.4185640811920166, 0.5920882821083069, 0.7656124830245972, 0.9391367435455322, 1.1126608848571777, 1.2861850261688232, 1.4597092866897583, 1.6332335472106934, 1.8067576885223389, 1.9802818298339844, 2.153806209564209, 2.3273303508758545, 2.5008544921875, 2.6743786334991455, 2.847902774810791, 3.0214271545410156, 3.194951295852661, 3.3684754371643066, 3.5419998168945312, 3.7155239582061768, 3.8890480995178223, 4.062572479248047, 4.236096382141113, 4.409620761871338, 4.5831451416015625, 4.756669044494629, 4.9301934242248535, 5.103717803955078, 5.2772417068481445]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 0.0, 4.0, 2.0, 2.0, 4.0, 2.0, 6.0, 10.0, 7.0, 9.0, 17.0, 18.0, 21.0, 26.0, 63.0, 64.0, 102.0, 147.0, 234.0, 402.0, 809.0, 1744.0, 5602.0, 55693.0, 4108098.0, 15334.0, 3255.0, 1203.0, 537.0, 329.0, 160.0, 111.0, 78.0, 57.0, 45.0, 29.0, 23.0, 11.0, 11.0, 7.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-2.33203125, -2.2741241455078125, -2.216217041015625, -2.1583099365234375, -2.10040283203125, -2.0424957275390625, -1.984588623046875, -1.9266815185546875, -1.8687744140625, -1.8108673095703125, -1.752960205078125, -1.6950531005859375, -1.63714599609375, -1.5792388916015625, -1.521331787109375, -1.4634246826171875, -1.405517578125, -1.3476104736328125, -1.289703369140625, -1.2317962646484375, -1.17388916015625, -1.1159820556640625, -1.058074951171875, -1.0001678466796875, -0.9422607421875, -0.8843536376953125, -0.826446533203125, -0.7685394287109375, -0.71063232421875, -0.6527252197265625, -0.594818115234375, -0.5369110107421875, -0.47900390625, -0.4210968017578125, -0.363189697265625, -0.3052825927734375, -0.24737548828125, -0.1894683837890625, -0.131561279296875, -0.0736541748046875, -0.0157470703125, 0.0421600341796875, 0.100067138671875, 0.1579742431640625, 0.21588134765625, 0.2737884521484375, 0.331695556640625, 0.3896026611328125, 0.447509765625, 0.5054168701171875, 0.563323974609375, 0.6212310791015625, 0.67913818359375, 0.7370452880859375, 0.794952392578125, 0.8528594970703125, 0.9107666015625, 0.9686737060546875, 1.026580810546875, 1.0844879150390625, 1.14239501953125, 1.2003021240234375, 1.258209228515625, 1.3161163330078125, 1.3740234375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 5.0, 5.0, 3.0, 9.0, 9.0, 15.0, 16.0, 20.0, 38.0, 42.0, 43.0, 54.0, 66.0, 66.0, 68.0, 69.0, 72.0, 64.0, 62.0, 53.0, 56.0, 32.0, 36.0, 22.0, 18.0, 24.0, 16.0, 4.0, 5.0, 6.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.429931640625, -0.4174652099609375, -0.404998779296875, -0.3925323486328125, -0.38006591796875, -0.3675994873046875, -0.355133056640625, -0.3426666259765625, -0.3302001953125, -0.3177337646484375, -0.305267333984375, -0.2928009033203125, -0.28033447265625, -0.2678680419921875, -0.255401611328125, -0.2429351806640625, -0.23046875, -0.2180023193359375, -0.205535888671875, -0.1930694580078125, -0.18060302734375, -0.1681365966796875, -0.155670166015625, -0.1432037353515625, -0.1307373046875, -0.1182708740234375, -0.105804443359375, -0.0933380126953125, -0.08087158203125, -0.0684051513671875, -0.055938720703125, -0.0434722900390625, -0.031005859375, -0.0185394287109375, -0.006072998046875, 0.0063934326171875, 0.01885986328125, 0.0313262939453125, 0.043792724609375, 0.0562591552734375, 0.0687255859375, 0.0811920166015625, 0.093658447265625, 0.1061248779296875, 0.11859130859375, 0.1310577392578125, 0.143524169921875, 0.1559906005859375, 0.16845703125, 0.1809234619140625, 0.193389892578125, 0.2058563232421875, 0.21832275390625, 0.2307891845703125, 0.243255615234375, 0.2557220458984375, 0.2681884765625, 0.2806549072265625, 0.293121337890625, 0.3055877685546875, 0.31805419921875, 0.3305206298828125, 0.342987060546875, 0.3554534912109375, 0.367919921875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 5.0, 1.0, 4.0, 7.0, 13.0, 15.0, 25.0, 28.0, 53.0, 69.0, 77.0, 145.0, 163.0, 253.0, 368.0, 497.0, 733.0, 1103.0, 1751.0, 2982.0, 6000.0, 15181.0, 81398.0, 4009863.0, 48675.0, 12116.0, 5015.0, 2620.0, 1659.0, 1077.0, 693.0, 516.0, 383.0, 240.0, 169.0, 109.0, 105.0, 55.0, 39.0, 28.0, 14.0, 12.0, 11.0, 5.0, 5.0, 6.0, 3.0, 1.0, 3.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9013671875, -0.8735427856445312, -0.8457183837890625, -0.8178939819335938, -0.790069580078125, -0.7622451782226562, -0.7344207763671875, -0.7065963745117188, -0.67877197265625, -0.6509475708007812, -0.6231231689453125, -0.5952987670898438, -0.567474365234375, -0.5396499633789062, -0.5118255615234375, -0.48400115966796875, -0.4561767578125, -0.42835235595703125, -0.4005279541015625, -0.37270355224609375, -0.344879150390625, -0.31705474853515625, -0.2892303466796875, -0.26140594482421875, -0.23358154296875, -0.20575714111328125, -0.1779327392578125, -0.15010833740234375, -0.122283935546875, -0.09445953369140625, -0.0666351318359375, -0.03881072998046875, -0.010986328125, 0.01683807373046875, 0.0446624755859375, 0.07248687744140625, 0.100311279296875, 0.12813568115234375, 0.1559600830078125, 0.18378448486328125, 0.21160888671875, 0.23943328857421875, 0.2672576904296875, 0.29508209228515625, 0.322906494140625, 0.35073089599609375, 0.3785552978515625, 0.40637969970703125, 0.4342041015625, 0.46202850341796875, 0.4898529052734375, 0.5176773071289062, 0.545501708984375, 0.5733261108398438, 0.6011505126953125, 0.6289749145507812, 0.65679931640625, 0.6846237182617188, 0.7124481201171875, 0.7402725219726562, 0.768096923828125, 0.7959213256835938, 0.8237457275390625, 0.8515701293945312, 0.87939453125]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 2.0, 5.0, 6.0, 4.0, 5.0, 9.0, 16.0, 28.0, 55.0, 202.0, 3462.0, 139.0, 47.0, 21.0, 15.0, 15.0, 10.0, 11.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.2166748046875, -0.20931053161621094, -0.20194625854492188, -0.1945819854736328, -0.18721771240234375, -0.1798534393310547, -0.17248916625976562, -0.16512489318847656, -0.1577606201171875, -0.15039634704589844, -0.14303207397460938, -0.1356678009033203, -0.12830352783203125, -0.12093925476074219, -0.11357498168945312, -0.10621070861816406, -0.098846435546875, -0.09148216247558594, -0.08411788940429688, -0.07675361633300781, -0.06938934326171875, -0.06202507019042969, -0.054660797119140625, -0.04729652404785156, -0.0399322509765625, -0.03256797790527344, -0.025203704833984375, -0.017839431762695312, -0.01047515869140625, -0.0031108856201171875, 0.004253387451171875, 0.011617660522460938, 0.01898193359375, 0.026346206665039062, 0.033710479736328125, 0.04107475280761719, 0.04843902587890625, 0.05580329895019531, 0.06316757202148438, 0.07053184509277344, 0.0778961181640625, 0.08526039123535156, 0.09262466430664062, 0.09998893737792969, 0.10735321044921875, 0.11471748352050781, 0.12208175659179688, 0.12944602966308594, 0.136810302734375, 0.14417457580566406, 0.15153884887695312, 0.1589031219482422, 0.16626739501953125, 0.1736316680908203, 0.18099594116210938, 0.18836021423339844, 0.1957244873046875, 0.20308876037597656, 0.21045303344726562, 0.2178173065185547, 0.22518157958984375, 0.2325458526611328, 0.23991012573242188, 0.24727439880371094, 0.254638671875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 18.0, 34.0, 82.0, 116.0, 161.0, 157.0, 148.0, 103.0, 73.0, 31.0, 22.0, 17.0, 10.0, 4.0, 7.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-1.4201459884643555, -1.380935549736023, -1.3417249917984009, -1.3025145530700684, -1.2633039951324463, -1.2240935564041138, -1.1848829984664917, -1.1456725597381592, -1.106462001800537, -1.0672515630722046, -1.0280410051345825, -0.9888305068016052, -0.9496200084686279, -0.9104095697402954, -0.8711990714073181, -0.8319885730743408, -0.7927781343460083, -0.753567636013031, -0.7143571376800537, -0.6751466393470764, -0.6359361410140991, -0.5967257022857666, -0.5575152039527893, -0.518304705619812, -0.4790942072868347, -0.4398837089538574, -0.4006732106208801, -0.3614627420902252, -0.3222522437572479, -0.28304174542427063, -0.24383126199245453, -0.20462077856063843, -0.16541028022766113, -0.12619978189468384, -0.08698929846286774, -0.04777880758047104, -0.00856831669807434, 0.030642181634902954, 0.06985266506671906, 0.10906314849853516, 0.14827364683151245, 0.18748414516448975, 0.22669462859630585, 0.26590511202812195, 0.30511561036109924, 0.34432610869407654, 0.38353657722473145, 0.42274707555770874, 0.46195757389068604, 0.5011680722236633, 0.5403785705566406, 0.5795890688896179, 0.6187995672225952, 0.6580100059509277, 0.697220504283905, 0.7364310026168823, 0.7756415009498596, 0.8148519992828369, 0.8540624976158142, 0.8932729959487915, 0.932483434677124, 0.9716939926147461, 1.0109044313430786, 1.0501148700714111, 1.0893254280090332]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 7.0, 6.0, 10.0, 10.0, 14.0, 14.0, 17.0, 15.0, 31.0, 23.0, 29.0, 47.0, 33.0, 50.0, 36.0, 40.0, 44.0, 52.0, 59.0, 39.0, 45.0, 49.0, 38.0, 48.0, 31.0, 44.0, 36.0, 23.0, 22.0, 23.0, 14.0, 13.0, 7.0, 13.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5525497198104858, -0.5323319435119629, -0.5121142268180847, -0.49189645051956177, -0.4716787040233612, -0.45146095752716064, -0.4312431812286377, -0.41102543473243713, -0.3908076882362366, -0.370589941740036, -0.35037219524383545, -0.3301544189453125, -0.30993667244911194, -0.2897189259529114, -0.2695011496543884, -0.24928340315818787, -0.2290656566619873, -0.20884791016578674, -0.188630148768425, -0.16841238737106323, -0.14819464087486267, -0.1279768943786621, -0.10775913298130035, -0.0875413715839386, -0.06732362508773804, -0.04710587114095688, -0.02688811719417572, -0.006670363247394562, 0.013547390699386597, 0.033765144646167755, 0.053982898592948914, 0.07420065999031067, 0.094418466091156, 0.11463622003793716, 0.13485397398471832, 0.15507173538208008, 0.17528948187828064, 0.1955072283744812, 0.21572498977184296, 0.2359427511692047, 0.2561604976654053, 0.27637824416160583, 0.2965959906578064, 0.31681376695632935, 0.3370315134525299, 0.35724925994873047, 0.3774670362472534, 0.397684782743454, 0.41790252923965454, 0.4381202757358551, 0.45833802223205566, 0.4785557985305786, 0.4987735450267792, 0.5189912915229797, 0.5392090678215027, 0.5594267845153809, 0.5796445608139038, 0.5998623371124268, 0.6200800538063049, 0.6402978301048279, 0.660515546798706, 0.680733323097229, 0.700951099395752, 0.7211688756942749, 0.7413865923881531]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 5.0, 7.0, 8.0, 7.0, 9.0, 14.0, 18.0, 30.0, 35.0, 63.0, 73.0, 119.0, 214.0, 333.0, 599.0, 1095.0, 2281.0, 5889.0, 18834.0, 84595.0, 404279.0, 412682.0, 87163.0, 19471.0, 5904.0, 2314.0, 1103.0, 511.0, 326.0, 186.0, 149.0, 80.0, 39.0, 40.0, 27.0, 18.0, 17.0, 8.0, 7.0, 4.0, 4.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.9375, -0.9128341674804688, -0.8881683349609375, -0.8635025024414062, -0.838836669921875, -0.8141708374023438, -0.7895050048828125, -0.7648391723632812, -0.74017333984375, -0.7155075073242188, -0.6908416748046875, -0.6661758422851562, -0.641510009765625, -0.6168441772460938, -0.5921783447265625, -0.5675125122070312, -0.5428466796875, -0.5181808471679688, -0.4935150146484375, -0.46884918212890625, -0.444183349609375, -0.41951751708984375, -0.3948516845703125, -0.37018585205078125, -0.34552001953125, -0.32085418701171875, -0.2961883544921875, -0.27152252197265625, -0.246856689453125, -0.22219085693359375, -0.1975250244140625, -0.17285919189453125, -0.148193359375, -0.12352752685546875, -0.0988616943359375, -0.07419586181640625, -0.049530029296875, -0.02486419677734375, -0.0001983642578125, 0.02446746826171875, 0.04913330078125, 0.07379913330078125, 0.0984649658203125, 0.12313079833984375, 0.147796630859375, 0.17246246337890625, 0.1971282958984375, 0.22179412841796875, 0.2464599609375, 0.27112579345703125, 0.2957916259765625, 0.32045745849609375, 0.345123291015625, 0.36978912353515625, 0.3944549560546875, 0.41912078857421875, 0.44378662109375, 0.46845245361328125, 0.4931182861328125, 0.5177841186523438, 0.542449951171875, 0.5671157836914062, 0.5917816162109375, 0.6164474487304688, 0.64111328125]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 0.0, 4.0, 3.0, 5.0, 6.0, 8.0, 7.0, 8.0, 7.0, 13.0, 30.0, 37.0, 40.0, 42.0, 53.0, 51.0, 65.0, 58.0, 63.0, 67.0, 67.0, 58.0, 54.0, 58.0, 44.0, 22.0, 35.0, 24.0, 15.0, 21.0, 12.0, 10.0, 6.0, 4.0, 7.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.42529296875, -0.4131126403808594, -0.40093231201171875, -0.3887519836425781, -0.3765716552734375, -0.3643913269042969, -0.35221099853515625, -0.3400306701660156, -0.327850341796875, -0.3156700134277344, -0.30348968505859375, -0.2913093566894531, -0.2791290283203125, -0.2669486999511719, -0.25476837158203125, -0.24258804321289062, -0.23040771484375, -0.21822738647460938, -0.20604705810546875, -0.19386672973632812, -0.1816864013671875, -0.16950607299804688, -0.15732574462890625, -0.14514541625976562, -0.132965087890625, -0.12078475952148438, -0.10860443115234375, -0.09642410278320312, -0.0842437744140625, -0.07206344604492188, -0.05988311767578125, -0.047702789306640625, -0.0355224609375, -0.023342132568359375, -0.01116180419921875, 0.001018524169921875, 0.0131988525390625, 0.025379180908203125, 0.03755950927734375, 0.049739837646484375, 0.061920166015625, 0.07410049438476562, 0.08628082275390625, 0.09846115112304688, 0.1106414794921875, 0.12282180786132812, 0.13500213623046875, 0.14718246459960938, 0.15936279296875, 0.17154312133789062, 0.18372344970703125, 0.19590377807617188, 0.2080841064453125, 0.22026443481445312, 0.23244476318359375, 0.24462509155273438, 0.256805419921875, 0.2689857482910156, 0.28116607666015625, 0.2933464050292969, 0.3055267333984375, 0.3177070617675781, 0.32988739013671875, 0.3420677185058594, 0.354248046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 8.0, 4.0, 14.0, 13.0, 14.0, 29.0, 47.0, 56.0, 72.0, 127.0, 196.0, 302.0, 455.0, 909.0, 1866.0, 5380.0, 27257.0, 300886.0, 633706.0, 62632.0, 9114.0, 2661.0, 1150.0, 621.0, 343.0, 212.0, 145.0, 87.0, 69.0, 51.0, 38.0, 24.0, 13.0, 11.0, 9.0, 7.0, 8.0, 4.0, 2.0, 4.0, 2.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.087890625, -1.0540924072265625, -1.020294189453125, -0.9864959716796875, -0.95269775390625, -0.9188995361328125, -0.885101318359375, -0.8513031005859375, -0.8175048828125, -0.7837066650390625, -0.749908447265625, -0.7161102294921875, -0.68231201171875, -0.6485137939453125, -0.614715576171875, -0.5809173583984375, -0.547119140625, -0.5133209228515625, -0.479522705078125, -0.4457244873046875, -0.41192626953125, -0.3781280517578125, -0.344329833984375, -0.3105316162109375, -0.2767333984375, -0.2429351806640625, -0.209136962890625, -0.1753387451171875, -0.14154052734375, -0.1077423095703125, -0.073944091796875, -0.0401458740234375, -0.00634765625, 0.0274505615234375, 0.061248779296875, 0.0950469970703125, 0.12884521484375, 0.1626434326171875, 0.196441650390625, 0.2302398681640625, 0.2640380859375, 0.2978363037109375, 0.331634521484375, 0.3654327392578125, 0.39923095703125, 0.4330291748046875, 0.466827392578125, 0.5006256103515625, 0.534423828125, 0.5682220458984375, 0.602020263671875, 0.6358184814453125, 0.66961669921875, 0.7034149169921875, 0.737213134765625, 0.7710113525390625, 0.8048095703125, 0.8386077880859375, 0.872406005859375, 0.9062042236328125, 0.94000244140625, 0.9738006591796875, 1.007598876953125, 1.0413970947265625, 1.0751953125]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 0.0, 1.0, 3.0, 7.0, 4.0, 7.0, 9.0, 14.0, 14.0, 21.0, 19.0, 15.0, 19.0, 33.0, 25.0, 28.0, 28.0, 39.0, 37.0, 43.0, 43.0, 45.0, 40.0, 39.0, 34.0, 48.0, 36.0, 38.0, 42.0, 39.0, 24.0, 30.0, 20.0, 28.0, 29.0, 19.0, 27.0, 13.0, 9.0, 9.0, 7.0, 3.0, 2.0, 4.0, 1.0, 8.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.111328125, -1.074462890625, -1.03759765625, -1.000732421875, -0.9638671875, -0.927001953125, -0.89013671875, -0.853271484375, -0.81640625, -0.779541015625, -0.74267578125, -0.705810546875, -0.6689453125, -0.632080078125, -0.59521484375, -0.558349609375, -0.521484375, -0.484619140625, -0.44775390625, -0.410888671875, -0.3740234375, -0.337158203125, -0.30029296875, -0.263427734375, -0.2265625, -0.189697265625, -0.15283203125, -0.115966796875, -0.0791015625, -0.042236328125, -0.00537109375, 0.031494140625, 0.068359375, 0.105224609375, 0.14208984375, 0.178955078125, 0.2158203125, 0.252685546875, 0.28955078125, 0.326416015625, 0.36328125, 0.400146484375, 0.43701171875, 0.473876953125, 0.5107421875, 0.547607421875, 0.58447265625, 0.621337890625, 0.658203125, 0.695068359375, 0.73193359375, 0.768798828125, 0.8056640625, 0.842529296875, 0.87939453125, 0.916259765625, 0.953125, 0.989990234375, 1.02685546875, 1.063720703125, 1.1005859375, 1.137451171875, 1.17431640625, 1.211181640625, 1.248046875]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 5.0, 4.0, 5.0, 15.0, 18.0, 36.0, 76.0, 167.0, 475.0, 2169.0, 54753.0, 975742.0, 13287.0, 1204.0, 348.0, 126.0, 68.0, 27.0, 16.0, 11.0, 9.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.23828125, -1.187408447265625, -1.13653564453125, -1.085662841796875, -1.0347900390625, -0.983917236328125, -0.93304443359375, -0.882171630859375, -0.831298828125, -0.780426025390625, -0.72955322265625, -0.678680419921875, -0.6278076171875, -0.576934814453125, -0.52606201171875, -0.475189208984375, -0.42431640625, -0.373443603515625, -0.32257080078125, -0.271697998046875, -0.2208251953125, -0.169952392578125, -0.11907958984375, -0.068206787109375, -0.017333984375, 0.033538818359375, 0.08441162109375, 0.135284423828125, 0.1861572265625, 0.237030029296875, 0.28790283203125, 0.338775634765625, 0.3896484375, 0.440521240234375, 0.49139404296875, 0.542266845703125, 0.5931396484375, 0.644012451171875, 0.69488525390625, 0.745758056640625, 0.796630859375, 0.847503662109375, 0.89837646484375, 0.949249267578125, 1.0001220703125, 1.050994873046875, 1.10186767578125, 1.152740478515625, 1.20361328125, 1.254486083984375, 1.30535888671875, 1.356231689453125, 1.4071044921875, 1.457977294921875, 1.50885009765625, 1.559722900390625, 1.610595703125, 1.661468505859375, 1.71234130859375, 1.763214111328125, 1.8140869140625, 1.864959716796875, 1.91583251953125, 1.966705322265625, 2.017578125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 7.0, 6.0, 6.0, 33.0, 35.0, 44.0, 70.0, 87.0, 84.0, 111.0, 113.0, 109.0, 82.0, 68.0, 45.0, 28.0, 21.0, 14.0, 14.0, 5.0, 9.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.8531761169433594e-05, -5.576387047767639e-05, -5.299597978591919e-05, -5.022808909416199e-05, -4.7460198402404785e-05, -4.469230771064758e-05, -4.192441701889038e-05, -3.915652632713318e-05, -3.6388635635375977e-05, -3.3620744943618774e-05, -3.085285425186157e-05, -2.808496356010437e-05, -2.5317072868347168e-05, -2.2549182176589966e-05, -1.9781291484832764e-05, -1.701340079307556e-05, -1.424551010131836e-05, -1.1477619409561157e-05, -8.709728717803955e-06, -5.941838026046753e-06, -3.1739473342895508e-06, -4.0605664253234863e-07, 2.3618340492248535e-06, 5.129724740982056e-06, 7.897615432739258e-06, 1.066550612449646e-05, 1.3433396816253662e-05, 1.6201287508010864e-05, 1.8969178199768066e-05, 2.173706889152527e-05, 2.450495958328247e-05, 2.7272850275039673e-05, 3.0040740966796875e-05, 3.280863165855408e-05, 3.557652235031128e-05, 3.834441304206848e-05, 4.1112303733825684e-05, 4.3880194425582886e-05, 4.664808511734009e-05, 4.941597580909729e-05, 5.218386650085449e-05, 5.4951757192611694e-05, 5.7719647884368896e-05, 6.04875385761261e-05, 6.32554292678833e-05, 6.60233199596405e-05, 6.87912106513977e-05, 7.155910134315491e-05, 7.432699203491211e-05, 7.709488272666931e-05, 7.986277341842651e-05, 8.263066411018372e-05, 8.539855480194092e-05, 8.816644549369812e-05, 9.093433618545532e-05, 9.370222687721252e-05, 9.647011756896973e-05, 9.923800826072693e-05, 0.00010200589895248413, 0.00010477378964424133, 0.00010754168033599854, 0.00011030957102775574, 0.00011307746171951294, 0.00011584535241127014, 0.00011861324310302734]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 3.0, 0.0, 8.0, 10.0, 9.0, 13.0, 23.0, 37.0, 68.0, 152.0, 282.0, 670.0, 1954.0, 10111.0, 243002.0, 764419.0, 22858.0, 3236.0, 939.0, 349.0, 182.0, 98.0, 43.0, 36.0, 21.0, 10.0, 10.0, 4.0, 4.0, 4.0, 0.0, 5.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0107421875, -0.9811630249023438, -0.9515838623046875, -0.9220046997070312, -0.892425537109375, -0.8628463745117188, -0.8332672119140625, -0.8036880493164062, -0.77410888671875, -0.7445297241210938, -0.7149505615234375, -0.6853713989257812, -0.655792236328125, -0.6262130737304688, -0.5966339111328125, -0.5670547485351562, -0.5374755859375, -0.5078964233398438, -0.4783172607421875, -0.44873809814453125, -0.419158935546875, -0.38957977294921875, -0.3600006103515625, -0.33042144775390625, -0.30084228515625, -0.27126312255859375, -0.2416839599609375, -0.21210479736328125, -0.182525634765625, -0.15294647216796875, -0.1233673095703125, -0.09378814697265625, -0.064208984375, -0.03462982177734375, -0.0050506591796875, 0.02452850341796875, 0.054107666015625, 0.08368682861328125, 0.1132659912109375, 0.14284515380859375, 0.17242431640625, 0.20200347900390625, 0.2315826416015625, 0.26116180419921875, 0.290740966796875, 0.32032012939453125, 0.3498992919921875, 0.37947845458984375, 0.4090576171875, 0.43863677978515625, 0.4682159423828125, 0.49779510498046875, 0.527374267578125, 0.5569534301757812, 0.5865325927734375, 0.6161117553710938, 0.64569091796875, 0.6752700805664062, 0.7048492431640625, 0.7344284057617188, 0.764007568359375, 0.7935867309570312, 0.8231658935546875, 0.8527450561523438, 0.88232421875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 5.0, 18.0, 29.0, 40.0, 69.0, 106.0, 169.0, 170.0, 140.0, 112.0, 68.0, 35.0, 19.0, 13.0, 7.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.212890625, -1.1811447143554688, -1.1493988037109375, -1.1176528930664062, -1.085906982421875, -1.0541610717773438, -1.0224151611328125, -0.9906692504882812, -0.95892333984375, -0.9271774291992188, -0.8954315185546875, -0.8636856079101562, -0.831939697265625, -0.8001937866210938, -0.7684478759765625, -0.7367019653320312, -0.7049560546875, -0.6732101440429688, -0.6414642333984375, -0.6097183227539062, -0.577972412109375, -0.5462265014648438, -0.5144805908203125, -0.48273468017578125, -0.45098876953125, -0.41924285888671875, -0.3874969482421875, -0.35575103759765625, -0.324005126953125, -0.29225921630859375, -0.2605133056640625, -0.22876739501953125, -0.197021484375, -0.16527557373046875, -0.1335296630859375, -0.10178375244140625, -0.070037841796875, -0.03829193115234375, -0.0065460205078125, 0.02519989013671875, 0.05694580078125, 0.08869171142578125, 0.1204376220703125, 0.15218353271484375, 0.183929443359375, 0.21567535400390625, 0.2474212646484375, 0.27916717529296875, 0.3109130859375, 0.34265899658203125, 0.3744049072265625, 0.40615081787109375, 0.437896728515625, 0.46964263916015625, 0.5013885498046875, 0.5331344604492188, 0.56488037109375, 0.5966262817382812, 0.6283721923828125, 0.6601181030273438, 0.691864013671875, 0.7236099243164062, 0.7553558349609375, 0.7871017456054688, 0.81884765625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 8.0, 37.0, 70.0, 182.0, 256.0, 226.0, 119.0, 64.0, 23.0, 7.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.231990814208984, -13.80994701385498, -13.38790225982666, -12.965858459472656, -12.543813705444336, -12.121769905090332, -11.699726104736328, -11.277681350708008, -10.855636596679688, -10.433592796325684, -10.011548042297363, -9.58950424194336, -9.167459487915039, -8.745415687561035, -8.323371887207031, -7.901327133178711, -7.479283332824707, -7.057239055633545, -6.635194778442383, -6.213150978088379, -5.791106224060059, -5.369062423706055, -4.947018146514893, -4.5249738693237305, -4.102929592132568, -3.6808853149414062, -3.258841037750244, -2.836796998977661, -2.414752721786499, -1.992708444595337, -1.570664405822754, -1.1486201286315918, -0.7265748977661133, -0.30453068017959595, 0.11751353740692139, 0.539557695388794, 0.961601972579956, 1.3836462497711182, 1.8056902885437012, 2.2277345657348633, 2.6497788429260254, 3.0718231201171875, 3.4938673973083496, 3.9159114360809326, 4.337955474853516, 4.760000228881836, 5.18204402923584, 5.604088306427002, 6.026132583618164, 6.448176860809326, 6.870221138000488, 7.292264938354492, 7.7143096923828125, 8.136353492736816, 8.55839729309082, 8.98044204711914, 9.402486801147461, 9.824530601501465, 10.246575355529785, 10.668619155883789, 11.09066390991211, 11.512707710266113, 11.934751510620117, 12.356796264648438, 12.778840065002441]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 5.0, 5.0, 6.0, 3.0, 9.0, 10.0, 15.0, 9.0, 15.0, 29.0, 17.0, 22.0, 28.0, 41.0, 44.0, 44.0, 51.0, 41.0, 51.0, 50.0, 56.0, 58.0, 48.0, 45.0, 37.0, 37.0, 44.0, 38.0, 18.0, 15.0, 15.0, 16.0, 19.0, 10.0, 12.0, 7.0, 5.0, 7.0, 5.0, 3.0, 5.0, 2.0, 4.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.540613174438477, -6.347937107086182, -6.155261039733887, -5.962584972381592, -5.769908905029297, -5.577232837677002, -5.384556770324707, -5.191880702972412, -4.999204635620117, -4.806528568267822, -4.613852500915527, -4.421176433563232, -4.2285003662109375, -4.035824298858643, -3.8431482315063477, -3.6504721641540527, -3.4577958583831787, -3.265119791030884, -3.072443723678589, -2.879767656326294, -2.687091588973999, -2.494415521621704, -2.30173921585083, -2.109063148498535, -1.9163872003555298, -1.7237111330032349, -1.53103506565094, -1.3383588790893555, -1.1456828117370605, -0.9530068039894104, -0.7603306770324707, -0.5676546096801758, -0.37497854232788086, -0.18230246007442474, 0.010373622179031372, 0.20304971933364868, 0.3957257866859436, 0.5884018540382385, 0.7810779809951782, 0.9737540483474731, 1.166430115699768, 1.359106183052063, 1.551782250404358, 1.7444584369659424, 1.9371345043182373, 2.1298105716705322, 2.322486639022827, 2.515162706375122, 2.707838773727417, 2.900514841079712, 3.093190908432007, 3.2858669757843018, 3.4785430431365967, 3.6712191104888916, 3.8638954162597656, 4.0565714836120605, 4.2492475509643555, 4.44192361831665, 4.634599685668945, 4.82727575302124, 5.019951820373535, 5.21262788772583, 5.405303955078125, 5.59798002243042, 5.790656089782715]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 4.0, 8.0, 7.0, 8.0, 6.0, 11.0, 18.0, 20.0, 46.0, 60.0, 83.0, 150.0, 250.0, 419.0, 891.0, 2246.0, 7640.0, 55466.0, 4070378.0, 45885.0, 6807.0, 2085.0, 866.0, 386.0, 217.0, 129.0, 62.0, 47.0, 39.0, 21.0, 10.0, 9.0, 7.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.4072265625, -1.36639404296875, -1.3255615234375, -1.28472900390625, -1.243896484375, -1.20306396484375, -1.1622314453125, -1.12139892578125, -1.08056640625, -1.03973388671875, -0.9989013671875, -0.95806884765625, -0.917236328125, -0.87640380859375, -0.8355712890625, -0.79473876953125, -0.75390625, -0.71307373046875, -0.6722412109375, -0.63140869140625, -0.590576171875, -0.54974365234375, -0.5089111328125, -0.46807861328125, -0.42724609375, -0.38641357421875, -0.3455810546875, -0.30474853515625, -0.263916015625, -0.22308349609375, -0.1822509765625, -0.14141845703125, -0.1005859375, -0.05975341796875, -0.0189208984375, 0.02191162109375, 0.062744140625, 0.10357666015625, 0.1444091796875, 0.18524169921875, 0.22607421875, 0.26690673828125, 0.3077392578125, 0.34857177734375, 0.389404296875, 0.43023681640625, 0.4710693359375, 0.51190185546875, 0.552734375, 0.59356689453125, 0.6343994140625, 0.67523193359375, 0.716064453125, 0.75689697265625, 0.7977294921875, 0.83856201171875, 0.87939453125, 0.92022705078125, 0.9610595703125, 1.00189208984375, 1.042724609375, 1.08355712890625, 1.1243896484375, 1.16522216796875, 1.2060546875]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 4.0, 5.0, 7.0, 5.0, 9.0, 13.0, 13.0, 22.0, 20.0, 37.0, 35.0, 42.0, 45.0, 60.0, 63.0, 66.0, 71.0, 64.0, 60.0, 60.0, 52.0, 47.0, 40.0, 44.0, 29.0, 21.0, 15.0, 18.0, 7.0, 9.0, 7.0, 8.0, 4.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.43798828125, -0.4264030456542969, -0.41481781005859375, -0.4032325744628906, -0.3916473388671875, -0.3800621032714844, -0.36847686767578125, -0.3568916320800781, -0.345306396484375, -0.3337211608886719, -0.32213592529296875, -0.3105506896972656, -0.2989654541015625, -0.2873802185058594, -0.27579498291015625, -0.2642097473144531, -0.25262451171875, -0.24103927612304688, -0.22945404052734375, -0.21786880493164062, -0.2062835693359375, -0.19469833374023438, -0.18311309814453125, -0.17152786254882812, -0.159942626953125, -0.14835739135742188, -0.13677215576171875, -0.12518692016601562, -0.1136016845703125, -0.10201644897460938, -0.09043121337890625, -0.07884597778320312, -0.0672607421875, -0.055675506591796875, -0.04409027099609375, -0.032505035400390625, -0.0209197998046875, -0.009334564208984375, 0.00225067138671875, 0.013835906982421875, 0.025421142578125, 0.037006378173828125, 0.04859161376953125, 0.060176849365234375, 0.0717620849609375, 0.08334732055664062, 0.09493255615234375, 0.10651779174804688, 0.11810302734375, 0.12968826293945312, 0.14127349853515625, 0.15285873413085938, 0.1644439697265625, 0.17602920532226562, 0.18761444091796875, 0.19919967651367188, 0.210784912109375, 0.22237014770507812, 0.23395538330078125, 0.24554061889648438, 0.2571258544921875, 0.2687110900878906, 0.28029632568359375, 0.2918815612792969, 0.303466796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 8.0, 10.0, 14.0, 17.0, 19.0, 25.0, 37.0, 51.0, 77.0, 148.0, 199.0, 393.0, 691.0, 1266.0, 2633.0, 5742.0, 15746.0, 63123.0, 3625100.0, 417190.0, 40852.0, 11571.0, 4696.0, 2129.0, 1102.0, 585.0, 329.0, 177.0, 111.0, 70.0, 52.0, 39.0, 28.0, 12.0, 17.0, 10.0, 7.0, 0.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5185546875, -0.4992523193359375, -0.479949951171875, -0.4606475830078125, -0.44134521484375, -0.4220428466796875, -0.402740478515625, -0.3834381103515625, -0.3641357421875, -0.3448333740234375, -0.325531005859375, -0.3062286376953125, -0.28692626953125, -0.2676239013671875, -0.248321533203125, -0.2290191650390625, -0.209716796875, -0.1904144287109375, -0.171112060546875, -0.1518096923828125, -0.13250732421875, -0.1132049560546875, -0.093902587890625, -0.0746002197265625, -0.0552978515625, -0.0359954833984375, -0.016693115234375, 0.0026092529296875, 0.02191162109375, 0.0412139892578125, 0.060516357421875, 0.0798187255859375, 0.09912109375, 0.1184234619140625, 0.137725830078125, 0.1570281982421875, 0.17633056640625, 0.1956329345703125, 0.214935302734375, 0.2342376708984375, 0.2535400390625, 0.2728424072265625, 0.292144775390625, 0.3114471435546875, 0.33074951171875, 0.3500518798828125, 0.369354248046875, 0.3886566162109375, 0.407958984375, 0.4272613525390625, 0.446563720703125, 0.4658660888671875, 0.48516845703125, 0.5044708251953125, 0.523773193359375, 0.5430755615234375, 0.5623779296875, 0.5816802978515625, 0.600982666015625, 0.6202850341796875, 0.63958740234375, 0.6588897705078125, 0.678192138671875, 0.6974945068359375, 0.716796875]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 4.0, 4.0, 3.0, 5.0, 8.0, 21.0, 22.0, 27.0, 47.0, 72.0, 206.0, 2744.0, 549.0, 146.0, 72.0, 49.0, 20.0, 17.0, 13.0, 15.0, 3.0, 8.0, 7.0, 6.0, 1.0, 4.0, 5.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.363037109375, -0.35367774963378906, -0.3443183898925781, -0.3349590301513672, -0.32559967041015625, -0.3162403106689453, -0.3068809509277344, -0.29752159118652344, -0.2881622314453125, -0.27880287170410156, -0.2694435119628906, -0.2600841522216797, -0.25072479248046875, -0.2413654327392578, -0.23200607299804688, -0.22264671325683594, -0.213287353515625, -0.20392799377441406, -0.19456863403320312, -0.1852092742919922, -0.17584991455078125, -0.1664905548095703, -0.15713119506835938, -0.14777183532714844, -0.1384124755859375, -0.12905311584472656, -0.11969375610351562, -0.11033439636230469, -0.10097503662109375, -0.09161567687988281, -0.08225631713867188, -0.07289695739746094, -0.06353759765625, -0.05417823791503906, -0.044818878173828125, -0.03545951843261719, -0.02610015869140625, -0.016740798950195312, -0.007381439208984375, 0.0019779205322265625, 0.0113372802734375, 0.020696640014648438, 0.030055999755859375, 0.03941535949707031, 0.04877471923828125, 0.05813407897949219, 0.06749343872070312, 0.07685279846191406, 0.086212158203125, 0.09557151794433594, 0.10493087768554688, 0.11429023742675781, 0.12364959716796875, 0.1330089569091797, 0.14236831665039062, 0.15172767639160156, 0.1610870361328125, 0.17044639587402344, 0.17980575561523438, 0.1891651153564453, 0.19852447509765625, 0.2078838348388672, 0.21724319458007812, 0.22660255432128906, 0.2359619140625]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 1.0, 6.0, 2.0, 8.0, 6.0, 18.0, 26.0, 49.0, 62.0, 67.0, 85.0, 113.0, 109.0, 100.0, 108.0, 76.0, 55.0, 48.0, 17.0, 16.0, 15.0, 5.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7125715017318726, -0.6782512068748474, -0.6439309120178223, -0.6096106767654419, -0.5752903819084167, -0.5409700870513916, -0.5066497921943665, -0.4723294973373413, -0.43800923228263855, -0.4036889374256134, -0.36936867237091064, -0.3350483775138855, -0.30072808265686035, -0.2664078176021576, -0.23208752274513245, -0.1977672427892685, -0.16344696283340454, -0.1291266828775406, -0.09480639547109604, -0.06048610806465149, -0.026165828108787537, 0.008154451847076416, 0.04247474670410156, 0.07679502665996552, 0.11111530661582947, 0.14543558657169342, 0.17975586652755737, 0.21407616138458252, 0.24839644134044647, 0.2827167212963104, 0.31703701615333557, 0.35135728120803833, 0.3856775760650635, 0.4199978709220886, 0.4543181359767914, 0.48863843083381653, 0.5229586958885193, 0.5572789907455444, 0.5915992856025696, 0.6259195804595947, 0.6602398157119751, 0.6945601105690002, 0.7288804054260254, 0.7632006406784058, 0.7975209355354309, 0.831841230392456, 0.8661615252494812, 0.9004818201065063, 0.9348021149635315, 0.9691224098205566, 1.003442645072937, 1.037762999534607, 1.0720832347869873, 1.1064035892486572, 1.1407238245010376, 1.175044059753418, 1.209364414215088, 1.2436846494674683, 1.2780050039291382, 1.3123252391815186, 1.3466455936431885, 1.3809658288955688, 1.4152860641479492, 1.4496064186096191, 1.4839266538619995]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 4.0, 3.0, 3.0, 11.0, 2.0, 8.0, 7.0, 10.0, 9.0, 20.0, 16.0, 16.0, 19.0, 19.0, 29.0, 25.0, 18.0, 26.0, 24.0, 38.0, 34.0, 51.0, 42.0, 40.0, 37.0, 33.0, 36.0, 44.0, 36.0, 22.0, 36.0, 34.0, 36.0, 29.0, 31.0, 24.0, 23.0, 18.0, 24.0, 16.0, 13.0, 10.0, 9.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-0.6391416192054749, -0.6194917559623718, -0.599841833114624, -0.580191969871521, -0.560542106628418, -0.5408922433853149, -0.5212423801422119, -0.5015924572944641, -0.4819425940513611, -0.46229273080825806, -0.44264283776283264, -0.4229929447174072, -0.4033430814743042, -0.38369321823120117, -0.36404332518577576, -0.34439343214035034, -0.3247435688972473, -0.3050937056541443, -0.28544381260871887, -0.26579391956329346, -0.24614405632019043, -0.2264941781759262, -0.206844300031662, -0.18719442188739777, -0.16754454374313354, -0.14789466559886932, -0.1282447874546051, -0.10859490931034088, -0.08894503116607666, -0.06929515302181244, -0.04964527487754822, -0.029995396733283997, -0.010345458984375, 0.009304419159889221, 0.028954297304153442, 0.048604175448417664, 0.06825405359268188, 0.0879039317369461, 0.10755380988121033, 0.12720368802547455, 0.14685356616973877, 0.166503444314003, 0.1861533224582672, 0.20580320060253143, 0.22545307874679565, 0.24510295689105988, 0.2647528350353241, 0.2844027280807495, 0.30405259132385254, 0.32370245456695557, 0.343352347612381, 0.3630022406578064, 0.3826521039009094, 0.40230196714401245, 0.42195186018943787, 0.4416017532348633, 0.4612516164779663, 0.48090147972106934, 0.5005513429641724, 0.5202012658119202, 0.5398511290550232, 0.5595009922981262, 0.579150915145874, 0.598800778388977, 0.6184506416320801]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 6.0, 9.0, 13.0, 22.0, 40.0, 92.0, 144.0, 367.0, 799.0, 2951.0, 15612.0, 151838.0, 718923.0, 138955.0, 14466.0, 2791.0, 802.0, 358.0, 165.0, 80.0, 52.0, 20.0, 9.0, 12.0, 9.0, 4.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.0615234375, -1.0214385986328125, -0.981353759765625, -0.9412689208984375, -0.90118408203125, -0.8610992431640625, -0.821014404296875, -0.7809295654296875, -0.7408447265625, -0.7007598876953125, -0.660675048828125, -0.6205902099609375, -0.58050537109375, -0.5404205322265625, -0.500335693359375, -0.4602508544921875, -0.420166015625, -0.3800811767578125, -0.339996337890625, -0.2999114990234375, -0.25982666015625, -0.2197418212890625, -0.179656982421875, -0.1395721435546875, -0.0994873046875, -0.0594024658203125, -0.019317626953125, 0.0207672119140625, 0.06085205078125, 0.1009368896484375, 0.141021728515625, 0.1811065673828125, 0.22119140625, 0.2612762451171875, 0.301361083984375, 0.3414459228515625, 0.38153076171875, 0.4216156005859375, 0.461700439453125, 0.5017852783203125, 0.5418701171875, 0.5819549560546875, 0.622039794921875, 0.6621246337890625, 0.70220947265625, 0.7422943115234375, 0.782379150390625, 0.8224639892578125, 0.862548828125, 0.9026336669921875, 0.942718505859375, 0.9828033447265625, 1.02288818359375, 1.0629730224609375, 1.103057861328125, 1.1431427001953125, 1.1832275390625, 1.2233123779296875, 1.263397216796875, 1.3034820556640625, 1.34356689453125, 1.3836517333984375, 1.423736572265625, 1.4638214111328125, 1.50390625]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 4.0, 4.0, 8.0, 12.0, 17.0, 15.0, 14.0, 18.0, 30.0, 41.0, 35.0, 58.0, 66.0, 65.0, 71.0, 68.0, 53.0, 65.0, 55.0, 66.0, 46.0, 39.0, 35.0, 25.0, 24.0, 23.0, 13.0, 11.0, 9.0, 6.0, 8.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.431640625, -0.4192390441894531, -0.40683746337890625, -0.3944358825683594, -0.3820343017578125, -0.3696327209472656, -0.35723114013671875, -0.3448295593261719, -0.332427978515625, -0.3200263977050781, -0.30762481689453125, -0.2952232360839844, -0.2828216552734375, -0.2704200744628906, -0.25801849365234375, -0.24561691284179688, -0.23321533203125, -0.22081375122070312, -0.20841217041015625, -0.19601058959960938, -0.1836090087890625, -0.17120742797851562, -0.15880584716796875, -0.14640426635742188, -0.134002685546875, -0.12160110473632812, -0.10919952392578125, -0.09679794311523438, -0.0843963623046875, -0.07199478149414062, -0.05959320068359375, -0.047191619873046875, -0.0347900390625, -0.022388458251953125, -0.00998687744140625, 0.002414703369140625, 0.0148162841796875, 0.027217864990234375, 0.03961944580078125, 0.052021026611328125, 0.064422607421875, 0.07682418823242188, 0.08922576904296875, 0.10162734985351562, 0.1140289306640625, 0.12643051147460938, 0.13883209228515625, 0.15123367309570312, 0.16363525390625, 0.17603683471679688, 0.18843841552734375, 0.20083999633789062, 0.2132415771484375, 0.22564315795898438, 0.23804473876953125, 0.2504463195800781, 0.262847900390625, 0.2752494812011719, 0.28765106201171875, 0.3000526428222656, 0.3124542236328125, 0.3248558044433594, 0.33725738525390625, 0.3496589660644531, 0.362060546875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 6.0, 16.0, 8.0, 26.0, 31.0, 47.0, 78.0, 143.0, 289.0, 657.0, 1639.0, 7063.0, 83438.0, 862519.0, 82528.0, 7012.0, 1769.0, 602.0, 298.0, 152.0, 92.0, 61.0, 33.0, 23.0, 11.0, 10.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3603515625, -1.310882568359375, -1.26141357421875, -1.211944580078125, -1.1624755859375, -1.113006591796875, -1.06353759765625, -1.014068603515625, -0.964599609375, -0.915130615234375, -0.86566162109375, -0.816192626953125, -0.7667236328125, -0.717254638671875, -0.66778564453125, -0.618316650390625, -0.56884765625, -0.519378662109375, -0.46990966796875, -0.420440673828125, -0.3709716796875, -0.321502685546875, -0.27203369140625, -0.222564697265625, -0.173095703125, -0.123626708984375, -0.07415771484375, -0.024688720703125, 0.0247802734375, 0.074249267578125, 0.12371826171875, 0.173187255859375, 0.22265625, 0.272125244140625, 0.32159423828125, 0.371063232421875, 0.4205322265625, 0.470001220703125, 0.51947021484375, 0.568939208984375, 0.618408203125, 0.667877197265625, 0.71734619140625, 0.766815185546875, 0.8162841796875, 0.865753173828125, 0.91522216796875, 0.964691162109375, 1.01416015625, 1.063629150390625, 1.11309814453125, 1.162567138671875, 1.2120361328125, 1.261505126953125, 1.31097412109375, 1.360443115234375, 1.409912109375, 1.459381103515625, 1.50885009765625, 1.558319091796875, 1.6077880859375, 1.657257080078125, 1.70672607421875, 1.756195068359375, 1.8056640625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 5.0, 4.0, 10.0, 11.0, 12.0, 24.0, 33.0, 43.0, 47.0, 56.0, 70.0, 74.0, 80.0, 78.0, 77.0, 81.0, 82.0, 45.0, 41.0, 33.0, 30.0, 18.0, 21.0, 12.0, 6.0, 4.0, 5.0, 6.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.16015625, -2.095550537109375, -2.03094482421875, -1.966339111328125, -1.9017333984375, -1.837127685546875, -1.77252197265625, -1.707916259765625, -1.643310546875, -1.578704833984375, -1.51409912109375, -1.449493408203125, -1.3848876953125, -1.320281982421875, -1.25567626953125, -1.191070556640625, -1.12646484375, -1.061859130859375, -0.99725341796875, -0.932647705078125, -0.8680419921875, -0.803436279296875, -0.73883056640625, -0.674224853515625, -0.609619140625, -0.545013427734375, -0.48040771484375, -0.415802001953125, -0.3511962890625, -0.286590576171875, -0.22198486328125, -0.157379150390625, -0.0927734375, -0.028167724609375, 0.03643798828125, 0.101043701171875, 0.1656494140625, 0.230255126953125, 0.29486083984375, 0.359466552734375, 0.424072265625, 0.488677978515625, 0.55328369140625, 0.617889404296875, 0.6824951171875, 0.747100830078125, 0.81170654296875, 0.876312255859375, 0.94091796875, 1.005523681640625, 1.07012939453125, 1.134735107421875, 1.1993408203125, 1.263946533203125, 1.32855224609375, 1.393157958984375, 1.457763671875, 1.522369384765625, 1.58697509765625, 1.651580810546875, 1.7161865234375, 1.780792236328125, 1.84539794921875, 1.910003662109375, 1.974609375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 5.0, 5.0, 5.0, 7.0, 20.0, 20.0, 34.0, 58.0, 112.0, 181.0, 372.0, 774.0, 2219.0, 9961.0, 110292.0, 819148.0, 92635.0, 9016.0, 2185.0, 739.0, 342.0, 179.0, 88.0, 57.0, 37.0, 20.0, 17.0, 6.0, 9.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.499755859375, -0.48482513427734375, -0.4698944091796875, -0.45496368408203125, -0.440032958984375, -0.42510223388671875, -0.4101715087890625, -0.39524078369140625, -0.38031005859375, -0.36537933349609375, -0.3504486083984375, -0.33551788330078125, -0.320587158203125, -0.30565643310546875, -0.2907257080078125, -0.27579498291015625, -0.2608642578125, -0.24593353271484375, -0.2310028076171875, -0.21607208251953125, -0.201141357421875, -0.18621063232421875, -0.1712799072265625, -0.15634918212890625, -0.14141845703125, -0.12648773193359375, -0.1115570068359375, -0.09662628173828125, -0.081695556640625, -0.06676483154296875, -0.0518341064453125, -0.03690338134765625, -0.02197265625, -0.00704193115234375, 0.0078887939453125, 0.02281951904296875, 0.037750244140625, 0.05268096923828125, 0.0676116943359375, 0.08254241943359375, 0.09747314453125, 0.11240386962890625, 0.1273345947265625, 0.14226531982421875, 0.157196044921875, 0.17212677001953125, 0.1870574951171875, 0.20198822021484375, 0.2169189453125, 0.23184967041015625, 0.2467803955078125, 0.26171112060546875, 0.276641845703125, 0.29157257080078125, 0.3065032958984375, 0.32143402099609375, 0.33636474609375, 0.35129547119140625, 0.3662261962890625, 0.38115692138671875, 0.396087646484375, 0.41101837158203125, 0.4259490966796875, 0.44087982177734375, 0.455810546875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 0.0, 2.0, 4.0, 4.0, 5.0, 6.0, 9.0, 19.0, 10.0, 11.0, 19.0, 14.0, 19.0, 25.0, 35.0, 34.0, 51.0, 67.0, 70.0, 74.0, 93.0, 65.0, 73.0, 56.0, 52.0, 39.0, 30.0, 27.0, 21.0, 16.0, 11.0, 9.0, 9.0, 4.0, 8.0, 6.0, 4.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.449222564697266e-05, -6.277207285165787e-05, -6.105192005634308e-05, -5.933176726102829e-05, -5.76116144657135e-05, -5.589146167039871e-05, -5.417130887508392e-05, -5.2451156079769135e-05, -5.0731003284454346e-05, -4.901085048913956e-05, -4.729069769382477e-05, -4.557054489850998e-05, -4.385039210319519e-05, -4.21302393078804e-05, -4.041008651256561e-05, -3.8689933717250824e-05, -3.6969780921936035e-05, -3.5249628126621246e-05, -3.352947533130646e-05, -3.180932253599167e-05, -3.008916974067688e-05, -2.836901694536209e-05, -2.6648864150047302e-05, -2.4928711354732513e-05, -2.3208558559417725e-05, -2.1488405764102936e-05, -1.9768252968788147e-05, -1.8048100173473358e-05, -1.632794737815857e-05, -1.460779458284378e-05, -1.2887641787528992e-05, -1.1167488992214203e-05, -9.447336196899414e-06, -7.727183401584625e-06, -6.0070306062698364e-06, -4.286877810955048e-06, -2.566725015640259e-06, -8.4657222032547e-07, 8.735805749893188e-07, 2.5937333703041077e-06, 4.3138861656188965e-06, 6.034038960933685e-06, 7.754191756248474e-06, 9.474344551563263e-06, 1.1194497346878052e-05, 1.291465014219284e-05, 1.463480293750763e-05, 1.6354955732822418e-05, 1.8075108528137207e-05, 1.9795261323451996e-05, 2.1515414118766785e-05, 2.3235566914081573e-05, 2.4955719709396362e-05, 2.667587250471115e-05, 2.839602530002594e-05, 3.011617809534073e-05, 3.183633089065552e-05, 3.3556483685970306e-05, 3.5276636481285095e-05, 3.6996789276599884e-05, 3.871694207191467e-05, 4.043709486722946e-05, 4.215724766254425e-05, 4.387740045785904e-05, 4.559755325317383e-05]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 11.0, 11.0, 21.0, 36.0, 51.0, 97.0, 199.0, 426.0, 1055.0, 3565.0, 22592.0, 614552.0, 385858.0, 15571.0, 2809.0, 920.0, 348.0, 186.0, 95.0, 56.0, 33.0, 24.0, 9.0, 11.0, 4.0, 5.0, 3.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.70263671875, -0.6845855712890625, -0.666534423828125, -0.6484832763671875, -0.63043212890625, -0.6123809814453125, -0.594329833984375, -0.5762786865234375, -0.5582275390625, -0.5401763916015625, -0.522125244140625, -0.5040740966796875, -0.48602294921875, -0.4679718017578125, -0.449920654296875, -0.4318695068359375, -0.413818359375, -0.3957672119140625, -0.377716064453125, -0.3596649169921875, -0.34161376953125, -0.3235626220703125, -0.305511474609375, -0.2874603271484375, -0.2694091796875, -0.2513580322265625, -0.233306884765625, -0.2152557373046875, -0.19720458984375, -0.1791534423828125, -0.161102294921875, -0.1430511474609375, -0.125, -0.1069488525390625, -0.088897705078125, -0.0708465576171875, -0.05279541015625, -0.0347442626953125, -0.016693115234375, 0.0013580322265625, 0.0194091796875, 0.0374603271484375, 0.055511474609375, 0.0735626220703125, 0.09161376953125, 0.1096649169921875, 0.127716064453125, 0.1457672119140625, 0.163818359375, 0.1818695068359375, 0.199920654296875, 0.2179718017578125, 0.23602294921875, 0.2540740966796875, 0.272125244140625, 0.2901763916015625, 0.3082275390625, 0.3262786865234375, 0.344329833984375, 0.3623809814453125, 0.38043212890625, 0.3984832763671875, 0.416534423828125, 0.4345855712890625, 0.45263671875]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 4.0, 6.0, 3.0, 8.0, 20.0, 26.0, 58.0, 84.0, 119.0, 136.0, 138.0, 145.0, 107.0, 69.0, 40.0, 19.0, 14.0, 2.0, 10.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.69775390625, -0.6761245727539062, -0.6544952392578125, -0.6328659057617188, -0.611236572265625, -0.5896072387695312, -0.5679779052734375, -0.5463485717773438, -0.52471923828125, -0.5030899047851562, -0.4814605712890625, -0.45983123779296875, -0.438201904296875, -0.41657257080078125, -0.3949432373046875, -0.37331390380859375, -0.3516845703125, -0.33005523681640625, -0.3084259033203125, -0.28679656982421875, -0.265167236328125, -0.24353790283203125, -0.2219085693359375, -0.20027923583984375, -0.17864990234375, -0.15702056884765625, -0.1353912353515625, -0.11376190185546875, -0.092132568359375, -0.07050323486328125, -0.0488739013671875, -0.02724456787109375, -0.005615234375, 0.01601409912109375, 0.0376434326171875, 0.05927276611328125, 0.080902099609375, 0.10253143310546875, 0.1241607666015625, 0.14579010009765625, 0.16741943359375, 0.18904876708984375, 0.2106781005859375, 0.23230743408203125, 0.253936767578125, 0.27556610107421875, 0.2971954345703125, 0.31882476806640625, 0.3404541015625, 0.36208343505859375, 0.3837127685546875, 0.40534210205078125, 0.426971435546875, 0.44860076904296875, 0.4702301025390625, 0.49185943603515625, 0.51348876953125, 0.5351181030273438, 0.5567474365234375, 0.5783767700195312, 0.600006103515625, 0.6216354370117188, 0.6432647705078125, 0.6648941040039062, 0.6865234375]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 8.0, 34.0, 103.0, 218.0, 281.0, 207.0, 92.0, 38.0, 8.0, 11.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.319669723510742, -6.899855136871338, -6.480040550231934, -6.0602264404296875, -5.640411853790283, -5.220597267150879, -4.800782680511475, -4.38096809387207, -3.961153745651245, -3.541339159011841, -3.1215248107910156, -2.7017102241516113, -2.281895637512207, -1.8620812892913818, -1.4422667026519775, -1.0224523544311523, -0.602637767791748, -0.1828232705593109, 0.23699122667312622, 0.6568057537078857, 1.0766202211380005, 1.4964346885681152, 1.9162492752075195, 2.3360636234283447, 2.755878210067749, 3.1756927967071533, 3.5955071449279785, 4.015321731567383, 4.435136318206787, 4.854950904846191, 5.2747650146484375, 5.694579601287842, 6.114394187927246, 6.53420877456665, 6.954023361206055, 7.373837471008301, 7.793652057647705, 8.21346664428711, 8.633281707763672, 9.053095817565918, 9.472909927368164, 9.89272403717041, 10.312539100646973, 10.732353210449219, 11.152168273925781, 11.571982383728027, 11.991796493530273, 12.411611557006836, 12.831426620483398, 13.251240730285645, 13.671055793762207, 14.090869903564453, 14.510684967041016, 14.930499076843262, 15.350313186645508, 15.77012825012207, 16.18994140625, 16.609756469726562, 17.029569625854492, 17.449384689331055, 17.869199752807617, 18.289012908935547, 18.70882797241211, 19.128643035888672, 19.548458099365234]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 2.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 17.0, 11.0, 24.0, 27.0, 22.0, 34.0, 28.0, 37.0, 31.0, 36.0, 48.0, 61.0, 59.0, 62.0, 60.0, 61.0, 56.0, 45.0, 42.0, 38.0, 31.0, 22.0, 24.0, 18.0, 14.0, 17.0, 10.0, 12.0, 8.0, 6.0, 7.0, 4.0, 1.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.4959716796875, -5.303989887237549, -5.1120076179504395, -4.920025825500488, -4.728043556213379, -4.536061763763428, -4.344079971313477, -4.152097702026367, -3.960115909576416, -3.7681338787078857, -3.5761518478393555, -3.3841700553894043, -3.192188024520874, -3.0002059936523438, -2.8082239627838135, -2.616241931915283, -2.424259901046753, -2.2322778701782227, -2.0402958393096924, -1.8483139276504517, -1.656332015991211, -1.4643499851226807, -1.2723679542541504, -1.0803860425949097, -0.8884040117263794, -0.6964220404624939, -0.5044400691986084, -0.3124580383300781, -0.12047606706619263, 0.07150590419769287, 0.26348793506622314, 0.45546984672546387, 0.6474518775939941, 0.8394338488578796, 1.0314158201217651, 1.2233978509902954, 1.4153797626495361, 1.6073617935180664, 1.7993438243865967, 1.9913257360458374, 2.183307647705078, 2.3752896785736084, 2.5672717094421387, 2.75925350189209, 2.95123553276062, 3.1432175636291504, 3.3351995944976807, 3.527181625366211, 3.719163656234741, 3.9111456871032715, 4.103127479553223, 4.295109748840332, 4.487091541290283, 4.679073333740234, 4.871055603027344, 5.063037395477295, 5.255019664764404, 5.4470014572143555, 5.638983726501465, 5.830965518951416, 6.022947788238525, 6.214929580688477, 6.406911849975586, 6.598893642425537, 6.790875434875488]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 8.0, 10.0, 10.0, 31.0, 64.0, 90.0, 246.0, 656.0, 2032.0, 9228.0, 80667.0, 3839843.0, 240790.0, 16075.0, 3051.0, 894.0, 310.0, 131.0, 65.0, 33.0, 17.0, 11.0, 10.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.89111328125, -0.8549728393554688, -0.8188323974609375, -0.7826919555664062, -0.746551513671875, -0.7104110717773438, -0.6742706298828125, -0.6381301879882812, -0.60198974609375, -0.5658493041992188, -0.5297088623046875, -0.49356842041015625, -0.457427978515625, -0.42128753662109375, -0.3851470947265625, -0.34900665283203125, -0.3128662109375, -0.27672576904296875, -0.2405853271484375, -0.20444488525390625, -0.168304443359375, -0.13216400146484375, -0.0960235595703125, -0.05988311767578125, -0.02374267578125, 0.01239776611328125, 0.0485382080078125, 0.08467864990234375, 0.120819091796875, 0.15695953369140625, 0.1930999755859375, 0.22924041748046875, 0.265380859375, 0.30152130126953125, 0.3376617431640625, 0.37380218505859375, 0.409942626953125, 0.44608306884765625, 0.4822235107421875, 0.5183639526367188, 0.55450439453125, 0.5906448364257812, 0.6267852783203125, 0.6629257202148438, 0.699066162109375, 0.7352066040039062, 0.7713470458984375, 0.8074874877929688, 0.8436279296875, 0.8797683715820312, 0.9159088134765625, 0.9520492553710938, 0.988189697265625, 1.0243301391601562, 1.0604705810546875, 1.0966110229492188, 1.13275146484375, 1.1688919067382812, 1.2050323486328125, 1.2411727905273438, 1.277313232421875, 1.3134536743164062, 1.3495941162109375, 1.3857345581054688, 1.421875]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 3.0, 4.0, 8.0, 6.0, 8.0, 13.0, 15.0, 28.0, 29.0, 38.0, 49.0, 55.0, 63.0, 62.0, 72.0, 69.0, 71.0, 69.0, 70.0, 62.0, 45.0, 38.0, 37.0, 21.0, 21.0, 20.0, 7.0, 8.0, 5.0, 5.0, 2.0, 2.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.26416015625, -0.2520294189453125, -0.239898681640625, -0.2277679443359375, -0.21563720703125, -0.2035064697265625, -0.191375732421875, -0.1792449951171875, -0.1671142578125, -0.1549835205078125, -0.142852783203125, -0.1307220458984375, -0.11859130859375, -0.1064605712890625, -0.094329833984375, -0.0821990966796875, -0.070068359375, -0.0579376220703125, -0.045806884765625, -0.0336761474609375, -0.02154541015625, -0.0094146728515625, 0.002716064453125, 0.0148468017578125, 0.0269775390625, 0.0391082763671875, 0.051239013671875, 0.0633697509765625, 0.07550048828125, 0.0876312255859375, 0.099761962890625, 0.1118927001953125, 0.1240234375, 0.1361541748046875, 0.148284912109375, 0.1604156494140625, 0.17254638671875, 0.1846771240234375, 0.196807861328125, 0.2089385986328125, 0.2210693359375, 0.2332000732421875, 0.245330810546875, 0.2574615478515625, 0.26959228515625, 0.2817230224609375, 0.293853759765625, 0.3059844970703125, 0.318115234375, 0.3302459716796875, 0.342376708984375, 0.3545074462890625, 0.36663818359375, 0.3787689208984375, 0.390899658203125, 0.4030303955078125, 0.4151611328125, 0.4272918701171875, 0.439422607421875, 0.4515533447265625, 0.46368408203125, 0.4758148193359375, 0.487945556640625, 0.5000762939453125, 0.51220703125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 7.0, 10.0, 29.0, 38.0, 76.0, 150.0, 400.0, 1898.0, 15583.0, 915338.0, 3236041.0, 21451.0, 2381.0, 527.0, 158.0, 85.0, 44.0, 14.0, 20.0, 10.0, 7.0, 4.0, 4.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.693359375, -1.64508056640625, -1.5968017578125, -1.54852294921875, -1.500244140625, -1.45196533203125, -1.4036865234375, -1.35540771484375, -1.30712890625, -1.25885009765625, -1.2105712890625, -1.16229248046875, -1.114013671875, -1.06573486328125, -1.0174560546875, -0.96917724609375, -0.9208984375, -0.87261962890625, -0.8243408203125, -0.77606201171875, -0.727783203125, -0.67950439453125, -0.6312255859375, -0.58294677734375, -0.53466796875, -0.48638916015625, -0.4381103515625, -0.38983154296875, -0.341552734375, -0.29327392578125, -0.2449951171875, -0.19671630859375, -0.1484375, -0.10015869140625, -0.0518798828125, -0.00360107421875, 0.044677734375, 0.09295654296875, 0.1412353515625, 0.18951416015625, 0.23779296875, 0.28607177734375, 0.3343505859375, 0.38262939453125, 0.430908203125, 0.47918701171875, 0.5274658203125, 0.57574462890625, 0.6240234375, 0.67230224609375, 0.7205810546875, 0.76885986328125, 0.817138671875, 0.86541748046875, 0.9136962890625, 0.96197509765625, 1.01025390625, 1.05853271484375, 1.1068115234375, 1.15509033203125, 1.203369140625, 1.25164794921875, 1.2999267578125, 1.34820556640625, 1.396484375]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 7.0, 7.0, 7.0, 9.0, 9.0, 29.0, 28.0, 62.0, 86.0, 193.0, 692.0, 1674.0, 826.0, 229.0, 92.0, 53.0, 22.0, 23.0, 10.0, 9.0, 6.0, 3.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9091796875, -0.8722076416015625, -0.835235595703125, -0.7982635498046875, -0.76129150390625, -0.7243194580078125, -0.687347412109375, -0.6503753662109375, -0.6134033203125, -0.5764312744140625, -0.539459228515625, -0.5024871826171875, -0.46551513671875, -0.4285430908203125, -0.391571044921875, -0.3545989990234375, -0.317626953125, -0.2806549072265625, -0.243682861328125, -0.2067108154296875, -0.16973876953125, -0.1327667236328125, -0.095794677734375, -0.0588226318359375, -0.0218505859375, 0.0151214599609375, 0.052093505859375, 0.0890655517578125, 0.12603759765625, 0.1630096435546875, 0.199981689453125, 0.2369537353515625, 0.27392578125, 0.3108978271484375, 0.347869873046875, 0.3848419189453125, 0.42181396484375, 0.4587860107421875, 0.495758056640625, 0.5327301025390625, 0.5697021484375, 0.6066741943359375, 0.643646240234375, 0.6806182861328125, 0.71759033203125, 0.7545623779296875, 0.791534423828125, 0.8285064697265625, 0.865478515625, 0.9024505615234375, 0.939422607421875, 0.9763946533203125, 1.01336669921875, 1.0503387451171875, 1.087310791015625, 1.1242828369140625, 1.1612548828125, 1.1982269287109375, 1.235198974609375, 1.2721710205078125, 1.30914306640625, 1.3461151123046875, 1.383087158203125, 1.4200592041015625, 1.45703125]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 5.0, 0.0, 7.0, 7.0, 15.0, 64.0, 250.0, 366.0, 225.0, 51.0, 9.0, 7.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-16.968063354492188, -16.549407958984375, -16.13075065612793, -15.712095260620117, -15.293439865112305, -14.874783515930176, -14.456127166748047, -14.037471771240234, -13.618816375732422, -13.200160026550293, -12.78150463104248, -12.362848281860352, -11.944192886352539, -11.52553653717041, -11.106880187988281, -10.688224792480469, -10.26956844329834, -9.850912094116211, -9.432256698608398, -9.01360034942627, -8.594944953918457, -8.176288604736328, -7.757632732391357, -7.338976860046387, -6.920320987701416, -6.501665115356445, -6.083009243011475, -5.664353370666504, -5.245697021484375, -4.8270416259765625, -4.408385276794434, -3.989729404449463, -3.5710744857788086, -3.152418613433838, -2.733762741088867, -2.3151066303253174, -1.8964507579803467, -1.477794885635376, -1.0591387748718262, -0.6404829025268555, -0.22182703018188477, 0.1968289017677307, 0.6154848337173462, 1.0341408252716064, 1.4527966976165771, 1.8714525699615479, 2.2901086807250977, 2.7087645530700684, 3.127420425415039, 3.5460762977600098, 3.9647321701049805, 4.383388519287109, 4.802043914794922, 5.220700263977051, 5.6393561363220215, 6.058012008666992, 6.476667881011963, 6.895323753356934, 7.313979625701904, 7.732635498046875, 8.151291847229004, 8.569947242736816, 8.988603591918945, 9.407258987426758, 9.825915336608887]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 6.0, 5.0, 3.0, 4.0, 1.0, 3.0, 12.0, 10.0, 13.0, 18.0, 25.0, 18.0, 32.0, 24.0, 29.0, 25.0, 31.0, 28.0, 48.0, 53.0, 42.0, 39.0, 38.0, 46.0, 42.0, 35.0, 44.0, 43.0, 40.0, 33.0, 27.0, 22.0, 35.0, 24.0, 13.0, 16.0, 13.0, 11.0, 14.0, 7.0, 7.0, 5.0, 4.0, 7.0, 3.0, 3.0, 1.0, 1.0, 3.0, 1.0, 3.0], "bins": [-3.2460854053497314, -3.154895782470703, -3.063706398010254, -2.9725167751312256, -2.8813271522521973, -2.790137529373169, -2.6989479064941406, -2.6077585220336914, -2.516568899154663, -2.4253792762756348, -2.3341898918151855, -2.2430002689361572, -2.151810646057129, -2.0606210231781006, -1.9694315195083618, -1.878242015838623, -1.7870523929595947, -1.6958627700805664, -1.6046732664108276, -1.5134837627410889, -1.4222941398620605, -1.3311045169830322, -1.2399150133132935, -1.1487255096435547, -1.0575358867645264, -0.9663463234901428, -0.8751567602157593, -0.7839671969413757, -0.6927776336669922, -0.6015880703926086, -0.5103985071182251, -0.41920894384384155, -0.328019380569458, -0.23682981729507446, -0.14564025402069092, -0.05445069074630737, 0.03673887252807617, 0.12792843580245972, 0.21911799907684326, 0.3103075623512268, 0.40149712562561035, 0.4926866888999939, 0.5838762521743774, 0.675065815448761, 0.7662553787231445, 0.8574449419975281, 0.9486345052719116, 1.0398240089416504, 1.1310136318206787, 1.222203254699707, 1.3133927583694458, 1.4045822620391846, 1.495771884918213, 1.5869615077972412, 1.67815101146698, 1.7693405151367188, 1.860530138015747, 1.9517197608947754, 2.0429091453552246, 2.134098768234253, 2.2252883911132812, 2.3164780139923096, 2.407667636871338, 2.498857021331787, 2.5900466442108154]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 3.0, 5.0, 6.0, 13.0, 22.0, 34.0, 58.0, 103.0, 195.0, 330.0, 653.0, 1213.0, 2369.0, 5171.0, 11671.0, 28271.0, 76037.0, 206326.0, 362844.0, 218735.0, 81266.0, 30502.0, 12215.0, 5284.0, 2498.0, 1298.0, 619.0, 357.0, 191.0, 110.0, 70.0, 24.0, 27.0, 13.0, 7.0, 8.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.378662109375, -0.3653907775878906, -0.35211944580078125, -0.3388481140136719, -0.3255767822265625, -0.3123054504394531, -0.29903411865234375, -0.2857627868652344, -0.272491455078125, -0.2592201232910156, -0.24594879150390625, -0.23267745971679688, -0.2194061279296875, -0.20613479614257812, -0.19286346435546875, -0.17959213256835938, -0.16632080078125, -0.15304946899414062, -0.13977813720703125, -0.12650680541992188, -0.1132354736328125, -0.09996414184570312, -0.08669281005859375, -0.07342147827148438, -0.060150146484375, -0.046878814697265625, -0.03360748291015625, -0.020336151123046875, -0.0070648193359375, 0.006206512451171875, 0.01947784423828125, 0.032749176025390625, 0.0460205078125, 0.059291839599609375, 0.07256317138671875, 0.08583450317382812, 0.0991058349609375, 0.11237716674804688, 0.12564849853515625, 0.13891983032226562, 0.152191162109375, 0.16546249389648438, 0.17873382568359375, 0.19200515747070312, 0.2052764892578125, 0.21854782104492188, 0.23181915283203125, 0.24509048461914062, 0.25836181640625, 0.2716331481933594, 0.28490447998046875, 0.2981758117675781, 0.3114471435546875, 0.3247184753417969, 0.33798980712890625, 0.3512611389160156, 0.364532470703125, 0.3778038024902344, 0.39107513427734375, 0.4043464660644531, 0.4176177978515625, 0.4308891296386719, 0.44416046142578125, 0.4574317932128906, 0.470703125]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 7.0, 2.0, 7.0, 10.0, 11.0, 29.0, 23.0, 24.0, 33.0, 24.0, 40.0, 60.0, 45.0, 41.0, 44.0, 41.0, 43.0, 52.0, 63.0, 60.0, 44.0, 37.0, 41.0, 39.0, 32.0, 30.0, 26.0, 18.0, 19.0, 20.0, 9.0, 11.0, 4.0, 4.0, 3.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.259765625, -0.2508583068847656, -0.24195098876953125, -0.23304367065429688, -0.2241363525390625, -0.21522903442382812, -0.20632171630859375, -0.19741439819335938, -0.188507080078125, -0.17959976196289062, -0.17069244384765625, -0.16178512573242188, -0.1528778076171875, -0.14397048950195312, -0.13506317138671875, -0.12615585327148438, -0.11724853515625, -0.10834121704101562, -0.09943389892578125, -0.09052658081054688, -0.0816192626953125, -0.07271194458007812, -0.06380462646484375, -0.054897308349609375, -0.045989990234375, -0.037082672119140625, -0.02817535400390625, -0.019268035888671875, -0.0103607177734375, -0.001453399658203125, 0.00745391845703125, 0.016361236572265625, 0.0252685546875, 0.034175872802734375, 0.04308319091796875, 0.051990509033203125, 0.0608978271484375, 0.06980514526367188, 0.07871246337890625, 0.08761978149414062, 0.096527099609375, 0.10543441772460938, 0.11434173583984375, 0.12324905395507812, 0.1321563720703125, 0.14106369018554688, 0.14997100830078125, 0.15887832641601562, 0.16778564453125, 0.17669296264648438, 0.18560028076171875, 0.19450759887695312, 0.2034149169921875, 0.21232223510742188, 0.22122955322265625, 0.23013687133789062, 0.239044189453125, 0.24795150756835938, 0.25685882568359375, 0.2657661437988281, 0.2746734619140625, 0.2835807800292969, 0.29248809814453125, 0.3013954162597656, 0.310302734375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 6.0, 6.0, 11.0, 9.0, 10.0, 14.0, 13.0, 25.0, 28.0, 50.0, 59.0, 92.0, 133.0, 246.0, 344.0, 519.0, 952.0, 1767.0, 4505.0, 22218.0, 239045.0, 695773.0, 67810.0, 9071.0, 2650.0, 1272.0, 685.0, 431.0, 276.0, 147.0, 107.0, 99.0, 56.0, 36.0, 25.0, 23.0, 13.0, 10.0, 5.0, 5.0, 3.0, 5.0, 0.0, 3.0, 1.0, 2.0], "bins": [-0.99365234375, -0.9683380126953125, -0.943023681640625, -0.9177093505859375, -0.89239501953125, -0.8670806884765625, -0.841766357421875, -0.8164520263671875, -0.7911376953125, -0.7658233642578125, -0.740509033203125, -0.7151947021484375, -0.68988037109375, -0.6645660400390625, -0.639251708984375, -0.6139373779296875, -0.588623046875, -0.5633087158203125, -0.537994384765625, -0.5126800537109375, -0.48736572265625, -0.4620513916015625, -0.436737060546875, -0.4114227294921875, -0.3861083984375, -0.3607940673828125, -0.335479736328125, -0.3101654052734375, -0.28485107421875, -0.2595367431640625, -0.234222412109375, -0.2089080810546875, -0.18359375, -0.1582794189453125, -0.132965087890625, -0.1076507568359375, -0.08233642578125, -0.0570220947265625, -0.031707763671875, -0.0063934326171875, 0.0189208984375, 0.0442352294921875, 0.069549560546875, 0.0948638916015625, 0.12017822265625, 0.1454925537109375, 0.170806884765625, 0.1961212158203125, 0.221435546875, 0.2467498779296875, 0.272064208984375, 0.2973785400390625, 0.32269287109375, 0.3480072021484375, 0.373321533203125, 0.3986358642578125, 0.4239501953125, 0.4492645263671875, 0.474578857421875, 0.4998931884765625, 0.52520751953125, 0.5505218505859375, 0.575836181640625, 0.6011505126953125, 0.62646484375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 0.0, 2.0, 4.0, 8.0, 11.0, 11.0, 5.0, 13.0, 10.0, 12.0, 13.0, 21.0, 24.0, 32.0, 37.0, 33.0, 50.0, 34.0, 36.0, 29.0, 51.0, 41.0, 41.0, 48.0, 46.0, 44.0, 43.0, 32.0, 42.0, 29.0, 31.0, 21.0, 24.0, 18.0, 24.0, 14.0, 13.0, 13.0, 6.0, 8.0, 4.0, 10.0, 9.0, 3.0, 2.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0], "bins": [-1.052734375, -1.0234909057617188, -0.9942474365234375, -0.9650039672851562, -0.935760498046875, -0.9065170288085938, -0.8772735595703125, -0.8480300903320312, -0.81878662109375, -0.7895431518554688, -0.7602996826171875, -0.7310562133789062, -0.701812744140625, -0.6725692749023438, -0.6433258056640625, -0.6140823364257812, -0.5848388671875, -0.5555953979492188, -0.5263519287109375, -0.49710845947265625, -0.467864990234375, -0.43862152099609375, -0.4093780517578125, -0.38013458251953125, -0.35089111328125, -0.32164764404296875, -0.2924041748046875, -0.26316070556640625, -0.233917236328125, -0.20467376708984375, -0.1754302978515625, -0.14618682861328125, -0.116943359375, -0.08769989013671875, -0.0584564208984375, -0.02921295166015625, 3.0517578125e-05, 0.02927398681640625, 0.0585174560546875, 0.08776092529296875, 0.11700439453125, 0.14624786376953125, 0.1754913330078125, 0.20473480224609375, 0.233978271484375, 0.26322174072265625, 0.2924652099609375, 0.32170867919921875, 0.3509521484375, 0.38019561767578125, 0.4094390869140625, 0.43868255615234375, 0.467926025390625, 0.49716949462890625, 0.5264129638671875, 0.5556564331054688, 0.58489990234375, 0.6141433715820312, 0.6433868408203125, 0.6726303100585938, 0.701873779296875, 0.7311172485351562, 0.7603607177734375, 0.7896041870117188, 0.81884765625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0, 2.0, 3.0, 1.0, 6.0, 5.0, 10.0, 24.0, 28.0, 58.0, 119.0, 306.0, 1221.0, 12467.0, 930351.0, 99918.0, 3093.0, 560.0, 202.0, 85.0, 37.0, 23.0, 16.0, 8.0, 11.0, 5.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87646484375, -0.8526077270507812, -0.8287506103515625, -0.8048934936523438, -0.781036376953125, -0.7571792602539062, -0.7333221435546875, -0.7094650268554688, -0.68560791015625, -0.6617507934570312, -0.6378936767578125, -0.6140365600585938, -0.590179443359375, -0.5663223266601562, -0.5424652099609375, -0.5186080932617188, -0.4947509765625, -0.47089385986328125, -0.4470367431640625, -0.42317962646484375, -0.399322509765625, -0.37546539306640625, -0.3516082763671875, -0.32775115966796875, -0.30389404296875, -0.28003692626953125, -0.2561798095703125, -0.23232269287109375, -0.208465576171875, -0.18460845947265625, -0.1607513427734375, -0.13689422607421875, -0.113037109375, -0.08917999267578125, -0.0653228759765625, -0.04146575927734375, -0.017608642578125, 0.00624847412109375, 0.0301055908203125, 0.05396270751953125, 0.07781982421875, 0.10167694091796875, 0.1255340576171875, 0.14939117431640625, 0.173248291015625, 0.19710540771484375, 0.2209625244140625, 0.24481964111328125, 0.2686767578125, 0.29253387451171875, 0.3163909912109375, 0.34024810791015625, 0.364105224609375, 0.38796234130859375, 0.4118194580078125, 0.43567657470703125, 0.45953369140625, 0.48339080810546875, 0.5072479248046875, 0.5311050415039062, 0.554962158203125, 0.5788192749023438, 0.6026763916015625, 0.6265335083007812, 0.650390625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 4.0, 4.0, 5.0, 5.0, 6.0, 6.0, 6.0, 16.0, 13.0, 22.0, 26.0, 27.0, 30.0, 48.0, 65.0, 69.0, 109.0, 105.0, 85.0, 74.0, 63.0, 50.0, 28.0, 31.0, 19.0, 16.0, 16.0, 16.0, 9.0, 8.0, 6.0, 5.0, 6.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.857778549194336e-05, -4.680175334215164e-05, -4.5025721192359924e-05, -4.324968904256821e-05, -4.147365689277649e-05, -3.969762474298477e-05, -3.7921592593193054e-05, -3.614556044340134e-05, -3.436952829360962e-05, -3.25934961438179e-05, -3.0817463994026184e-05, -2.9041431844234467e-05, -2.726539969444275e-05, -2.548936754465103e-05, -2.3713335394859314e-05, -2.1937303245067596e-05, -2.016127109527588e-05, -1.838523894548416e-05, -1.6609206795692444e-05, -1.4833174645900726e-05, -1.3057142496109009e-05, -1.1281110346317291e-05, -9.505078196525574e-06, -7.729046046733856e-06, -5.953013896942139e-06, -4.176981747150421e-06, -2.4009495973587036e-06, -6.249174475669861e-07, 1.1511147022247314e-06, 2.927146852016449e-06, 4.7031790018081665e-06, 6.479211151599884e-06, 8.255243301391602e-06, 1.0031275451183319e-05, 1.1807307600975037e-05, 1.3583339750766754e-05, 1.535937190055847e-05, 1.713540405035019e-05, 1.8911436200141907e-05, 2.0687468349933624e-05, 2.2463500499725342e-05, 2.423953264951706e-05, 2.6015564799308777e-05, 2.7791596949100494e-05, 2.9567629098892212e-05, 3.134366124868393e-05, 3.311969339847565e-05, 3.4895725548267365e-05, 3.667175769805908e-05, 3.84477898478508e-05, 4.022382199764252e-05, 4.1999854147434235e-05, 4.377588629722595e-05, 4.555191844701767e-05, 4.732795059680939e-05, 4.9103982746601105e-05, 5.088001489639282e-05, 5.265604704618454e-05, 5.443207919597626e-05, 5.6208111345767975e-05, 5.798414349555969e-05, 5.976017564535141e-05, 6.153620779514313e-05, 6.331223994493484e-05, 6.508827209472656e-05]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 4.0, 6.0, 6.0, 12.0, 13.0, 34.0, 47.0, 85.0, 128.0, 284.0, 629.0, 1863.0, 7308.0, 89089.0, 874672.0, 65375.0, 6255.0, 1556.0, 556.0, 276.0, 140.0, 86.0, 38.0, 29.0, 14.0, 10.0, 12.0, 5.0, 9.0, 2.0, 7.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.55419921875, -0.5385665893554688, -0.5229339599609375, -0.5073013305664062, -0.491668701171875, -0.47603607177734375, -0.4604034423828125, -0.44477081298828125, -0.42913818359375, -0.41350555419921875, -0.3978729248046875, -0.38224029541015625, -0.366607666015625, -0.35097503662109375, -0.3353424072265625, -0.31970977783203125, -0.3040771484375, -0.28844451904296875, -0.2728118896484375, -0.25717926025390625, -0.241546630859375, -0.22591400146484375, -0.2102813720703125, -0.19464874267578125, -0.17901611328125, -0.16338348388671875, -0.1477508544921875, -0.13211822509765625, -0.116485595703125, -0.10085296630859375, -0.0852203369140625, -0.06958770751953125, -0.053955078125, -0.03832244873046875, -0.0226898193359375, -0.00705718994140625, 0.008575439453125, 0.02420806884765625, 0.0398406982421875, 0.05547332763671875, 0.07110595703125, 0.08673858642578125, 0.1023712158203125, 0.11800384521484375, 0.133636474609375, 0.14926910400390625, 0.1649017333984375, 0.18053436279296875, 0.1961669921875, 0.21179962158203125, 0.2274322509765625, 0.24306488037109375, 0.258697509765625, 0.27433013916015625, 0.2899627685546875, 0.30559539794921875, 0.32122802734375, 0.33686065673828125, 0.3524932861328125, 0.36812591552734375, 0.383758544921875, 0.39939117431640625, 0.4150238037109375, 0.43065643310546875, 0.4462890625]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 5.0, 4.0, 13.0, 10.0, 10.0, 16.0, 19.0, 27.0, 33.0, 30.0, 40.0, 54.0, 63.0, 68.0, 80.0, 57.0, 71.0, 81.0, 56.0, 50.0, 29.0, 38.0, 27.0, 25.0, 24.0, 19.0, 6.0, 9.0, 11.0, 6.0, 6.0, 3.0, 7.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2303466796875, -0.2220172882080078, -0.21368789672851562, -0.20535850524902344, -0.19702911376953125, -0.18869972229003906, -0.18037033081054688, -0.1720409393310547, -0.1637115478515625, -0.1553821563720703, -0.14705276489257812, -0.13872337341308594, -0.13039398193359375, -0.12206459045410156, -0.11373519897460938, -0.10540580749511719, -0.097076416015625, -0.08874702453613281, -0.08041763305664062, -0.07208824157714844, -0.06375885009765625, -0.05542945861816406, -0.047100067138671875, -0.03877067565917969, -0.0304412841796875, -0.022111892700195312, -0.013782501220703125, -0.0054531097412109375, 0.00287628173828125, 0.011205673217773438, 0.019535064697265625, 0.027864456176757812, 0.03619384765625, 0.04452323913574219, 0.052852630615234375, 0.06118202209472656, 0.06951141357421875, 0.07784080505371094, 0.08617019653320312, 0.09449958801269531, 0.1028289794921875, 0.11115837097167969, 0.11948776245117188, 0.12781715393066406, 0.13614654541015625, 0.14447593688964844, 0.15280532836914062, 0.1611347198486328, 0.169464111328125, 0.1777935028076172, 0.18612289428710938, 0.19445228576660156, 0.20278167724609375, 0.21111106872558594, 0.21944046020507812, 0.2277698516845703, 0.2360992431640625, 0.2444286346435547, 0.2527580261230469, 0.26108741760253906, 0.26941680908203125, 0.27774620056152344, 0.2860755920410156, 0.2944049835205078, 0.302734375]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 6.0, 5.0, 22.0, 95.0, 325.0, 385.0, 134.0, 21.0, 4.0, 5.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.046024322509766, -14.641167640686035, -14.236310958862305, -13.831453323364258, -13.426596641540527, -13.021739959716797, -12.61688232421875, -12.21202564239502, -11.807168960571289, -11.402312278747559, -10.997455596923828, -10.592597961425781, -10.18774127960205, -9.78288459777832, -9.378026962280273, -8.973170280456543, -8.568313598632812, -8.163456916809082, -7.758599758148193, -7.353742599487305, -6.948885917663574, -6.544029235839844, -6.139172077178955, -5.734314918518066, -5.329458236694336, -4.9246015548706055, -4.519744396209717, -4.114887237548828, -3.7100305557250977, -3.305173635482788, -2.9003167152404785, -2.495459794998169, -2.090603828430176, -1.6857469081878662, -1.2808899879455566, -0.8760330677032471, -0.4711761474609375, -0.06631922721862793, 0.33853769302368164, 0.7433946132659912, 1.1482515335083008, 1.5531084537506104, 1.95796537399292, 2.3628222942352295, 2.767679214477539, 3.1725361347198486, 3.577393054962158, 3.9822499752044678, 4.387106895446777, 4.791963577270508, 5.1968207359313965, 5.601677894592285, 6.006534576416016, 6.411391258239746, 6.816248416900635, 7.221105575561523, 7.625962257385254, 8.030818939208984, 8.435676574707031, 8.840533256530762, 9.245389938354492, 9.650246620178223, 10.055103302001953, 10.4599609375, 10.86481761932373]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 2.0, 10.0, 14.0, 8.0, 13.0, 31.0, 32.0, 34.0, 28.0, 44.0, 51.0, 54.0, 79.0, 99.0, 82.0, 56.0, 63.0, 36.0, 67.0, 41.0, 35.0, 27.0, 26.0, 16.0, 15.0, 8.0, 8.0, 10.0, 3.0, 4.0, 2.0, 4.0, 2.0, 2.0, 2.0], "bins": [-7.669978141784668, -7.492786407470703, -7.315594673156738, -7.138402938842773, -6.961211204528809, -6.784019947052002, -6.606828212738037, -6.429636478424072, -6.252444744110107, -6.075253009796143, -5.898061275482178, -5.720869541168213, -5.543678283691406, -5.366486549377441, -5.189294815063477, -5.012103080749512, -4.834911346435547, -4.657719612121582, -4.480527877807617, -4.303336143493652, -4.1261444091796875, -3.9489529132843018, -3.771761417388916, -3.594569683074951, -3.4173779487609863, -3.2401862144470215, -3.0629944801330566, -2.885802984237671, -2.708611249923706, -2.531419515609741, -2.3542280197143555, -2.1770362854003906, -1.999845027923584, -1.8226532936096191, -1.6454616785049438, -1.4682700634002686, -1.2910783290863037, -1.1138865947723389, -0.9366949796676636, -0.7595033645629883, -0.5823116302490234, -0.40511995553970337, -0.2279282808303833, -0.05073660612106323, 0.12645506858825684, 0.3036467432975769, 0.480838418006897, 0.6580300331115723, 0.8352217674255371, 1.012413501739502, 1.1896051168441772, 1.3667967319488525, 1.5439884662628174, 1.7211802005767822, 1.8983718156814575, 2.075563430786133, 2.2527551651000977, 2.4299468994140625, 2.6071386337280273, 2.784330129623413, 2.961521863937378, 3.1387135982513428, 3.3159050941467285, 3.4930968284606934, 3.670288562774658]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 5.0, 5.0, 2.0, 8.0, 9.0, 11.0, 23.0, 22.0, 25.0, 42.0, 54.0, 74.0, 95.0, 160.0, 262.0, 732.0, 8265.0, 4038276.0, 143213.0, 2056.0, 345.0, 168.0, 107.0, 72.0, 65.0, 43.0, 30.0, 22.0, 26.0, 15.0, 9.0, 8.0, 11.0, 5.0, 5.0, 3.0, 2.0, 0.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.15234375, -2.0921783447265625, -2.032012939453125, -1.9718475341796875, -1.91168212890625, -1.8515167236328125, -1.791351318359375, -1.7311859130859375, -1.6710205078125, -1.6108551025390625, -1.550689697265625, -1.4905242919921875, -1.43035888671875, -1.3701934814453125, -1.310028076171875, -1.2498626708984375, -1.189697265625, -1.1295318603515625, -1.069366455078125, -1.0092010498046875, -0.94903564453125, -0.8888702392578125, -0.828704833984375, -0.7685394287109375, -0.7083740234375, -0.6482086181640625, -0.588043212890625, -0.5278778076171875, -0.46771240234375, -0.4075469970703125, -0.347381591796875, -0.2872161865234375, -0.22705078125, -0.1668853759765625, -0.106719970703125, -0.0465545654296875, 0.01361083984375, 0.0737762451171875, 0.133941650390625, 0.1941070556640625, 0.2542724609375, 0.3144378662109375, 0.374603271484375, 0.4347686767578125, 0.49493408203125, 0.5550994873046875, 0.615264892578125, 0.6754302978515625, 0.735595703125, 0.7957611083984375, 0.855926513671875, 0.9160919189453125, 0.97625732421875, 1.0364227294921875, 1.096588134765625, 1.1567535400390625, 1.2169189453125, 1.2770843505859375, 1.337249755859375, 1.3974151611328125, 1.45758056640625, 1.5177459716796875, 1.577911376953125, 1.6380767822265625, 1.6982421875]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 7.0, 18.0, 18.0, 22.0, 43.0, 39.0, 50.0, 66.0, 59.0, 83.0, 84.0, 115.0, 98.0, 85.0, 57.0, 46.0, 40.0, 24.0, 17.0, 20.0, 7.0, 3.0, 9.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.57763671875, -0.5634689331054688, -0.5493011474609375, -0.5351333618164062, -0.520965576171875, -0.5067977905273438, -0.4926300048828125, -0.47846221923828125, -0.46429443359375, -0.45012664794921875, -0.4359588623046875, -0.42179107666015625, -0.407623291015625, -0.39345550537109375, -0.3792877197265625, -0.36511993408203125, -0.3509521484375, -0.33678436279296875, -0.3226165771484375, -0.30844879150390625, -0.294281005859375, -0.28011322021484375, -0.2659454345703125, -0.25177764892578125, -0.23760986328125, -0.22344207763671875, -0.2092742919921875, -0.19510650634765625, -0.180938720703125, -0.16677093505859375, -0.1526031494140625, -0.13843536376953125, -0.124267578125, -0.11009979248046875, -0.0959320068359375, -0.08176422119140625, -0.067596435546875, -0.05342864990234375, -0.0392608642578125, -0.02509307861328125, -0.01092529296875, 0.00324249267578125, 0.0174102783203125, 0.03157806396484375, 0.045745849609375, 0.05991363525390625, 0.0740814208984375, 0.08824920654296875, 0.1024169921875, 0.11658477783203125, 0.1307525634765625, 0.14492034912109375, 0.159088134765625, 0.17325592041015625, 0.1874237060546875, 0.20159149169921875, 0.21575927734375, 0.22992706298828125, 0.2440948486328125, 0.25826263427734375, 0.272430419921875, 0.28659820556640625, 0.3007659912109375, 0.31493377685546875, 0.3291015625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 0.0, 0.0, 0.0, 2.0, 7.0, 7.0, 7.0, 7.0, 11.0, 12.0, 17.0, 20.0, 49.0, 89.0, 155.0, 294.0, 577.0, 1112.0, 2182.0, 4426.0, 10039.0, 26821.0, 101476.0, 1091139.0, 2688761.0, 202406.0, 40239.0, 13343.0, 5746.0, 2669.0, 1265.0, 641.0, 334.0, 183.0, 94.0, 55.0, 32.0, 17.0, 16.0, 14.0, 2.0, 8.0, 3.0, 3.0, 5.0, 3.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.359375, -0.3474693298339844, -0.33556365966796875, -0.3236579895019531, -0.3117523193359375, -0.2998466491699219, -0.28794097900390625, -0.2760353088378906, -0.264129638671875, -0.2522239685058594, -0.24031829833984375, -0.22841262817382812, -0.2165069580078125, -0.20460128784179688, -0.19269561767578125, -0.18078994750976562, -0.16888427734375, -0.15697860717773438, -0.14507293701171875, -0.13316726684570312, -0.1212615966796875, -0.10935592651367188, -0.09745025634765625, -0.08554458618164062, -0.073638916015625, -0.061733245849609375, -0.04982757568359375, -0.037921905517578125, -0.0260162353515625, -0.014110565185546875, -0.00220489501953125, 0.009700775146484375, 0.0216064453125, 0.033512115478515625, 0.04541778564453125, 0.057323455810546875, 0.0692291259765625, 0.08113479614257812, 0.09304046630859375, 0.10494613647460938, 0.116851806640625, 0.12875747680664062, 0.14066314697265625, 0.15256881713867188, 0.1644744873046875, 0.17638015747070312, 0.18828582763671875, 0.20019149780273438, 0.21209716796875, 0.22400283813476562, 0.23590850830078125, 0.24781417846679688, 0.2597198486328125, 0.2716255187988281, 0.28353118896484375, 0.2954368591308594, 0.307342529296875, 0.3192481994628906, 0.33115386962890625, 0.3430595397949219, 0.3549652099609375, 0.3668708801269531, 0.37877655029296875, 0.3906822204589844, 0.402587890625]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 3.0, 4.0, 6.0, 9.0, 14.0, 14.0, 25.0, 35.0, 38.0, 57.0, 88.0, 178.0, 330.0, 571.0, 868.0, 773.0, 421.0, 247.0, 136.0, 83.0, 51.0, 31.0, 20.0, 11.0, 6.0, 12.0, 4.0, 3.0, 4.0, 6.0, 3.0, 1.0, 7.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.51611328125, -0.5012588500976562, -0.4864044189453125, -0.47154998779296875, -0.456695556640625, -0.44184112548828125, -0.4269866943359375, -0.41213226318359375, -0.39727783203125, -0.38242340087890625, -0.3675689697265625, -0.35271453857421875, -0.337860107421875, -0.32300567626953125, -0.3081512451171875, -0.29329681396484375, -0.2784423828125, -0.26358795166015625, -0.2487335205078125, -0.23387908935546875, -0.219024658203125, -0.20417022705078125, -0.1893157958984375, -0.17446136474609375, -0.15960693359375, -0.14475250244140625, -0.1298980712890625, -0.11504364013671875, -0.100189208984375, -0.08533477783203125, -0.0704803466796875, -0.05562591552734375, -0.040771484375, -0.02591705322265625, -0.0110626220703125, 0.00379180908203125, 0.018646240234375, 0.03350067138671875, 0.0483551025390625, 0.06320953369140625, 0.07806396484375, 0.09291839599609375, 0.1077728271484375, 0.12262725830078125, 0.137481689453125, 0.15233612060546875, 0.1671905517578125, 0.18204498291015625, 0.1968994140625, 0.21175384521484375, 0.2266082763671875, 0.24146270751953125, 0.256317138671875, 0.27117156982421875, 0.2860260009765625, 0.30088043212890625, 0.31573486328125, 0.33058929443359375, 0.3454437255859375, 0.36029815673828125, 0.375152587890625, 0.39000701904296875, 0.4048614501953125, 0.41971588134765625, 0.4345703125]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 5.0, 4.0, 8.0, 20.0, 93.0, 244.0, 346.0, 191.0, 54.0, 18.0, 8.0, 3.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0992560386657715, -6.858548164367676, -6.617840766906738, -6.377132892608643, -6.136425495147705, -5.895717620849609, -5.655010223388672, -5.414302349090576, -5.1735944747924805, -4.932886600494385, -4.692179203033447, -4.451471328735352, -4.210763931274414, -3.9700560569763184, -3.7293484210968018, -3.488640785217285, -3.2479333877563477, -3.007225751876831, -2.7665181159973145, -2.5258102416992188, -2.2851028442382812, -2.0443949699401855, -1.803687334060669, -1.5629796981811523, -1.3222720623016357, -1.0815644264221191, -0.8408567309379578, -0.6001490354537964, -0.3594413995742798, -0.11873376369476318, 0.12197399139404297, 0.36268162727355957, 0.603388786315918, 0.8440964221954346, 1.0848040580749512, 1.3255118131637573, 1.566219449043274, 1.8069270849227905, 2.0476348400115967, 2.2883424758911133, 2.52905011177063, 2.7697577476501465, 3.010465383529663, 3.2511730194091797, 3.4918808937072754, 3.732588291168213, 3.9732961654663086, 4.214003562927246, 4.454711437225342, 4.6954193115234375, 4.936126708984375, 5.176834583282471, 5.417541980743408, 5.658249855041504, 5.898957252502441, 6.139665126800537, 6.380373001098633, 6.6210808753967285, 6.861788272857666, 7.102496147155762, 7.343203544616699, 7.583911418914795, 7.824619293212891, 8.065326690673828, 8.306034088134766]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 3.0, 6.0, 8.0, 11.0, 10.0, 12.0, 26.0, 19.0, 25.0, 32.0, 41.0, 56.0, 50.0, 61.0, 72.0, 70.0, 59.0, 59.0, 56.0, 52.0, 49.0, 44.0, 44.0, 20.0, 19.0, 25.0, 21.0, 15.0, 13.0, 14.0, 7.0, 4.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9894845485687256, -1.9106454849243164, -1.8318064212799072, -1.752967357635498, -1.6741282939910889, -1.5952892303466797, -1.516450047492981, -1.4376109838485718, -1.3587719202041626, -1.2799328565597534, -1.2010937929153442, -1.122254729270935, -1.0434155464172363, -0.9645765423774719, -0.885737419128418, -0.8068983554840088, -0.7280592918395996, -0.6492202281951904, -0.5703811645507812, -0.4915420413017273, -0.4127029776573181, -0.33386391401290894, -0.25502482056617737, -0.1761857271194458, -0.09734666347503662, -0.018507584929466248, 0.060331493616104126, 0.1391705721616745, 0.21800965070724487, 0.29684871435165405, 0.3756878077983856, 0.4545269012451172, 0.5333657264709473, 0.6122047901153564, 0.6910438537597656, 0.7698829770088196, 0.8487220406532288, 0.9275611042976379, 1.006400227546692, 1.085239291191101, 1.1640783548355103, 1.2429174184799194, 1.3217564821243286, 1.4005955457687378, 1.4794347286224365, 1.5582737922668457, 1.6371128559112549, 1.715951919555664, 1.7947909832000732, 1.8736300468444824, 1.9524691104888916, 2.031308174133301, 2.11014723777771, 2.188986301422119, 2.2678253650665283, 2.3466644287109375, 2.425503730773926, 2.504342794418335, 2.583181858062744, 2.6620209217071533, 2.7408599853515625, 2.8196990489959717, 2.898538112640381, 2.977377414703369, 3.056216239929199]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 4.0, 1.0, 3.0, 0.0, 3.0, 5.0, 3.0, 13.0, 12.0, 24.0, 21.0, 45.0, 67.0, 99.0, 164.0, 267.0, 403.0, 643.0, 1210.0, 2225.0, 4129.0, 8388.0, 18064.0, 40113.0, 98506.0, 237731.0, 332307.0, 175529.0, 71153.0, 29876.0, 13679.0, 6447.0, 3284.0, 1677.0, 939.0, 542.0, 346.0, 230.0, 139.0, 84.0, 61.0, 44.0, 21.0, 12.0, 15.0, 12.0, 9.0, 5.0, 6.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.30712890625, -0.2962837219238281, -0.28543853759765625, -0.2745933532714844, -0.2637481689453125, -0.2529029846191406, -0.24205780029296875, -0.23121261596679688, -0.220367431640625, -0.20952224731445312, -0.19867706298828125, -0.18783187866210938, -0.1769866943359375, -0.16614151000976562, -0.15529632568359375, -0.14445114135742188, -0.13360595703125, -0.12276077270507812, -0.11191558837890625, -0.10107040405273438, -0.0902252197265625, -0.07938003540039062, -0.06853485107421875, -0.057689666748046875, -0.046844482421875, -0.035999298095703125, -0.02515411376953125, -0.014308929443359375, -0.0034637451171875, 0.007381439208984375, 0.01822662353515625, 0.029071807861328125, 0.0399169921875, 0.050762176513671875, 0.06160736083984375, 0.07245254516601562, 0.0832977294921875, 0.09414291381835938, 0.10498809814453125, 0.11583328247070312, 0.126678466796875, 0.13752365112304688, 0.14836883544921875, 0.15921401977539062, 0.1700592041015625, 0.18090438842773438, 0.19174957275390625, 0.20259475708007812, 0.21343994140625, 0.22428512573242188, 0.23513031005859375, 0.24597549438476562, 0.2568206787109375, 0.2676658630371094, 0.27851104736328125, 0.2893562316894531, 0.300201416015625, 0.3110466003417969, 0.32189178466796875, 0.3327369689941406, 0.3435821533203125, 0.3544273376464844, 0.36527252197265625, 0.3761177062988281, 0.386962890625]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 3.0, 8.0, 7.0, 12.0, 12.0, 14.0, 19.0, 14.0, 12.0, 21.0, 26.0, 33.0, 36.0, 46.0, 26.0, 41.0, 37.0, 59.0, 49.0, 56.0, 50.0, 47.0, 46.0, 45.0, 55.0, 28.0, 37.0, 29.0, 24.0, 14.0, 24.0, 16.0, 11.0, 12.0, 2.0, 12.0, 6.0, 3.0, 1.0, 4.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21044921875, -0.20273590087890625, -0.1950225830078125, -0.18730926513671875, -0.179595947265625, -0.17188262939453125, -0.1641693115234375, -0.15645599365234375, -0.14874267578125, -0.14102935791015625, -0.1333160400390625, -0.12560272216796875, -0.117889404296875, -0.11017608642578125, -0.1024627685546875, -0.09474945068359375, -0.0870361328125, -0.07932281494140625, -0.0716094970703125, -0.06389617919921875, -0.056182861328125, -0.04846954345703125, -0.0407562255859375, -0.03304290771484375, -0.02532958984375, -0.01761627197265625, -0.0099029541015625, -0.00218963623046875, 0.005523681640625, 0.01323699951171875, 0.0209503173828125, 0.02866363525390625, 0.036376953125, 0.04409027099609375, 0.0518035888671875, 0.05951690673828125, 0.067230224609375, 0.07494354248046875, 0.0826568603515625, 0.09037017822265625, 0.09808349609375, 0.10579681396484375, 0.1135101318359375, 0.12122344970703125, 0.128936767578125, 0.13665008544921875, 0.1443634033203125, 0.15207672119140625, 0.1597900390625, 0.16750335693359375, 0.1752166748046875, 0.18292999267578125, 0.190643310546875, 0.19835662841796875, 0.2060699462890625, 0.21378326416015625, 0.22149658203125, 0.22920989990234375, 0.2369232177734375, 0.24463653564453125, 0.252349853515625, 0.26006317138671875, 0.2677764892578125, 0.27548980712890625, 0.283203125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 4.0, 1.0, 1.0, 2.0, 3.0, 8.0, 11.0, 14.0, 17.0, 28.0, 50.0, 74.0, 108.0, 179.0, 325.0, 605.0, 1352.0, 4166.0, 22296.0, 242783.0, 697854.0, 65954.0, 8560.0, 2190.0, 877.0, 454.0, 243.0, 133.0, 98.0, 48.0, 38.0, 23.0, 15.0, 14.0, 8.0, 6.0, 3.0, 8.0, 2.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.7939453125, -0.7676925659179688, -0.7414398193359375, -0.7151870727539062, -0.688934326171875, -0.6626815795898438, -0.6364288330078125, -0.6101760864257812, -0.58392333984375, -0.5576705932617188, -0.5314178466796875, -0.5051651000976562, -0.478912353515625, -0.45265960693359375, -0.4264068603515625, -0.40015411376953125, -0.3739013671875, -0.34764862060546875, -0.3213958740234375, -0.29514312744140625, -0.268890380859375, -0.24263763427734375, -0.2163848876953125, -0.19013214111328125, -0.16387939453125, -0.13762664794921875, -0.1113739013671875, -0.08512115478515625, -0.058868408203125, -0.03261566162109375, -0.0063629150390625, 0.01988983154296875, 0.046142578125, 0.07239532470703125, 0.0986480712890625, 0.12490081787109375, 0.151153564453125, 0.17740631103515625, 0.2036590576171875, 0.22991180419921875, 0.25616455078125, 0.28241729736328125, 0.3086700439453125, 0.33492279052734375, 0.361175537109375, 0.38742828369140625, 0.4136810302734375, 0.43993377685546875, 0.4661865234375, 0.49243927001953125, 0.5186920166015625, 0.5449447631835938, 0.571197509765625, 0.5974502563476562, 0.6237030029296875, 0.6499557495117188, 0.67620849609375, 0.7024612426757812, 0.7287139892578125, 0.7549667358398438, 0.781219482421875, 0.8074722290039062, 0.8337249755859375, 0.8599777221679688, 0.88623046875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 3.0, 3.0, 1.0, 4.0, 5.0, 15.0, 5.0, 17.0, 15.0, 9.0, 22.0, 24.0, 34.0, 35.0, 28.0, 40.0, 25.0, 38.0, 37.0, 49.0, 43.0, 48.0, 53.0, 47.0, 37.0, 39.0, 38.0, 42.0, 26.0, 30.0, 29.0, 31.0, 20.0, 23.0, 21.0, 13.0, 15.0, 5.0, 8.0, 8.0, 5.0, 3.0, 4.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.8837890625, -0.8575439453125, -0.831298828125, -0.8050537109375, -0.77880859375, -0.7525634765625, -0.726318359375, -0.7000732421875, -0.673828125, -0.6475830078125, -0.621337890625, -0.5950927734375, -0.56884765625, -0.5426025390625, -0.516357421875, -0.4901123046875, -0.4638671875, -0.4376220703125, -0.411376953125, -0.3851318359375, -0.35888671875, -0.3326416015625, -0.306396484375, -0.2801513671875, -0.25390625, -0.2276611328125, -0.201416015625, -0.1751708984375, -0.14892578125, -0.1226806640625, -0.096435546875, -0.0701904296875, -0.0439453125, -0.0177001953125, 0.008544921875, 0.0347900390625, 0.06103515625, 0.0872802734375, 0.113525390625, 0.1397705078125, 0.166015625, 0.1922607421875, 0.218505859375, 0.2447509765625, 0.27099609375, 0.2972412109375, 0.323486328125, 0.3497314453125, 0.3759765625, 0.4022216796875, 0.428466796875, 0.4547119140625, 0.48095703125, 0.5072021484375, 0.533447265625, 0.5596923828125, 0.5859375, 0.6121826171875, 0.638427734375, 0.6646728515625, 0.69091796875, 0.7171630859375, 0.743408203125, 0.7696533203125, 0.7958984375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 1.0, 5.0, 11.0, 7.0, 26.0, 43.0, 78.0, 195.0, 683.0, 5023.0, 782412.0, 256144.0, 3067.0, 521.0, 176.0, 61.0, 37.0, 18.0, 9.0, 4.0, 12.0, 3.0, 6.0, 4.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7978515625, -0.7682037353515625, -0.738555908203125, -0.7089080810546875, -0.67926025390625, -0.6496124267578125, -0.619964599609375, -0.5903167724609375, -0.5606689453125, -0.5310211181640625, -0.501373291015625, -0.4717254638671875, -0.44207763671875, -0.4124298095703125, -0.382781982421875, -0.3531341552734375, -0.323486328125, -0.2938385009765625, -0.264190673828125, -0.2345428466796875, -0.20489501953125, -0.1752471923828125, -0.145599365234375, -0.1159515380859375, -0.0863037109375, -0.0566558837890625, -0.027008056640625, 0.0026397705078125, 0.03228759765625, 0.0619354248046875, 0.091583251953125, 0.1212310791015625, 0.15087890625, 0.1805267333984375, 0.210174560546875, 0.2398223876953125, 0.26947021484375, 0.2991180419921875, 0.328765869140625, 0.3584136962890625, 0.3880615234375, 0.4177093505859375, 0.447357177734375, 0.4770050048828125, 0.50665283203125, 0.5363006591796875, 0.565948486328125, 0.5955963134765625, 0.625244140625, 0.6548919677734375, 0.684539794921875, 0.7141876220703125, 0.74383544921875, 0.7734832763671875, 0.803131103515625, 0.8327789306640625, 0.8624267578125, 0.8920745849609375, 0.921722412109375, 0.9513702392578125, 0.98101806640625, 1.0106658935546875, 1.040313720703125, 1.0699615478515625, 1.099609375]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 4.0, 5.0, 3.0, 2.0, 11.0, 9.0, 15.0, 15.0, 17.0, 30.0, 31.0, 44.0, 59.0, 74.0, 89.0, 95.0, 103.0, 86.0, 81.0, 53.0, 38.0, 32.0, 23.0, 18.0, 15.0, 6.0, 8.0, 12.0, 6.0, 2.0, 3.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.173683166503906e-05, -5.011633038520813e-05, -4.84958291053772e-05, -4.6875327825546265e-05, -4.525482654571533e-05, -4.36343252658844e-05, -4.201382398605347e-05, -4.0393322706222534e-05, -3.87728214263916e-05, -3.715232014656067e-05, -3.5531818866729736e-05, -3.3911317586898804e-05, -3.229081630706787e-05, -3.067031502723694e-05, -2.9049813747406006e-05, -2.7429312467575073e-05, -2.580881118774414e-05, -2.4188309907913208e-05, -2.2567808628082275e-05, -2.0947307348251343e-05, -1.932680606842041e-05, -1.7706304788589478e-05, -1.6085803508758545e-05, -1.4465302228927612e-05, -1.284480094909668e-05, -1.1224299669265747e-05, -9.603798389434814e-06, -7.983297109603882e-06, -6.362795829772949e-06, -4.742294549942017e-06, -3.121793270111084e-06, -1.5012919902801514e-06, 1.1920928955078125e-07, 1.7397105693817139e-06, 3.3602118492126465e-06, 4.980713129043579e-06, 6.601214408874512e-06, 8.221715688705444e-06, 9.842216968536377e-06, 1.146271824836731e-05, 1.3083219528198242e-05, 1.4703720808029175e-05, 1.6324222087860107e-05, 1.794472336769104e-05, 1.9565224647521973e-05, 2.1185725927352905e-05, 2.2806227207183838e-05, 2.442672848701477e-05, 2.6047229766845703e-05, 2.7667731046676636e-05, 2.928823232650757e-05, 3.09087336063385e-05, 3.2529234886169434e-05, 3.4149736166000366e-05, 3.57702374458313e-05, 3.739073872566223e-05, 3.9011240005493164e-05, 4.06317412853241e-05, 4.225224256515503e-05, 4.387274384498596e-05, 4.5493245124816895e-05, 4.711374640464783e-05, 4.873424768447876e-05, 5.035474896430969e-05, 5.1975250244140625e-05]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 1.0, 6.0, 4.0, 5.0, 7.0, 20.0, 27.0, 24.0, 43.0, 55.0, 109.0, 143.0, 233.0, 482.0, 1041.0, 2667.0, 9433.0, 64682.0, 680097.0, 256417.0, 24695.0, 4955.0, 1700.0, 775.0, 376.0, 207.0, 104.0, 83.0, 53.0, 38.0, 21.0, 13.0, 10.0, 12.0, 2.0, 4.0, 4.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.302490234375, -0.2923316955566406, -0.28217315673828125, -0.2720146179199219, -0.2618560791015625, -0.2516975402832031, -0.24153900146484375, -0.23138046264648438, -0.221221923828125, -0.21106338500976562, -0.20090484619140625, -0.19074630737304688, -0.1805877685546875, -0.17042922973632812, -0.16027069091796875, -0.15011215209960938, -0.13995361328125, -0.12979507446289062, -0.11963653564453125, -0.10947799682617188, -0.0993194580078125, -0.08916091918945312, -0.07900238037109375, -0.06884384155273438, -0.058685302734375, -0.048526763916015625, -0.03836822509765625, -0.028209686279296875, -0.0180511474609375, -0.007892608642578125, 0.00226593017578125, 0.012424468994140625, 0.0225830078125, 0.032741546630859375, 0.04290008544921875, 0.053058624267578125, 0.0632171630859375, 0.07337570190429688, 0.08353424072265625, 0.09369277954101562, 0.103851318359375, 0.11400985717773438, 0.12416839599609375, 0.13432693481445312, 0.1444854736328125, 0.15464401245117188, 0.16480255126953125, 0.17496109008789062, 0.18511962890625, 0.19527816772460938, 0.20543670654296875, 0.21559524536132812, 0.2257537841796875, 0.23591232299804688, 0.24607086181640625, 0.2562294006347656, 0.266387939453125, 0.2765464782714844, 0.28670501708984375, 0.2968635559082031, 0.3070220947265625, 0.3171806335449219, 0.32733917236328125, 0.3374977111816406, 0.34765625]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 4.0, 4.0, 7.0, 4.0, 9.0, 10.0, 23.0, 24.0, 30.0, 33.0, 54.0, 63.0, 62.0, 84.0, 78.0, 78.0, 81.0, 73.0, 53.0, 48.0, 38.0, 34.0, 28.0, 19.0, 13.0, 13.0, 8.0, 10.0, 3.0, 5.0, 0.0, 4.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0], "bins": [-0.260498046875, -0.2523765563964844, -0.24425506591796875, -0.23613357543945312, -0.2280120849609375, -0.21989059448242188, -0.21176910400390625, -0.20364761352539062, -0.195526123046875, -0.18740463256835938, -0.17928314208984375, -0.17116165161132812, -0.1630401611328125, -0.15491867065429688, -0.14679718017578125, -0.13867568969726562, -0.13055419921875, -0.12243270874023438, -0.11431121826171875, -0.10618972778320312, -0.0980682373046875, -0.08994674682617188, -0.08182525634765625, -0.07370376586914062, -0.065582275390625, -0.057460784912109375, -0.04933929443359375, -0.041217803955078125, -0.0330963134765625, -0.024974822998046875, -0.01685333251953125, -0.008731842041015625, -0.0006103515625, 0.007511138916015625, 0.01563262939453125, 0.023754119873046875, 0.0318756103515625, 0.039997100830078125, 0.04811859130859375, 0.056240081787109375, 0.064361572265625, 0.07248306274414062, 0.08060455322265625, 0.08872604370117188, 0.0968475341796875, 0.10496902465820312, 0.11309051513671875, 0.12121200561523438, 0.12933349609375, 0.13745498657226562, 0.14557647705078125, 0.15369796752929688, 0.1618194580078125, 0.16994094848632812, 0.17806243896484375, 0.18618392944335938, 0.194305419921875, 0.20242691040039062, 0.21054840087890625, 0.21866989135742188, 0.2267913818359375, 0.23491287231445312, 0.24303436279296875, 0.2511558532714844, 0.25927734375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 6.0, 1.0, 5.0, 16.0, 63.0, 263.0, 471.0, 133.0, 36.0, 10.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.664222717285156, -13.24209213256836, -12.819961547851562, -12.397830963134766, -11.975700378417969, -11.553569793701172, -11.131439208984375, -10.709308624267578, -10.287178039550781, -9.865047454833984, -9.442916870117188, -9.02078628540039, -8.598655700683594, -8.176525115966797, -7.754394054412842, -7.332263469696045, -6.91013240814209, -6.488001823425293, -6.065871238708496, -5.643740653991699, -5.221610069274902, -4.7994794845581055, -4.37734842300415, -3.9552178382873535, -3.5330872535705566, -3.1109566688537598, -2.688826084136963, -2.266695261001587, -1.84456467628479, -1.4224340915679932, -1.0003032684326172, -0.5781726837158203, -0.15604209899902344, 0.2660885453224182, 0.6882191896438599, 1.1103498935699463, 1.5324804782867432, 1.95461106300354, 2.376741886138916, 2.798872470855713, 3.2210030555725098, 3.6431336402893066, 4.0652642250061035, 4.487395286560059, 4.9095258712768555, 5.331656455993652, 5.753787040710449, 6.175917625427246, 6.598048210144043, 7.02017879486084, 7.442309379577637, 7.864439964294434, 8.28657054901123, 8.708701133728027, 9.13083267211914, 9.552963256835938, 9.975093841552734, 10.397224426269531, 10.819355010986328, 11.241485595703125, 11.663616180419922, 12.085746765136719, 12.507877349853516, 12.930007934570312, 13.35213851928711]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 5.0, 4.0, 10.0, 4.0, 6.0, 8.0, 5.0, 14.0, 12.0, 19.0, 22.0, 18.0, 36.0, 30.0, 34.0, 24.0, 26.0, 39.0, 41.0, 47.0, 52.0, 69.0, 63.0, 61.0, 42.0, 44.0, 27.0, 42.0, 23.0, 32.0, 31.0, 26.0, 16.0, 14.0, 13.0, 4.0, 8.0, 9.0, 13.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.147916793823242, -3.034193754196167, -2.920470714569092, -2.8067476749420166, -2.6930246353149414, -2.579301595687866, -2.465578556060791, -2.3518552780151367, -2.2381324768066406, -2.1244094371795654, -2.0106863975524902, -1.896963357925415, -1.7832403182983398, -1.6695172786712646, -1.5557941198349, -1.4420710802078247, -1.32834792137146, -1.2146248817443848, -1.1009018421173096, -0.9871787428855896, -0.8734557032585144, -0.7597326636314392, -0.6460095643997192, -0.532286524772644, -0.41856348514556885, -0.30484044551849365, -0.19111737608909607, -0.07739430665969849, 0.03632873296737671, 0.1500517725944519, 0.2637748718261719, 0.37749791145324707, 0.49122095108032227, 0.6049439907073975, 0.7186670303344727, 0.8323901295661926, 0.9461131691932678, 1.0598361492156982, 1.173559308052063, 1.2872823476791382, 1.4010053873062134, 1.5147284269332886, 1.6284514665603638, 1.7421746253967285, 1.8558976650238037, 1.969620704650879, 2.083343744277954, 2.1970667839050293, 2.3107898235321045, 2.4245128631591797, 2.538235902786255, 2.65195894241333, 2.7656819820404053, 2.8794050216674805, 2.9931282997131348, 3.106851100921631, 3.220574378967285, 3.3342974185943604, 3.4480204582214355, 3.5617434978485107, 3.675466537475586, 3.789189577102661, 3.9029126167297363, 4.016635894775391, 4.130358695983887]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 4.0, 6.0, 13.0, 8.0, 12.0, 23.0, 29.0, 30.0, 37.0, 66.0, 97.0, 184.0, 356.0, 845.0, 2396.0, 8530.0, 43403.0, 632133.0, 3253616.0, 219506.0, 24360.0, 5630.0, 1741.0, 612.0, 302.0, 146.0, 78.0, 44.0, 21.0, 17.0, 16.0, 10.0, 5.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.466796875, -0.45032501220703125, -0.4338531494140625, -0.41738128662109375, -0.400909423828125, -0.38443756103515625, -0.3679656982421875, -0.35149383544921875, -0.33502197265625, -0.31855010986328125, -0.3020782470703125, -0.28560638427734375, -0.269134521484375, -0.25266265869140625, -0.2361907958984375, -0.21971893310546875, -0.2032470703125, -0.18677520751953125, -0.1703033447265625, -0.15383148193359375, -0.137359619140625, -0.12088775634765625, -0.1044158935546875, -0.08794403076171875, -0.07147216796875, -0.05500030517578125, -0.0385284423828125, -0.02205657958984375, -0.005584716796875, 0.01088714599609375, 0.0273590087890625, 0.04383087158203125, 0.060302734375, 0.07677459716796875, 0.0932464599609375, 0.10971832275390625, 0.126190185546875, 0.14266204833984375, 0.1591339111328125, 0.17560577392578125, 0.19207763671875, 0.20854949951171875, 0.2250213623046875, 0.24149322509765625, 0.257965087890625, 0.27443695068359375, 0.2909088134765625, 0.30738067626953125, 0.3238525390625, 0.34032440185546875, 0.3567962646484375, 0.37326812744140625, 0.389739990234375, 0.40621185302734375, 0.4226837158203125, 0.43915557861328125, 0.45562744140625, 0.47209930419921875, 0.4885711669921875, 0.5050430297851562, 0.521514892578125, 0.5379867553710938, 0.5544586181640625, 0.5709304809570312, 0.58740234375]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 7.0, 9.0, 9.0, 14.0, 12.0, 16.0, 22.0, 18.0, 41.0, 37.0, 38.0, 41.0, 51.0, 55.0, 60.0, 50.0, 64.0, 47.0, 43.0, 49.0, 61.0, 51.0, 34.0, 38.0, 24.0, 24.0, 19.0, 12.0, 13.0, 18.0, 8.0, 7.0, 4.0, 4.0, 3.0, 1.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2030029296875, -0.1946887969970703, -0.18637466430664062, -0.17806053161621094, -0.16974639892578125, -0.16143226623535156, -0.15311813354492188, -0.1448040008544922, -0.1364898681640625, -0.1281757354736328, -0.11986160278320312, -0.11154747009277344, -0.10323333740234375, -0.09491920471191406, -0.08660507202148438, -0.07829093933105469, -0.069976806640625, -0.06166267395019531, -0.053348541259765625, -0.04503440856933594, -0.03672027587890625, -0.028406143188476562, -0.020092010498046875, -0.011777877807617188, -0.0034637451171875, 0.0048503875732421875, 0.013164520263671875, 0.021478652954101562, 0.02979278564453125, 0.03810691833496094, 0.046421051025390625, 0.05473518371582031, 0.06304931640625, 0.07136344909667969, 0.07967758178710938, 0.08799171447753906, 0.09630584716796875, 0.10461997985839844, 0.11293411254882812, 0.12124824523925781, 0.1295623779296875, 0.1378765106201172, 0.14619064331054688, 0.15450477600097656, 0.16281890869140625, 0.17113304138183594, 0.17944717407226562, 0.1877613067626953, 0.196075439453125, 0.2043895721435547, 0.21270370483398438, 0.22101783752441406, 0.22933197021484375, 0.23764610290527344, 0.24596023559570312, 0.2542743682861328, 0.2625885009765625, 0.2709026336669922, 0.2792167663574219, 0.28753089904785156, 0.29584503173828125, 0.30415916442871094, 0.3124732971191406, 0.3207874298095703, 0.3291015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 5.0, 8.0, 5.0, 4.0, 11.0, 14.0, 31.0, 52.0, 59.0, 107.0, 203.0, 469.0, 1018.0, 3078.0, 11516.0, 61332.0, 1050182.0, 2941594.0, 102356.0, 15921.0, 3964.0, 1345.0, 511.0, 218.0, 112.0, 69.0, 35.0, 17.0, 15.0, 9.0, 8.0, 5.0, 3.0, 4.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6044921875, -0.5856857299804688, -0.5668792724609375, -0.5480728149414062, -0.529266357421875, -0.5104598999023438, -0.4916534423828125, -0.47284698486328125, -0.45404052734375, -0.43523406982421875, -0.4164276123046875, -0.39762115478515625, -0.378814697265625, -0.36000823974609375, -0.3412017822265625, -0.32239532470703125, -0.3035888671875, -0.28478240966796875, -0.2659759521484375, -0.24716949462890625, -0.228363037109375, -0.20955657958984375, -0.1907501220703125, -0.17194366455078125, -0.15313720703125, -0.13433074951171875, -0.1155242919921875, -0.09671783447265625, -0.077911376953125, -0.05910491943359375, -0.0402984619140625, -0.02149200439453125, -0.002685546875, 0.01612091064453125, 0.0349273681640625, 0.05373382568359375, 0.072540283203125, 0.09134674072265625, 0.1101531982421875, 0.12895965576171875, 0.14776611328125, 0.16657257080078125, 0.1853790283203125, 0.20418548583984375, 0.222991943359375, 0.24179840087890625, 0.2606048583984375, 0.27941131591796875, 0.2982177734375, 0.31702423095703125, 0.3358306884765625, 0.35463714599609375, 0.373443603515625, 0.39225006103515625, 0.4110565185546875, 0.42986297607421875, 0.44866943359375, 0.46747589111328125, 0.4862823486328125, 0.5050888061523438, 0.523895263671875, 0.5427017211914062, 0.5615081787109375, 0.5803146362304688, 0.59912109375]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 4.0, 2.0, 8.0, 7.0, 13.0, 11.0, 21.0, 21.0, 21.0, 37.0, 51.0, 72.0, 96.0, 166.0, 305.0, 548.0, 887.0, 703.0, 437.0, 248.0, 143.0, 98.0, 58.0, 33.0, 21.0, 9.0, 8.0, 14.0, 4.0, 10.0, 1.0, 6.0, 1.0, 1.0, 3.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.52734375, -0.5102310180664062, -0.4931182861328125, -0.47600555419921875, -0.458892822265625, -0.44178009033203125, -0.4246673583984375, -0.40755462646484375, -0.39044189453125, -0.37332916259765625, -0.3562164306640625, -0.33910369873046875, -0.321990966796875, -0.30487823486328125, -0.2877655029296875, -0.27065277099609375, -0.2535400390625, -0.23642730712890625, -0.2193145751953125, -0.20220184326171875, -0.185089111328125, -0.16797637939453125, -0.1508636474609375, -0.13375091552734375, -0.11663818359375, -0.09952545166015625, -0.0824127197265625, -0.06529998779296875, -0.048187255859375, -0.03107452392578125, -0.0139617919921875, 0.00315093994140625, 0.020263671875, 0.03737640380859375, 0.0544891357421875, 0.07160186767578125, 0.088714599609375, 0.10582733154296875, 0.1229400634765625, 0.14005279541015625, 0.15716552734375, 0.17427825927734375, 0.1913909912109375, 0.20850372314453125, 0.225616455078125, 0.24272918701171875, 0.2598419189453125, 0.27695465087890625, 0.2940673828125, 0.31118011474609375, 0.3282928466796875, 0.34540557861328125, 0.362518310546875, 0.37963104248046875, 0.3967437744140625, 0.41385650634765625, 0.43096923828125, 0.44808197021484375, 0.4651947021484375, 0.48230743408203125, 0.499420166015625, 0.5165328979492188, 0.5336456298828125, 0.5507583618164062, 0.56787109375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 3.0, 4.0, 6.0, 19.0, 55.0, 96.0, 203.0, 242.0, 180.0, 104.0, 43.0, 18.0, 7.0, 6.0, 6.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.125303268432617, -4.931992053985596, -4.738680839538574, -4.545370101928711, -4.3520588874816895, -4.158747673034668, -3.9654364585876465, -3.772125244140625, -3.5788142681121826, -3.385503053665161, -3.1921920776367188, -2.9988808631896973, -2.805569648742676, -2.6122586727142334, -2.418947458267212, -2.2256364822387695, -2.032325267791748, -1.8390141725540161, -1.6457030773162842, -1.4523918628692627, -1.2590807676315308, -1.0657696723937988, -0.8724584579467773, -0.6791473627090454, -0.4858362674713135, -0.29252514243125916, -0.09921401739120483, 0.09409713745117188, 0.2874082326889038, 0.48071932792663574, 0.6740305423736572, 0.8673416376113892, 1.0606532096862793, 1.2539643049240112, 1.4472754001617432, 1.6405866146087646, 1.8338977098464966, 2.0272088050842285, 2.22052001953125, 2.4138312339782715, 2.607142210006714, 2.8004534244537354, 2.9937644004821777, 3.187075614929199, 3.3803868293762207, 3.573697805404663, 3.7670090198516846, 3.960319995880127, 4.153631210327148, 4.34694242477417, 4.540253639221191, 4.733564376831055, 4.926875591278076, 5.120186805725098, 5.313498020172119, 5.506809234619141, 5.700119972229004, 5.893431186676025, 6.086742401123047, 6.28005313873291, 6.473364353179932, 6.666675567626953, 6.859986782073975, 7.053297996520996, 7.246609210968018]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 8.0, 6.0, 8.0, 10.0, 21.0, 12.0, 17.0, 18.0, 18.0, 23.0, 30.0, 40.0, 41.0, 35.0, 39.0, 53.0, 56.0, 49.0, 53.0, 61.0, 46.0, 34.0, 55.0, 41.0, 38.0, 22.0, 29.0, 33.0, 18.0, 19.0, 19.0, 10.0, 12.0, 7.0, 6.0, 4.0, 4.0, 8.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4401419162750244, -2.3595619201660156, -2.278981924057007, -2.198401927947998, -2.1178219318389893, -2.0372419357299805, -1.9566619396209717, -1.876081943511963, -1.795501947402954, -1.7149219512939453, -1.6343419551849365, -1.5537619590759277, -1.473181962966919, -1.3926019668579102, -1.3120219707489014, -1.2314419746398926, -1.1508619785308838, -1.070281982421875, -0.9897019863128662, -0.9091219902038574, -0.8285419940948486, -0.7479619979858398, -0.667382001876831, -0.5868020057678223, -0.5062220096588135, -0.4256420135498047, -0.3450620174407959, -0.2644820213317871, -0.18390202522277832, -0.10332202911376953, -0.022742033004760742, 0.05783796310424805, 0.13841819763183594, 0.21899819374084473, 0.2995781898498535, 0.3801581859588623, 0.4607381820678711, 0.5413181781768799, 0.6218981742858887, 0.7024781703948975, 0.7830581665039062, 0.863638162612915, 0.9442181587219238, 1.0247981548309326, 1.1053781509399414, 1.1859581470489502, 1.266538143157959, 1.3471181392669678, 1.4276981353759766, 1.5082781314849854, 1.5888581275939941, 1.669438123703003, 1.7500181198120117, 1.8305981159210205, 1.9111781120300293, 1.991758108139038, 2.072338104248047, 2.1529181003570557, 2.2334980964660645, 2.3140780925750732, 2.394658088684082, 2.475238084793091, 2.5558180809020996, 2.6363980770111084, 2.716978073120117]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 3.0, 1.0, 6.0, 10.0, 14.0, 20.0, 20.0, 32.0, 59.0, 101.0, 184.0, 389.0, 883.0, 2130.0, 5507.0, 15193.0, 46087.0, 140214.0, 337351.0, 313904.0, 123770.0, 40666.0, 13643.0, 4886.0, 1906.0, 796.0, 359.0, 197.0, 103.0, 45.0, 30.0, 18.0, 12.0, 10.0, 6.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.37548828125, -0.3625144958496094, -0.34954071044921875, -0.3365669250488281, -0.3235931396484375, -0.3106193542480469, -0.29764556884765625, -0.2846717834472656, -0.271697998046875, -0.2587242126464844, -0.24575042724609375, -0.23277664184570312, -0.2198028564453125, -0.20682907104492188, -0.19385528564453125, -0.18088150024414062, -0.16790771484375, -0.15493392944335938, -0.14196014404296875, -0.12898635864257812, -0.1160125732421875, -0.10303878784179688, -0.09006500244140625, -0.07709121704101562, -0.064117431640625, -0.051143646240234375, -0.03816986083984375, -0.025196075439453125, -0.0122222900390625, 0.000751495361328125, 0.01372528076171875, 0.026699066162109375, 0.0396728515625, 0.052646636962890625, 0.06562042236328125, 0.07859420776367188, 0.0915679931640625, 0.10454177856445312, 0.11751556396484375, 0.13048934936523438, 0.143463134765625, 0.15643692016601562, 0.16941070556640625, 0.18238449096679688, 0.1953582763671875, 0.20833206176757812, 0.22130584716796875, 0.23427963256835938, 0.24725341796875, 0.2602272033691406, 0.27320098876953125, 0.2861747741699219, 0.2991485595703125, 0.3121223449707031, 0.32509613037109375, 0.3380699157714844, 0.351043701171875, 0.3640174865722656, 0.37699127197265625, 0.3899650573730469, 0.4029388427734375, 0.4159126281738281, 0.42888641357421875, 0.4418601989746094, 0.454833984375]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 5.0, 7.0, 3.0, 11.0, 11.0, 11.0, 14.0, 18.0, 16.0, 20.0, 24.0, 34.0, 24.0, 26.0, 29.0, 38.0, 33.0, 35.0, 36.0, 37.0, 38.0, 42.0, 34.0, 31.0, 34.0, 47.0, 40.0, 45.0, 30.0, 31.0, 32.0, 19.0, 25.0, 17.0, 15.0, 16.0, 10.0, 11.0, 6.0, 9.0, 8.0, 7.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 0.0, 1.0, 2.0], "bins": [-0.1722412109375, -0.16643142700195312, -0.16062164306640625, -0.15481185913085938, -0.1490020751953125, -0.14319229125976562, -0.13738250732421875, -0.13157272338867188, -0.125762939453125, -0.11995315551757812, -0.11414337158203125, -0.10833358764648438, -0.1025238037109375, -0.09671401977539062, -0.09090423583984375, -0.08509445190429688, -0.07928466796875, -0.07347488403320312, -0.06766510009765625, -0.061855316162109375, -0.0560455322265625, -0.050235748291015625, -0.04442596435546875, -0.038616180419921875, -0.032806396484375, -0.026996612548828125, -0.02118682861328125, -0.015377044677734375, -0.0095672607421875, -0.003757476806640625, 0.00205230712890625, 0.007862091064453125, 0.013671875, 0.019481658935546875, 0.02529144287109375, 0.031101226806640625, 0.0369110107421875, 0.042720794677734375, 0.04853057861328125, 0.054340362548828125, 0.060150146484375, 0.06595993041992188, 0.07176971435546875, 0.07757949829101562, 0.0833892822265625, 0.08919906616210938, 0.09500885009765625, 0.10081863403320312, 0.10662841796875, 0.11243820190429688, 0.11824798583984375, 0.12405776977539062, 0.1298675537109375, 0.13567733764648438, 0.14148712158203125, 0.14729690551757812, 0.153106689453125, 0.15891647338867188, 0.16472625732421875, 0.17053604125976562, 0.1763458251953125, 0.18215560913085938, 0.18796539306640625, 0.19377517700195312, 0.1995849609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 5.0, 1.0, 4.0, 1.0, 4.0, 5.0, 10.0, 11.0, 25.0, 17.0, 26.0, 38.0, 50.0, 76.0, 110.0, 135.0, 196.0, 278.0, 353.0, 538.0, 937.0, 1551.0, 3375.0, 10952.0, 65494.0, 597866.0, 313105.0, 39299.0, 7604.0, 2635.0, 1360.0, 754.0, 498.0, 352.0, 266.0, 149.0, 135.0, 80.0, 65.0, 53.0, 37.0, 27.0, 28.0, 16.0, 16.0, 10.0, 5.0, 6.0, 2.0, 3.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.6201171875, -0.5993576049804688, -0.5785980224609375, -0.5578384399414062, -0.537078857421875, -0.5163192749023438, -0.4955596923828125, -0.47480010986328125, -0.45404052734375, -0.43328094482421875, -0.4125213623046875, -0.39176177978515625, -0.371002197265625, -0.35024261474609375, -0.3294830322265625, -0.30872344970703125, -0.2879638671875, -0.26720428466796875, -0.2464447021484375, -0.22568511962890625, -0.204925537109375, -0.18416595458984375, -0.1634063720703125, -0.14264678955078125, -0.12188720703125, -0.10112762451171875, -0.0803680419921875, -0.05960845947265625, -0.038848876953125, -0.01808929443359375, 0.0026702880859375, 0.02342987060546875, 0.044189453125, 0.06494903564453125, 0.0857086181640625, 0.10646820068359375, 0.127227783203125, 0.14798736572265625, 0.1687469482421875, 0.18950653076171875, 0.21026611328125, 0.23102569580078125, 0.2517852783203125, 0.27254486083984375, 0.293304443359375, 0.31406402587890625, 0.3348236083984375, 0.35558319091796875, 0.3763427734375, 0.39710235595703125, 0.4178619384765625, 0.43862152099609375, 0.459381103515625, 0.48014068603515625, 0.5009002685546875, 0.5216598510742188, 0.54241943359375, 0.5631790161132812, 0.5839385986328125, 0.6046981811523438, 0.625457763671875, 0.6462173461914062, 0.6669769287109375, 0.6877365112304688, 0.70849609375]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 5.0, 0.0, 5.0, 3.0, 8.0, 5.0, 11.0, 11.0, 22.0, 17.0, 13.0, 28.0, 33.0, 35.0, 42.0, 55.0, 46.0, 46.0, 47.0, 70.0, 52.0, 59.0, 51.0, 53.0, 42.0, 34.0, 32.0, 28.0, 35.0, 15.0, 14.0, 22.0, 17.0, 10.0, 9.0, 10.0, 2.0, 7.0, 8.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9775390625, -0.946197509765625, -0.91485595703125, -0.883514404296875, -0.8521728515625, -0.820831298828125, -0.78948974609375, -0.758148193359375, -0.726806640625, -0.695465087890625, -0.66412353515625, -0.632781982421875, -0.6014404296875, -0.570098876953125, -0.53875732421875, -0.507415771484375, -0.47607421875, -0.444732666015625, -0.41339111328125, -0.382049560546875, -0.3507080078125, -0.319366455078125, -0.28802490234375, -0.256683349609375, -0.225341796875, -0.194000244140625, -0.16265869140625, -0.131317138671875, -0.0999755859375, -0.068634033203125, -0.03729248046875, -0.005950927734375, 0.025390625, 0.056732177734375, 0.08807373046875, 0.119415283203125, 0.1507568359375, 0.182098388671875, 0.21343994140625, 0.244781494140625, 0.276123046875, 0.307464599609375, 0.33880615234375, 0.370147705078125, 0.4014892578125, 0.432830810546875, 0.46417236328125, 0.495513916015625, 0.52685546875, 0.558197021484375, 0.58953857421875, 0.620880126953125, 0.6522216796875, 0.683563232421875, 0.71490478515625, 0.746246337890625, 0.777587890625, 0.808929443359375, 0.84027099609375, 0.871612548828125, 0.9029541015625, 0.934295654296875, 0.96563720703125, 0.996978759765625, 1.0283203125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 9.0, 16.0, 16.0, 19.0, 24.0, 34.0, 73.0, 99.0, 144.0, 351.0, 779.0, 1757.0, 4735.0, 18656.0, 130279.0, 744426.0, 121514.0, 17895.0, 4522.0, 1628.0, 687.0, 366.0, 196.0, 112.0, 66.0, 48.0, 28.0, 32.0, 9.0, 8.0, 7.0, 8.0, 3.0, 2.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.241455078125, -0.23266983032226562, -0.22388458251953125, -0.21509933471679688, -0.2063140869140625, -0.19752883911132812, -0.18874359130859375, -0.17995834350585938, -0.171173095703125, -0.16238784790039062, -0.15360260009765625, -0.14481735229492188, -0.1360321044921875, -0.12724685668945312, -0.11846160888671875, -0.10967636108398438, -0.10089111328125, -0.09210586547851562, -0.08332061767578125, -0.07453536987304688, -0.0657501220703125, -0.056964874267578125, -0.04817962646484375, -0.039394378662109375, -0.030609130859375, -0.021823883056640625, -0.01303863525390625, -0.004253387451171875, 0.0045318603515625, 0.013317108154296875, 0.02210235595703125, 0.030887603759765625, 0.0396728515625, 0.048458099365234375, 0.05724334716796875, 0.06602859497070312, 0.0748138427734375, 0.08359909057617188, 0.09238433837890625, 0.10116958618164062, 0.109954833984375, 0.11874008178710938, 0.12752532958984375, 0.13631057739257812, 0.1450958251953125, 0.15388107299804688, 0.16266632080078125, 0.17145156860351562, 0.18023681640625, 0.18902206420898438, 0.19780731201171875, 0.20659255981445312, 0.2153778076171875, 0.22416305541992188, 0.23294830322265625, 0.24173355102539062, 0.250518798828125, 0.2593040466308594, 0.26808929443359375, 0.2768745422363281, 0.2856597900390625, 0.2944450378417969, 0.30323028564453125, 0.3120155334472656, 0.32080078125]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 3.0, 4.0, 3.0, 7.0, 9.0, 6.0, 9.0, 15.0, 13.0, 22.0, 20.0, 22.0, 22.0, 40.0, 51.0, 49.0, 72.0, 73.0, 93.0, 71.0, 93.0, 44.0, 57.0, 41.0, 35.0, 19.0, 24.0, 25.0, 18.0, 10.0, 11.0, 10.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0590763092041016e-05, -3.8798898458480835e-05, -3.7007033824920654e-05, -3.5215169191360474e-05, -3.342330455780029e-05, -3.163143992424011e-05, -2.983957529067993e-05, -2.804771065711975e-05, -2.625584602355957e-05, -2.446398138999939e-05, -2.267211675643921e-05, -2.088025212287903e-05, -1.9088387489318848e-05, -1.7296522855758667e-05, -1.5504658222198486e-05, -1.3712793588638306e-05, -1.1920928955078125e-05, -1.0129064321517944e-05, -8.337199687957764e-06, -6.545335054397583e-06, -4.753470420837402e-06, -2.9616057872772217e-06, -1.169741153717041e-06, 6.221234798431396e-07, 2.4139881134033203e-06, 4.205852746963501e-06, 5.997717380523682e-06, 7.789582014083862e-06, 9.581446647644043e-06, 1.1373311281204224e-05, 1.3165175914764404e-05, 1.4957040548324585e-05, 1.6748905181884766e-05, 1.8540769815444946e-05, 2.0332634449005127e-05, 2.2124499082565308e-05, 2.3916363716125488e-05, 2.570822834968567e-05, 2.750009298324585e-05, 2.929195761680603e-05, 3.108382225036621e-05, 3.287568688392639e-05, 3.466755151748657e-05, 3.645941615104675e-05, 3.8251280784606934e-05, 4.0043145418167114e-05, 4.1835010051727295e-05, 4.3626874685287476e-05, 4.5418739318847656e-05, 4.721060395240784e-05, 4.900246858596802e-05, 5.07943332195282e-05, 5.258619785308838e-05, 5.437806248664856e-05, 5.616992712020874e-05, 5.796179175376892e-05, 5.97536563873291e-05, 6.154552102088928e-05, 6.333738565444946e-05, 6.512925028800964e-05, 6.692111492156982e-05, 6.871297955513e-05, 7.050484418869019e-05, 7.229670882225037e-05, 7.408857345581055e-05]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 4.0, 7.0, 6.0, 10.0, 9.0, 15.0, 25.0, 34.0, 56.0, 76.0, 143.0, 252.0, 482.0, 976.0, 2588.0, 7998.0, 39956.0, 432982.0, 508736.0, 41108.0, 8260.0, 2526.0, 1089.0, 505.0, 274.0, 170.0, 79.0, 57.0, 46.0, 22.0, 21.0, 15.0, 6.0, 5.0, 7.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0], "bins": [-0.3623046875, -0.35324859619140625, -0.3441925048828125, -0.33513641357421875, -0.326080322265625, -0.31702423095703125, -0.3079681396484375, -0.29891204833984375, -0.28985595703125, -0.28079986572265625, -0.2717437744140625, -0.26268768310546875, -0.253631591796875, -0.24457550048828125, -0.2355194091796875, -0.22646331787109375, -0.2174072265625, -0.20835113525390625, -0.1992950439453125, -0.19023895263671875, -0.181182861328125, -0.17212677001953125, -0.1630706787109375, -0.15401458740234375, -0.14495849609375, -0.13590240478515625, -0.1268463134765625, -0.11779022216796875, -0.108734130859375, -0.09967803955078125, -0.0906219482421875, -0.08156585693359375, -0.072509765625, -0.06345367431640625, -0.0543975830078125, -0.04534149169921875, -0.036285400390625, -0.02722930908203125, -0.0181732177734375, -0.00911712646484375, -6.103515625e-05, 0.00899505615234375, 0.0180511474609375, 0.02710723876953125, 0.036163330078125, 0.04521942138671875, 0.0542755126953125, 0.06333160400390625, 0.0723876953125, 0.08144378662109375, 0.0904998779296875, 0.09955596923828125, 0.108612060546875, 0.11766815185546875, 0.1267242431640625, 0.13578033447265625, 0.14483642578125, 0.15389251708984375, 0.1629486083984375, 0.17200469970703125, 0.181060791015625, 0.19011688232421875, 0.1991729736328125, 0.20822906494140625, 0.21728515625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 4.0, 6.0, 8.0, 2.0, 6.0, 11.0, 16.0, 17.0, 27.0, 47.0, 47.0, 60.0, 85.0, 89.0, 72.0, 92.0, 76.0, 84.0, 61.0, 43.0, 44.0, 25.0, 23.0, 18.0, 10.0, 6.0, 8.0, 3.0, 8.0, 3.0, 2.0, 3.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.280517578125, -0.2722644805908203, -0.2640113830566406, -0.25575828552246094, -0.24750518798828125, -0.23925209045410156, -0.23099899291992188, -0.2227458953857422, -0.2144927978515625, -0.2062397003173828, -0.19798660278320312, -0.18973350524902344, -0.18148040771484375, -0.17322731018066406, -0.16497421264648438, -0.1567211151123047, -0.148468017578125, -0.1402149200439453, -0.13196182250976562, -0.12370872497558594, -0.11545562744140625, -0.10720252990722656, -0.09894943237304688, -0.09069633483886719, -0.0824432373046875, -0.07419013977050781, -0.06593704223632812, -0.05768394470214844, -0.04943084716796875, -0.04117774963378906, -0.032924652099609375, -0.024671554565429688, -0.01641845703125, -0.008165359497070312, 8.7738037109375e-05, 0.008340835571289062, 0.01659393310546875, 0.024847030639648438, 0.033100128173828125, 0.04135322570800781, 0.0496063232421875, 0.05785942077636719, 0.06611251831054688, 0.07436561584472656, 0.08261871337890625, 0.09087181091308594, 0.09912490844726562, 0.10737800598144531, 0.115631103515625, 0.12388420104980469, 0.13213729858398438, 0.14039039611816406, 0.14864349365234375, 0.15689659118652344, 0.16514968872070312, 0.1734027862548828, 0.1816558837890625, 0.1899089813232422, 0.19816207885742188, 0.20641517639160156, 0.21466827392578125, 0.22292137145996094, 0.23117446899414062, 0.2394275665283203, 0.2476806640625]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 5.0, 5.0, 16.0, 39.0, 126.0, 251.0, 306.0, 147.0, 67.0, 17.0, 9.0, 3.0, 4.0, 4.0, 3.0, 0.0, 0.0, 4.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.301182508468628, -3.048675775527954, -2.7961692810058594, -2.5436625480651855, -2.2911558151245117, -2.038649320602417, -1.7861425876617432, -1.5336359739303589, -1.2811293601989746, -1.0286227464675903, -0.7761160731315613, -0.5236093997955322, -0.27110278606414795, -0.018596172332763672, 0.23391056060791016, 0.48641717433929443, 0.7389237880706787, 0.991430401802063, 1.2439370155334473, 1.496443748474121, 1.7489503622055054, 2.0014569759368896, 2.2539637088775635, 2.506470203399658, 2.758976936340332, 3.011483669281006, 3.2639901638031006, 3.5164968967437744, 3.769003391265869, 4.021510124206543, 4.274016857147217, 4.526523590087891, 4.779029846191406, 5.03153657913208, 5.284043312072754, 5.5365495681762695, 5.789056301116943, 6.041563034057617, 6.294069766998291, 6.546576499938965, 6.7990827560424805, 7.051589488983154, 7.304096221923828, 7.556602478027344, 7.809109210968018, 8.061615943908691, 8.314123153686523, 8.566629409790039, 8.819135665893555, 9.07164192199707, 9.324149131774902, 9.576655387878418, 9.82916259765625, 10.081668853759766, 10.334175109863281, 10.586682319641113, 10.839189529418945, 11.091695785522461, 11.344202995300293, 11.596709251403809, 11.84921646118164, 12.101722717285156, 12.354228973388672, 12.606736183166504, 12.85924243927002]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 6.0, 6.0, 2.0, 5.0, 6.0, 6.0, 10.0, 9.0, 14.0, 16.0, 20.0, 26.0, 24.0, 22.0, 36.0, 44.0, 41.0, 48.0, 58.0, 64.0, 74.0, 75.0, 50.0, 42.0, 42.0, 37.0, 32.0, 31.0, 21.0, 18.0, 26.0, 16.0, 9.0, 20.0, 13.0, 11.0, 6.0, 4.0, 11.0, 6.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.084724187850952, -2.972348213195801, -2.8599720001220703, -2.747596025466919, -2.6352200508117676, -2.522843837738037, -2.4104678630828857, -2.2980918884277344, -2.185715675354004, -2.0733397006988525, -1.9609636068344116, -1.8485875129699707, -1.7362115383148193, -1.6238354444503784, -1.5114593505859375, -1.3990833759307861, -1.2867074012756348, -1.1743313074111938, -1.0619553327560425, -0.9495792388916016, -0.8372032046318054, -0.7248271703720093, -0.6124510765075684, -0.5000750422477722, -0.3876990079879761, -0.27532297372817993, -0.1629469096660614, -0.05057084560394287, 0.06180518865585327, 0.17418122291564941, 0.28655731678009033, 0.3989333510398865, 0.5113091468811035, 0.6236851811408997, 0.7360612154006958, 0.8484373092651367, 0.9608133435249329, 1.073189377784729, 1.18556547164917, 1.2979414463043213, 1.4103175401687622, 1.5226936340332031, 1.6350696086883545, 1.7474457025527954, 1.8598217964172363, 1.9721977710723877, 2.084573745727539, 2.1969499588012695, 2.309325933456421, 2.4217019081115723, 2.5340781211853027, 2.646454095840454, 2.7588300704956055, 2.871206283569336, 2.9835822582244873, 3.0959582328796387, 3.208334445953369, 3.3207104206085205, 3.433086633682251, 3.5454626083374023, 3.6578385829925537, 3.770214557647705, 3.8825907707214355, 3.994966745376587, 4.107342720031738]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 4.0, 7.0, 4.0, 11.0, 9.0, 17.0, 18.0, 30.0, 64.0, 80.0, 162.0, 254.0, 550.0, 1175.0, 3708.0, 17150.0, 160605.0, 3144881.0, 813492.0, 41263.0, 7246.0, 2072.0, 737.0, 346.0, 172.0, 101.0, 51.0, 27.0, 16.0, 12.0, 10.0, 6.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.515625, -0.49884796142578125, -0.4820709228515625, -0.46529388427734375, -0.448516845703125, -0.43173980712890625, -0.4149627685546875, -0.39818572998046875, -0.38140869140625, -0.36463165283203125, -0.3478546142578125, -0.33107757568359375, -0.314300537109375, -0.29752349853515625, -0.2807464599609375, -0.26396942138671875, -0.2471923828125, -0.23041534423828125, -0.2136383056640625, -0.19686126708984375, -0.180084228515625, -0.16330718994140625, -0.1465301513671875, -0.12975311279296875, -0.11297607421875, -0.09619903564453125, -0.0794219970703125, -0.06264495849609375, -0.045867919921875, -0.02909088134765625, -0.0123138427734375, 0.00446319580078125, 0.021240234375, 0.03801727294921875, 0.0547943115234375, 0.07157135009765625, 0.088348388671875, 0.10512542724609375, 0.1219024658203125, 0.13867950439453125, 0.15545654296875, 0.17223358154296875, 0.1890106201171875, 0.20578765869140625, 0.222564697265625, 0.23934173583984375, 0.2561187744140625, 0.27289581298828125, 0.2896728515625, 0.30644989013671875, 0.3232269287109375, 0.34000396728515625, 0.356781005859375, 0.37355804443359375, 0.3903350830078125, 0.40711212158203125, 0.42388916015625, 0.44066619873046875, 0.4574432373046875, 0.47422027587890625, 0.490997314453125, 0.5077743530273438, 0.5245513916015625, 0.5413284301757812, 0.55810546875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 6.0, 5.0, 7.0, 5.0, 7.0, 10.0, 13.0, 29.0, 29.0, 33.0, 59.0, 51.0, 63.0, 51.0, 62.0, 72.0, 50.0, 56.0, 60.0, 69.0, 65.0, 60.0, 29.0, 31.0, 23.0, 22.0, 9.0, 14.0, 4.0, 5.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1861572265625, -0.17647743225097656, -0.16679763793945312, -0.1571178436279297, -0.14743804931640625, -0.1377582550048828, -0.12807846069335938, -0.11839866638183594, -0.1087188720703125, -0.09903907775878906, -0.08935928344726562, -0.07967948913574219, -0.06999969482421875, -0.06031990051269531, -0.050640106201171875, -0.04096031188964844, -0.031280517578125, -0.021600723266601562, -0.011920928955078125, -0.0022411346435546875, 0.00743865966796875, 0.017118453979492188, 0.026798248291015625, 0.03647804260253906, 0.0461578369140625, 0.05583763122558594, 0.06551742553710938, 0.07519721984863281, 0.08487701416015625, 0.09455680847167969, 0.10423660278320312, 0.11391639709472656, 0.12359619140625, 0.13327598571777344, 0.14295578002929688, 0.1526355743408203, 0.16231536865234375, 0.1719951629638672, 0.18167495727539062, 0.19135475158691406, 0.2010345458984375, 0.21071434020996094, 0.22039413452148438, 0.2300739288330078, 0.23975372314453125, 0.2494335174560547, 0.2591133117675781, 0.26879310607910156, 0.278472900390625, 0.28815269470214844, 0.2978324890136719, 0.3075122833251953, 0.31719207763671875, 0.3268718719482422, 0.3365516662597656, 0.34623146057128906, 0.3559112548828125, 0.36559104919433594, 0.3752708435058594, 0.3849506378173828, 0.39463043212890625, 0.4043102264404297, 0.4139900207519531, 0.42366981506347656, 0.433349609375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 3.0, 3.0, 6.0, 12.0, 9.0, 13.0, 14.0, 22.0, 46.0, 60.0, 130.0, 196.0, 288.0, 544.0, 1129.0, 2398.0, 7173.0, 27742.0, 169867.0, 3023474.0, 884024.0, 59003.0, 12195.0, 3417.0, 1281.0, 529.0, 258.0, 164.0, 99.0, 69.0, 37.0, 19.0, 23.0, 14.0, 10.0, 4.0, 6.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.495361328125, -0.4806976318359375, -0.466033935546875, -0.4513702392578125, -0.43670654296875, -0.4220428466796875, -0.407379150390625, -0.3927154541015625, -0.3780517578125, -0.3633880615234375, -0.348724365234375, -0.3340606689453125, -0.31939697265625, -0.3047332763671875, -0.290069580078125, -0.2754058837890625, -0.2607421875, -0.2460784912109375, -0.231414794921875, -0.2167510986328125, -0.20208740234375, -0.1874237060546875, -0.172760009765625, -0.1580963134765625, -0.1434326171875, -0.1287689208984375, -0.114105224609375, -0.0994415283203125, -0.08477783203125, -0.0701141357421875, -0.055450439453125, -0.0407867431640625, -0.026123046875, -0.0114593505859375, 0.003204345703125, 0.0178680419921875, 0.03253173828125, 0.0471954345703125, 0.061859130859375, 0.0765228271484375, 0.0911865234375, 0.1058502197265625, 0.120513916015625, 0.1351776123046875, 0.14984130859375, 0.1645050048828125, 0.179168701171875, 0.1938323974609375, 0.20849609375, 0.2231597900390625, 0.237823486328125, 0.2524871826171875, 0.26715087890625, 0.2818145751953125, 0.296478271484375, 0.3111419677734375, 0.3258056640625, 0.3404693603515625, 0.355133056640625, 0.3697967529296875, 0.38446044921875, 0.3991241455078125, 0.413787841796875, 0.4284515380859375, 0.443115234375]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 5.0, 7.0, 11.0, 14.0, 19.0, 25.0, 33.0, 58.0, 67.0, 121.0, 212.0, 444.0, 751.0, 978.0, 659.0, 336.0, 155.0, 76.0, 34.0, 19.0, 12.0, 9.0, 9.0, 9.0, 6.0, 3.0, 3.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.86083984375, -0.8409538269042969, -0.8210678100585938, -0.8011817932128906, -0.7812957763671875, -0.7614097595214844, -0.7415237426757812, -0.7216377258300781, -0.701751708984375, -0.6818656921386719, -0.6619796752929688, -0.6420936584472656, -0.6222076416015625, -0.6023216247558594, -0.5824356079101562, -0.5625495910644531, -0.54266357421875, -0.5227775573730469, -0.5028915405273438, -0.4830055236816406, -0.4631195068359375, -0.4432334899902344, -0.42334747314453125, -0.4034614562988281, -0.383575439453125, -0.3636894226074219, -0.34380340576171875, -0.3239173889160156, -0.3040313720703125, -0.2841453552246094, -0.26425933837890625, -0.24437332153320312, -0.2244873046875, -0.20460128784179688, -0.18471527099609375, -0.16482925415039062, -0.1449432373046875, -0.12505722045898438, -0.10517120361328125, -0.08528518676757812, -0.065399169921875, -0.045513153076171875, -0.02562713623046875, -0.005741119384765625, 0.0141448974609375, 0.034030914306640625, 0.05391693115234375, 0.07380294799804688, 0.09368896484375, 0.11357498168945312, 0.13346099853515625, 0.15334701538085938, 0.1732330322265625, 0.19311904907226562, 0.21300506591796875, 0.23289108276367188, 0.252777099609375, 0.2726631164550781, 0.29254913330078125, 0.3124351501464844, 0.3323211669921875, 0.3522071838378906, 0.37209320068359375, 0.3919792175292969, 0.411865234375]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 5.0, 1.0, 1.0, 2.0, 3.0, 5.0, 6.0, 16.0, 71.0, 209.0, 309.0, 242.0, 97.0, 30.0, 8.0, 2.0, 1.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.322185516357422, -9.082605361938477, -8.843026161193848, -8.603446006774902, -8.363866806030273, -8.124286651611328, -7.884707450866699, -7.645127773284912, -7.405548095703125, -7.165968418121338, -6.926388740539551, -6.686809062957764, -6.447229385375977, -6.2076497077941895, -5.968070030212402, -5.728490352630615, -5.488910675048828, -5.249330997467041, -5.009751319885254, -4.770171642303467, -4.53059196472168, -4.291012287139893, -4.0514326095581055, -3.8118529319763184, -3.572272777557373, -3.332693099975586, -3.093113422393799, -2.8535337448120117, -2.6139540672302246, -2.3743743896484375, -2.1347947120666504, -1.8952149152755737, -1.6556353569030762, -1.416055679321289, -1.176476001739502, -0.9368962645530701, -0.697316586971283, -0.4577368497848511, -0.21815717220306396, 0.021422505378723145, 0.26100218296051025, 0.5005818605422974, 0.7401615381240845, 0.9797412753105164, 1.2193210124969482, 1.4589006900787354, 1.6984803676605225, 1.9380600452423096, 2.1776397228240967, 2.417219400405884, 2.656799077987671, 2.896378755569458, 3.135958433151245, 3.3755383491516113, 3.6151180267333984, 3.8546977043151855, 4.094277381896973, 4.33385705947876, 4.573436737060547, 4.813016414642334, 5.052596092224121, 5.292175769805908, 5.531755447387695, 5.771335124969482, 6.0109148025512695]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 3.0, 0.0, 3.0, 4.0, 3.0, 5.0, 3.0, 3.0, 10.0, 14.0, 17.0, 24.0, 22.0, 26.0, 35.0, 40.0, 49.0, 56.0, 45.0, 47.0, 64.0, 69.0, 64.0, 55.0, 45.0, 45.0, 48.0, 38.0, 31.0, 26.0, 13.0, 19.0, 16.0, 15.0, 13.0, 6.0, 8.0, 5.0, 6.0, 6.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.016331672668457, -2.9301891326904297, -2.8440465927124023, -2.757903814315796, -2.6717612743377686, -2.585618734359741, -2.499476194381714, -2.4133334159851074, -2.32719087600708, -2.2410483360290527, -2.1549057960510254, -2.068763017654419, -1.9826204776763916, -1.8964779376983643, -1.810335397720337, -1.72419273853302, -1.6380501985549927, -1.5519076585769653, -1.4657649993896484, -1.379622459411621, -1.2934798002243042, -1.2073372602462769, -1.12119460105896, -1.0350520610809326, -0.9489094614982605, -0.8627668619155884, -0.7766242623329163, -0.6904816627502441, -0.6043391227722168, -0.5181964635848999, -0.43205392360687256, -0.34591132402420044, -0.2597687244415283, -0.1736261248588562, -0.08748354017734528, -0.0013409554958343506, 0.08480164408683777, 0.1709442436695099, 0.2570868134498596, 0.34322941303253174, 0.42937201261520386, 0.515514612197876, 0.6016572117805481, 0.6877998113632202, 0.7739423513412476, 0.8600850105285645, 0.9462275505065918, 1.0323700904846191, 1.118512749671936, 1.2046552896499634, 1.2907979488372803, 1.3769404888153076, 1.4630831480026245, 1.5492256879806519, 1.6353683471679688, 1.721510887145996, 1.8076534271240234, 1.8937959671020508, 1.9799386262893677, 2.0660812854766846, 2.152223825454712, 2.2383663654327393, 2.3245089054107666, 2.410651683807373, 2.4967942237854004]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 5.0, 5.0, 5.0, 3.0, 5.0, 15.0, 13.0, 27.0, 29.0, 38.0, 56.0, 111.0, 162.0, 223.0, 456.0, 770.0, 1591.0, 3329.0, 6840.0, 15831.0, 38240.0, 91208.0, 213475.0, 329633.0, 199504.0, 84585.0, 35090.0, 14438.0, 6494.0, 2985.0, 1520.0, 746.0, 410.0, 269.0, 168.0, 104.0, 52.0, 37.0, 27.0, 21.0, 13.0, 10.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.30023956298828125, -0.2896881103515625, -0.27913665771484375, -0.268585205078125, -0.25803375244140625, -0.2474822998046875, -0.23693084716796875, -0.22637939453125, -0.21582794189453125, -0.2052764892578125, -0.19472503662109375, -0.184173583984375, -0.17362213134765625, -0.1630706787109375, -0.15251922607421875, -0.1419677734375, -0.13141632080078125, -0.1208648681640625, -0.11031341552734375, -0.099761962890625, -0.08921051025390625, -0.0786590576171875, -0.06810760498046875, -0.05755615234375, -0.04700469970703125, -0.0364532470703125, -0.02590179443359375, -0.015350341796875, -0.00479888916015625, 0.0057525634765625, 0.01630401611328125, 0.02685546875, 0.03740692138671875, 0.0479583740234375, 0.05850982666015625, 0.069061279296875, 0.07961273193359375, 0.0901641845703125, 0.10071563720703125, 0.11126708984375, 0.12181854248046875, 0.1323699951171875, 0.14292144775390625, 0.153472900390625, 0.16402435302734375, 0.1745758056640625, 0.18512725830078125, 0.1956787109375, 0.20623016357421875, 0.2167816162109375, 0.22733306884765625, 0.237884521484375, 0.24843597412109375, 0.2589874267578125, 0.26953887939453125, 0.28009033203125, 0.29064178466796875, 0.3011932373046875, 0.31174468994140625, 0.322296142578125, 0.33284759521484375, 0.3433990478515625, 0.35395050048828125, 0.364501953125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 6.0, 5.0, 6.0, 4.0, 7.0, 8.0, 5.0, 16.0, 9.0, 16.0, 17.0, 25.0, 22.0, 23.0, 41.0, 30.0, 33.0, 38.0, 39.0, 36.0, 53.0, 55.0, 42.0, 40.0, 42.0, 43.0, 48.0, 36.0, 40.0, 39.0, 41.0, 20.0, 22.0, 23.0, 13.0, 13.0, 9.0, 7.0, 5.0, 7.0, 6.0, 6.0, 3.0, 2.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.2064208984375, -0.20001983642578125, -0.1936187744140625, -0.18721771240234375, -0.180816650390625, -0.17441558837890625, -0.1680145263671875, -0.16161346435546875, -0.15521240234375, -0.14881134033203125, -0.1424102783203125, -0.13600921630859375, -0.129608154296875, -0.12320709228515625, -0.1168060302734375, -0.11040496826171875, -0.10400390625, -0.09760284423828125, -0.0912017822265625, -0.08480072021484375, -0.078399658203125, -0.07199859619140625, -0.0655975341796875, -0.05919647216796875, -0.05279541015625, -0.04639434814453125, -0.0399932861328125, -0.03359222412109375, -0.027191162109375, -0.02079010009765625, -0.0143890380859375, -0.00798797607421875, -0.0015869140625, 0.00481414794921875, 0.0112152099609375, 0.01761627197265625, 0.024017333984375, 0.03041839599609375, 0.0368194580078125, 0.04322052001953125, 0.04962158203125, 0.05602264404296875, 0.0624237060546875, 0.06882476806640625, 0.075225830078125, 0.08162689208984375, 0.0880279541015625, 0.09442901611328125, 0.100830078125, 0.10723114013671875, 0.1136322021484375, 0.12003326416015625, 0.126434326171875, 0.13283538818359375, 0.1392364501953125, 0.14563751220703125, 0.15203857421875, 0.15843963623046875, 0.1648406982421875, 0.17124176025390625, 0.177642822265625, 0.18404388427734375, 0.1904449462890625, 0.19684600830078125, 0.2032470703125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 4.0, 7.0, 2.0, 8.0, 7.0, 9.0, 10.0, 22.0, 27.0, 26.0, 44.0, 52.0, 74.0, 109.0, 150.0, 170.0, 272.0, 396.0, 591.0, 1001.0, 1835.0, 4420.0, 16840.0, 101963.0, 660323.0, 214604.0, 32525.0, 6987.0, 2460.0, 1227.0, 733.0, 489.0, 313.0, 243.0, 162.0, 106.0, 84.0, 83.0, 48.0, 38.0, 24.0, 27.0, 13.0, 7.0, 7.0, 7.0, 3.0, 3.0, 3.0, 4.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.51708984375, -0.4969635009765625, -0.476837158203125, -0.4567108154296875, -0.43658447265625, -0.4164581298828125, -0.396331787109375, -0.3762054443359375, -0.3560791015625, -0.3359527587890625, -0.315826416015625, -0.2957000732421875, -0.27557373046875, -0.2554473876953125, -0.235321044921875, -0.2151947021484375, -0.195068359375, -0.1749420166015625, -0.154815673828125, -0.1346893310546875, -0.11456298828125, -0.0944366455078125, -0.074310302734375, -0.0541839599609375, -0.0340576171875, -0.0139312744140625, 0.006195068359375, 0.0263214111328125, 0.04644775390625, 0.0665740966796875, 0.086700439453125, 0.1068267822265625, 0.126953125, 0.1470794677734375, 0.167205810546875, 0.1873321533203125, 0.20745849609375, 0.2275848388671875, 0.247711181640625, 0.2678375244140625, 0.2879638671875, 0.3080902099609375, 0.328216552734375, 0.3483428955078125, 0.36846923828125, 0.3885955810546875, 0.408721923828125, 0.4288482666015625, 0.448974609375, 0.4691009521484375, 0.489227294921875, 0.5093536376953125, 0.52947998046875, 0.5496063232421875, 0.569732666015625, 0.5898590087890625, 0.6099853515625, 0.6301116943359375, 0.650238037109375, 0.6703643798828125, 0.69049072265625, 0.7106170654296875, 0.730743408203125, 0.7508697509765625, 0.77099609375]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 6.0, 7.0, 6.0, 8.0, 13.0, 7.0, 14.0, 16.0, 19.0, 16.0, 30.0, 21.0, 16.0, 23.0, 40.0, 39.0, 35.0, 55.0, 55.0, 47.0, 50.0, 52.0, 47.0, 41.0, 36.0, 32.0, 43.0, 28.0, 33.0, 23.0, 20.0, 29.0, 20.0, 10.0, 7.0, 13.0, 9.0, 6.0, 7.0, 7.0, 10.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.76318359375, -0.739410400390625, -0.71563720703125, -0.691864013671875, -0.6680908203125, -0.644317626953125, -0.62054443359375, -0.596771240234375, -0.572998046875, -0.549224853515625, -0.52545166015625, -0.501678466796875, -0.4779052734375, -0.454132080078125, -0.43035888671875, -0.406585693359375, -0.3828125, -0.359039306640625, -0.33526611328125, -0.311492919921875, -0.2877197265625, -0.263946533203125, -0.24017333984375, -0.216400146484375, -0.192626953125, -0.168853759765625, -0.14508056640625, -0.121307373046875, -0.0975341796875, -0.073760986328125, -0.04998779296875, -0.026214599609375, -0.00244140625, 0.021331787109375, 0.04510498046875, 0.068878173828125, 0.0926513671875, 0.116424560546875, 0.14019775390625, 0.163970947265625, 0.187744140625, 0.211517333984375, 0.23529052734375, 0.259063720703125, 0.2828369140625, 0.306610107421875, 0.33038330078125, 0.354156494140625, 0.3779296875, 0.401702880859375, 0.42547607421875, 0.449249267578125, 0.4730224609375, 0.496795654296875, 0.52056884765625, 0.544342041015625, 0.568115234375, 0.591888427734375, 0.61566162109375, 0.639434814453125, 0.6632080078125, 0.686981201171875, 0.71075439453125, 0.734527587890625, 0.75830078125]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 3.0, 3.0, 2.0, 6.0, 7.0, 7.0, 13.0, 15.0, 14.0, 19.0, 22.0, 31.0, 59.0, 71.0, 128.0, 237.0, 474.0, 1290.0, 4416.0, 23265.0, 165600.0, 714773.0, 115755.0, 16775.0, 3495.0, 1046.0, 434.0, 219.0, 115.0, 82.0, 44.0, 43.0, 19.0, 20.0, 16.0, 4.0, 3.0, 8.0, 8.0, 4.0, 3.0, 7.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2337646484375, -0.2258167266845703, -0.21786880493164062, -0.20992088317871094, -0.20197296142578125, -0.19402503967285156, -0.18607711791992188, -0.1781291961669922, -0.1701812744140625, -0.1622333526611328, -0.15428543090820312, -0.14633750915527344, -0.13838958740234375, -0.13044166564941406, -0.12249374389648438, -0.11454582214355469, -0.106597900390625, -0.09864997863769531, -0.09070205688476562, -0.08275413513183594, -0.07480621337890625, -0.06685829162597656, -0.058910369873046875, -0.05096244812011719, -0.0430145263671875, -0.03506660461425781, -0.027118682861328125, -0.019170761108398438, -0.01122283935546875, -0.0032749176025390625, 0.004673004150390625, 0.012620925903320312, 0.02056884765625, 0.028516769409179688, 0.036464691162109375, 0.04441261291503906, 0.05236053466796875, 0.06030845642089844, 0.06825637817382812, 0.07620429992675781, 0.0841522216796875, 0.09210014343261719, 0.10004806518554688, 0.10799598693847656, 0.11594390869140625, 0.12389183044433594, 0.13183975219726562, 0.1397876739501953, 0.147735595703125, 0.1556835174560547, 0.16363143920898438, 0.17157936096191406, 0.17952728271484375, 0.18747520446777344, 0.19542312622070312, 0.2033710479736328, 0.2113189697265625, 0.2192668914794922, 0.22721481323242188, 0.23516273498535156, 0.24311065673828125, 0.25105857849121094, 0.2590065002441406, 0.2669544219970703, 0.27490234375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 6.0, 5.0, 9.0, 9.0, 8.0, 9.0, 8.0, 17.0, 11.0, 23.0, 15.0, 32.0, 40.0, 38.0, 47.0, 60.0, 75.0, 77.0, 70.0, 82.0, 54.0, 53.0, 35.0, 42.0, 27.0, 39.0, 18.0, 15.0, 10.0, 12.0, 14.0, 8.0, 5.0, 6.0, 4.0, 5.0, 1.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.8279762268066406e-05, -4.6688131988048553e-05, -4.50965017080307e-05, -4.350487142801285e-05, -4.1913241147994995e-05, -4.032161086797714e-05, -3.872998058795929e-05, -3.713835030794144e-05, -3.5546720027923584e-05, -3.395508974790573e-05, -3.236345946788788e-05, -3.0771829187870026e-05, -2.9180198907852173e-05, -2.758856862783432e-05, -2.5996938347816467e-05, -2.4405308067798615e-05, -2.2813677787780762e-05, -2.122204750776291e-05, -1.9630417227745056e-05, -1.8038786947727203e-05, -1.644715666770935e-05, -1.4855526387691498e-05, -1.3263896107673645e-05, -1.1672265827655792e-05, -1.008063554763794e-05, -8.489005267620087e-06, -6.897374987602234e-06, -5.305744707584381e-06, -3.7141144275665283e-06, -2.1224841475486755e-06, -5.308538675308228e-07, 1.06077641248703e-06, 2.652406692504883e-06, 4.244036972522736e-06, 5.835667252540588e-06, 7.427297532558441e-06, 9.018927812576294e-06, 1.0610558092594147e-05, 1.2202188372612e-05, 1.3793818652629852e-05, 1.5385448932647705e-05, 1.6977079212665558e-05, 1.856870949268341e-05, 2.0160339772701263e-05, 2.1751970052719116e-05, 2.334360033273697e-05, 2.4935230612754822e-05, 2.6526860892772675e-05, 2.8118491172790527e-05, 2.971012145280838e-05, 3.130175173282623e-05, 3.2893382012844086e-05, 3.448501229286194e-05, 3.607664257287979e-05, 3.7668272852897644e-05, 3.92599031329155e-05, 4.085153341293335e-05, 4.24431636929512e-05, 4.4034793972969055e-05, 4.562642425298691e-05, 4.721805453300476e-05, 4.8809684813022614e-05, 5.0401315093040466e-05, 5.199294537305832e-05, 5.358457565307617e-05]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 2.0, 8.0, 4.0, 10.0, 10.0, 18.0, 29.0, 40.0, 56.0, 90.0, 137.0, 234.0, 413.0, 883.0, 1982.0, 5358.0, 21299.0, 117259.0, 645442.0, 206781.0, 35465.0, 7950.0, 2704.0, 1111.0, 555.0, 270.0, 162.0, 83.0, 54.0, 40.0, 32.0, 27.0, 18.0, 8.0, 12.0, 4.0, 9.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2001953125, -0.19344520568847656, -0.18669509887695312, -0.1799449920654297, -0.17319488525390625, -0.1664447784423828, -0.15969467163085938, -0.15294456481933594, -0.1461944580078125, -0.13944435119628906, -0.13269424438476562, -0.1259441375732422, -0.11919403076171875, -0.11244392395019531, -0.10569381713867188, -0.09894371032714844, -0.092193603515625, -0.08544349670410156, -0.07869338989257812, -0.07194328308105469, -0.06519317626953125, -0.05844306945800781, -0.051692962646484375, -0.04494285583496094, -0.0381927490234375, -0.03144264221191406, -0.024692535400390625, -0.017942428588867188, -0.01119232177734375, -0.0044422149658203125, 0.002307891845703125, 0.009057998657226562, 0.01580810546875, 0.022558212280273438, 0.029308319091796875, 0.03605842590332031, 0.04280853271484375, 0.04955863952636719, 0.056308746337890625, 0.06305885314941406, 0.0698089599609375, 0.07655906677246094, 0.08330917358398438, 0.09005928039550781, 0.09680938720703125, 0.10355949401855469, 0.11030960083007812, 0.11705970764160156, 0.123809814453125, 0.13055992126464844, 0.13731002807617188, 0.1440601348876953, 0.15081024169921875, 0.1575603485107422, 0.16431045532226562, 0.17106056213378906, 0.1778106689453125, 0.18456077575683594, 0.19131088256835938, 0.1980609893798828, 0.20481109619140625, 0.2115612030029297, 0.21831130981445312, 0.22506141662597656, 0.2318115234375]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 2.0, 9.0, 6.0, 7.0, 13.0, 21.0, 17.0, 30.0, 45.0, 48.0, 52.0, 70.0, 56.0, 73.0, 83.0, 81.0, 60.0, 72.0, 52.0, 40.0, 33.0, 36.0, 23.0, 18.0, 18.0, 8.0, 7.0, 3.0, 5.0, 4.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.23193359375, -0.2253875732421875, -0.218841552734375, -0.2122955322265625, -0.20574951171875, -0.1992034912109375, -0.192657470703125, -0.1861114501953125, -0.1795654296875, -0.1730194091796875, -0.166473388671875, -0.1599273681640625, -0.15338134765625, -0.1468353271484375, -0.140289306640625, -0.1337432861328125, -0.127197265625, -0.1206512451171875, -0.114105224609375, -0.1075592041015625, -0.10101318359375, -0.0944671630859375, -0.087921142578125, -0.0813751220703125, -0.0748291015625, -0.0682830810546875, -0.061737060546875, -0.0551910400390625, -0.04864501953125, -0.0420989990234375, -0.035552978515625, -0.0290069580078125, -0.0224609375, -0.0159149169921875, -0.009368896484375, -0.0028228759765625, 0.00372314453125, 0.0102691650390625, 0.016815185546875, 0.0233612060546875, 0.0299072265625, 0.0364532470703125, 0.042999267578125, 0.0495452880859375, 0.05609130859375, 0.0626373291015625, 0.069183349609375, 0.0757293701171875, 0.082275390625, 0.0888214111328125, 0.095367431640625, 0.1019134521484375, 0.10845947265625, 0.1150054931640625, 0.121551513671875, 0.1280975341796875, 0.1346435546875, 0.1411895751953125, 0.147735595703125, 0.1542816162109375, 0.16082763671875, 0.1673736572265625, 0.173919677734375, 0.1804656982421875, 0.18701171875]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 5.0, 4.0, 7.0, 12.0, 21.0, 36.0, 52.0, 110.0, 155.0, 214.0, 160.0, 84.0, 50.0, 35.0, 21.0, 10.0, 5.0, 6.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-4.2026286125183105, -4.068789482116699, -3.934950113296509, -3.8011107444763184, -3.667271614074707, -3.5334324836730957, -3.3995931148529053, -3.265753746032715, -3.1319146156311035, -2.998075485229492, -2.8642361164093018, -2.7303967475891113, -2.5965576171875, -2.4627184867858887, -2.3288791179656982, -2.195039749145508, -2.0612006187438965, -1.9273613691329956, -1.7935221195220947, -1.6596828699111938, -1.525843620300293, -1.392004370689392, -1.2581651210784912, -1.1243258714675903, -0.9904866218566895, -0.8566473722457886, -0.7228081226348877, -0.5889688730239868, -0.45512962341308594, -0.32129037380218506, -0.18745112419128418, -0.0536118745803833, 0.08022689819335938, 0.21406614780426025, 0.34790539741516113, 0.481744647026062, 0.6155838966369629, 0.7494231462478638, 0.8832623958587646, 1.0171016454696655, 1.1509408950805664, 1.2847801446914673, 1.4186193943023682, 1.552458643913269, 1.68629789352417, 1.8201371431350708, 1.9539763927459717, 2.087815761566162, 2.2216548919677734, 2.3554940223693848, 2.489333391189575, 2.6231727600097656, 2.757011890411377, 2.8908510208129883, 3.0246903896331787, 3.158529758453369, 3.2923688888549805, 3.426208019256592, 3.5600473880767822, 3.6938867568969727, 3.827725887298584, 3.9615650177001953, 4.095404624938965, 4.229243755340576, 4.3630828857421875]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 5.0, 4.0, 5.0, 14.0, 8.0, 16.0, 8.0, 26.0, 27.0, 34.0, 24.0, 28.0, 23.0, 34.0, 33.0, 37.0, 54.0, 70.0, 70.0, 72.0, 54.0, 30.0, 46.0, 33.0, 30.0, 35.0, 19.0, 23.0, 12.0, 14.0, 19.0, 5.0, 12.0, 14.0, 8.0, 6.0, 8.0, 11.0, 4.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.987926721572876, -2.891068696975708, -2.794210910797119, -2.697352886199951, -2.600494861602783, -2.5036368370056152, -2.4067790508270264, -2.3099210262298584, -2.2130630016326904, -2.1162049770355225, -2.0193471908569336, -1.9224891662597656, -1.8256311416625977, -1.7287732362747192, -1.6319153308868408, -1.5350573062896729, -1.4381994009017944, -1.341341495513916, -1.244483470916748, -1.1476255655288696, -1.0507675409317017, -0.9539096355438232, -0.8570516705513, -0.7601937055587769, -0.6633357405662537, -0.5664777755737305, -0.4696198105812073, -0.37276187539100647, -0.2759039103984833, -0.17904594540596008, -0.08218801021575928, 0.014669954776763916, 0.11152791976928711, 0.2083858847618103, 0.3052438497543335, 0.4021017849445343, 0.4989597499370575, 0.5958176851272583, 0.6926756501197815, 0.7895336151123047, 0.8863915801048279, 0.9832495450973511, 1.0801074504852295, 1.1769654750823975, 1.2738233804702759, 1.3706814050674438, 1.4675393104553223, 1.5643973350524902, 1.6612552404403687, 1.758113145828247, 1.854971170425415, 1.9518290758132935, 2.048686981201172, 2.14554500579834, 2.242403030395508, 2.339261054992676, 2.4361188411712646, 2.5329768657684326, 2.6298346519470215, 2.7266926765441895, 2.8235507011413574, 2.9204087257385254, 3.0172665119171143, 3.1141245365142822, 3.21098256111145]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 10.0, 7.0, 10.0, 11.0, 15.0, 24.0, 39.0, 47.0, 62.0, 87.0, 100.0, 151.0, 217.0, 394.0, 771.0, 1746.0, 5103.0, 18701.0, 119142.0, 1992382.0, 1917366.0, 112223.0, 17560.0, 4685.0, 1635.0, 682.0, 384.0, 225.0, 149.0, 99.0, 66.0, 44.0, 36.0, 33.0, 18.0, 10.0, 13.0, 4.0, 11.0, 7.0, 7.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3642578125, -0.35076141357421875, -0.3372650146484375, -0.32376861572265625, -0.310272216796875, -0.29677581787109375, -0.2832794189453125, -0.26978302001953125, -0.25628662109375, -0.24279022216796875, -0.2292938232421875, -0.21579742431640625, -0.202301025390625, -0.18880462646484375, -0.1753082275390625, -0.16181182861328125, -0.1483154296875, -0.13481903076171875, -0.1213226318359375, -0.10782623291015625, -0.094329833984375, -0.08083343505859375, -0.0673370361328125, -0.05384063720703125, -0.04034423828125, -0.02684783935546875, -0.0133514404296875, 0.00014495849609375, 0.013641357421875, 0.02713775634765625, 0.0406341552734375, 0.05413055419921875, 0.067626953125, 0.08112335205078125, 0.0946197509765625, 0.10811614990234375, 0.121612548828125, 0.13510894775390625, 0.1486053466796875, 0.16210174560546875, 0.17559814453125, 0.18909454345703125, 0.2025909423828125, 0.21608734130859375, 0.229583740234375, 0.24308013916015625, 0.2565765380859375, 0.27007293701171875, 0.2835693359375, 0.29706573486328125, 0.3105621337890625, 0.32405853271484375, 0.337554931640625, 0.35105133056640625, 0.3645477294921875, 0.37804412841796875, 0.39154052734375, 0.40503692626953125, 0.4185333251953125, 0.43202972412109375, 0.445526123046875, 0.45902252197265625, 0.4725189208984375, 0.48601531982421875, 0.49951171875]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 2.0, 4.0, 4.0, 6.0, 6.0, 9.0, 17.0, 21.0, 24.0, 45.0, 48.0, 53.0, 68.0, 78.0, 63.0, 63.0, 59.0, 74.0, 62.0, 65.0, 48.0, 50.0, 44.0, 35.0, 19.0, 11.0, 9.0, 4.0, 7.0, 5.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2222900390625, -0.2130451202392578, -0.20380020141601562, -0.19455528259277344, -0.18531036376953125, -0.17606544494628906, -0.16682052612304688, -0.1575756072998047, -0.1483306884765625, -0.1390857696533203, -0.12984085083007812, -0.12059593200683594, -0.11135101318359375, -0.10210609436035156, -0.09286117553710938, -0.08361625671386719, -0.074371337890625, -0.06512641906738281, -0.055881500244140625, -0.04663658142089844, -0.03739166259765625, -0.028146743774414062, -0.018901824951171875, -0.009656906127929688, -0.0004119873046875, 0.008832931518554688, 0.018077850341796875, 0.027322769165039062, 0.03656768798828125, 0.04581260681152344, 0.055057525634765625, 0.06430244445800781, 0.07354736328125, 0.08279228210449219, 0.09203720092773438, 0.10128211975097656, 0.11052703857421875, 0.11977195739746094, 0.12901687622070312, 0.1382617950439453, 0.1475067138671875, 0.1567516326904297, 0.16599655151367188, 0.17524147033691406, 0.18448638916015625, 0.19373130798339844, 0.20297622680664062, 0.2122211456298828, 0.221466064453125, 0.2307109832763672, 0.23995590209960938, 0.24920082092285156, 0.25844573974609375, 0.26769065856933594, 0.2769355773925781, 0.2861804962158203, 0.2954254150390625, 0.3046703338623047, 0.3139152526855469, 0.32316017150878906, 0.33240509033203125, 0.34165000915527344, 0.3508949279785156, 0.3601398468017578, 0.369384765625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 9.0, 15.0, 19.0, 29.0, 61.0, 105.0, 211.0, 377.0, 839.0, 2198.0, 11614.0, 225547.0, 3864264.0, 79324.0, 6640.0, 1513.0, 667.0, 357.0, 211.0, 122.0, 81.0, 28.0, 27.0, 7.0, 8.0, 6.0, 2.0, 6.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.81005859375, -0.7824783325195312, -0.7548980712890625, -0.7273178100585938, -0.699737548828125, -0.6721572875976562, -0.6445770263671875, -0.6169967651367188, -0.58941650390625, -0.5618362426757812, -0.5342559814453125, -0.5066757202148438, -0.479095458984375, -0.45151519775390625, -0.4239349365234375, -0.39635467529296875, -0.3687744140625, -0.34119415283203125, -0.3136138916015625, -0.28603363037109375, -0.258453369140625, -0.23087310791015625, -0.2032928466796875, -0.17571258544921875, -0.14813232421875, -0.12055206298828125, -0.0929718017578125, -0.06539154052734375, -0.037811279296875, -0.01023101806640625, 0.0173492431640625, 0.04492950439453125, 0.072509765625, 0.10009002685546875, 0.1276702880859375, 0.15525054931640625, 0.182830810546875, 0.21041107177734375, 0.2379913330078125, 0.26557159423828125, 0.29315185546875, 0.32073211669921875, 0.3483123779296875, 0.37589263916015625, 0.403472900390625, 0.43105316162109375, 0.4586334228515625, 0.48621368408203125, 0.5137939453125, 0.5413742065429688, 0.5689544677734375, 0.5965347290039062, 0.624114990234375, 0.6516952514648438, 0.6792755126953125, 0.7068557739257812, 0.73443603515625, 0.7620162963867188, 0.7895965576171875, 0.8171768188476562, 0.844757080078125, 0.8723373413085938, 0.8999176025390625, 0.9274978637695312, 0.955078125]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 3.0, 1.0, 8.0, 14.0, 9.0, 16.0, 32.0, 73.0, 125.0, 306.0, 754.0, 1268.0, 859.0, 352.0, 123.0, 55.0, 34.0, 22.0, 13.0, 6.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.904296875, -0.8773345947265625, -0.850372314453125, -0.8234100341796875, -0.79644775390625, -0.7694854736328125, -0.742523193359375, -0.7155609130859375, -0.6885986328125, -0.6616363525390625, -0.634674072265625, -0.6077117919921875, -0.58074951171875, -0.5537872314453125, -0.526824951171875, -0.4998626708984375, -0.472900390625, -0.4459381103515625, -0.418975830078125, -0.3920135498046875, -0.36505126953125, -0.3380889892578125, -0.311126708984375, -0.2841644287109375, -0.2572021484375, -0.2302398681640625, -0.203277587890625, -0.1763153076171875, -0.14935302734375, -0.1223907470703125, -0.095428466796875, -0.0684661865234375, -0.04150390625, -0.0145416259765625, 0.012420654296875, 0.0393829345703125, 0.06634521484375, 0.0933074951171875, 0.120269775390625, 0.1472320556640625, 0.1741943359375, 0.2011566162109375, 0.228118896484375, 0.2550811767578125, 0.28204345703125, 0.3090057373046875, 0.335968017578125, 0.3629302978515625, 0.389892578125, 0.4168548583984375, 0.443817138671875, 0.4707794189453125, 0.49774169921875, 0.5247039794921875, 0.551666259765625, 0.5786285400390625, 0.6055908203125, 0.6325531005859375, 0.659515380859375, 0.6864776611328125, 0.71343994140625, 0.7404022216796875, 0.767364501953125, 0.7943267822265625, 0.8212890625]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 3.0, 2.0, 1.0, 2.0, 3.0, 4.0, 12.0, 8.0, 12.0, 39.0, 72.0, 133.0, 199.0, 192.0, 135.0, 100.0, 42.0, 20.0, 14.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.1621832847595215, -2.996473789215088, -2.8307642936706543, -2.6650547981262207, -2.499345302581787, -2.3336358070373535, -2.167926549911499, -2.0022170543670654, -1.8365075588226318, -1.6707980632781982, -1.5050885677337646, -1.3393791913986206, -1.173669695854187, -1.0079602003097534, -0.8422507643699646, -0.6765413284301758, -0.5108318328857422, -0.345122367143631, -0.17941290140151978, -0.01370343565940857, 0.15200603008270264, 0.31771552562713623, 0.48342496156692505, 0.6491343975067139, 0.8148438930511475, 0.980553388595581, 1.1462628841400146, 1.3119722604751587, 1.4776817560195923, 1.6433912515640259, 1.80910062789917, 1.9748101234436035, 2.1405200958251953, 2.306229591369629, 2.4719390869140625, 2.637648582458496, 2.8033580780029297, 2.9690675735473633, 3.1347768306732178, 3.3004863262176514, 3.466195821762085, 3.6319053173065186, 3.797614812850952, 3.9633243083953857, 4.12903356552124, 4.294743061065674, 4.460452556610107, 4.626162052154541, 4.791871547698975, 4.957581043243408, 5.123290538787842, 5.289000034332275, 5.454709529876709, 5.620419025421143, 5.786128520965576, 5.951837539672852, 6.117547035217285, 6.283256530761719, 6.448966026306152, 6.614675521850586, 6.7803850173950195, 6.946094512939453, 7.111804008483887, 7.27751350402832, 7.443222999572754]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 4.0, 9.0, 4.0, 8.0, 11.0, 12.0, 15.0, 20.0, 25.0, 17.0, 21.0, 42.0, 40.0, 43.0, 48.0, 54.0, 60.0, 52.0, 56.0, 51.0, 44.0, 48.0, 44.0, 42.0, 34.0, 37.0, 23.0, 24.0, 17.0, 18.0, 20.0, 14.0, 8.0, 11.0, 5.0, 3.0, 7.0, 5.0, 0.0, 5.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0], "bins": [-2.3516716957092285, -2.27836012840271, -2.2050487995147705, -2.131737232208252, -2.0584256649017334, -1.9851142168045044, -1.9118027687072754, -1.8384912014007568, -1.7651797533035278, -1.6918683052062988, -1.6185567378997803, -1.5452452898025513, -1.4719338417053223, -1.3986222743988037, -1.3253108263015747, -1.2519993782043457, -1.1786878108978271, -1.1053763628005981, -1.0320647954940796, -0.9587533473968506, -0.8854418396949768, -0.812130331993103, -0.738818883895874, -0.6655073761940002, -0.5921958684921265, -0.5188843607902527, -0.4455728828907013, -0.3722614049911499, -0.2989498972892761, -0.22563838958740234, -0.15232691168785095, -0.07901543378829956, -0.00570368766784668, 0.0676078051328659, 0.1409192979335785, 0.21423079073429108, 0.28754228353500366, 0.36085379123687744, 0.43416526913642883, 0.5074767470359802, 0.580788254737854, 0.6540997624397278, 0.7274112701416016, 0.8007227182388306, 0.8740342259407043, 0.9473457336425781, 1.0206571817398071, 1.0939686298370361, 1.1672801971435547, 1.2405916452407837, 1.3139032125473022, 1.3872146606445312, 1.4605262279510498, 1.5338376760482788, 1.6071491241455078, 1.6804606914520264, 1.7537721395492554, 1.8270835876464844, 1.900395154953003, 1.973706603050232, 2.047018051147461, 2.1203296184539795, 2.193641185760498, 2.2669525146484375, 2.340264081954956]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 4.0, 3.0, 7.0, 8.0, 9.0, 19.0, 24.0, 37.0, 78.0, 165.0, 304.0, 848.0, 2340.0, 7728.0, 33931.0, 191050.0, 558380.0, 205204.0, 36287.0, 8187.0, 2394.0, 832.0, 391.0, 166.0, 58.0, 31.0, 24.0, 15.0, 8.0, 7.0, 10.0, 4.0, 1.0, 6.0, 3.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.78955078125, -0.7705345153808594, -0.7515182495117188, -0.7325019836425781, -0.7134857177734375, -0.6944694519042969, -0.6754531860351562, -0.6564369201660156, -0.637420654296875, -0.6184043884277344, -0.5993881225585938, -0.5803718566894531, -0.5613555908203125, -0.5423393249511719, -0.5233230590820312, -0.5043067932128906, -0.48529052734375, -0.4662742614746094, -0.44725799560546875, -0.4282417297363281, -0.4092254638671875, -0.3902091979980469, -0.37119293212890625, -0.3521766662597656, -0.333160400390625, -0.3141441345214844, -0.29512786865234375, -0.2761116027832031, -0.2570953369140625, -0.23807907104492188, -0.21906280517578125, -0.20004653930664062, -0.1810302734375, -0.16201400756835938, -0.14299774169921875, -0.12398147583007812, -0.1049652099609375, -0.08594894409179688, -0.06693267822265625, -0.047916412353515625, -0.028900146484375, -0.009883880615234375, 0.00913238525390625, 0.028148651123046875, 0.0471649169921875, 0.06618118286132812, 0.08519744873046875, 0.10421371459960938, 0.12322998046875, 0.14224624633789062, 0.16126251220703125, 0.18027877807617188, 0.1992950439453125, 0.21831130981445312, 0.23732757568359375, 0.2563438415527344, 0.275360107421875, 0.2943763732910156, 0.31339263916015625, 0.3324089050292969, 0.3514251708984375, 0.3704414367675781, 0.38945770263671875, 0.4084739685058594, 0.427490234375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 0.0, 2.0, 2.0, 3.0, 2.0, 4.0, 14.0, 20.0, 23.0, 28.0, 31.0, 44.0, 42.0, 49.0, 56.0, 59.0, 74.0, 71.0, 67.0, 59.0, 79.0, 46.0, 60.0, 38.0, 31.0, 29.0, 30.0, 15.0, 8.0, 8.0, 5.0, 2.0, 5.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17724609375, -0.16785049438476562, -0.15845489501953125, -0.14905929565429688, -0.1396636962890625, -0.13026809692382812, -0.12087249755859375, -0.11147689819335938, -0.102081298828125, -0.09268569946289062, -0.08329010009765625, -0.07389450073242188, -0.0644989013671875, -0.055103302001953125, -0.04570770263671875, -0.036312103271484375, -0.02691650390625, -0.017520904541015625, -0.00812530517578125, 0.001270294189453125, 0.0106658935546875, 0.020061492919921875, 0.02945709228515625, 0.038852691650390625, 0.048248291015625, 0.057643890380859375, 0.06703948974609375, 0.07643508911132812, 0.0858306884765625, 0.09522628784179688, 0.10462188720703125, 0.11401748657226562, 0.1234130859375, 0.13280868530273438, 0.14220428466796875, 0.15159988403320312, 0.1609954833984375, 0.17039108276367188, 0.17978668212890625, 0.18918228149414062, 0.198577880859375, 0.20797348022460938, 0.21736907958984375, 0.22676467895507812, 0.2361602783203125, 0.24555587768554688, 0.25495147705078125, 0.2643470764160156, 0.27374267578125, 0.2831382751464844, 0.29253387451171875, 0.3019294738769531, 0.3113250732421875, 0.3207206726074219, 0.33011627197265625, 0.3395118713378906, 0.348907470703125, 0.3583030700683594, 0.36769866943359375, 0.3770942687988281, 0.3864898681640625, 0.3958854675292969, 0.40528106689453125, 0.4146766662597656, 0.424072265625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 2.0, 9.0, 10.0, 10.0, 10.0, 12.0, 14.0, 14.0, 21.0, 38.0, 45.0, 60.0, 121.0, 171.0, 274.0, 471.0, 1034.0, 2996.0, 10389.0, 48846.0, 260740.0, 598757.0, 97180.0, 19275.0, 4940.0, 1521.0, 679.0, 313.0, 176.0, 111.0, 98.0, 51.0, 38.0, 35.0, 19.0, 16.0, 13.0, 7.0, 9.0, 5.0, 2.0, 5.0, 6.0, 0.0, 4.0, 4.0, 3.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.58447265625, -0.5668716430664062, -0.5492706298828125, -0.5316696166992188, -0.514068603515625, -0.49646759033203125, -0.4788665771484375, -0.46126556396484375, -0.44366455078125, -0.42606353759765625, -0.4084625244140625, -0.39086151123046875, -0.373260498046875, -0.35565948486328125, -0.3380584716796875, -0.32045745849609375, -0.3028564453125, -0.28525543212890625, -0.2676544189453125, -0.25005340576171875, -0.232452392578125, -0.21485137939453125, -0.1972503662109375, -0.17964935302734375, -0.16204833984375, -0.14444732666015625, -0.1268463134765625, -0.10924530029296875, -0.091644287109375, -0.07404327392578125, -0.0564422607421875, -0.03884124755859375, -0.021240234375, -0.00363922119140625, 0.0139617919921875, 0.03156280517578125, 0.049163818359375, 0.06676483154296875, 0.0843658447265625, 0.10196685791015625, 0.11956787109375, 0.13716888427734375, 0.1547698974609375, 0.17237091064453125, 0.189971923828125, 0.20757293701171875, 0.2251739501953125, 0.24277496337890625, 0.2603759765625, 0.27797698974609375, 0.2955780029296875, 0.31317901611328125, 0.330780029296875, 0.34838104248046875, 0.3659820556640625, 0.38358306884765625, 0.40118408203125, 0.41878509521484375, 0.4363861083984375, 0.45398712158203125, 0.471588134765625, 0.48918914794921875, 0.5067901611328125, 0.5243911743164062, 0.5419921875]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 3.0, 9.0, 5.0, 8.0, 3.0, 14.0, 21.0, 19.0, 17.0, 20.0, 23.0, 30.0, 30.0, 35.0, 37.0, 47.0, 32.0, 43.0, 34.0, 46.0, 52.0, 45.0, 61.0, 31.0, 40.0, 33.0, 25.0, 35.0, 24.0, 22.0, 22.0, 14.0, 26.0, 15.0, 13.0, 12.0, 12.0, 7.0, 6.0, 8.0, 5.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59765625, -0.57684326171875, -0.5560302734375, -0.53521728515625, -0.514404296875, -0.49359130859375, -0.4727783203125, -0.45196533203125, -0.43115234375, -0.41033935546875, -0.3895263671875, -0.36871337890625, -0.347900390625, -0.32708740234375, -0.3062744140625, -0.28546142578125, -0.2646484375, -0.24383544921875, -0.2230224609375, -0.20220947265625, -0.181396484375, -0.16058349609375, -0.1397705078125, -0.11895751953125, -0.09814453125, -0.07733154296875, -0.0565185546875, -0.03570556640625, -0.014892578125, 0.00592041015625, 0.0267333984375, 0.04754638671875, 0.068359375, 0.08917236328125, 0.1099853515625, 0.13079833984375, 0.151611328125, 0.17242431640625, 0.1932373046875, 0.21405029296875, 0.23486328125, 0.25567626953125, 0.2764892578125, 0.29730224609375, 0.318115234375, 0.33892822265625, 0.3597412109375, 0.38055419921875, 0.4013671875, 0.42218017578125, 0.4429931640625, 0.46380615234375, 0.484619140625, 0.50543212890625, 0.5262451171875, 0.54705810546875, 0.56787109375, 0.58868408203125, 0.6094970703125, 0.63031005859375, 0.651123046875, 0.67193603515625, 0.6927490234375, 0.71356201171875, 0.734375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 11.0, 9.0, 5.0, 11.0, 19.0, 26.0, 61.0, 89.0, 146.0, 208.0, 378.0, 725.0, 1356.0, 2897.0, 6142.0, 14569.0, 39336.0, 122858.0, 537470.0, 216687.0, 65632.0, 22846.0, 9098.0, 3911.0, 1908.0, 932.0, 501.0, 294.0, 162.0, 97.0, 52.0, 31.0, 24.0, 22.0, 14.0, 6.0, 8.0, 8.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.151123046875, -0.1463603973388672, -0.14159774780273438, -0.13683509826660156, -0.13207244873046875, -0.12730979919433594, -0.12254714965820312, -0.11778450012207031, -0.1130218505859375, -0.10825920104980469, -0.10349655151367188, -0.09873390197753906, -0.09397125244140625, -0.08920860290527344, -0.08444595336914062, -0.07968330383300781, -0.074920654296875, -0.07015800476074219, -0.06539535522460938, -0.06063270568847656, -0.05587005615234375, -0.05110740661621094, -0.046344757080078125, -0.04158210754394531, -0.0368194580078125, -0.03205680847167969, -0.027294158935546875, -0.022531509399414062, -0.01776885986328125, -0.013006210327148438, -0.008243560791015625, -0.0034809112548828125, 0.00128173828125, 0.0060443878173828125, 0.010807037353515625, 0.015569686889648438, 0.02033233642578125, 0.025094985961914062, 0.029857635498046875, 0.03462028503417969, 0.0393829345703125, 0.04414558410644531, 0.048908233642578125, 0.05367088317871094, 0.05843353271484375, 0.06319618225097656, 0.06795883178710938, 0.07272148132324219, 0.077484130859375, 0.08224678039550781, 0.08700942993164062, 0.09177207946777344, 0.09653472900390625, 0.10129737854003906, 0.10606002807617188, 0.11082267761230469, 0.1155853271484375, 0.12034797668457031, 0.12511062622070312, 0.12987327575683594, 0.13463592529296875, 0.13939857482910156, 0.14416122436523438, 0.1489238739013672, 0.1536865234375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 4.0, 4.0, 6.0, 9.0, 23.0, 24.0, 39.0, 48.0, 70.0, 90.0, 130.0, 141.0, 116.0, 76.0, 67.0, 45.0, 38.0, 26.0, 15.0, 9.0, 6.0, 6.0, 5.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.732080459594727e-05, -8.498877286911011e-05, -8.265674114227295e-05, -8.032470941543579e-05, -7.799267768859863e-05, -7.566064596176147e-05, -7.332861423492432e-05, -7.099658250808716e-05, -6.866455078125e-05, -6.633251905441284e-05, -6.400048732757568e-05, -6.166845560073853e-05, -5.933642387390137e-05, -5.700439214706421e-05, -5.467236042022705e-05, -5.234032869338989e-05, -5.0008296966552734e-05, -4.7676265239715576e-05, -4.534423351287842e-05, -4.301220178604126e-05, -4.06801700592041e-05, -3.834813833236694e-05, -3.6016106605529785e-05, -3.368407487869263e-05, -3.135204315185547e-05, -2.902001142501831e-05, -2.6687979698181152e-05, -2.4355947971343994e-05, -2.2023916244506836e-05, -1.9691884517669678e-05, -1.735985279083252e-05, -1.5027821063995361e-05, -1.2695789337158203e-05, -1.0363757610321045e-05, -8.031725883483887e-06, -5.6996941566467285e-06, -3.3676624298095703e-06, -1.0356307029724121e-06, 1.296401023864746e-06, 3.6284327507019043e-06, 5.9604644775390625e-06, 8.29249620437622e-06, 1.0624527931213379e-05, 1.2956559658050537e-05, 1.5288591384887695e-05, 1.7620623111724854e-05, 1.9952654838562012e-05, 2.228468656539917e-05, 2.4616718292236328e-05, 2.6948750019073486e-05, 2.9280781745910645e-05, 3.16128134727478e-05, 3.394484519958496e-05, 3.627687692642212e-05, 3.860890865325928e-05, 4.0940940380096436e-05, 4.3272972106933594e-05, 4.560500383377075e-05, 4.793703556060791e-05, 5.026906728744507e-05, 5.2601099014282227e-05, 5.4933130741119385e-05, 5.726516246795654e-05, 5.95971941947937e-05, 6.192922592163086e-05]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 4.0, 14.0, 14.0, 35.0, 43.0, 82.0, 142.0, 289.0, 754.0, 2336.0, 9416.0, 51476.0, 384524.0, 531629.0, 54108.0, 9814.0, 2409.0, 802.0, 328.0, 144.0, 78.0, 30.0, 30.0, 20.0, 12.0, 3.0, 11.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3017578125, -0.2933788299560547, -0.2849998474121094, -0.27662086486816406, -0.26824188232421875, -0.25986289978027344, -0.2514839172363281, -0.2431049346923828, -0.2347259521484375, -0.2263469696044922, -0.21796798706054688, -0.20958900451660156, -0.20121002197265625, -0.19283103942871094, -0.18445205688476562, -0.1760730743408203, -0.167694091796875, -0.1593151092529297, -0.15093612670898438, -0.14255714416503906, -0.13417816162109375, -0.12579917907714844, -0.11742019653320312, -0.10904121398925781, -0.1006622314453125, -0.09228324890136719, -0.08390426635742188, -0.07552528381347656, -0.06714630126953125, -0.05876731872558594, -0.050388336181640625, -0.04200935363769531, -0.03363037109375, -0.025251388549804688, -0.016872406005859375, -0.008493423461914062, -0.00011444091796875, 0.008264541625976562, 0.016643524169921875, 0.025022506713867188, 0.0334014892578125, 0.04178047180175781, 0.050159454345703125, 0.05853843688964844, 0.06691741943359375, 0.07529640197753906, 0.08367538452148438, 0.09205436706542969, 0.100433349609375, 0.10881233215332031, 0.11719131469726562, 0.12557029724121094, 0.13394927978515625, 0.14232826232910156, 0.15070724487304688, 0.1590862274169922, 0.1674652099609375, 0.1758441925048828, 0.18422317504882812, 0.19260215759277344, 0.20098114013671875, 0.20936012268066406, 0.21773910522460938, 0.2261180877685547, 0.2344970703125]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 6.0, 5.0, 2.0, 9.0, 28.0, 22.0, 31.0, 53.0, 62.0, 76.0, 99.0, 102.0, 111.0, 106.0, 97.0, 55.0, 39.0, 35.0, 28.0, 23.0, 5.0, 7.0, 5.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.28857421875, -0.28009796142578125, -0.2716217041015625, -0.26314544677734375, -0.254669189453125, -0.24619293212890625, -0.2377166748046875, -0.22924041748046875, -0.22076416015625, -0.21228790283203125, -0.2038116455078125, -0.19533538818359375, -0.186859130859375, -0.17838287353515625, -0.1699066162109375, -0.16143035888671875, -0.1529541015625, -0.14447784423828125, -0.1360015869140625, -0.12752532958984375, -0.119049072265625, -0.11057281494140625, -0.1020965576171875, -0.09362030029296875, -0.08514404296875, -0.07666778564453125, -0.0681915283203125, -0.05971527099609375, -0.051239013671875, -0.04276275634765625, -0.0342864990234375, -0.02581024169921875, -0.017333984375, -0.00885772705078125, -0.0003814697265625, 0.00809478759765625, 0.016571044921875, 0.02504730224609375, 0.0335235595703125, 0.04199981689453125, 0.05047607421875, 0.05895233154296875, 0.0674285888671875, 0.07590484619140625, 0.084381103515625, 0.09285736083984375, 0.1013336181640625, 0.10980987548828125, 0.1182861328125, 0.12676239013671875, 0.1352386474609375, 0.14371490478515625, 0.152191162109375, 0.16066741943359375, 0.1691436767578125, 0.17761993408203125, 0.18609619140625, 0.19457244873046875, 0.2030487060546875, 0.21152496337890625, 0.220001220703125, 0.22847747802734375, 0.2369537353515625, 0.24542999267578125, 0.25390625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 8.0, 10.0, 24.0, 39.0, 66.0, 134.0, 226.0, 155.0, 108.0, 77.0, 43.0, 28.0, 29.0, 18.0, 8.0, 8.0, 5.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-2.7052805423736572, -2.590704917907715, -2.4761290550231934, -2.361553430557251, -2.2469775676727295, -2.132401943206787, -2.0178260803222656, -1.9032504558563232, -1.7886747121810913, -1.6740989685058594, -1.5595232248306274, -1.4449474811553955, -1.3303718566894531, -1.2157959938049316, -1.1012203693389893, -0.9866446256637573, -0.8720688819885254, -0.7574931383132935, -0.6429173946380615, -0.5283417105674744, -0.41376596689224243, -0.2991902232170105, -0.18461453914642334, -0.0700387954711914, 0.04453694820404053, 0.15911267697811127, 0.273688405752182, 0.38826411962509155, 0.5028398633003235, 0.6174156069755554, 0.7319912910461426, 0.8465670347213745, 0.9611425399780273, 1.0757182836532593, 1.1902940273284912, 1.3048696517944336, 1.419445514678955, 1.5340211391448975, 1.6485968828201294, 1.7631726264953613, 1.8777483701705933, 1.9923241138458252, 2.1068997383117676, 2.221475601196289, 2.3360512256622314, 2.450627088546753, 2.5652027130126953, 2.679778575897217, 2.794354200363159, 2.9089298248291016, 3.023505687713623, 3.1380813121795654, 3.252657175064087, 3.3672327995300293, 3.481808662414551, 3.596384286880493, 3.7109599113464355, 3.825535535812378, 3.9401113986968994, 4.054687023162842, 4.169262886047363, 4.283838748931885, 4.398414134979248, 4.5129899978637695, 4.627565860748291]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 3.0, 1.0, 2.0, 5.0, 2.0, 3.0, 6.0, 7.0, 3.0, 10.0, 6.0, 10.0, 7.0, 10.0, 8.0, 14.0, 20.0, 27.0, 10.0, 20.0, 29.0, 42.0, 31.0, 31.0, 33.0, 77.0, 55.0, 70.0, 69.0, 43.0, 38.0, 44.0, 43.0, 31.0, 25.0, 15.0, 26.0, 25.0, 18.0, 15.0, 12.0, 11.0, 15.0, 7.0, 8.0, 5.0, 5.0, 9.0, 3.0, 0.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-2.6322755813598633, -2.552201986312866, -2.4721286296844482, -2.392055034637451, -2.311981439590454, -2.231907844543457, -2.151834487915039, -2.071760892868042, -1.9916874170303345, -1.911613941192627, -1.8315403461456299, -1.7514668703079224, -1.6713933944702148, -1.5913197994232178, -1.5112463235855103, -1.4311728477478027, -1.3510992527008057, -1.2710257768630981, -1.190952181816101, -1.1108787059783936, -1.0308051109313965, -0.950731635093689, -0.8706581592559814, -0.7905846238136292, -0.7105110883712769, -0.6304375529289246, -0.5503640174865723, -0.47029054164886475, -0.39021700620651245, -0.31014347076416016, -0.23006996512413025, -0.14999645948410034, -0.06992292404174805, 0.010150596499443054, 0.09022411704063416, 0.17029763758182526, 0.25037115812301636, 0.33044469356536865, 0.41051819920539856, 0.49059170484542847, 0.5706652402877808, 0.6507387757301331, 0.7308123111724854, 0.8108857870101929, 0.8909593224525452, 0.9710328578948975, 1.051106333732605, 1.1311798095703125, 1.2112534046173096, 1.291326880455017, 1.3714004755020142, 1.4514739513397217, 1.5315475463867188, 1.6116210222244263, 1.6916944980621338, 1.7717680931091309, 1.8518415689468384, 1.931915044784546, 2.011988639831543, 2.09206223487854, 2.172135591506958, 2.252209186553955, 2.332282781600952, 2.41235613822937, 2.492429733276367]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 17.0, 25.0, 53.0, 100.0, 178.0, 355.0, 656.0, 1544.0, 4823.0, 23796.0, 383402.0, 3494686.0, 259117.0, 18915.0, 3969.0, 1335.0, 613.0, 326.0, 172.0, 76.0, 47.0, 32.0, 14.0, 9.0, 4.0, 6.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6484375, -0.630645751953125, -0.61285400390625, -0.595062255859375, -0.5772705078125, -0.559478759765625, -0.54168701171875, -0.523895263671875, -0.506103515625, -0.488311767578125, -0.47052001953125, -0.452728271484375, -0.4349365234375, -0.417144775390625, -0.39935302734375, -0.381561279296875, -0.36376953125, -0.345977783203125, -0.32818603515625, -0.310394287109375, -0.2926025390625, -0.274810791015625, -0.25701904296875, -0.239227294921875, -0.221435546875, -0.203643798828125, -0.18585205078125, -0.168060302734375, -0.1502685546875, -0.132476806640625, -0.11468505859375, -0.096893310546875, -0.0791015625, -0.061309814453125, -0.04351806640625, -0.025726318359375, -0.0079345703125, 0.009857177734375, 0.02764892578125, 0.045440673828125, 0.063232421875, 0.081024169921875, 0.09881591796875, 0.116607666015625, 0.1343994140625, 0.152191162109375, 0.16998291015625, 0.187774658203125, 0.20556640625, 0.223358154296875, 0.24114990234375, 0.258941650390625, 0.2767333984375, 0.294525146484375, 0.31231689453125, 0.330108642578125, 0.347900390625, 0.365692138671875, 0.38348388671875, 0.401275634765625, 0.4190673828125, 0.436859130859375, 0.45465087890625, 0.472442626953125, 0.490234375]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 1.0, 2.0, 7.0, 4.0, 6.0, 15.0, 26.0, 20.0, 21.0, 35.0, 29.0, 31.0, 44.0, 54.0, 58.0, 59.0, 82.0, 74.0, 68.0, 68.0, 64.0, 49.0, 45.0, 41.0, 31.0, 26.0, 13.0, 8.0, 11.0, 4.0, 4.0, 4.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1776123046875, -0.1687641143798828, -0.15991592407226562, -0.15106773376464844, -0.14221954345703125, -0.13337135314941406, -0.12452316284179688, -0.11567497253417969, -0.1068267822265625, -0.09797859191894531, -0.08913040161132812, -0.08028221130371094, -0.07143402099609375, -0.06258583068847656, -0.053737640380859375, -0.04488945007324219, -0.036041259765625, -0.027193069458007812, -0.018344879150390625, -0.009496688842773438, -0.00064849853515625, 0.008199691772460938, 0.017047882080078125, 0.025896072387695312, 0.0347442626953125, 0.04359245300292969, 0.052440643310546875, 0.06128883361816406, 0.07013702392578125, 0.07898521423339844, 0.08783340454101562, 0.09668159484863281, 0.10552978515625, 0.11437797546386719, 0.12322616577148438, 0.13207435607910156, 0.14092254638671875, 0.14977073669433594, 0.15861892700195312, 0.1674671173095703, 0.1763153076171875, 0.1851634979248047, 0.19401168823242188, 0.20285987854003906, 0.21170806884765625, 0.22055625915527344, 0.22940444946289062, 0.2382526397705078, 0.247100830078125, 0.2559490203857422, 0.2647972106933594, 0.27364540100097656, 0.28249359130859375, 0.29134178161621094, 0.3001899719238281, 0.3090381622314453, 0.3178863525390625, 0.3267345428466797, 0.3355827331542969, 0.34443092346191406, 0.35327911376953125, 0.36212730407714844, 0.3709754943847656, 0.3798236846923828, 0.388671875]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 7.0, 7.0, 3.0, 8.0, 17.0, 18.0, 24.0, 57.0, 121.0, 225.0, 494.0, 1322.0, 5637.0, 70146.0, 3787100.0, 313999.0, 11791.0, 1968.0, 705.0, 300.0, 133.0, 80.0, 32.0, 41.0, 17.0, 14.0, 7.0, 2.0, 5.0, 2.0, 3.0, 6.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.99169921875, -0.9631118774414062, -0.9345245361328125, -0.9059371948242188, -0.877349853515625, -0.8487625122070312, -0.8201751708984375, -0.7915878295898438, -0.76300048828125, -0.7344131469726562, -0.7058258056640625, -0.6772384643554688, -0.648651123046875, -0.6200637817382812, -0.5914764404296875, -0.5628890991210938, -0.5343017578125, -0.5057144165039062, -0.4771270751953125, -0.44853973388671875, -0.419952392578125, -0.39136505126953125, -0.3627777099609375, -0.33419036865234375, -0.30560302734375, -0.27701568603515625, -0.2484283447265625, -0.21984100341796875, -0.191253662109375, -0.16266632080078125, -0.1340789794921875, -0.10549163818359375, -0.076904296875, -0.04831695556640625, -0.0197296142578125, 0.00885772705078125, 0.037445068359375, 0.06603240966796875, 0.0946197509765625, 0.12320709228515625, 0.15179443359375, 0.18038177490234375, 0.2089691162109375, 0.23755645751953125, 0.266143798828125, 0.29473114013671875, 0.3233184814453125, 0.35190582275390625, 0.3804931640625, 0.40908050537109375, 0.4376678466796875, 0.46625518798828125, 0.494842529296875, 0.5234298706054688, 0.5520172119140625, 0.5806045532226562, 0.60919189453125, 0.6377792358398438, 0.6663665771484375, 0.6949539184570312, 0.723541259765625, 0.7521286010742188, 0.7807159423828125, 0.8093032836914062, 0.837890625]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 3.0, 3.0, 9.0, 8.0, 10.0, 24.0, 29.0, 35.0, 55.0, 88.0, 137.0, 267.0, 523.0, 886.0, 848.0, 516.0, 257.0, 159.0, 79.0, 57.0, 22.0, 23.0, 13.0, 9.0, 11.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.62255859375, -0.6024627685546875, -0.582366943359375, -0.5622711181640625, -0.54217529296875, -0.5220794677734375, -0.501983642578125, -0.4818878173828125, -0.4617919921875, -0.4416961669921875, -0.421600341796875, -0.4015045166015625, -0.38140869140625, -0.3613128662109375, -0.341217041015625, -0.3211212158203125, -0.301025390625, -0.2809295654296875, -0.260833740234375, -0.2407379150390625, -0.22064208984375, -0.2005462646484375, -0.180450439453125, -0.1603546142578125, -0.1402587890625, -0.1201629638671875, -0.100067138671875, -0.0799713134765625, -0.05987548828125, -0.0397796630859375, -0.019683837890625, 0.0004119873046875, 0.0205078125, 0.0406036376953125, 0.060699462890625, 0.0807952880859375, 0.10089111328125, 0.1209869384765625, 0.141082763671875, 0.1611785888671875, 0.1812744140625, 0.2013702392578125, 0.221466064453125, 0.2415618896484375, 0.26165771484375, 0.2817535400390625, 0.301849365234375, 0.3219451904296875, 0.342041015625, 0.3621368408203125, 0.382232666015625, 0.4023284912109375, 0.42242431640625, 0.4425201416015625, 0.462615966796875, 0.4827117919921875, 0.5028076171875, 0.5229034423828125, 0.542999267578125, 0.5630950927734375, 0.58319091796875, 0.6032867431640625, 0.623382568359375, 0.6434783935546875, 0.66357421875]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 2.0, 4.0, 10.0, 11.0, 30.0, 90.0, 235.0, 302.0, 204.0, 77.0, 19.0, 17.0, 2.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.960099220275879, -7.698525428771973, -7.436951160430908, -7.175377368927002, -6.9138031005859375, -6.652229309082031, -6.390655517578125, -6.129081726074219, -5.867507457733154, -5.605933666229248, -5.344359397888184, -5.082785606384277, -4.821211814880371, -4.559637546539307, -4.2980637550354, -4.036489486694336, -3.7749156951904297, -3.5133416652679443, -3.251767635345459, -2.9901938438415527, -2.7286198139190674, -2.467045783996582, -2.205471992492676, -1.9438979625701904, -1.682323932647705, -1.4207499027252197, -1.159175992012024, -0.8976020216941833, -0.6360280513763428, -0.3744540214538574, -0.11288011074066162, 0.14869379997253418, 0.41026782989501953, 0.6718418002128601, 0.9334157705307007, 1.1949896812438965, 1.4565637111663818, 1.7181377410888672, 1.979711651802063, 2.241285562515259, 2.502859592437744, 2.7644336223602295, 3.026007652282715, 3.287581443786621, 3.5491554737091064, 3.810729503631592, 4.072303295135498, 4.3338775634765625, 4.595451354980469, 4.857025146484375, 5.1185994148254395, 5.380173206329346, 5.64174747467041, 5.903321266174316, 6.164895057678223, 6.426468849182129, 6.688043117523193, 6.9496169090271, 7.211191177368164, 7.47276496887207, 7.734338760375977, 7.995913028717041, 8.257487297058105, 8.519061088562012, 8.780634880065918]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 7.0, 5.0, 3.0, 3.0, 11.0, 7.0, 12.0, 14.0, 18.0, 16.0, 30.0, 25.0, 31.0, 31.0, 30.0, 56.0, 49.0, 57.0, 47.0, 51.0, 46.0, 51.0, 57.0, 41.0, 54.0, 31.0, 34.0, 40.0, 20.0, 25.0, 21.0, 20.0, 16.0, 9.0, 9.0, 8.0, 2.0, 4.0, 4.0, 3.0, 2.0, 2.0, 5.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.0736961364746094, -1.9984891414642334, -1.9232821464538574, -1.8480751514434814, -1.7728681564331055, -1.6976611614227295, -1.622454047203064, -1.547247052192688, -1.472040057182312, -1.396833062171936, -1.32162606716156, -1.246419072151184, -1.1712119579315186, -1.0960049629211426, -1.0207979679107666, -0.9455909729003906, -0.8703839778900146, -0.7951769828796387, -0.7199699878692627, -0.6447629332542419, -0.569555938243866, -0.49434894323349, -0.4191419184207916, -0.34393489360809326, -0.2687278985977173, -0.19352088868618011, -0.11831387877464294, -0.043106868863105774, 0.032100141048431396, 0.10730713605880737, 0.18251416087150574, 0.2577211856842041, 0.3329284191131592, 0.40813541412353516, 0.4833424389362335, 0.5585494637489319, 0.6337564587593079, 0.7089634537696838, 0.7841705083847046, 0.8593775033950806, 0.9345844984054565, 1.0097914934158325, 1.0849984884262085, 1.1602054834365845, 1.23541259765625, 1.310619592666626, 1.385826587677002, 1.461033582687378, 1.536240577697754, 1.6114475727081299, 1.6866545677185059, 1.7618615627288818, 1.8370685577392578, 1.9122755527496338, 1.9874826669692993, 2.062689781188965, 2.1378965377807617, 2.2131035327911377, 2.2883105278015137, 2.3635175228118896, 2.4387245178222656, 2.5139315128326416, 2.5891385078430176, 2.6643457412719727, 2.7395527362823486]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 4.0, 5.0, 9.0, 13.0, 11.0, 18.0, 26.0, 49.0, 57.0, 123.0, 174.0, 257.0, 479.0, 885.0, 1727.0, 3520.0, 7986.0, 18821.0, 48423.0, 131956.0, 329403.0, 309016.0, 119623.0, 44192.0, 17616.0, 7237.0, 3381.0, 1582.0, 791.0, 471.0, 275.0, 173.0, 78.0, 39.0, 46.0, 20.0, 20.0, 10.0, 13.0, 6.0, 10.0, 7.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0], "bins": [-0.358642578125, -0.3480796813964844, -0.33751678466796875, -0.3269538879394531, -0.3163909912109375, -0.3058280944824219, -0.29526519775390625, -0.2847023010253906, -0.274139404296875, -0.2635765075683594, -0.25301361083984375, -0.24245071411132812, -0.2318878173828125, -0.22132492065429688, -0.21076202392578125, -0.20019912719726562, -0.18963623046875, -0.17907333374023438, -0.16851043701171875, -0.15794754028320312, -0.1473846435546875, -0.13682174682617188, -0.12625885009765625, -0.11569595336914062, -0.105133056640625, -0.09457015991210938, -0.08400726318359375, -0.07344436645507812, -0.0628814697265625, -0.052318572998046875, -0.04175567626953125, -0.031192779541015625, -0.0206298828125, -0.010066986083984375, 0.00049591064453125, 0.011058807373046875, 0.0216217041015625, 0.032184600830078125, 0.04274749755859375, 0.053310394287109375, 0.063873291015625, 0.07443618774414062, 0.08499908447265625, 0.09556198120117188, 0.1061248779296875, 0.11668777465820312, 0.12725067138671875, 0.13781356811523438, 0.14837646484375, 0.15893936157226562, 0.16950225830078125, 0.18006515502929688, 0.1906280517578125, 0.20119094848632812, 0.21175384521484375, 0.22231674194335938, 0.232879638671875, 0.24344253540039062, 0.25400543212890625, 0.2645683288574219, 0.2751312255859375, 0.2856941223144531, 0.29625701904296875, 0.3068199157714844, 0.3173828125]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 2.0, 7.0, 5.0, 11.0, 13.0, 17.0, 13.0, 37.0, 31.0, 42.0, 53.0, 40.0, 38.0, 65.0, 68.0, 71.0, 72.0, 61.0, 64.0, 56.0, 51.0, 35.0, 38.0, 27.0, 27.0, 16.0, 8.0, 9.0, 4.0, 10.0, 9.0, 2.0, 1.0, 1.0, 5.0, 1.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2015380859375, -0.1923084259033203, -0.18307876586914062, -0.17384910583496094, -0.16461944580078125, -0.15538978576660156, -0.14616012573242188, -0.1369304656982422, -0.1277008056640625, -0.11847114562988281, -0.10924148559570312, -0.10001182556152344, -0.09078216552734375, -0.08155250549316406, -0.07232284545898438, -0.06309318542480469, -0.053863525390625, -0.04463386535644531, -0.035404205322265625, -0.026174545288085938, -0.01694488525390625, -0.0077152252197265625, 0.001514434814453125, 0.010744094848632812, 0.0199737548828125, 0.029203414916992188, 0.038433074951171875, 0.04766273498535156, 0.05689239501953125, 0.06612205505371094, 0.07535171508789062, 0.08458137512207031, 0.09381103515625, 0.10304069519042969, 0.11227035522460938, 0.12150001525878906, 0.13072967529296875, 0.13995933532714844, 0.14918899536132812, 0.1584186553955078, 0.1676483154296875, 0.1768779754638672, 0.18610763549804688, 0.19533729553222656, 0.20456695556640625, 0.21379661560058594, 0.22302627563476562, 0.2322559356689453, 0.241485595703125, 0.2507152557373047, 0.2599449157714844, 0.26917457580566406, 0.27840423583984375, 0.28763389587402344, 0.2968635559082031, 0.3060932159423828, 0.3153228759765625, 0.3245525360107422, 0.3337821960449219, 0.34301185607910156, 0.35224151611328125, 0.36147117614746094, 0.3707008361816406, 0.3799304962158203, 0.38916015625]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 3.0, 5.0, 7.0, 5.0, 6.0, 14.0, 13.0, 25.0, 36.0, 62.0, 78.0, 112.0, 136.0, 206.0, 293.0, 444.0, 907.0, 2181.0, 7018.0, 35141.0, 234599.0, 664928.0, 81685.0, 14079.0, 3460.0, 1271.0, 651.0, 354.0, 224.0, 212.0, 123.0, 87.0, 49.0, 40.0, 32.0, 16.0, 19.0, 12.0, 12.0, 4.0, 3.0, 4.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.625, -0.6056060791015625, -0.586212158203125, -0.5668182373046875, -0.54742431640625, -0.5280303955078125, -0.508636474609375, -0.4892425537109375, -0.4698486328125, -0.4504547119140625, -0.431060791015625, -0.4116668701171875, -0.39227294921875, -0.3728790283203125, -0.353485107421875, -0.3340911865234375, -0.314697265625, -0.2953033447265625, -0.275909423828125, -0.2565155029296875, -0.23712158203125, -0.2177276611328125, -0.198333740234375, -0.1789398193359375, -0.1595458984375, -0.1401519775390625, -0.120758056640625, -0.1013641357421875, -0.08197021484375, -0.0625762939453125, -0.043182373046875, -0.0237884521484375, -0.00439453125, 0.0149993896484375, 0.034393310546875, 0.0537872314453125, 0.07318115234375, 0.0925750732421875, 0.111968994140625, 0.1313629150390625, 0.1507568359375, 0.1701507568359375, 0.189544677734375, 0.2089385986328125, 0.22833251953125, 0.2477264404296875, 0.267120361328125, 0.2865142822265625, 0.305908203125, 0.3253021240234375, 0.344696044921875, 0.3640899658203125, 0.38348388671875, 0.4028778076171875, 0.422271728515625, 0.4416656494140625, 0.4610595703125, 0.4804534912109375, 0.499847412109375, 0.5192413330078125, 0.53863525390625, 0.5580291748046875, 0.577423095703125, 0.5968170166015625, 0.6162109375]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 1.0, 5.0, 6.0, 4.0, 5.0, 12.0, 9.0, 8.0, 13.0, 13.0, 16.0, 12.0, 25.0, 17.0, 33.0, 34.0, 35.0, 38.0, 34.0, 42.0, 66.0, 53.0, 58.0, 57.0, 42.0, 48.0, 35.0, 40.0, 29.0, 36.0, 31.0, 17.0, 26.0, 14.0, 16.0, 9.0, 19.0, 9.0, 11.0, 6.0, 7.0, 6.0, 4.0, 6.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.72802734375, -0.704254150390625, -0.68048095703125, -0.656707763671875, -0.6329345703125, -0.609161376953125, -0.58538818359375, -0.561614990234375, -0.537841796875, -0.514068603515625, -0.49029541015625, -0.466522216796875, -0.4427490234375, -0.418975830078125, -0.39520263671875, -0.371429443359375, -0.34765625, -0.323883056640625, -0.30010986328125, -0.276336669921875, -0.2525634765625, -0.228790283203125, -0.20501708984375, -0.181243896484375, -0.157470703125, -0.133697509765625, -0.10992431640625, -0.086151123046875, -0.0623779296875, -0.038604736328125, -0.01483154296875, 0.008941650390625, 0.03271484375, 0.056488037109375, 0.08026123046875, 0.104034423828125, 0.1278076171875, 0.151580810546875, 0.17535400390625, 0.199127197265625, 0.222900390625, 0.246673583984375, 0.27044677734375, 0.294219970703125, 0.3179931640625, 0.341766357421875, 0.36553955078125, 0.389312744140625, 0.4130859375, 0.436859130859375, 0.46063232421875, 0.484405517578125, 0.5081787109375, 0.531951904296875, 0.55572509765625, 0.579498291015625, 0.603271484375, 0.627044677734375, 0.65081787109375, 0.674591064453125, 0.6983642578125, 0.722137451171875, 0.74591064453125, 0.769683837890625, 0.79345703125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 6.0, 11.0, 14.0, 20.0, 20.0, 29.0, 65.0, 77.0, 152.0, 296.0, 552.0, 1378.0, 3693.0, 11390.0, 39976.0, 189204.0, 676941.0, 90550.0, 23102.0, 6736.0, 2426.0, 961.0, 387.0, 201.0, 116.0, 81.0, 48.0, 37.0, 21.0, 21.0, 5.0, 7.0, 7.0, 5.0, 3.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1712646484375, -0.16560935974121094, -0.15995407104492188, -0.1542987823486328, -0.14864349365234375, -0.1429882049560547, -0.13733291625976562, -0.13167762756347656, -0.1260223388671875, -0.12036705017089844, -0.11471176147460938, -0.10905647277832031, -0.10340118408203125, -0.09774589538574219, -0.09209060668945312, -0.08643531799316406, -0.080780029296875, -0.07512474060058594, -0.06946945190429688, -0.06381416320800781, -0.05815887451171875, -0.05250358581542969, -0.046848297119140625, -0.04119300842285156, -0.0355377197265625, -0.029882431030273438, -0.024227142333984375, -0.018571853637695312, -0.01291656494140625, -0.0072612762451171875, -0.001605987548828125, 0.0040493011474609375, 0.00970458984375, 0.015359878540039062, 0.021015167236328125, 0.026670455932617188, 0.03232574462890625, 0.03798103332519531, 0.043636322021484375, 0.04929161071777344, 0.0549468994140625, 0.06060218811035156, 0.06625747680664062, 0.07191276550292969, 0.07756805419921875, 0.08322334289550781, 0.08887863159179688, 0.09453392028808594, 0.100189208984375, 0.10584449768066406, 0.11149978637695312, 0.11715507507324219, 0.12281036376953125, 0.1284656524658203, 0.13412094116210938, 0.13977622985839844, 0.1454315185546875, 0.15108680725097656, 0.15674209594726562, 0.1623973846435547, 0.16805267333984375, 0.1737079620361328, 0.17936325073242188, 0.18501853942871094, 0.190673828125]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 7.0, 6.0, 7.0, 8.0, 3.0, 13.0, 15.0, 20.0, 27.0, 32.0, 35.0, 52.0, 52.0, 73.0, 68.0, 90.0, 75.0, 81.0, 47.0, 54.0, 48.0, 45.0, 28.0, 23.0, 13.0, 14.0, 13.0, 15.0, 6.0, 10.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 3.0, 1.0, 4.0, 0.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.3451786041259766e-05, -4.2242929339408875e-05, -4.1034072637557983e-05, -3.982521593570709e-05, -3.86163592338562e-05, -3.740750253200531e-05, -3.619864583015442e-05, -3.498978912830353e-05, -3.378093242645264e-05, -3.2572075724601746e-05, -3.1363219022750854e-05, -3.0154362320899963e-05, -2.8945505619049072e-05, -2.773664891719818e-05, -2.652779221534729e-05, -2.53189355134964e-05, -2.4110078811645508e-05, -2.2901222109794617e-05, -2.1692365407943726e-05, -2.0483508706092834e-05, -1.9274652004241943e-05, -1.8065795302391052e-05, -1.685693860054016e-05, -1.564808189868927e-05, -1.4439225196838379e-05, -1.3230368494987488e-05, -1.2021511793136597e-05, -1.0812655091285706e-05, -9.603798389434814e-06, -8.394941687583923e-06, -7.186084985733032e-06, -5.977228283882141e-06, -4.76837158203125e-06, -3.559514880180359e-06, -2.3506581783294678e-06, -1.1418014764785767e-06, 6.705522537231445e-08, 1.2759119272232056e-06, 2.4847686290740967e-06, 3.693625330924988e-06, 4.902482032775879e-06, 6.11133873462677e-06, 7.320195436477661e-06, 8.529052138328552e-06, 9.737908840179443e-06, 1.0946765542030334e-05, 1.2155622243881226e-05, 1.3364478945732117e-05, 1.4573335647583008e-05, 1.57821923494339e-05, 1.699104905128479e-05, 1.819990575313568e-05, 1.9408762454986572e-05, 2.0617619156837463e-05, 2.1826475858688354e-05, 2.3035332560539246e-05, 2.4244189262390137e-05, 2.5453045964241028e-05, 2.666190266609192e-05, 2.787075936794281e-05, 2.90796160697937e-05, 3.0288472771644592e-05, 3.1497329473495483e-05, 3.2706186175346375e-05, 3.3915042877197266e-05]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 6.0, 10.0, 3.0, 8.0, 10.0, 7.0, 10.0, 18.0, 27.0, 43.0, 46.0, 89.0, 123.0, 216.0, 389.0, 772.0, 1678.0, 3877.0, 11100.0, 39134.0, 181768.0, 670878.0, 100923.0, 24463.0, 7409.0, 2828.0, 1239.0, 614.0, 314.0, 203.0, 107.0, 59.0, 55.0, 48.0, 23.0, 17.0, 14.0, 13.0, 3.0, 7.0, 2.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.1983642578125, -0.19258499145507812, -0.18680572509765625, -0.18102645874023438, -0.1752471923828125, -0.16946792602539062, -0.16368865966796875, -0.15790939331054688, -0.152130126953125, -0.14635086059570312, -0.14057159423828125, -0.13479232788085938, -0.1290130615234375, -0.12323379516601562, -0.11745452880859375, -0.11167526245117188, -0.10589599609375, -0.10011672973632812, -0.09433746337890625, -0.08855819702148438, -0.0827789306640625, -0.07699966430664062, -0.07122039794921875, -0.06544113159179688, -0.059661865234375, -0.053882598876953125, -0.04810333251953125, -0.042324066162109375, -0.0365447998046875, -0.030765533447265625, -0.02498626708984375, -0.019207000732421875, -0.013427734375, -0.007648468017578125, -0.00186920166015625, 0.003910064697265625, 0.0096893310546875, 0.015468597412109375, 0.02124786376953125, 0.027027130126953125, 0.032806396484375, 0.038585662841796875, 0.04436492919921875, 0.050144195556640625, 0.0559234619140625, 0.061702728271484375, 0.06748199462890625, 0.07326126098632812, 0.07904052734375, 0.08481979370117188, 0.09059906005859375, 0.09637832641601562, 0.1021575927734375, 0.10793685913085938, 0.11371612548828125, 0.11949539184570312, 0.125274658203125, 0.13105392456054688, 0.13683319091796875, 0.14261245727539062, 0.1483917236328125, 0.15417098999023438, 0.15995025634765625, 0.16572952270507812, 0.1715087890625]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 2.0, 7.0, 10.0, 6.0, 6.0, 11.0, 27.0, 27.0, 45.0, 63.0, 85.0, 89.0, 112.0, 124.0, 95.0, 82.0, 47.0, 35.0, 37.0, 28.0, 18.0, 16.0, 12.0, 8.0, 1.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.2266845703125, -0.21959495544433594, -0.21250534057617188, -0.2054157257080078, -0.19832611083984375, -0.1912364959716797, -0.18414688110351562, -0.17705726623535156, -0.1699676513671875, -0.16287803649902344, -0.15578842163085938, -0.1486988067626953, -0.14160919189453125, -0.1345195770263672, -0.12742996215820312, -0.12034034729003906, -0.113250732421875, -0.10616111755371094, -0.09907150268554688, -0.09198188781738281, -0.08489227294921875, -0.07780265808105469, -0.07071304321289062, -0.06362342834472656, -0.0565338134765625, -0.04944419860839844, -0.042354583740234375, -0.03526496887207031, -0.02817535400390625, -0.021085739135742188, -0.013996124267578125, -0.0069065093994140625, 0.00018310546875, 0.0072727203369140625, 0.014362335205078125, 0.021451950073242188, 0.02854156494140625, 0.03563117980957031, 0.042720794677734375, 0.04981040954589844, 0.0569000244140625, 0.06398963928222656, 0.07107925415039062, 0.07816886901855469, 0.08525848388671875, 0.09234809875488281, 0.09943771362304688, 0.10652732849121094, 0.113616943359375, 0.12070655822753906, 0.12779617309570312, 0.1348857879638672, 0.14197540283203125, 0.1490650177001953, 0.15615463256835938, 0.16324424743652344, 0.1703338623046875, 0.17742347717285156, 0.18451309204101562, 0.1916027069091797, 0.19869232177734375, 0.2057819366455078, 0.21287155151367188, 0.21996116638183594, 0.22705078125]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 0.0, 0.0, 3.0, 3.0, 4.0, 18.0, 27.0, 80.0, 118.0, 270.0, 249.0, 103.0, 64.0, 37.0, 11.0, 7.0, 5.0, 4.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.340597629547119, -5.156380653381348, -4.972163677215576, -4.787946701049805, -4.603730201721191, -4.41951322555542, -4.235296249389648, -4.051079273223877, -3.8668625354766846, -3.682645559310913, -3.4984288215637207, -3.314211845397949, -3.1299948692321777, -2.9457781314849854, -2.761561155319214, -2.5773444175720215, -2.39312744140625, -2.2089104652404785, -2.024693727493286, -1.8404767513275146, -1.6562598943710327, -1.4720430374145508, -1.2878260612487793, -1.1036092042922974, -0.9193923473358154, -0.7351754903793335, -0.5509585738182068, -0.3667416572570801, -0.18252480030059814, 0.001692056655883789, 0.18590903282165527, 0.3701258897781372, 0.5543432235717773, 0.7385600805282593, 0.922776997089386, 1.1069939136505127, 1.2912107706069946, 1.4754276275634766, 1.659644603729248, 1.84386146068573, 2.028078317642212, 2.2122952938079834, 2.396512031555176, 2.5807290077209473, 2.7649459838867188, 2.949162721633911, 3.1333796977996826, 3.317596435546875, 3.5018134117126465, 3.686030387878418, 3.8702471256256104, 4.054464340209961, 4.238680839538574, 4.422897815704346, 4.607114791870117, 4.791331768035889, 4.97554874420166, 5.159765720367432, 5.343982696533203, 5.528199195861816, 5.712416172027588, 5.896633148193359, 6.080850124359131, 6.265067100524902, 6.449283599853516]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 3.0, 5.0, 2.0, 10.0, 9.0, 7.0, 16.0, 11.0, 8.0, 21.0, 17.0, 21.0, 24.0, 24.0, 45.0, 31.0, 28.0, 54.0, 83.0, 93.0, 106.0, 72.0, 43.0, 45.0, 25.0, 28.0, 23.0, 15.0, 16.0, 18.0, 26.0, 14.0, 10.0, 15.0, 6.0, 4.0, 4.0, 7.0, 4.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0], "bins": [-3.094390869140625, -2.9970617294311523, -2.8997323513031006, -2.802403211593628, -2.705073833465576, -2.6077446937561035, -2.510415554046631, -2.413086175918579, -2.3157570362091064, -2.218427896499634, -2.121098518371582, -2.0237693786621094, -1.9264401197433472, -1.829110860824585, -1.7317816019058228, -1.6344523429870605, -1.5371230840682983, -1.4397938251495361, -1.342464566230774, -1.2451353073120117, -1.147806167602539, -1.0504769086837769, -0.9531476497650146, -0.8558184504508972, -0.758489191532135, -0.6611599326133728, -0.5638307332992554, -0.46650147438049316, -0.36917224526405334, -0.2718430161476135, -0.17451375722885132, -0.07718455791473389, 0.02014470100402832, 0.11747393757104874, 0.21480317413806915, 0.31213241815567017, 0.40946164727211, 0.5067908763885498, 0.604120135307312, 0.7014493346214294, 0.7987785935401917, 0.8961078524589539, 0.9934370517730713, 1.0907663106918335, 1.1880955696105957, 1.2854247093200684, 1.3827540874481201, 1.4800832271575928, 1.577412486076355, 1.6747417449951172, 1.7720710039138794, 1.8694002628326416, 1.9667294025421143, 2.064058780670166, 2.1613879203796387, 2.2587170600891113, 2.356046438217163, 2.4533755779266357, 2.5507049560546875, 2.64803409576416, 2.745363473892212, 2.8426926136016846, 2.9400219917297363, 3.037351131439209, 3.1346802711486816]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 5.0, 2.0, 5.0, 1.0, 3.0, 4.0, 6.0, 6.0, 17.0, 10.0, 22.0, 31.0, 40.0, 56.0, 69.0, 151.0, 269.0, 489.0, 1103.0, 2568.0, 7047.0, 25203.0, 147019.0, 1351138.0, 2298150.0, 302512.0, 41671.0, 10469.0, 3565.0, 1360.0, 619.0, 302.0, 142.0, 90.0, 48.0, 24.0, 33.0, 16.0, 5.0, 5.0, 6.0, 1.0, 2.0, 3.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.392822265625, -0.38132476806640625, -0.3698272705078125, -0.35832977294921875, -0.346832275390625, -0.33533477783203125, -0.3238372802734375, -0.31233978271484375, -0.30084228515625, -0.28934478759765625, -0.2778472900390625, -0.26634979248046875, -0.254852294921875, -0.24335479736328125, -0.2318572998046875, -0.22035980224609375, -0.2088623046875, -0.19736480712890625, -0.1858673095703125, -0.17436981201171875, -0.162872314453125, -0.15137481689453125, -0.1398773193359375, -0.12837982177734375, -0.11688232421875, -0.10538482666015625, -0.0938873291015625, -0.08238983154296875, -0.070892333984375, -0.05939483642578125, -0.0478973388671875, -0.03639984130859375, -0.02490234375, -0.01340484619140625, -0.0019073486328125, 0.00959014892578125, 0.021087646484375, 0.03258514404296875, 0.0440826416015625, 0.05558013916015625, 0.06707763671875, 0.07857513427734375, 0.0900726318359375, 0.10157012939453125, 0.113067626953125, 0.12456512451171875, 0.1360626220703125, 0.14756011962890625, 0.1590576171875, 0.17055511474609375, 0.1820526123046875, 0.19355010986328125, 0.205047607421875, 0.21654510498046875, 0.2280426025390625, 0.23954010009765625, 0.25103759765625, 0.26253509521484375, 0.2740325927734375, 0.28553009033203125, 0.297027587890625, 0.30852508544921875, 0.3200225830078125, 0.33152008056640625, 0.343017578125]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 9.0, 8.0, 7.0, 7.0, 8.0, 13.0, 16.0, 15.0, 11.0, 16.0, 33.0, 20.0, 33.0, 26.0, 27.0, 28.0, 39.0, 46.0, 57.0, 35.0, 48.0, 48.0, 38.0, 46.0, 31.0, 47.0, 34.0, 34.0, 29.0, 32.0, 28.0, 22.0, 29.0, 14.0, 12.0, 13.0, 7.0, 6.0, 5.0, 8.0, 4.0, 3.0, 2.0, 4.0, 0.0, 4.0, 1.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0], "bins": [-0.202392578125, -0.19609451293945312, -0.18979644775390625, -0.18349838256835938, -0.1772003173828125, -0.17090225219726562, -0.16460418701171875, -0.15830612182617188, -0.152008056640625, -0.14570999145507812, -0.13941192626953125, -0.13311386108398438, -0.1268157958984375, -0.12051773071289062, -0.11421966552734375, -0.10792160034179688, -0.10162353515625, -0.09532546997070312, -0.08902740478515625, -0.08272933959960938, -0.0764312744140625, -0.07013320922851562, -0.06383514404296875, -0.057537078857421875, -0.051239013671875, -0.044940948486328125, -0.03864288330078125, -0.032344818115234375, -0.0260467529296875, -0.019748687744140625, -0.01345062255859375, -0.007152557373046875, -0.0008544921875, 0.005443572998046875, 0.01174163818359375, 0.018039703369140625, 0.0243377685546875, 0.030635833740234375, 0.03693389892578125, 0.043231964111328125, 0.049530029296875, 0.055828094482421875, 0.06212615966796875, 0.06842422485351562, 0.0747222900390625, 0.08102035522460938, 0.08731842041015625, 0.09361648559570312, 0.09991455078125, 0.10621261596679688, 0.11251068115234375, 0.11880874633789062, 0.1251068115234375, 0.13140487670898438, 0.13770294189453125, 0.14400100708007812, 0.150299072265625, 0.15659713745117188, 0.16289520263671875, 0.16919326782226562, 0.1754913330078125, 0.18178939819335938, 0.18808746337890625, 0.19438552856445312, 0.20068359375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 6.0, 10.0, 11.0, 7.0, 23.0, 37.0, 36.0, 61.0, 94.0, 193.0, 298.0, 772.0, 2858.0, 21980.0, 757444.0, 3348441.0, 54896.0, 5076.0, 1066.0, 404.0, 217.0, 127.0, 71.0, 50.0, 38.0, 25.0, 17.0, 12.0, 2.0, 2.0, 5.0, 5.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7392578125, -0.7120513916015625, -0.684844970703125, -0.6576385498046875, -0.63043212890625, -0.6032257080078125, -0.576019287109375, -0.5488128662109375, -0.5216064453125, -0.4944000244140625, -0.467193603515625, -0.4399871826171875, -0.41278076171875, -0.3855743408203125, -0.358367919921875, -0.3311614990234375, -0.303955078125, -0.2767486572265625, -0.249542236328125, -0.2223358154296875, -0.19512939453125, -0.1679229736328125, -0.140716552734375, -0.1135101318359375, -0.0863037109375, -0.0590972900390625, -0.031890869140625, -0.0046844482421875, 0.02252197265625, 0.0497283935546875, 0.076934814453125, 0.1041412353515625, 0.13134765625, 0.1585540771484375, 0.185760498046875, 0.2129669189453125, 0.24017333984375, 0.2673797607421875, 0.294586181640625, 0.3217926025390625, 0.3489990234375, 0.3762054443359375, 0.403411865234375, 0.4306182861328125, 0.45782470703125, 0.4850311279296875, 0.512237548828125, 0.5394439697265625, 0.566650390625, 0.5938568115234375, 0.621063232421875, 0.6482696533203125, 0.67547607421875, 0.7026824951171875, 0.729888916015625, 0.7570953369140625, 0.7843017578125, 0.8115081787109375, 0.838714599609375, 0.8659210205078125, 0.89312744140625, 0.9203338623046875, 0.947540283203125, 0.9747467041015625, 1.001953125]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 5.0, 6.0, 10.0, 16.0, 17.0, 21.0, 26.0, 54.0, 79.0, 104.0, 140.0, 247.0, 379.0, 621.0, 733.0, 584.0, 398.0, 194.0, 155.0, 93.0, 68.0, 33.0, 25.0, 21.0, 14.0, 7.0, 8.0, 4.0, 6.0, 5.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.56689453125, -0.548828125, -0.53076171875, -0.5126953125, -0.49462890625, -0.4765625, -0.45849609375, -0.4404296875, -0.42236328125, -0.404296875, -0.38623046875, -0.3681640625, -0.35009765625, -0.33203125, -0.31396484375, -0.2958984375, -0.27783203125, -0.259765625, -0.24169921875, -0.2236328125, -0.20556640625, -0.1875, -0.16943359375, -0.1513671875, -0.13330078125, -0.115234375, -0.09716796875, -0.0791015625, -0.06103515625, -0.04296875, -0.02490234375, -0.0068359375, 0.01123046875, 0.029296875, 0.04736328125, 0.0654296875, 0.08349609375, 0.1015625, 0.11962890625, 0.1376953125, 0.15576171875, 0.173828125, 0.19189453125, 0.2099609375, 0.22802734375, 0.24609375, 0.26416015625, 0.2822265625, 0.30029296875, 0.318359375, 0.33642578125, 0.3544921875, 0.37255859375, 0.390625, 0.40869140625, 0.4267578125, 0.44482421875, 0.462890625, 0.48095703125, 0.4990234375, 0.51708984375, 0.53515625, 0.55322265625, 0.5712890625, 0.58935546875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 3.0, 4.0, 7.0, 15.0, 36.0, 85.0, 185.0, 294.0, 208.0, 101.0, 43.0, 19.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-11.564440727233887, -11.305808067321777, -11.047175407409668, -10.788542747497559, -10.52991008758545, -10.27127742767334, -10.01264476776123, -9.754013061523438, -9.495380401611328, -9.236747741699219, -8.97811508178711, -8.719482421875, -8.46084976196289, -8.202217102050781, -7.94358491897583, -7.684952259063721, -7.426319122314453, -7.167686462402344, -6.909053802490234, -6.650421142578125, -6.391788482666016, -6.133155822753906, -5.874523639678955, -5.615890979766846, -5.357258319854736, -5.098625659942627, -4.839993000030518, -4.581360340118408, -4.322728157043457, -4.064095497131348, -3.8054628372192383, -3.546830177307129, -3.288198471069336, -3.0295658111572266, -2.770933151245117, -2.512300729751587, -2.2536680698394775, -1.9950354099273682, -1.7364028692245483, -1.4777703285217285, -1.2191376686096191, -0.9605050683021545, -0.7018724679946899, -0.44323986768722534, -0.18460726737976074, 0.07402539253234863, 0.33265793323516846, 0.5912904739379883, 0.8499231338500977, 1.108555793762207, 1.3671883344650269, 1.6258208751678467, 1.884453535079956, 2.1430861949920654, 2.4017186164855957, 2.660351276397705, 2.9189839363098145, 3.177616596221924, 3.436249256134033, 3.6948816776275635, 3.953514337539673, 4.212146759033203, 4.4707794189453125, 4.729412078857422, 4.988044738769531]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 1.0, 4.0, 7.0, 6.0, 7.0, 8.0, 7.0, 11.0, 11.0, 10.0, 18.0, 11.0, 16.0, 33.0, 24.0, 32.0, 27.0, 37.0, 43.0, 53.0, 55.0, 46.0, 46.0, 54.0, 58.0, 40.0, 53.0, 38.0, 32.0, 34.0, 23.0, 20.0, 21.0, 23.0, 17.0, 19.0, 13.0, 13.0, 10.0, 12.0, 4.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1057796478271484, -2.0328540802001953, -1.959928274154663, -1.8870025873184204, -1.8140769004821777, -1.7411513328552246, -1.668225646018982, -1.5952999591827393, -1.5223742723464966, -1.449448585510254, -1.3765228986740112, -1.3035972118377686, -1.2306716442108154, -1.1577458381652832, -1.08482027053833, -1.0118945837020874, -0.9389688968658447, -0.866043210029602, -0.7931175231933594, -0.7201918959617615, -0.6472662091255188, -0.5743405222892761, -0.5014148950576782, -0.42848920822143555, -0.35556352138519287, -0.2826378345489502, -0.2097121775150299, -0.13678650557994843, -0.06386083364486694, 0.009064853191375732, 0.08199051022529602, 0.1549161672592163, 0.22784161567687988, 0.30076730251312256, 0.37369295954704285, 0.44661861658096313, 0.5195443034172058, 0.5924699902534485, 0.6653956174850464, 0.7383213043212891, 0.8112469911575317, 0.8841726779937744, 0.9570983648300171, 1.0300240516662598, 1.102949619293213, 1.1758754253387451, 1.2488009929656982, 1.321726679801941, 1.3946523666381836, 1.4675780534744263, 1.540503740310669, 1.6134294271469116, 1.6863551139831543, 1.7592806816101074, 1.83220636844635, 1.9051320552825928, 1.9780577421188354, 2.050983428955078, 2.1239089965820312, 2.1968348026275635, 2.2697603702545166, 2.342686176300049, 2.415611743927002, 2.488537311553955, 2.5614631175994873]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 2.0, 3.0, 4.0, 6.0, 12.0, 26.0, 32.0, 44.0, 86.0, 127.0, 207.0, 356.0, 606.0, 1290.0, 2628.0, 5677.0, 13424.0, 37914.0, 127126.0, 433049.0, 300831.0, 81023.0, 25759.0, 9710.0, 4269.0, 2042.0, 994.0, 539.0, 321.0, 174.0, 95.0, 59.0, 41.0, 25.0, 18.0, 14.0, 9.0, 5.0, 10.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.482666015625, -0.4670066833496094, -0.45134735107421875, -0.4356880187988281, -0.4200286865234375, -0.4043693542480469, -0.38871002197265625, -0.3730506896972656, -0.357391357421875, -0.3417320251464844, -0.32607269287109375, -0.3104133605957031, -0.2947540283203125, -0.2790946960449219, -0.26343536376953125, -0.24777603149414062, -0.23211669921875, -0.21645736694335938, -0.20079803466796875, -0.18513870239257812, -0.1694793701171875, -0.15382003784179688, -0.13816070556640625, -0.12250137329101562, -0.106842041015625, -0.09118270874023438, -0.07552337646484375, -0.059864044189453125, -0.0442047119140625, -0.028545379638671875, -0.01288604736328125, 0.002773284912109375, 0.0184326171875, 0.034091949462890625, 0.04975128173828125, 0.06541061401367188, 0.0810699462890625, 0.09672927856445312, 0.11238861083984375, 0.12804794311523438, 0.143707275390625, 0.15936660766601562, 0.17502593994140625, 0.19068527221679688, 0.2063446044921875, 0.22200393676757812, 0.23766326904296875, 0.2533226013183594, 0.26898193359375, 0.2846412658691406, 0.30030059814453125, 0.3159599304199219, 0.3316192626953125, 0.3472785949707031, 0.36293792724609375, 0.3785972595214844, 0.394256591796875, 0.4099159240722656, 0.42557525634765625, 0.4412345886230469, 0.4568939208984375, 0.4725532531738281, 0.48821258544921875, 0.5038719177246094, 0.51953125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 2.0, 10.0, 13.0, 7.0, 9.0, 8.0, 12.0, 11.0, 17.0, 17.0, 21.0, 30.0, 33.0, 21.0, 40.0, 29.0, 42.0, 53.0, 44.0, 49.0, 39.0, 53.0, 41.0, 49.0, 40.0, 44.0, 33.0, 24.0, 35.0, 30.0, 19.0, 24.0, 19.0, 13.0, 14.0, 10.0, 11.0, 10.0, 6.0, 2.0, 2.0, 3.0, 5.0, 1.0, 4.0, 3.0, 3.0, 3.0, 2.0, 3.0], "bins": [-0.2440185546875, -0.237030029296875, -0.23004150390625, -0.223052978515625, -0.216064453125, -0.209075927734375, -0.20208740234375, -0.195098876953125, -0.1881103515625, -0.181121826171875, -0.17413330078125, -0.167144775390625, -0.16015625, -0.153167724609375, -0.14617919921875, -0.139190673828125, -0.1322021484375, -0.125213623046875, -0.11822509765625, -0.111236572265625, -0.104248046875, -0.097259521484375, -0.09027099609375, -0.083282470703125, -0.0762939453125, -0.069305419921875, -0.06231689453125, -0.055328369140625, -0.04833984375, -0.041351318359375, -0.03436279296875, -0.027374267578125, -0.0203857421875, -0.013397216796875, -0.00640869140625, 0.000579833984375, 0.007568359375, 0.014556884765625, 0.02154541015625, 0.028533935546875, 0.0355224609375, 0.042510986328125, 0.04949951171875, 0.056488037109375, 0.0634765625, 0.070465087890625, 0.07745361328125, 0.084442138671875, 0.0914306640625, 0.098419189453125, 0.10540771484375, 0.112396240234375, 0.119384765625, 0.126373291015625, 0.13336181640625, 0.140350341796875, 0.1473388671875, 0.154327392578125, 0.16131591796875, 0.168304443359375, 0.17529296875, 0.182281494140625, 0.18927001953125, 0.196258544921875, 0.2032470703125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 4.0, 11.0, 15.0, 24.0, 29.0, 43.0, 62.0, 75.0, 132.0, 205.0, 377.0, 606.0, 1097.0, 2842.0, 14924.0, 267443.0, 730418.0, 23564.0, 3658.0, 1300.0, 683.0, 399.0, 203.0, 130.0, 99.0, 66.0, 40.0, 33.0, 24.0, 16.0, 15.0, 12.0, 3.0, 0.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.109375, -1.0777664184570312, -1.0461578369140625, -1.0145492553710938, -0.982940673828125, -0.9513320922851562, -0.9197235107421875, -0.8881149291992188, -0.85650634765625, -0.8248977661132812, -0.7932891845703125, -0.7616806030273438, -0.730072021484375, -0.6984634399414062, -0.6668548583984375, -0.6352462768554688, -0.6036376953125, -0.5720291137695312, -0.5404205322265625, -0.5088119506835938, -0.477203369140625, -0.44559478759765625, -0.4139862060546875, -0.38237762451171875, -0.35076904296875, -0.31916046142578125, -0.2875518798828125, -0.25594329833984375, -0.224334716796875, -0.19272613525390625, -0.1611175537109375, -0.12950897216796875, -0.097900390625, -0.06629180908203125, -0.0346832275390625, -0.00307464599609375, 0.028533935546875, 0.06014251708984375, 0.0917510986328125, 0.12335968017578125, 0.15496826171875, 0.18657684326171875, 0.2181854248046875, 0.24979400634765625, 0.281402587890625, 0.31301116943359375, 0.3446197509765625, 0.37622833251953125, 0.4078369140625, 0.43944549560546875, 0.4710540771484375, 0.5026626586914062, 0.534271240234375, 0.5658798217773438, 0.5974884033203125, 0.6290969848632812, 0.66070556640625, 0.6923141479492188, 0.7239227294921875, 0.7555313110351562, 0.787139892578125, 0.8187484741210938, 0.8503570556640625, 0.8819656372070312, 0.91357421875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 4.0, 3.0, 5.0, 3.0, 6.0, 8.0, 9.0, 14.0, 13.0, 14.0, 20.0, 28.0, 40.0, 51.0, 43.0, 53.0, 63.0, 77.0, 74.0, 71.0, 62.0, 55.0, 49.0, 39.0, 50.0, 33.0, 33.0, 23.0, 13.0, 13.0, 7.0, 9.0, 9.0, 9.0, 2.0, 4.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.78857421875, -0.7539749145507812, -0.7193756103515625, -0.6847763061523438, -0.650177001953125, -0.6155776977539062, -0.5809783935546875, -0.5463790893554688, -0.51177978515625, -0.47718048095703125, -0.4425811767578125, -0.40798187255859375, -0.373382568359375, -0.33878326416015625, -0.3041839599609375, -0.26958465576171875, -0.2349853515625, -0.20038604736328125, -0.1657867431640625, -0.13118743896484375, -0.096588134765625, -0.06198883056640625, -0.0273895263671875, 0.00720977783203125, 0.04180908203125, 0.07640838623046875, 0.1110076904296875, 0.14560699462890625, 0.180206298828125, 0.21480560302734375, 0.2494049072265625, 0.28400421142578125, 0.318603515625, 0.35320281982421875, 0.3878021240234375, 0.42240142822265625, 0.457000732421875, 0.49160003662109375, 0.5261993408203125, 0.5607986450195312, 0.59539794921875, 0.6299972534179688, 0.6645965576171875, 0.6991958618164062, 0.733795166015625, 0.7683944702148438, 0.8029937744140625, 0.8375930786132812, 0.8721923828125, 0.9067916870117188, 0.9413909912109375, 0.9759902954101562, 1.010589599609375, 1.0451889038085938, 1.0797882080078125, 1.1143875122070312, 1.14898681640625, 1.1835861206054688, 1.2181854248046875, 1.2527847290039062, 1.287384033203125, 1.3219833374023438, 1.3565826416015625, 1.3911819458007812, 1.42578125]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 5.0, 0.0, 7.0, 6.0, 9.0, 7.0, 12.0, 14.0, 22.0, 24.0, 36.0, 57.0, 85.0, 131.0, 276.0, 560.0, 1379.0, 4342.0, 22274.0, 205298.0, 757744.0, 45255.0, 7414.0, 2005.0, 763.0, 317.0, 194.0, 105.0, 61.0, 50.0, 27.0, 30.0, 10.0, 12.0, 3.0, 7.0, 6.0, 3.0, 3.0, 5.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.2156982421875, -0.20830726623535156, -0.20091629028320312, -0.1935253143310547, -0.18613433837890625, -0.1787433624267578, -0.17135238647460938, -0.16396141052246094, -0.1565704345703125, -0.14917945861816406, -0.14178848266601562, -0.1343975067138672, -0.12700653076171875, -0.11961555480957031, -0.11222457885742188, -0.10483360290527344, -0.097442626953125, -0.09005165100097656, -0.08266067504882812, -0.07526969909667969, -0.06787872314453125, -0.06048774719238281, -0.053096771240234375, -0.04570579528808594, -0.0383148193359375, -0.030923843383789062, -0.023532867431640625, -0.016141891479492188, -0.00875091552734375, -0.0013599395751953125, 0.006031036376953125, 0.013422012329101562, 0.02081298828125, 0.028203964233398438, 0.035594940185546875, 0.04298591613769531, 0.05037689208984375, 0.05776786804199219, 0.06515884399414062, 0.07254981994628906, 0.0799407958984375, 0.08733177185058594, 0.09472274780273438, 0.10211372375488281, 0.10950469970703125, 0.11689567565917969, 0.12428665161132812, 0.13167762756347656, 0.139068603515625, 0.14645957946777344, 0.15385055541992188, 0.1612415313720703, 0.16863250732421875, 0.1760234832763672, 0.18341445922851562, 0.19080543518066406, 0.1981964111328125, 0.20558738708496094, 0.21297836303710938, 0.2203693389892578, 0.22776031494140625, 0.2351512908935547, 0.24254226684570312, 0.24993324279785156, 0.25732421875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 8.0, 3.0, 6.0, 6.0, 13.0, 10.0, 23.0, 13.0, 36.0, 47.0, 65.0, 73.0, 130.0, 129.0, 100.0, 93.0, 58.0, 41.0, 34.0, 26.0, 21.0, 16.0, 15.0, 10.0, 5.0, 4.0, 6.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.687641143798828e-05, -6.481911987066269e-05, -6.27618283033371e-05, -6.0704536736011505e-05, -5.864724516868591e-05, -5.658995360136032e-05, -5.453266203403473e-05, -5.247537046670914e-05, -5.0418078899383545e-05, -4.836078733205795e-05, -4.630349576473236e-05, -4.424620419740677e-05, -4.218891263008118e-05, -4.0131621062755585e-05, -3.807432949542999e-05, -3.60170379281044e-05, -3.395974636077881e-05, -3.1902454793453217e-05, -2.9845163226127625e-05, -2.7787871658802032e-05, -2.573058009147644e-05, -2.367328852415085e-05, -2.1615996956825256e-05, -1.9558705389499664e-05, -1.7501413822174072e-05, -1.544412225484848e-05, -1.3386830687522888e-05, -1.1329539120197296e-05, -9.272247552871704e-06, -7.214955985546112e-06, -5.15766441822052e-06, -3.100372850894928e-06, -1.043081283569336e-06, 1.014210283756256e-06, 3.071501851081848e-06, 5.12879341840744e-06, 7.186084985733032e-06, 9.243376553058624e-06, 1.1300668120384216e-05, 1.3357959687709808e-05, 1.54152512550354e-05, 1.7472542822360992e-05, 1.9529834389686584e-05, 2.1587125957012177e-05, 2.364441752433777e-05, 2.570170909166336e-05, 2.7759000658988953e-05, 2.9816292226314545e-05, 3.187358379364014e-05, 3.393087536096573e-05, 3.598816692829132e-05, 3.804545849561691e-05, 4.0102750062942505e-05, 4.21600416302681e-05, 4.421733319759369e-05, 4.627462476491928e-05, 4.833191633224487e-05, 5.0389207899570465e-05, 5.244649946689606e-05, 5.450379103422165e-05, 5.656108260154724e-05, 5.861837416887283e-05, 6.0675665736198425e-05, 6.273295730352402e-05, 6.479024887084961e-05]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 3.0, 17.0, 11.0, 17.0, 28.0, 25.0, 31.0, 53.0, 72.0, 98.0, 173.0, 338.0, 613.0, 1139.0, 2461.0, 7072.0, 28783.0, 178364.0, 726128.0, 79621.0, 15387.0, 4392.0, 1735.0, 852.0, 415.0, 234.0, 175.0, 107.0, 61.0, 41.0, 25.0, 28.0, 11.0, 10.0, 7.0, 5.0, 9.0, 6.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.193359375, -0.18755149841308594, -0.18174362182617188, -0.1759357452392578, -0.17012786865234375, -0.1643199920654297, -0.15851211547851562, -0.15270423889160156, -0.1468963623046875, -0.14108848571777344, -0.13528060913085938, -0.1294727325439453, -0.12366485595703125, -0.11785697937011719, -0.11204910278320312, -0.10624122619628906, -0.100433349609375, -0.09462547302246094, -0.08881759643554688, -0.08300971984863281, -0.07720184326171875, -0.07139396667480469, -0.06558609008789062, -0.05977821350097656, -0.0539703369140625, -0.04816246032714844, -0.042354583740234375, -0.03654670715332031, -0.03073883056640625, -0.024930953979492188, -0.019123077392578125, -0.013315200805664062, -0.00750732421875, -0.0016994476318359375, 0.004108428955078125, 0.009916305541992188, 0.01572418212890625, 0.021532058715820312, 0.027339935302734375, 0.03314781188964844, 0.0389556884765625, 0.04476356506347656, 0.050571441650390625, 0.05637931823730469, 0.06218719482421875, 0.06799507141113281, 0.07380294799804688, 0.07961082458496094, 0.085418701171875, 0.09122657775878906, 0.09703445434570312, 0.10284233093261719, 0.10865020751953125, 0.11445808410644531, 0.12026596069335938, 0.12607383728027344, 0.1318817138671875, 0.13768959045410156, 0.14349746704101562, 0.1493053436279297, 0.15511322021484375, 0.1609210968017578, 0.16672897338867188, 0.17253684997558594, 0.1783447265625]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 3.0, 4.0, 6.0, 6.0, 13.0, 10.0, 11.0, 13.0, 13.0, 12.0, 27.0, 25.0, 29.0, 34.0, 52.0, 48.0, 56.0, 67.0, 81.0, 69.0, 78.0, 59.0, 52.0, 57.0, 33.0, 25.0, 19.0, 16.0, 18.0, 10.0, 10.0, 12.0, 9.0, 6.0, 4.0, 2.0, 4.0, 2.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 3.0], "bins": [-0.1552734375, -0.15093040466308594, -0.14658737182617188, -0.1422443389892578, -0.13790130615234375, -0.1335582733154297, -0.12921524047851562, -0.12487220764160156, -0.1205291748046875, -0.11618614196777344, -0.11184310913085938, -0.10750007629394531, -0.10315704345703125, -0.09881401062011719, -0.09447097778320312, -0.09012794494628906, -0.085784912109375, -0.08144187927246094, -0.07709884643554688, -0.07275581359863281, -0.06841278076171875, -0.06406974792480469, -0.059726715087890625, -0.05538368225097656, -0.0510406494140625, -0.04669761657714844, -0.042354583740234375, -0.03801155090332031, -0.03366851806640625, -0.029325485229492188, -0.024982452392578125, -0.020639419555664062, -0.01629638671875, -0.011953353881835938, -0.007610321044921875, -0.0032672882080078125, 0.00107574462890625, 0.0054187774658203125, 0.009761810302734375, 0.014104843139648438, 0.0184478759765625, 0.022790908813476562, 0.027133941650390625, 0.03147697448730469, 0.03582000732421875, 0.04016304016113281, 0.044506072998046875, 0.04884910583496094, 0.053192138671875, 0.05753517150878906, 0.061878204345703125, 0.06622123718261719, 0.07056427001953125, 0.07490730285644531, 0.07925033569335938, 0.08359336853027344, 0.0879364013671875, 0.09227943420410156, 0.09662246704101562, 0.10096549987792969, 0.10530853271484375, 0.10965156555175781, 0.11399459838867188, 0.11833763122558594, 0.1226806640625]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 6.0, 10.0, 21.0, 54.0, 105.0, 351.0, 247.0, 118.0, 41.0, 15.0, 11.0, 10.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.291942596435547, -5.087686538696289, -4.883430004119873, -4.679173946380615, -4.474917411804199, -4.270661354064941, -4.066405296325684, -3.8621490001678467, -3.6578927040100098, -3.453636407852173, -3.249380111694336, -3.045124053955078, -2.840867757797241, -2.6366114616394043, -2.4323554039001465, -2.2280991077423096, -2.0238428115844727, -1.8195865154266357, -1.6153303384780884, -1.411074161529541, -1.206817865371704, -1.0025615692138672, -0.7983053922653198, -0.5940492153167725, -0.38979291915893555, -0.1855366826057434, 0.01871955394744873, 0.22297579050064087, 0.427232027053833, 0.6314883232116699, 0.8357445001602173, 1.0400006771087646, 1.2442569732666016, 1.4485132694244385, 1.6527694463729858, 1.8570256233215332, 2.06128191947937, 2.265538215637207, 2.469794273376465, 2.6740505695343018, 2.8783068656921387, 3.0825631618499756, 3.2868194580078125, 3.4910755157470703, 3.6953318119049072, 3.899588108062744, 4.103844165802002, 4.308100700378418, 4.512356758117676, 4.716612815856934, 4.92086935043335, 5.125125408172607, 5.329381942749023, 5.533638000488281, 5.737894058227539, 5.942150115966797, 6.146406650543213, 6.350662708282471, 6.554919242858887, 6.7591753005981445, 6.963431358337402, 7.167687892913818, 7.371943950653076, 7.576200485229492, 7.78045654296875]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 2.0, 4.0, 9.0, 5.0, 12.0, 10.0, 9.0, 16.0, 10.0, 20.0, 20.0, 19.0, 24.0, 23.0, 40.0, 38.0, 57.0, 93.0, 167.0, 98.0, 41.0, 40.0, 31.0, 27.0, 27.0, 28.0, 20.0, 24.0, 13.0, 10.0, 11.0, 12.0, 8.0, 8.0, 4.0, 4.0, 5.0, 3.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.988544225692749, -2.8904993534088135, -2.792454481124878, -2.6944098472595215, -2.596364974975586, -2.4983201026916504, -2.400275230407715, -2.3022303581237793, -2.2041854858398438, -2.106140613555908, -2.0080957412719727, -1.9100509881973267, -1.8120062351226807, -1.7139613628387451, -1.6159164905548096, -1.517871618270874, -1.4198269844055176, -1.321782112121582, -1.223737359046936, -1.1256924867630005, -1.0276477336883545, -0.929602861404419, -0.8315579891204834, -0.7335131764411926, -0.6354683637619019, -0.5374235510826111, -0.4393787086009979, -0.34133386611938477, -0.243289053440094, -0.14524424076080322, -0.047199368476867676, 0.050845444202423096, 0.14889049530029297, 0.24693532288074493, 0.3449801504611969, 0.44302499294281006, 0.5410698056221008, 0.6391146183013916, 0.7371594905853271, 0.8352043032646179, 0.9332491159439087, 1.0312939882278442, 1.1293387413024902, 1.2273836135864258, 1.3254284858703613, 1.4234732389450073, 1.5215181112289429, 1.6195628643035889, 1.7176077365875244, 1.81565260887146, 1.913697361946106, 2.011742115020752, 2.1097869873046875, 2.207831859588623, 2.3058767318725586, 2.403921604156494, 2.5019664764404297, 2.6000113487243652, 2.698056221008301, 2.7961010932922363, 2.8941457271575928, 2.9921905994415283, 3.090235471725464, 3.1882803440093994, 3.286324977874756]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 4.0, 6.0, 3.0, 12.0, 18.0, 28.0, 43.0, 74.0, 110.0, 191.0, 287.0, 532.0, 840.0, 1534.0, 2869.0, 6309.0, 16311.0, 54928.0, 254471.0, 1131101.0, 1908143.0, 636525.0, 128394.0, 31121.0, 10718.0, 4617.0, 2254.0, 1145.0, 666.0, 403.0, 212.0, 151.0, 111.0, 48.0, 37.0, 20.0, 14.0, 14.0, 7.0, 6.0, 2.0, 2.0, 3.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.310791015625, -0.2998046875, -0.288818359375, -0.27783203125, -0.266845703125, -0.255859375, -0.244873046875, -0.23388671875, -0.222900390625, -0.2119140625, -0.200927734375, -0.18994140625, -0.178955078125, -0.16796875, -0.156982421875, -0.14599609375, -0.135009765625, -0.1240234375, -0.113037109375, -0.10205078125, -0.091064453125, -0.080078125, -0.069091796875, -0.05810546875, -0.047119140625, -0.0361328125, -0.025146484375, -0.01416015625, -0.003173828125, 0.0078125, 0.018798828125, 0.02978515625, 0.040771484375, 0.0517578125, 0.062744140625, 0.07373046875, 0.084716796875, 0.095703125, 0.106689453125, 0.11767578125, 0.128662109375, 0.1396484375, 0.150634765625, 0.16162109375, 0.172607421875, 0.18359375, 0.194580078125, 0.20556640625, 0.216552734375, 0.2275390625, 0.238525390625, 0.24951171875, 0.260498046875, 0.271484375, 0.282470703125, 0.29345703125, 0.304443359375, 0.3154296875, 0.326416015625, 0.33740234375, 0.348388671875, 0.359375, 0.370361328125, 0.38134765625, 0.392333984375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 3.0, 2.0, 2.0, 7.0, 5.0, 6.0, 4.0, 7.0, 5.0, 8.0, 7.0, 12.0, 14.0, 12.0, 28.0, 24.0, 35.0, 26.0, 34.0, 27.0, 27.0, 47.0, 42.0, 42.0, 43.0, 49.0, 50.0, 38.0, 34.0, 41.0, 40.0, 17.0, 37.0, 32.0, 34.0, 28.0, 18.0, 17.0, 21.0, 21.0, 8.0, 10.0, 11.0, 10.0, 11.0, 4.0, 3.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1798095703125, -0.17360687255859375, -0.1674041748046875, -0.16120147705078125, -0.154998779296875, -0.14879608154296875, -0.1425933837890625, -0.13639068603515625, -0.13018798828125, -0.12398529052734375, -0.1177825927734375, -0.11157989501953125, -0.105377197265625, -0.09917449951171875, -0.0929718017578125, -0.08676910400390625, -0.08056640625, -0.07436370849609375, -0.0681610107421875, -0.06195831298828125, -0.055755615234375, -0.04955291748046875, -0.0433502197265625, -0.03714752197265625, -0.03094482421875, -0.02474212646484375, -0.0185394287109375, -0.01233673095703125, -0.006134033203125, 6.866455078125e-05, 0.0062713623046875, 0.01247406005859375, 0.0186767578125, 0.02487945556640625, 0.0310821533203125, 0.03728485107421875, 0.043487548828125, 0.04969024658203125, 0.0558929443359375, 0.06209564208984375, 0.06829833984375, 0.07450103759765625, 0.0807037353515625, 0.08690643310546875, 0.093109130859375, 0.09931182861328125, 0.1055145263671875, 0.11171722412109375, 0.117919921875, 0.12412261962890625, 0.1303253173828125, 0.13652801513671875, 0.142730712890625, 0.14893341064453125, 0.1551361083984375, 0.16133880615234375, 0.16754150390625, 0.17374420166015625, 0.1799468994140625, 0.18614959716796875, 0.192352294921875, 0.19855499267578125, 0.2047576904296875, 0.21096038818359375, 0.2171630859375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 4.0, 1.0, 0.0, 1.0, 3.0, 3.0, 2.0, 6.0, 2.0, 9.0, 7.0, 13.0, 20.0, 25.0, 38.0, 53.0, 77.0, 138.0, 245.0, 395.0, 661.0, 1301.0, 3230.0, 14734.0, 350979.0, 3756577.0, 55383.0, 6241.0, 1987.0, 918.0, 484.0, 294.0, 158.0, 94.0, 70.0, 53.0, 31.0, 15.0, 10.0, 8.0, 9.0, 6.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.130859375, -1.089385986328125, -1.04791259765625, -1.006439208984375, -0.9649658203125, -0.923492431640625, -0.88201904296875, -0.840545654296875, -0.799072265625, -0.757598876953125, -0.71612548828125, -0.674652099609375, -0.6331787109375, -0.591705322265625, -0.55023193359375, -0.508758544921875, -0.46728515625, -0.425811767578125, -0.38433837890625, -0.342864990234375, -0.3013916015625, -0.259918212890625, -0.21844482421875, -0.176971435546875, -0.135498046875, -0.094024658203125, -0.05255126953125, -0.011077880859375, 0.0303955078125, 0.071868896484375, 0.11334228515625, 0.154815673828125, 0.1962890625, 0.237762451171875, 0.27923583984375, 0.320709228515625, 0.3621826171875, 0.403656005859375, 0.44512939453125, 0.486602783203125, 0.528076171875, 0.569549560546875, 0.61102294921875, 0.652496337890625, 0.6939697265625, 0.735443115234375, 0.77691650390625, 0.818389892578125, 0.85986328125, 0.901336669921875, 0.94281005859375, 0.984283447265625, 1.0257568359375, 1.067230224609375, 1.10870361328125, 1.150177001953125, 1.191650390625, 1.233123779296875, 1.27459716796875, 1.316070556640625, 1.3575439453125, 1.399017333984375, 1.44049072265625, 1.481964111328125, 1.5234375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 0.0, 6.0, 4.0, 4.0, 7.0, 11.0, 10.0, 15.0, 32.0, 39.0, 58.0, 62.0, 73.0, 133.0, 206.0, 290.0, 394.0, 536.0, 586.0, 464.0, 316.0, 256.0, 174.0, 118.0, 90.0, 45.0, 41.0, 35.0, 20.0, 17.0, 9.0, 5.0, 6.0, 3.0, 6.0, 2.0, 3.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.748046875, -0.723236083984375, -0.69842529296875, -0.673614501953125, -0.6488037109375, -0.623992919921875, -0.59918212890625, -0.574371337890625, -0.549560546875, -0.524749755859375, -0.49993896484375, -0.475128173828125, -0.4503173828125, -0.425506591796875, -0.40069580078125, -0.375885009765625, -0.35107421875, -0.326263427734375, -0.30145263671875, -0.276641845703125, -0.2518310546875, -0.227020263671875, -0.20220947265625, -0.177398681640625, -0.152587890625, -0.127777099609375, -0.10296630859375, -0.078155517578125, -0.0533447265625, -0.028533935546875, -0.00372314453125, 0.021087646484375, 0.0458984375, 0.070709228515625, 0.09552001953125, 0.120330810546875, 0.1451416015625, 0.169952392578125, 0.19476318359375, 0.219573974609375, 0.244384765625, 0.269195556640625, 0.29400634765625, 0.318817138671875, 0.3436279296875, 0.368438720703125, 0.39324951171875, 0.418060302734375, 0.44287109375, 0.467681884765625, 0.49249267578125, 0.517303466796875, 0.5421142578125, 0.566925048828125, 0.59173583984375, 0.616546630859375, 0.641357421875, 0.666168212890625, 0.69097900390625, 0.715789794921875, 0.7406005859375, 0.765411376953125, 0.79022216796875, 0.815032958984375, 0.83984375]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 23.0, 44.0, 137.0, 269.0, 275.0, 138.0, 39.0, 29.0, 16.0, 10.0, 4.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-20.627559661865234, -20.12334632873535, -19.61913299560547, -19.114917755126953, -18.61070442199707, -18.106491088867188, -17.602277755737305, -17.098064422607422, -16.593849182128906, -16.089635848999023, -15.585421562194824, -15.081208229064941, -14.576993942260742, -14.07278060913086, -13.568567276000977, -13.064353942871094, -12.560140609741211, -12.055927276611328, -11.551712989807129, -11.047499656677246, -10.543285369873047, -10.039072036743164, -9.534858703613281, -9.030645370483398, -8.5264310836792, -8.022217750549316, -7.518003463745117, -7.013790130615234, -6.509576320648193, -6.005362510681152, -5.5011491775512695, -4.9969353675842285, -4.492719650268555, -3.9885058403015137, -3.4842922687530518, -2.98007869720459, -2.475864887237549, -1.9716510772705078, -1.467437505722046, -0.963223934173584, -0.45901012420654297, 0.045203566551208496, 0.54941725730896, 1.0536309480667114, 1.557844638824463, 2.062058448791504, 2.566272020339966, 3.0704855918884277, 3.5746994018554688, 4.07891321182251, 4.583127021789551, 5.087340354919434, 5.591554164886475, 6.095767974853516, 6.599981307983398, 7.1041951179504395, 7.6084089279174805, 8.112622261047363, 8.616836547851562, 9.121049880981445, 9.625263214111328, 10.129477500915527, 10.63369083404541, 11.13790512084961, 11.642118453979492]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 7.0, 8.0, 10.0, 16.0, 12.0, 30.0, 34.0, 39.0, 62.0, 62.0, 81.0, 69.0, 108.0, 95.0, 82.0, 54.0, 51.0, 45.0, 40.0, 25.0, 26.0, 16.0, 11.0, 7.0, 4.0, 6.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.38444709777832, -9.158693313598633, -8.932940483093262, -8.70718765258789, -8.481433868408203, -8.255680084228516, -8.029927253723145, -7.804173946380615, -7.578420639038086, -7.352667331695557, -7.126914024353027, -6.901160717010498, -6.675407409667969, -6.4496541023254395, -6.22390079498291, -5.998147487640381, -5.772394180297852, -5.546640872955322, -5.320887565612793, -5.095134258270264, -4.869380950927734, -4.643627643585205, -4.417874336242676, -4.1921210289001465, -3.966367721557617, -3.740614414215088, -3.5148611068725586, -3.2891077995300293, -3.0633544921875, -2.8376011848449707, -2.6118478775024414, -2.386094570159912, -2.160341262817383, -1.9345879554748535, -1.7088346481323242, -1.483081340789795, -1.2573280334472656, -1.0315747261047363, -0.805821418762207, -0.5800681114196777, -0.35431480407714844, -0.12856149673461914, 0.09719181060791016, 0.32294511795043945, 0.5486984252929688, 0.774451732635498, 1.0002050399780273, 1.2259583473205566, 1.451711654663086, 1.6774649620056152, 1.9032182693481445, 2.128971576690674, 2.354724884033203, 2.5804781913757324, 2.8062314987182617, 3.031984806060791, 3.2577381134033203, 3.4834914207458496, 3.709244728088379, 3.934998035430908, 4.1607513427734375, 4.386504650115967, 4.612257957458496, 4.838011264801025, 5.063764572143555]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 4.0, 8.0, 5.0, 7.0, 4.0, 10.0, 15.0, 19.0, 31.0, 57.0, 126.0, 180.0, 371.0, 916.0, 2145.0, 6626.0, 28088.0, 262560.0, 684214.0, 48595.0, 9535.0, 2837.0, 1146.0, 487.0, 215.0, 145.0, 81.0, 45.0, 23.0, 17.0, 11.0, 11.0, 8.0, 5.0, 3.0, 1.0, 5.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-0.92578125, -0.9001693725585938, -0.8745574951171875, -0.8489456176757812, -0.823333740234375, -0.7977218627929688, -0.7721099853515625, -0.7464981079101562, -0.72088623046875, -0.6952743530273438, -0.6696624755859375, -0.6440505981445312, -0.618438720703125, -0.5928268432617188, -0.5672149658203125, -0.5416030883789062, -0.5159912109375, -0.49037933349609375, -0.4647674560546875, -0.43915557861328125, -0.413543701171875, -0.38793182373046875, -0.3623199462890625, -0.33670806884765625, -0.31109619140625, -0.28548431396484375, -0.2598724365234375, -0.23426055908203125, -0.208648681640625, -0.18303680419921875, -0.1574249267578125, -0.13181304931640625, -0.106201171875, -0.08058929443359375, -0.0549774169921875, -0.02936553955078125, -0.003753662109375, 0.02185821533203125, 0.0474700927734375, 0.07308197021484375, 0.09869384765625, 0.12430572509765625, 0.1499176025390625, 0.17552947998046875, 0.201141357421875, 0.22675323486328125, 0.2523651123046875, 0.27797698974609375, 0.3035888671875, 0.32920074462890625, 0.3548126220703125, 0.38042449951171875, 0.406036376953125, 0.43164825439453125, 0.4572601318359375, 0.48287200927734375, 0.50848388671875, 0.5340957641601562, 0.5597076416015625, 0.5853195190429688, 0.610931396484375, 0.6365432739257812, 0.6621551513671875, 0.6877670288085938, 0.71337890625]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 4.0, 10.0, 16.0, 27.0, 42.0, 52.0, 71.0, 85.0, 84.0, 100.0, 99.0, 110.0, 81.0, 75.0, 48.0, 29.0, 16.0, 19.0, 16.0, 7.0, 5.0, 6.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.75, -0.7316970825195312, -0.7133941650390625, -0.6950912475585938, -0.676788330078125, -0.6584854125976562, -0.6401824951171875, -0.6218795776367188, -0.60357666015625, -0.5852737426757812, -0.5669708251953125, -0.5486679077148438, -0.530364990234375, -0.5120620727539062, -0.4937591552734375, -0.47545623779296875, -0.4571533203125, -0.43885040283203125, -0.4205474853515625, -0.40224456787109375, -0.383941650390625, -0.36563873291015625, -0.3473358154296875, -0.32903289794921875, -0.31072998046875, -0.29242706298828125, -0.2741241455078125, -0.25582122802734375, -0.237518310546875, -0.21921539306640625, -0.2009124755859375, -0.18260955810546875, -0.164306640625, -0.14600372314453125, -0.1277008056640625, -0.10939788818359375, -0.091094970703125, -0.07279205322265625, -0.0544891357421875, -0.03618621826171875, -0.01788330078125, 0.00041961669921875, 0.0187225341796875, 0.03702545166015625, 0.055328369140625, 0.07363128662109375, 0.0919342041015625, 0.11023712158203125, 0.1285400390625, 0.14684295654296875, 0.1651458740234375, 0.18344879150390625, 0.201751708984375, 0.22005462646484375, 0.2383575439453125, 0.25666046142578125, 0.27496337890625, 0.29326629638671875, 0.3115692138671875, 0.32987213134765625, 0.348175048828125, 0.36647796630859375, 0.3847808837890625, 0.40308380126953125, 0.42138671875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 2.0, 7.0, 8.0, 3.0, 11.0, 14.0, 17.0, 21.0, 33.0, 37.0, 53.0, 91.0, 103.0, 165.0, 333.0, 567.0, 1237.0, 3375.0, 14442.0, 131360.0, 853844.0, 33102.0, 5929.0, 1852.0, 800.0, 399.0, 243.0, 156.0, 91.0, 64.0, 45.0, 43.0, 34.0, 21.0, 11.0, 10.0, 10.0, 5.0, 9.0, 6.0, 5.0, 3.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53759765625, -0.5178451538085938, -0.4980926513671875, -0.47834014892578125, -0.458587646484375, -0.43883514404296875, -0.4190826416015625, -0.39933013916015625, -0.37957763671875, -0.35982513427734375, -0.3400726318359375, -0.32032012939453125, -0.300567626953125, -0.28081512451171875, -0.2610626220703125, -0.24131011962890625, -0.2215576171875, -0.20180511474609375, -0.1820526123046875, -0.16230010986328125, -0.142547607421875, -0.12279510498046875, -0.1030426025390625, -0.08329010009765625, -0.06353759765625, -0.04378509521484375, -0.0240325927734375, -0.00428009033203125, 0.015472412109375, 0.03522491455078125, 0.0549774169921875, 0.07472991943359375, 0.094482421875, 0.11423492431640625, 0.1339874267578125, 0.15373992919921875, 0.173492431640625, 0.19324493408203125, 0.2129974365234375, 0.23274993896484375, 0.25250244140625, 0.27225494384765625, 0.2920074462890625, 0.31175994873046875, 0.331512451171875, 0.35126495361328125, 0.3710174560546875, 0.39076995849609375, 0.4105224609375, 0.43027496337890625, 0.4500274658203125, 0.46977996826171875, 0.489532470703125, 0.5092849731445312, 0.5290374755859375, 0.5487899780273438, 0.56854248046875, 0.5882949829101562, 0.6080474853515625, 0.6277999877929688, 0.647552490234375, 0.6673049926757812, 0.6870574951171875, 0.7068099975585938, 0.7265625]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 1.0, 6.0, 4.0, 10.0, 3.0, 5.0, 13.0, 10.0, 18.0, 13.0, 21.0, 17.0, 31.0, 25.0, 36.0, 49.0, 53.0, 69.0, 74.0, 85.0, 79.0, 60.0, 46.0, 47.0, 32.0, 40.0, 29.0, 22.0, 19.0, 19.0, 13.0, 7.0, 9.0, 8.0, 4.0, 7.0, 4.0, 5.0, 2.0, 2.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9169921875, -0.883087158203125, -0.84918212890625, -0.815277099609375, -0.7813720703125, -0.747467041015625, -0.71356201171875, -0.679656982421875, -0.645751953125, -0.611846923828125, -0.57794189453125, -0.544036865234375, -0.5101318359375, -0.476226806640625, -0.44232177734375, -0.408416748046875, -0.37451171875, -0.340606689453125, -0.30670166015625, -0.272796630859375, -0.2388916015625, -0.204986572265625, -0.17108154296875, -0.137176513671875, -0.103271484375, -0.069366455078125, -0.03546142578125, -0.001556396484375, 0.0323486328125, 0.066253662109375, 0.10015869140625, 0.134063720703125, 0.16796875, 0.201873779296875, 0.23577880859375, 0.269683837890625, 0.3035888671875, 0.337493896484375, 0.37139892578125, 0.405303955078125, 0.439208984375, 0.473114013671875, 0.50701904296875, 0.540924072265625, 0.5748291015625, 0.608734130859375, 0.64263916015625, 0.676544189453125, 0.71044921875, 0.744354248046875, 0.77825927734375, 0.812164306640625, 0.8460693359375, 0.879974365234375, 0.91387939453125, 0.947784423828125, 0.981689453125, 1.015594482421875, 1.04949951171875, 1.083404541015625, 1.1173095703125, 1.151214599609375, 1.18511962890625, 1.219024658203125, 1.2529296875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 4.0, 1.0, 3.0, 6.0, 7.0, 9.0, 9.0, 11.0, 22.0, 26.0, 26.0, 35.0, 39.0, 63.0, 102.0, 196.0, 313.0, 538.0, 1099.0, 2405.0, 6311.0, 25138.0, 832290.0, 154908.0, 16291.0, 4694.0, 1871.0, 885.0, 489.0, 269.0, 165.0, 110.0, 63.0, 45.0, 31.0, 16.0, 18.0, 11.0, 11.0, 8.0, 7.0, 5.0, 3.0, 5.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.130615234375, -0.12651634216308594, -0.12241744995117188, -0.11831855773925781, -0.11421966552734375, -0.11012077331542969, -0.10602188110351562, -0.10192298889160156, -0.0978240966796875, -0.09372520446777344, -0.08962631225585938, -0.08552742004394531, -0.08142852783203125, -0.07732963562011719, -0.07323074340820312, -0.06913185119628906, -0.065032958984375, -0.06093406677246094, -0.056835174560546875, -0.05273628234863281, -0.04863739013671875, -0.04453849792480469, -0.040439605712890625, -0.03634071350097656, -0.0322418212890625, -0.028142929077148438, -0.024044036865234375, -0.019945144653320312, -0.01584625244140625, -0.011747360229492188, -0.007648468017578125, -0.0035495758056640625, 0.00054931640625, 0.0046482086181640625, 0.008747100830078125, 0.012845993041992188, 0.01694488525390625, 0.021043777465820312, 0.025142669677734375, 0.029241561889648438, 0.0333404541015625, 0.03743934631347656, 0.041538238525390625, 0.04563713073730469, 0.04973602294921875, 0.05383491516113281, 0.057933807373046875, 0.06203269958496094, 0.066131591796875, 0.07023048400878906, 0.07432937622070312, 0.07842826843261719, 0.08252716064453125, 0.08662605285644531, 0.09072494506835938, 0.09482383728027344, 0.0989227294921875, 0.10302162170410156, 0.10712051391601562, 0.11121940612792969, 0.11531829833984375, 0.11941719055175781, 0.12351608276367188, 0.12761497497558594, 0.1317138671875]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 3.0, 4.0, 3.0, 1.0, 1.0, 3.0, 5.0, 9.0, 9.0, 24.0, 36.0, 35.0, 43.0, 54.0, 91.0, 108.0, 143.0, 114.0, 88.0, 55.0, 45.0, 35.0, 19.0, 15.0, 13.0, 13.0, 5.0, 5.0, 2.0, 3.0, 6.0, 4.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-4.559755325317383e-05, -4.405435174703598e-05, -4.251115024089813e-05, -4.0967948734760284e-05, -3.9424747228622437e-05, -3.788154572248459e-05, -3.633834421634674e-05, -3.479514271020889e-05, -3.3251941204071045e-05, -3.17087396979332e-05, -3.016553819179535e-05, -2.86223366856575e-05, -2.7079135179519653e-05, -2.5535933673381805e-05, -2.3992732167243958e-05, -2.244953066110611e-05, -2.0906329154968262e-05, -1.9363127648830414e-05, -1.7819926142692566e-05, -1.6276724636554718e-05, -1.473352313041687e-05, -1.3190321624279022e-05, -1.1647120118141174e-05, -1.0103918612003326e-05, -8.560717105865479e-06, -7.017515599727631e-06, -5.474314093589783e-06, -3.931112587451935e-06, -2.387911081314087e-06, -8.44709575176239e-07, 6.984919309616089e-07, 2.2416934370994568e-06, 3.7848949432373047e-06, 5.328096449375153e-06, 6.8712979555130005e-06, 8.414499461650848e-06, 9.957700967788696e-06, 1.1500902473926544e-05, 1.3044103980064392e-05, 1.458730548620224e-05, 1.6130506992340088e-05, 1.7673708498477936e-05, 1.9216910004615784e-05, 2.076011151075363e-05, 2.230331301689148e-05, 2.3846514523029327e-05, 2.5389716029167175e-05, 2.6932917535305023e-05, 2.847611904144287e-05, 3.001932054758072e-05, 3.156252205371857e-05, 3.3105723559856415e-05, 3.464892506599426e-05, 3.619212657213211e-05, 3.773532807826996e-05, 3.9278529584407806e-05, 4.0821731090545654e-05, 4.23649325966835e-05, 4.390813410282135e-05, 4.54513356089592e-05, 4.6994537115097046e-05, 4.8537738621234894e-05, 5.008094012737274e-05, 5.162414163351059e-05, 5.316734313964844e-05]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 3.0, 8.0, 9.0, 11.0, 15.0, 24.0, 35.0, 34.0, 56.0, 98.0, 167.0, 248.0, 432.0, 853.0, 1719.0, 3705.0, 10175.0, 36080.0, 782056.0, 174181.0, 24700.0, 7813.0, 3056.0, 1430.0, 696.0, 373.0, 208.0, 119.0, 85.0, 56.0, 22.0, 24.0, 17.0, 13.0, 6.0, 7.0, 6.0, 2.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0], "bins": [-0.11810302734375, -0.1148996353149414, -0.11169624328613281, -0.10849285125732422, -0.10528945922851562, -0.10208606719970703, -0.09888267517089844, -0.09567928314208984, -0.09247589111328125, -0.08927249908447266, -0.08606910705566406, -0.08286571502685547, -0.07966232299804688, -0.07645893096923828, -0.07325553894042969, -0.0700521469116211, -0.0668487548828125, -0.0636453628540039, -0.06044197082519531, -0.05723857879638672, -0.054035186767578125, -0.05083179473876953, -0.04762840270996094, -0.044425010681152344, -0.04122161865234375, -0.038018226623535156, -0.03481483459472656, -0.03161144256591797, -0.028408050537109375, -0.02520465850830078, -0.022001266479492188, -0.018797874450683594, -0.015594482421875, -0.012391090393066406, -0.009187698364257812, -0.005984306335449219, -0.002780914306640625, 0.00042247772216796875, 0.0036258697509765625, 0.006829261779785156, 0.01003265380859375, 0.013236045837402344, 0.016439437866210938, 0.01964282989501953, 0.022846221923828125, 0.02604961395263672, 0.029253005981445312, 0.032456398010253906, 0.0356597900390625, 0.038863182067871094, 0.04206657409667969, 0.04526996612548828, 0.048473358154296875, 0.05167675018310547, 0.05488014221191406, 0.058083534240722656, 0.06128692626953125, 0.06449031829833984, 0.06769371032714844, 0.07089710235595703, 0.07410049438476562, 0.07730388641357422, 0.08050727844238281, 0.0837106704711914, 0.0869140625]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 4.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 9.0, 6.0, 5.0, 16.0, 10.0, 18.0, 17.0, 18.0, 23.0, 32.0, 64.0, 95.0, 114.0, 143.0, 104.0, 83.0, 58.0, 28.0, 35.0, 22.0, 19.0, 18.0, 13.0, 6.0, 5.0, 7.0, 3.0, 3.0, 1.0, 4.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 1.0], "bins": [-0.12213134765625, -0.11867904663085938, -0.11522674560546875, -0.11177444458007812, -0.1083221435546875, -0.10486984252929688, -0.10141754150390625, -0.09796524047851562, -0.094512939453125, -0.09106063842773438, -0.08760833740234375, -0.08415603637695312, -0.0807037353515625, -0.07725143432617188, -0.07379913330078125, -0.07034683227539062, -0.06689453125, -0.06344223022460938, -0.05998992919921875, -0.056537628173828125, -0.0530853271484375, -0.049633026123046875, -0.04618072509765625, -0.042728424072265625, -0.039276123046875, -0.035823822021484375, -0.03237152099609375, -0.028919219970703125, -0.0254669189453125, -0.022014617919921875, -0.01856231689453125, -0.015110015869140625, -0.01165771484375, -0.008205413818359375, -0.00475311279296875, -0.001300811767578125, 0.0021514892578125, 0.005603790283203125, 0.00905609130859375, 0.012508392333984375, 0.015960693359375, 0.019412994384765625, 0.02286529541015625, 0.026317596435546875, 0.0297698974609375, 0.033222198486328125, 0.03667449951171875, 0.040126800537109375, 0.0435791015625, 0.047031402587890625, 0.05048370361328125, 0.053936004638671875, 0.0573883056640625, 0.060840606689453125, 0.06429290771484375, 0.06774520874023438, 0.071197509765625, 0.07464981079101562, 0.07810211181640625, 0.08155441284179688, 0.0850067138671875, 0.08845901489257812, 0.09191131591796875, 0.09536361694335938, 0.09881591796875]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 4.0, 7.0, 13.0, 30.0, 39.0, 71.0, 134.0, 489.0, 85.0, 48.0, 26.0, 20.0, 12.0, 13.0, 7.0, 3.0, 4.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.5760087966918945, -4.429663181304932, -4.283317565917969, -4.136972427368164, -3.990626573562622, -3.8442811965942383, -3.6979355812072754, -3.5515899658203125, -3.4052443504333496, -3.2588987350463867, -3.112553358078003, -2.96620774269104, -2.819862127304077, -2.6735167503356934, -2.5271711349487305, -2.3808255195617676, -2.234480142593384, -2.088134527206421, -1.9417890310287476, -1.7954435348510742, -1.6490979194641113, -1.502752423286438, -1.3564069271087646, -1.2100613117218018, -1.0637158155441284, -0.9173702597618103, -0.7710247039794922, -0.6246792078018188, -0.47833365201950073, -0.3319880962371826, -0.18564260005950928, -0.03929698467254639, 0.10704851150512695, 0.25339406728744507, 0.3997395932674408, 0.5460851192474365, 0.6924306750297546, 0.8387762308120728, 0.9851217269897461, 1.131467342376709, 1.2778128385543823, 1.4241583347320557, 1.5705039501190186, 1.716849446296692, 1.8631949424743652, 2.009540557861328, 2.155886173248291, 2.302231788635254, 2.4485771656036377, 2.5949227809906006, 2.7412681579589844, 2.8876137733459473, 3.03395938873291, 3.180305004119873, 3.326650381088257, 3.4729959964752197, 3.6193413734436035, 3.7656869888305664, 3.91203236579895, 4.058378219604492, 4.204723358154297, 4.35106897354126, 4.497414588928223, 4.6437602043151855, 4.790105819702148]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 6.0, 4.0, 6.0, 16.0, 10.0, 12.0, 11.0, 11.0, 17.0, 13.0, 22.0, 15.0, 18.0, 22.0, 29.0, 30.0, 44.0, 252.0, 202.0, 41.0, 22.0, 25.0, 21.0, 24.0, 19.0, 20.0, 17.0, 13.0, 8.0, 8.0, 5.0, 9.0, 11.0, 7.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.171809673309326, -3.080932855606079, -2.990056276321411, -2.899179458618164, -2.808302879333496, -2.717426061630249, -2.626549243927002, -2.535672664642334, -2.444795846939087, -2.35391902923584, -2.263042449951172, -2.172165632247925, -2.081289052963257, -1.9904122352600098, -1.8995355367660522, -1.8086588382720947, -1.7177821397781372, -1.6269054412841797, -1.5360287427902222, -1.4451520442962646, -1.3542752265930176, -1.26339852809906, -1.1725218296051025, -1.0816450119018555, -0.9907683730125427, -0.8998916745185852, -0.8090149164199829, -0.7181382179260254, -0.6272615194320679, -0.5363847613334656, -0.44550806283950806, -0.35463130474090576, -0.26375460624694824, -0.17287787795066833, -0.08200116455554962, 0.008875548839569092, 0.099752277135849, 0.1906290054321289, 0.2815057039260864, 0.3723824620246887, 0.46325916051864624, 0.5541358590126038, 0.645012617111206, 0.7358893156051636, 0.8267660140991211, 0.9176427721977234, 1.0085194110870361, 1.0993962287902832, 1.1902729272842407, 1.2811496257781982, 1.3720263242721558, 1.4629030227661133, 1.5537798404693604, 1.6446565389633179, 1.7355332374572754, 1.8264100551605225, 1.9172866344451904, 2.0081634521484375, 2.0990400314331055, 2.1899168491363525, 2.2807934284210205, 2.3716702461242676, 2.4625468254089355, 2.5534236431121826, 2.6443004608154297]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 4.0, 1.0, 5.0, 6.0, 2.0, 4.0, 6.0, 6.0, 6.0, 15.0, 12.0, 7.0, 21.0, 18.0, 21.0, 25.0, 22.0, 26.0, 32.0, 41.0, 98.0, 242.0, 91.0, 45.0, 36.0, 33.0, 34.0, 20.0, 22.0, 15.0, 15.0, 15.0, 12.0, 14.0, 7.0, 4.0, 9.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.291015625, -0.2828330993652344, -0.27465057373046875, -0.2664680480957031, -0.2582855224609375, -0.2501029968261719, -0.24192047119140625, -0.23373794555664062, -0.225555419921875, -0.21737289428710938, -0.20919036865234375, -0.20100784301757812, -0.1928253173828125, -0.18464279174804688, -0.17646026611328125, -0.16827774047851562, -0.16009521484375, -0.15191268920898438, -0.14373016357421875, -0.13554763793945312, -0.1273651123046875, -0.11918258666992188, -0.11100006103515625, -0.10281753540039062, -0.094635009765625, -0.08645248413085938, -0.07826995849609375, -0.07008743286132812, -0.0619049072265625, -0.053722381591796875, -0.04553985595703125, -0.037357330322265625, -0.0291748046875, -0.020992279052734375, -0.01280975341796875, -0.004627227783203125, 0.0035552978515625, 0.011737823486328125, 0.01992034912109375, 0.028102874755859375, 0.036285400390625, 0.044467926025390625, 0.05265045166015625, 0.060832977294921875, 0.0690155029296875, 0.07719802856445312, 0.08538055419921875, 0.09356307983398438, 0.10174560546875, 0.10992813110351562, 0.11811065673828125, 0.12629318237304688, 0.1344757080078125, 0.14265823364257812, 0.15084075927734375, 0.15902328491210938, 0.167205810546875, 0.17538833618164062, 0.18357086181640625, 0.19175338745117188, 0.1999359130859375, 0.20811843872070312, 0.21630096435546875, 0.22448348999023438, 0.232666015625]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 4.0, 5.0, 12.0, 8.0, 7.0, 15.0, 13.0, 22.0, 48.0, 55.0, 80.0, 114.0, 207.0, 412.0, 783.0, 1980.0, 5623.0, 34932.0, 8320021.0, 16969.0, 4154.0, 1556.0, 645.0, 327.0, 183.0, 109.0, 88.0, 68.0, 38.0, 18.0, 20.0, 8.0, 13.0, 9.0, 3.0, 6.0, 2.0, 10.0, 3.0, 3.0, 2.0, 0.0, 2.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0], "bins": [-1.9451676607131958, -1.8850535154342651, -1.824939489364624, -1.7648253440856934, -1.7047113180160522, -1.6445971727371216, -1.5844831466674805, -1.5243690013885498, -1.4642548561096191, -1.4041407108306885, -1.3440266847610474, -1.2839125394821167, -1.2237985134124756, -1.163684368133545, -1.1035702228546143, -1.0434561967849731, -0.9833421111106873, -0.9232280254364014, -0.8631139397621155, -0.8029998540878296, -0.7428857088088989, -0.682771623134613, -0.6226575374603271, -0.5625433921813965, -0.5024293661117554, -0.4423152804374695, -0.3822011649608612, -0.3220870792865753, -0.26197296380996704, -0.20185887813568115, -0.14174479246139526, -0.08163067698478699, -0.02151656150817871, 0.03859753534197807, 0.09871163219213486, 0.15882572531700134, 0.21893982589244843, 0.2790539264678955, 0.3391680121421814, 0.3992821276187897, 0.45939621329307556, 0.5195103287696838, 0.5796244144439697, 0.6397385001182556, 0.6998525857925415, 0.7599667310714722, 0.8200807571411133, 0.880194902420044, 0.9403089880943298, 1.0004230737686157, 1.0605372190475464, 1.1206512451171875, 1.1807653903961182, 1.2408795356750488, 1.30099356174469, 1.3611077070236206, 1.4212217330932617, 1.4813358783721924, 1.5414499044418335, 1.6015640497207642, 1.6616780757904053, 1.721792221069336, 1.7819063663482666, 1.8420203924179077, 1.9021345376968384]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 1.0, 4.0, 1.0, 5.0, 9.0, 9.0, 7.0, 11.0, 6.0, 6.0, 9.0, 10.0, 3.0, 6.0, 6.0, 4.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.424314498901367, -3.269782066345215, -3.1152496337890625, -2.960716962814331, -2.8061845302581787, -2.6516520977020264, -2.497119426727295, -2.3425869941711426, -2.1880545616149902, -2.033522129058838, -1.878989577293396, -1.724457025527954, -1.5699245929718018, -1.4153921604156494, -1.2608596086502075, -1.1063270568847656, -0.9517946243286133, -0.7972621321678162, -0.642729640007019, -0.4881971478462219, -0.3336646556854248, -0.17913216352462769, -0.024599671363830566, 0.12993288040161133, 0.28446531295776367, 0.4389978051185608, 0.5935302972793579, 0.748062789440155, 0.9025952816009521, 1.0571277141571045, 1.2116602659225464, 1.3661928176879883, 1.5207257270812988, 1.6752581596374512, 1.829790711402893, 1.984323263168335, 2.1388556957244873, 2.2933881282806396, 2.447920799255371, 2.6024532318115234, 2.756985664367676, 2.911518096923828, 3.0660505294799805, 3.220583200454712, 3.3751156330108643, 3.5296480655670166, 3.684180736541748, 3.8387131690979004, 3.9932456016540527, 4.147778034210205, 4.302310466766357, 4.45684289932251, 4.61137580871582, 4.765908241271973, 4.920440673828125, 5.074973106384277, 5.22950553894043, 5.384037971496582, 5.538570404052734, 5.693102836608887, 5.847635269165039, 6.00216817855835, 6.156700611114502, 6.311233043670654, 6.465765476226807]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 3.0, 3.0, 13.0, 10.0, 11.0, 14.0, 9.0, 17.0, 33.0, 40.0, 68.0, 113.0, 180.0, 340.0, 897.0, 3984.0, 32137.0, 289559.0, 175173.0, 17649.0, 2585.0, 713.0, 265.0, 150.0, 102.0, 57.0, 39.0, 31.0, 21.0, 24.0, 9.0, 6.0, 4.0, 5.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.61328125, -5.46099853515625, -5.3087158203125, -5.15643310546875, -5.004150390625, -4.85186767578125, -4.6995849609375, -4.54730224609375, -4.39501953125, -4.24273681640625, -4.0904541015625, -3.93817138671875, -3.785888671875, -3.63360595703125, -3.4813232421875, -3.32904052734375, -3.1767578125, -3.02447509765625, -2.8721923828125, -2.71990966796875, -2.567626953125, -2.41534423828125, -2.2630615234375, -2.11077880859375, -1.95849609375, -1.80621337890625, -1.6539306640625, -1.50164794921875, -1.349365234375, -1.19708251953125, -1.0447998046875, -0.89251708984375, -0.740234375, -0.58795166015625, -0.4356689453125, -0.28338623046875, -0.131103515625, 0.02117919921875, 0.1734619140625, 0.32574462890625, 0.47802734375, 0.63031005859375, 0.7825927734375, 0.93487548828125, 1.087158203125, 1.23944091796875, 1.3917236328125, 1.54400634765625, 1.6962890625, 1.84857177734375, 2.0008544921875, 2.15313720703125, 2.305419921875, 2.45770263671875, 2.6099853515625, 2.76226806640625, 2.91455078125, 3.06683349609375, 3.2191162109375, 3.37139892578125, 3.523681640625, 3.67596435546875, 3.8282470703125, 3.98052978515625, 4.1328125]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 3.0, 8.0, 21.0, 25.0, 37.0, 49.0, 76.0, 87.0, 120.0, 121.0, 99.0, 99.0, 75.0, 56.0, 52.0, 30.0, 17.0, 5.0, 6.0, 8.0, 1.0, 7.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.7060546875, -0.6886482238769531, -0.6712417602539062, -0.6538352966308594, -0.6364288330078125, -0.6190223693847656, -0.6016159057617188, -0.5842094421386719, -0.566802978515625, -0.5493965148925781, -0.5319900512695312, -0.5145835876464844, -0.4971771240234375, -0.4797706604003906, -0.46236419677734375, -0.4449577331542969, -0.42755126953125, -0.4101448059082031, -0.39273834228515625, -0.3753318786621094, -0.3579254150390625, -0.3405189514160156, -0.32311248779296875, -0.3057060241699219, -0.288299560546875, -0.2708930969238281, -0.25348663330078125, -0.23608016967773438, -0.2186737060546875, -0.20126724243164062, -0.18386077880859375, -0.16645431518554688, -0.1490478515625, -0.13164138793945312, -0.11423492431640625, -0.09682846069335938, -0.0794219970703125, -0.062015533447265625, -0.04460906982421875, -0.027202606201171875, -0.009796142578125, 0.007610321044921875, 0.02501678466796875, 0.042423248291015625, 0.0598297119140625, 0.07723617553710938, 0.09464263916015625, 0.11204910278320312, 0.12945556640625, 0.14686203002929688, 0.16426849365234375, 0.18167495727539062, 0.1990814208984375, 0.21648788452148438, 0.23389434814453125, 0.2513008117675781, 0.268707275390625, 0.2861137390136719, 0.30352020263671875, 0.3209266662597656, 0.3383331298828125, 0.3557395935058594, 0.37314605712890625, 0.3905525207519531, 0.407958984375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 6.0, 11.0, 9.0, 22.0, 45.0, 98.0, 133.0, 101.0, 37.0, 12.0, 4.0, 4.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 1.0, 2.0], "bins": [-6.965106010437012, -6.8206095695495605, -6.676112651824951, -6.5316162109375, -6.387119293212891, -6.2426228523254395, -6.098126411437988, -5.953629493713379, -5.809133052825928, -5.664636611938477, -5.520139694213867, -5.375643253326416, -5.231146812438965, -5.0866498947143555, -4.942153453826904, -4.797657012939453, -4.653160095214844, -4.508663654327393, -4.364166736602783, -4.219670295715332, -4.075173377990723, -3.9306769371032715, -3.7861804962158203, -3.64168381690979, -3.4971871376037598, -3.3526904582977295, -3.208193778991699, -3.063697338104248, -2.9192006587982178, -2.7747039794921875, -2.6302075386047363, -2.485710859298706, -2.341214418411255, -2.1967177391052246, -2.0522212982177734, -1.9077246189117432, -1.763227939605713, -1.6187312602996826, -1.474234700202942, -1.3297381401062012, -1.185241460800171, -1.0407447814941406, -0.8962482213973999, -0.7517516016960144, -0.6072549819946289, -0.4627583622932434, -0.3182617425918579, -0.1737651824951172, -0.029268503189086914, 0.11522811651229858, 0.2597247362136841, 0.4042213559150696, 0.5487179756164551, 0.6932145953178406, 0.8377112150192261, 0.9822077751159668, 1.126704454421997, 1.2712011337280273, 1.415697693824768, 1.5601942539215088, 1.704690933227539, 1.8491876125335693, 1.99368417263031, 2.138180732727051, 2.282677412033081]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 6.0, 3.0, 10.0, 3.0, 4.0, 5.0, 3.0, 4.0, 22.0, 51.0, 142.0, 123.0, 51.0, 23.0, 10.0, 8.0, 8.0, 6.0, 2.0, 3.0, 3.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.147279739379883, -3.055356025695801, -2.9634323120117188, -2.8715085983276367, -2.7795848846435547, -2.6876611709594727, -2.5957374572753906, -2.5038135051727295, -2.4118897914886475, -2.3199660778045654, -2.2280423641204834, -2.1361186504364014, -2.0441949367523193, -1.9522711038589478, -1.8603473901748657, -1.7684235572814941, -1.6764999628067017, -1.5845762491226196, -1.4926525354385376, -1.400728702545166, -1.308804988861084, -1.216881275177002, -1.12495756149292, -1.033033847808838, -0.9411100745201111, -0.849186360836029, -0.7572625875473022, -0.6653388738632202, -0.5734151601791382, -0.4814913868904114, -0.38956767320632935, -0.29764389991760254, -0.2057201862335205, -0.11379645019769669, -0.021872714161872864, 0.07005101442337036, 0.16197475790977478, 0.2538985013961792, 0.34582221508026123, 0.43774598836898804, 0.5296697020530701, 0.6215934157371521, 0.7135171890258789, 0.8054409027099609, 0.897364616394043, 0.9892883896827698, 1.081212043762207, 1.1731358766555786, 1.2650595903396606, 1.3569833040237427, 1.4489070177078247, 1.5408308506011963, 1.6327545642852783, 1.7246782779693604, 1.8166019916534424, 1.9085257053375244, 2.0004494190216064, 2.0923731327056885, 2.1842968463897705, 2.2762205600738525, 2.3681442737579346, 2.4600682258605957, 2.5519919395446777, 2.6439156532287598, 2.735839366912842]}, "eval/loss": 4.169541358947754, "eval/wer": 2.381138437128124, "eval/runtime": 1123.3815, "eval/samples_per_second": 2.352, "eval/steps_per_second": 0.295, "train/train_runtime": 6250.8757, "train/train_samples_per_second": 4.565, "train/train_steps_per_second": 0.143, "train/total_flos": 0.0, "train/train_loss": 4.249312744012328, "_wandb": {"runtime": 7715}}