diff --git "a/wandb/run-20220302_233655-33dtvgaa/files/wandb-summary.json" "b/wandb/run-20220302_233655-33dtvgaa/files/wandb-summary.json" new file mode 100644--- /dev/null +++ "b/wandb/run-20220302_233655-33dtvgaa/files/wandb-summary.json" @@ -0,0 +1 @@ +{"train/loss": 4.3323, "train/learning_rate": 0.0001194, "train/epoch": 0.78, "train/global_step": 200, "_runtime": 3718, "_timestamp": 1646267933, "_step": 199, "gradients/decoder.transformer.ln_f.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 10.0, 904.0, 101.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-176.83297729492188, -145.7891387939453, -114.74528503417969, -83.70144653320312, -52.65760040283203, -21.613754272460938, 9.430084228515625, 40.47393798828125, 71.51777648925781, 102.5616226196289, 133.60546875, 164.64930725097656, 195.69314575195312, 226.73699951171875, 257.78082275390625, 288.82470703125, 319.8685302734375, 350.9123840332031, 381.9562072753906, 413.00006103515625, 444.0439147949219, 475.0877685546875, 506.131591796875, 537.1754150390625, 568.2192993164062, 599.2631225585938, 630.3070068359375, 661.350830078125, 692.3946533203125, 723.4385375976562, 754.4823608398438, 785.5262451171875, 816.5700073242188, 847.6138305664062, 878.65771484375, 909.7015380859375, 940.745361328125, 971.7892456054688, 1002.8330688476562, 1033.876953125, 1064.9207763671875, 1095.964599609375, 1127.0084228515625, 1158.05224609375, 1189.09619140625, 1220.1400146484375, 1251.183837890625, 1282.2276611328125, 1313.271484375, 1344.3153076171875, 1375.359130859375, 1406.403076171875, 1437.4468994140625, 1468.49072265625, 1499.5345458984375, 1530.578369140625, 1561.622314453125, 1592.6661376953125, 1623.7099609375, 1654.75390625, 1685.7977294921875, 1716.841552734375, 1747.8853759765625, 1778.92919921875, 1809.9730224609375]}, "gradients/decoder.transformer.ln_f.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 2.0, 0.0, 3.0, 5.0, 6.0, 2.0, 10.0, 8.0, 10.0, 12.0, 14.0, 14.0, 20.0, 19.0, 33.0, 40.0, 40.0, 46.0, 46.0, 49.0, 48.0, 54.0, 58.0, 53.0, 58.0, 49.0, 47.0, 50.0, 38.0, 39.0, 26.0, 20.0, 24.0, 17.0, 9.0, 11.0, 6.0, 10.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.36355590820312, -110.03234100341797, -105.70112609863281, -101.36991119384766, -97.0386962890625, -92.70748901367188, -88.37627410888672, -84.04505920410156, -79.7138442993164, -75.38262939453125, -71.0514144897461, -66.72019958496094, -62.38898849487305, -58.05777359008789, -53.7265625, -49.395347595214844, -45.06413269042969, -40.73291778564453, -36.401702880859375, -32.070491790771484, -27.739276885986328, -23.408061981201172, -19.07684898376465, -14.745635986328125, -10.414421081542969, -6.083207130432129, -1.751993179321289, 2.579220771789551, 6.910434722900391, 11.241649627685547, 15.57286262512207, 19.904075622558594, 24.23529052734375, 28.566505432128906, 32.89772033691406, 37.22893142700195, 41.56014633178711, 45.891361236572266, 50.222572326660156, 54.55378723144531, 58.88500213623047, 63.216217041015625, 67.54743194580078, 71.87864685058594, 76.20985412597656, 80.54107666015625, 84.87228393554688, 89.20349884033203, 93.53471374511719, 97.86592864990234, 102.1971435546875, 106.52835845947266, 110.85957336425781, 115.19078063964844, 119.5219955444336, 123.85321044921875, 128.18441772460938, 132.515625, 136.8468475341797, 141.1780548095703, 145.50927734375, 149.84048461914062, 154.1717071533203, 158.50291442871094, 162.83413696289062]}, "gradients/decoder.transformer.h.23.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 4.0, 5.0, 7.0, 7.0, 9.0, 10.0, 18.0, 7.0, 21.0, 33.0, 21.0, 35.0, 41.0, 51.0, 52.0, 46.0, 46.0, 49.0, 48.0, 64.0, 59.0, 51.0, 65.0, 47.0, 32.0, 26.0, 33.0, 23.0, 22.0, 20.0, 17.0, 13.0, 7.0, 5.0, 7.0, 4.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-7.36328125, -7.15606689453125, -6.9488525390625, -6.74163818359375, -6.534423828125, -6.32720947265625, -6.1199951171875, -5.91278076171875, -5.70556640625, -5.49835205078125, -5.2911376953125, -5.08392333984375, -4.876708984375, -4.66949462890625, -4.4622802734375, -4.25506591796875, -4.0478515625, -3.84063720703125, -3.6334228515625, -3.42620849609375, -3.218994140625, -3.01177978515625, -2.8045654296875, -2.59735107421875, -2.39013671875, -2.18292236328125, -1.9757080078125, -1.76849365234375, -1.561279296875, -1.35406494140625, -1.1468505859375, -0.93963623046875, -0.732421875, -0.52520751953125, -0.3179931640625, -0.11077880859375, 0.096435546875, 0.30364990234375, 0.5108642578125, 0.71807861328125, 0.92529296875, 1.13250732421875, 1.3397216796875, 1.54693603515625, 1.754150390625, 1.96136474609375, 2.1685791015625, 2.37579345703125, 2.5830078125, 2.79022216796875, 2.9974365234375, 3.20465087890625, 3.411865234375, 3.61907958984375, 3.8262939453125, 4.03350830078125, 4.24072265625, 4.44793701171875, 4.6551513671875, 4.86236572265625, 5.069580078125, 5.27679443359375, 5.4840087890625, 5.69122314453125, 5.8984375]}, "gradients/decoder.transformer.h.23.mlp.c_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 5.0, 1.0, 5.0, 16.0, 11.0, 19.0, 23.0, 37.0, 51.0, 84.0, 121.0, 199.0, 322.0, 583.0, 1102.0, 2449.0, 6142.0, 21555.0, 135995.0, 2666167.0, 1260344.0, 75531.0, 15057.0, 4574.0, 1794.0, 887.0, 464.0, 255.0, 165.0, 106.0, 77.0, 49.0, 27.0, 19.0, 14.0, 8.0, 9.0, 5.0, 5.0, 6.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-28.796875, -27.89306640625, -26.9892578125, -26.08544921875, -25.181640625, -24.27783203125, -23.3740234375, -22.47021484375, -21.56640625, -20.66259765625, -19.7587890625, -18.85498046875, -17.951171875, -17.04736328125, -16.1435546875, -15.23974609375, -14.3359375, -13.43212890625, -12.5283203125, -11.62451171875, -10.720703125, -9.81689453125, -8.9130859375, -8.00927734375, -7.10546875, -6.20166015625, -5.2978515625, -4.39404296875, -3.490234375, -2.58642578125, -1.6826171875, -0.77880859375, 0.125, 1.02880859375, 1.9326171875, 2.83642578125, 3.740234375, 4.64404296875, 5.5478515625, 6.45166015625, 7.35546875, 8.25927734375, 9.1630859375, 10.06689453125, 10.970703125, 11.87451171875, 12.7783203125, 13.68212890625, 14.5859375, 15.48974609375, 16.3935546875, 17.29736328125, 18.201171875, 19.10498046875, 20.0087890625, 20.91259765625, 21.81640625, 22.72021484375, 23.6240234375, 24.52783203125, 25.431640625, 26.33544921875, 27.2392578125, 28.14306640625, 29.046875]}, "gradients/decoder.transformer.h.23.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 6.0, 5.0, 15.0, 29.0, 45.0, 77.0, 115.0, 211.0, 456.0, 807.0, 860.0, 645.0, 356.0, 181.0, 110.0, 78.0, 31.0, 19.0, 18.0, 6.0, 3.0, 4.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-32.625, -31.42529296875, -30.2255859375, -29.02587890625, -27.826171875, -26.62646484375, -25.4267578125, -24.22705078125, -23.02734375, -21.82763671875, -20.6279296875, -19.42822265625, -18.228515625, -17.02880859375, -15.8291015625, -14.62939453125, -13.4296875, -12.22998046875, -11.0302734375, -9.83056640625, -8.630859375, -7.43115234375, -6.2314453125, -5.03173828125, -3.83203125, -2.63232421875, -1.4326171875, -0.23291015625, 0.966796875, 2.16650390625, 3.3662109375, 4.56591796875, 5.765625, 6.96533203125, 8.1650390625, 9.36474609375, 10.564453125, 11.76416015625, 12.9638671875, 14.16357421875, 15.36328125, 16.56298828125, 17.7626953125, 18.96240234375, 20.162109375, 21.36181640625, 22.5615234375, 23.76123046875, 24.9609375, 26.16064453125, 27.3603515625, 28.56005859375, 29.759765625, 30.95947265625, 32.1591796875, 33.35888671875, 34.55859375, 35.75830078125, 36.9580078125, 38.15771484375, 39.357421875, 40.55712890625, 41.7568359375, 42.95654296875, 44.15625]}, "gradients/decoder.transformer.h.23.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 3.0, 5.0, 3.0, 6.0, 6.0, 12.0, 19.0, 24.0, 62.0, 115.0, 218.0, 500.0, 1092.0, 4233.0, 439348.0, 3735414.0, 10128.0, 1794.0, 634.0, 325.0, 156.0, 80.0, 49.0, 29.0, 11.0, 9.0, 4.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-116.1875, -112.2041015625, -108.220703125, -104.2373046875, -100.25390625, -96.2705078125, -92.287109375, -88.3037109375, -84.3203125, -80.3369140625, -76.353515625, -72.3701171875, -68.38671875, -64.4033203125, -60.419921875, -56.4365234375, -52.453125, -48.4697265625, -44.486328125, -40.5029296875, -36.51953125, -32.5361328125, -28.552734375, -24.5693359375, -20.5859375, -16.6025390625, -12.619140625, -8.6357421875, -4.65234375, -0.6689453125, 3.314453125, 7.2978515625, 11.28125, 15.2646484375, 19.248046875, 23.2314453125, 27.21484375, 31.1982421875, 35.181640625, 39.1650390625, 43.1484375, 47.1318359375, 51.115234375, 55.0986328125, 59.08203125, 63.0654296875, 67.048828125, 71.0322265625, 75.015625, 78.9990234375, 82.982421875, 86.9658203125, 90.94921875, 94.9326171875, 98.916015625, 102.8994140625, 106.8828125, 110.8662109375, 114.849609375, 118.8330078125, 122.81640625, 126.7998046875, 130.783203125, 134.7666015625, 138.75]}, "gradients/decoder.transformer.h.23.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 103.0, 785.0, 118.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-905.34814453125, -888.7216186523438, -872.0950927734375, -855.468505859375, -838.8419799804688, -822.2154541015625, -805.5889282226562, -788.96240234375, -772.3358154296875, -755.7092895507812, -739.082763671875, -722.4561767578125, -705.8296508789062, -689.203125, -672.5765991210938, -655.9500732421875, -639.3235473632812, -622.697021484375, -606.0704956054688, -589.4439086914062, -572.8173828125, -556.1908569335938, -539.5643310546875, -522.9378051757812, -506.3112487792969, -489.6847229003906, -473.05816650390625, -456.431640625, -439.80511474609375, -423.1785583496094, -406.5520324707031, -389.92547607421875, -373.2989501953125, -356.67242431640625, -340.0458679199219, -323.4193420410156, -306.79278564453125, -290.166259765625, -273.53973388671875, -256.9132080078125, -240.28665161132812, -223.6601104736328, -207.0335693359375, -190.40704345703125, -173.78050231933594, -157.15396118164062, -140.52743530273438, -123.90089416503906, -107.27435302734375, -90.64781188964844, -74.02127838134766, -57.39474105834961, -40.76820373535156, -24.14166259765625, -7.515129089355469, 9.111404418945312, 25.737945556640625, 42.36448287963867, 58.99102020263672, 75.6175537109375, 92.24409484863281, 108.87063598632812, 125.4971694946289, 142.1237030029297, 158.750244140625]}, "gradients/decoder.transformer.h.23.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 0.0, 3.0, 0.0, 3.0, 3.0, 3.0, 8.0, 8.0, 11.0, 13.0, 11.0, 29.0, 29.0, 20.0, 25.0, 30.0, 28.0, 36.0, 32.0, 57.0, 49.0, 50.0, 42.0, 36.0, 43.0, 49.0, 40.0, 54.0, 44.0, 39.0, 39.0, 32.0, 31.0, 24.0, 21.0, 14.0, 8.0, 13.0, 9.0, 4.0, 7.0, 6.0, 5.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-96.62782287597656, -93.78887939453125, -90.94994354248047, -88.11100769042969, -85.27206420898438, -82.43312072753906, -79.59418487548828, -76.7552490234375, -73.91630554199219, -71.07736206054688, -68.2384262084961, -65.39949035644531, -62.560546875, -59.72160720825195, -56.882667541503906, -54.04372787475586, -51.20478820800781, -48.365848541259766, -45.52690887451172, -42.68796920776367, -39.849029541015625, -37.01008987426758, -34.17115020751953, -31.332210540771484, -28.493270874023438, -25.65433120727539, -22.815391540527344, -19.976451873779297, -17.13751220703125, -14.298572540283203, -11.459632873535156, -8.62069320678711, -5.781761169433594, -2.942821502685547, -0.1038818359375, 2.735057830810547, 5.573997497558594, 8.41293716430664, 11.251876831054688, 14.090816497802734, 16.92975616455078, 19.768695831298828, 22.607635498046875, 25.446575164794922, 28.28551483154297, 31.124454498291016, 33.96339416503906, 36.80233383178711, 39.641273498535156, 42.4802131652832, 45.31915283203125, 48.1580924987793, 50.997032165527344, 53.83597183227539, 56.67491149902344, 59.513851165771484, 62.35279083251953, 65.19172668457031, 68.03067016601562, 70.86961364746094, 73.70854949951172, 76.5474853515625, 79.38642883300781, 82.22537231445312, 85.0643081665039]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 4.0, 5.0, 3.0, 18.0, 15.0, 12.0, 16.0, 24.0, 15.0, 24.0, 24.0, 32.0, 42.0, 31.0, 42.0, 38.0, 42.0, 48.0, 46.0, 47.0, 47.0, 52.0, 47.0, 47.0, 30.0, 42.0, 36.0, 29.0, 31.0, 14.0, 21.0, 11.0, 19.0, 9.0, 13.0, 8.0, 3.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.01171875, -5.8240966796875, -5.636474609375, -5.4488525390625, -5.26123046875, -5.0736083984375, -4.885986328125, -4.6983642578125, -4.5107421875, -4.3231201171875, -4.135498046875, -3.9478759765625, -3.76025390625, -3.5726318359375, -3.385009765625, -3.1973876953125, -3.009765625, -2.8221435546875, -2.634521484375, -2.4468994140625, -2.25927734375, -2.0716552734375, -1.884033203125, -1.6964111328125, -1.5087890625, -1.3211669921875, -1.133544921875, -0.9459228515625, -0.75830078125, -0.5706787109375, -0.383056640625, -0.1954345703125, -0.0078125, 0.1798095703125, 0.367431640625, 0.5550537109375, 0.74267578125, 0.9302978515625, 1.117919921875, 1.3055419921875, 1.4931640625, 1.6807861328125, 1.868408203125, 2.0560302734375, 2.24365234375, 2.4312744140625, 2.618896484375, 2.8065185546875, 2.994140625, 3.1817626953125, 3.369384765625, 3.5570068359375, 3.74462890625, 3.9322509765625, 4.119873046875, 4.3074951171875, 4.4951171875, 4.6827392578125, 4.870361328125, 5.0579833984375, 5.24560546875, 5.4332275390625, 5.620849609375, 5.8084716796875, 5.99609375]}, "gradients/decoder.transformer.h.23.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 7.0, 6.0, 15.0, 20.0, 22.0, 51.0, 50.0, 80.0, 109.0, 162.0, 250.0, 380.0, 546.0, 924.0, 1376.0, 2036.0, 3259.0, 5287.0, 8127.0, 13410.0, 21760.0, 36516.0, 62365.0, 108913.0, 182356.0, 224664.0, 154715.0, 90031.0, 51405.0, 30492.0, 18257.0, 11346.0, 7138.0, 4469.0, 2844.0, 1772.0, 1137.0, 733.0, 524.0, 333.0, 227.0, 154.0, 109.0, 55.0, 33.0, 29.0, 19.0, 19.0, 9.0, 7.0, 8.0, 4.0, 2.0, 1.0, 3.0, 2.0], "bins": [-0.6865234375, -0.665924072265625, -0.64532470703125, -0.624725341796875, -0.6041259765625, -0.583526611328125, -0.56292724609375, -0.542327880859375, -0.521728515625, -0.501129150390625, -0.48052978515625, -0.459930419921875, -0.4393310546875, -0.418731689453125, -0.39813232421875, -0.377532958984375, -0.35693359375, -0.336334228515625, -0.31573486328125, -0.295135498046875, -0.2745361328125, -0.253936767578125, -0.23333740234375, -0.212738037109375, -0.192138671875, -0.171539306640625, -0.15093994140625, -0.130340576171875, -0.1097412109375, -0.089141845703125, -0.06854248046875, -0.047943115234375, -0.02734375, -0.006744384765625, 0.01385498046875, 0.034454345703125, 0.0550537109375, 0.075653076171875, 0.09625244140625, 0.116851806640625, 0.137451171875, 0.158050537109375, 0.17864990234375, 0.199249267578125, 0.2198486328125, 0.240447998046875, 0.26104736328125, 0.281646728515625, 0.30224609375, 0.322845458984375, 0.34344482421875, 0.364044189453125, 0.3846435546875, 0.405242919921875, 0.42584228515625, 0.446441650390625, 0.467041015625, 0.487640380859375, 0.50823974609375, 0.528839111328125, 0.5494384765625, 0.570037841796875, 0.59063720703125, 0.611236572265625, 0.6318359375]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 6.0, 4.0, 3.0, 6.0, 7.0, 11.0, 8.0, 14.0, 17.0, 15.0, 22.0, 21.0, 19.0, 32.0, 29.0, 33.0, 45.0, 40.0, 36.0, 33.0, 34.0, 45.0, 1066.0, 32.0, 33.0, 32.0, 36.0, 36.0, 40.0, 26.0, 31.0, 36.0, 22.0, 21.0, 20.0, 16.0, 16.0, 16.0, 14.0, 9.0, 11.0, 6.0, 4.0, 1.0, 9.0, 2.0, 5.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-3.1953125, -3.095947265625, -2.99658203125, -2.897216796875, -2.7978515625, -2.698486328125, -2.59912109375, -2.499755859375, -2.400390625, -2.301025390625, -2.20166015625, -2.102294921875, -2.0029296875, -1.903564453125, -1.80419921875, -1.704833984375, -1.60546875, -1.506103515625, -1.40673828125, -1.307373046875, -1.2080078125, -1.108642578125, -1.00927734375, -0.909912109375, -0.810546875, -0.711181640625, -0.61181640625, -0.512451171875, -0.4130859375, -0.313720703125, -0.21435546875, -0.114990234375, -0.015625, 0.083740234375, 0.18310546875, 0.282470703125, 0.3818359375, 0.481201171875, 0.58056640625, 0.679931640625, 0.779296875, 0.878662109375, 0.97802734375, 1.077392578125, 1.1767578125, 1.276123046875, 1.37548828125, 1.474853515625, 1.57421875, 1.673583984375, 1.77294921875, 1.872314453125, 1.9716796875, 2.071044921875, 2.17041015625, 2.269775390625, 2.369140625, 2.468505859375, 2.56787109375, 2.667236328125, 2.7666015625, 2.865966796875, 2.96533203125, 3.064697265625, 3.1640625]}, "gradients/decoder.transformer.h.23.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 0.0, 5.0, 4.0, 4.0, 14.0, 15.0, 29.0, 33.0, 59.0, 76.0, 125.0, 179.0, 269.0, 409.0, 585.0, 809.0, 1242.0, 1861.0, 2744.0, 4067.0, 6240.0, 9404.0, 14470.0, 22590.0, 35200.0, 55854.0, 86912.0, 130051.0, 1151383.0, 224499.0, 121943.0, 80864.0, 51733.0, 32740.0, 20881.0, 13555.0, 8735.0, 5825.0, 3841.0, 2577.0, 1708.0, 1107.0, 797.0, 559.0, 333.0, 256.0, 169.0, 124.0, 79.0, 56.0, 45.0, 28.0, 18.0, 15.0, 8.0, 5.0, 5.0, 4.0, 1.0, 2.0], "bins": [-0.413818359375, -0.4012451171875, -0.388671875, -0.3760986328125, -0.363525390625, -0.3509521484375, -0.33837890625, -0.3258056640625, -0.313232421875, -0.3006591796875, -0.2880859375, -0.2755126953125, -0.262939453125, -0.2503662109375, -0.23779296875, -0.2252197265625, -0.212646484375, -0.2000732421875, -0.1875, -0.1749267578125, -0.162353515625, -0.1497802734375, -0.13720703125, -0.1246337890625, -0.112060546875, -0.0994873046875, -0.0869140625, -0.0743408203125, -0.061767578125, -0.0491943359375, -0.03662109375, -0.0240478515625, -0.011474609375, 0.0010986328125, 0.013671875, 0.0262451171875, 0.038818359375, 0.0513916015625, 0.06396484375, 0.0765380859375, 0.089111328125, 0.1016845703125, 0.1142578125, 0.1268310546875, 0.139404296875, 0.1519775390625, 0.16455078125, 0.1771240234375, 0.189697265625, 0.2022705078125, 0.21484375, 0.2274169921875, 0.239990234375, 0.2525634765625, 0.26513671875, 0.2777099609375, 0.290283203125, 0.3028564453125, 0.3154296875, 0.3280029296875, 0.340576171875, 0.3531494140625, 0.36572265625, 0.3782958984375, 0.390869140625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 1.0, 1.0, 2.0, 1.0, 0.0, 7.0, 5.0, 6.0, 10.0, 5.0, 17.0, 17.0, 16.0, 21.0, 23.0, 28.0, 30.0, 32.0, 43.0, 38.0, 53.0, 57.0, 60.0, 54.0, 57.0, 58.0, 45.0, 52.0, 34.0, 41.0, 28.0, 35.0, 19.0, 19.0, 15.0, 14.0, 4.0, 14.0, 4.0, 10.0, 6.0, 5.0, 5.0, 6.0, 3.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0], "bins": [-0.0038471221923828125, -0.003740847110748291, -0.0036345720291137695, -0.003528296947479248, -0.0034220218658447266, -0.003315746784210205, -0.0032094717025756836, -0.003103196620941162, -0.0029969215393066406, -0.002890646457672119, -0.0027843713760375977, -0.002678096294403076, -0.0025718212127685547, -0.002465546131134033, -0.0023592710494995117, -0.0022529959678649902, -0.0021467208862304688, -0.0020404458045959473, -0.0019341707229614258, -0.0018278956413269043, -0.0017216205596923828, -0.0016153454780578613, -0.0015090703964233398, -0.0014027953147888184, -0.0012965202331542969, -0.0011902451515197754, -0.001083970069885254, -0.0009776949882507324, -0.0008714199066162109, -0.0007651448249816895, -0.000658869743347168, -0.0005525946617126465, -0.000446319580078125, -0.0003400444984436035, -0.00023376941680908203, -0.00012749433517456055, -2.1219253540039062e-05, 8.505582809448242e-05, 0.0001913309097290039, 0.0002976059913635254, 0.0004038810729980469, 0.0005101561546325684, 0.0006164312362670898, 0.0007227063179016113, 0.0008289813995361328, 0.0009352564811706543, 0.0010415315628051758, 0.0011478066444396973, 0.0012540817260742188, 0.0013603568077087402, 0.0014666318893432617, 0.0015729069709777832, 0.0016791820526123047, 0.0017854571342468262, 0.0018917322158813477, 0.001998007297515869, 0.0021042823791503906, 0.002210557460784912, 0.0023168325424194336, 0.002423107624053955, 0.0025293827056884766, 0.002635657787322998, 0.0027419328689575195, 0.002848207950592041, 0.0029544830322265625]}, "gradients/decoder.transformer.h.23.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 7.0, 2.0, 4.0, 4.0, 5.0, 4.0, 11.0, 13.0, 10.0, 13.0, 17.0, 17.0, 26.0, 40.0, 40.0, 70.0, 77.0, 107.0, 124.0, 170.0, 242.0, 324.0, 600.0, 19736.0, 1023575.0, 1687.0, 425.0, 283.0, 209.0, 154.0, 136.0, 95.0, 72.0, 62.0, 40.0, 25.0, 37.0, 29.0, 12.0, 19.0, 12.0, 10.0, 4.0, 5.0, 4.0, 0.0, 4.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.06866455078125, -0.06639766693115234, -0.06413078308105469, -0.06186389923095703, -0.059597015380859375, -0.05733013153076172, -0.05506324768066406, -0.052796363830566406, -0.05052947998046875, -0.048262596130371094, -0.04599571228027344, -0.04372882843017578, -0.041461944580078125, -0.03919506072998047, -0.03692817687988281, -0.034661293029785156, -0.0323944091796875, -0.030127525329589844, -0.027860641479492188, -0.02559375762939453, -0.023326873779296875, -0.02105998992919922, -0.018793106079101562, -0.016526222229003906, -0.01425933837890625, -0.011992454528808594, -0.009725570678710938, -0.007458686828613281, -0.005191802978515625, -0.0029249191284179688, -0.0006580352783203125, 0.0016088485717773438, 0.003875732421875, 0.006142616271972656, 0.008409500122070312, 0.010676383972167969, 0.012943267822265625, 0.015210151672363281, 0.017477035522460938, 0.019743919372558594, 0.02201080322265625, 0.024277687072753906, 0.026544570922851562, 0.02881145477294922, 0.031078338623046875, 0.03334522247314453, 0.03561210632324219, 0.037878990173339844, 0.0401458740234375, 0.042412757873535156, 0.04467964172363281, 0.04694652557373047, 0.049213409423828125, 0.05148029327392578, 0.05374717712402344, 0.056014060974121094, 0.05828094482421875, 0.060547828674316406, 0.06281471252441406, 0.06508159637451172, 0.06734848022460938, 0.06961536407470703, 0.07188224792480469, 0.07414913177490234, 0.076416015625]}, "gradients/decoder.transformer.h.23.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 32.0, 734.0, 243.0, 7.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008459459990262985, -0.008007566444575787, -0.007555673830211163, -0.007103780750185251, -0.00665188767015934, -0.006199994124472141, -0.005748101510107517, -0.005296207964420319, -0.004844315350055695, -0.004392422270029783, -0.003940529190003872, -0.0034886361099779606, -0.0030367430299520493, -0.0025848497170954943, -0.002132956637069583, -0.0016810635570436716, -0.0012291702441871166, -0.0007772771641612053, -0.00032538402592763305, 0.0001265091123059392, 0.0005784021923318505, 0.0010302953887730837, 0.001482188468798995, 0.0019340815488249063, 0.0023859746288508177, 0.002837867708876729, 0.0032897607889026403, 0.0037416541017591953, 0.004193547181785107, 0.004645440261811018, 0.005097333341836929, 0.005549226421862841, 0.006001119501888752, 0.006453012581914663, 0.006904905661940575, 0.007356798741966486, 0.007808691821992397, 0.008260585367679596, 0.00871247798204422, 0.009164371527731419, 0.009616264142096043, 0.010068157687783241, 0.010520050302147865, 0.010971943847835064, 0.011423836462199688, 0.011875730007886887, 0.01232762262225151, 0.01277951616793871, 0.013231409713625908, 0.013683303259313107, 0.01413519587367773, 0.01458708941936493, 0.015038982033729553, 0.015490875579416752, 0.01594276912510395, 0.016394661739468575, 0.0168465543538332, 0.017298446968197823, 0.017750341445207596, 0.01820223405957222, 0.018654126673936844, 0.019106019288301468, 0.01955791376531124, 0.020009806379675865, 0.02046169899404049]}, "gradients/decoder.transformer.h.23.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 5.0, 3.0, 7.0, 6.0, 7.0, 10.0, 11.0, 16.0, 19.0, 38.0, 44.0, 38.0, 46.0, 44.0, 48.0, 69.0, 43.0, 37.0, 69.0, 62.0, 60.0, 51.0, 48.0, 34.0, 37.0, 32.0, 19.0, 17.0, 15.0, 19.0, 16.0, 8.0, 12.0, 8.0, 6.0, 6.0, 1.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0022068023681640625, -0.0021236399188637733, -0.002040477469563484, -0.001957315020263195, -0.0018741525709629059, -0.0017909901216626167, -0.0017078276723623276, -0.0016246652230620384, -0.0015415027737617493, -0.0014583403244614601, -0.001375177875161171, -0.0012920154258608818, -0.0012088529765605927, -0.0011256905272603035, -0.0010425280779600143, -0.0009593656286597252, -0.000876203179359436, -0.0007930407300591469, -0.0007098782807588577, -0.0006267158314585686, -0.0005435533821582794, -0.00046039093285799026, -0.0003772284835577011, -0.00029406603425741196, -0.0002109035849571228, -0.00012774113565683365, -4.4578686356544495e-05, 3.858376294374466e-05, 0.00012174621224403381, 0.00020490866154432297, 0.0002880711108446121, 0.0003712335601449013, 0.00045439600944519043, 0.0005375584587454796, 0.0006207209080457687, 0.0007038833573460579, 0.000787045806646347, 0.0008702082559466362, 0.0009533707052469254, 0.0010365331545472145, 0.0011196956038475037, 0.0012028580531477928, 0.001286020502448082, 0.0013691829517483711, 0.0014523454010486603, 0.0015355078503489494, 0.0016186702996492386, 0.0017018327489495277, 0.001784995198249817, 0.001868157647550106, 0.0019513200968503952, 0.0020344825461506844, 0.0021176449954509735, 0.0022008074447512627, 0.002283969894051552, 0.002367132343351841, 0.00245029479265213, 0.0025334572419524193, 0.0026166196912527084, 0.0026997821405529976, 0.0027829445898532867, 0.002866107039153576, 0.002949269488453865, 0.003032431937754154, 0.0031155943870544434]}, "gradients/decoder.transformer.h.23.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 5.0, 4.0, 5.0, 3.0, 18.0, 15.0, 12.0, 16.0, 24.0, 15.0, 24.0, 24.0, 32.0, 42.0, 31.0, 42.0, 38.0, 43.0, 47.0, 46.0, 47.0, 47.0, 52.0, 47.0, 47.0, 30.0, 42.0, 36.0, 29.0, 31.0, 14.0, 21.0, 11.0, 19.0, 9.0, 13.0, 9.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.01171875, -5.8240966796875, -5.636474609375, -5.4488525390625, -5.26123046875, -5.0736083984375, -4.885986328125, -4.6983642578125, -4.5107421875, -4.3231201171875, -4.135498046875, -3.9478759765625, -3.76025390625, -3.5726318359375, -3.385009765625, -3.1973876953125, -3.009765625, -2.8221435546875, -2.634521484375, -2.4468994140625, -2.25927734375, -2.0716552734375, -1.884033203125, -1.6964111328125, -1.5087890625, -1.3211669921875, -1.133544921875, -0.9459228515625, -0.75830078125, -0.5706787109375, -0.383056640625, -0.1954345703125, -0.0078125, 0.1798095703125, 0.367431640625, 0.5550537109375, 0.74267578125, 0.9302978515625, 1.117919921875, 1.3055419921875, 1.4931640625, 1.6807861328125, 1.868408203125, 2.0560302734375, 2.24365234375, 2.4312744140625, 2.618896484375, 2.8065185546875, 2.994140625, 3.1817626953125, 3.369384765625, 3.5570068359375, 3.74462890625, 3.9322509765625, 4.119873046875, 4.3074951171875, 4.4951171875, 4.6827392578125, 4.870361328125, 5.0579833984375, 5.24560546875, 5.4332275390625, 5.620849609375, 5.8084716796875, 5.99609375]}, "gradients/decoder.transformer.h.23.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 8.0, 3.0, 9.0, 3.0, 18.0, 27.0, 25.0, 43.0, 56.0, 82.0, 116.0, 123.0, 254.0, 315.0, 468.0, 659.0, 1012.0, 1552.0, 2386.0, 4162.0, 7265.0, 13891.0, 39581.0, 411770.0, 487690.0, 43170.0, 14710.0, 7457.0, 4322.0, 2549.0, 1562.0, 975.0, 712.0, 480.0, 306.0, 238.0, 166.0, 111.0, 72.0, 65.0, 47.0, 22.0, 27.0, 21.0, 13.0, 3.0, 9.0, 2.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-29.828125, -28.925048828125, -28.02197265625, -27.118896484375, -26.2158203125, -25.312744140625, -24.40966796875, -23.506591796875, -22.603515625, -21.700439453125, -20.79736328125, -19.894287109375, -18.9912109375, -18.088134765625, -17.18505859375, -16.281982421875, -15.37890625, -14.475830078125, -13.57275390625, -12.669677734375, -11.7666015625, -10.863525390625, -9.96044921875, -9.057373046875, -8.154296875, -7.251220703125, -6.34814453125, -5.445068359375, -4.5419921875, -3.638916015625, -2.73583984375, -1.832763671875, -0.9296875, -0.026611328125, 0.87646484375, 1.779541015625, 2.6826171875, 3.585693359375, 4.48876953125, 5.391845703125, 6.294921875, 7.197998046875, 8.10107421875, 9.004150390625, 9.9072265625, 10.810302734375, 11.71337890625, 12.616455078125, 13.51953125, 14.422607421875, 15.32568359375, 16.228759765625, 17.1318359375, 18.034912109375, 18.93798828125, 19.841064453125, 20.744140625, 21.647216796875, 22.55029296875, 23.453369140625, 24.3564453125, 25.259521484375, 26.16259765625, 27.065673828125, 27.96875]}, "gradients/decoder.transformer.h.23.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 2.0, 1.0, 3.0, 3.0, 2.0, 2.0, 7.0, 3.0, 7.0, 10.0, 8.0, 15.0, 12.0, 14.0, 21.0, 17.0, 19.0, 34.0, 38.0, 31.0, 58.0, 53.0, 62.0, 67.0, 124.0, 263.0, 1451.0, 200.0, 95.0, 62.0, 50.0, 52.0, 24.0, 32.0, 30.0, 30.0, 22.0, 20.0, 21.0, 22.0, 14.0, 10.0, 14.0, 9.0, 9.0, 7.0, 3.0, 1.0, 3.0, 2.0, 3.0, 1.0, 1.0], "bins": [-19.875, -19.3426513671875, -18.810302734375, -18.2779541015625, -17.74560546875, -17.2132568359375, -16.680908203125, -16.1485595703125, -15.6162109375, -15.0838623046875, -14.551513671875, -14.0191650390625, -13.48681640625, -12.9544677734375, -12.422119140625, -11.8897705078125, -11.357421875, -10.8250732421875, -10.292724609375, -9.7603759765625, -9.22802734375, -8.6956787109375, -8.163330078125, -7.6309814453125, -7.0986328125, -6.5662841796875, -6.033935546875, -5.5015869140625, -4.96923828125, -4.4368896484375, -3.904541015625, -3.3721923828125, -2.83984375, -2.3074951171875, -1.775146484375, -1.2427978515625, -0.71044921875, -0.1781005859375, 0.354248046875, 0.8865966796875, 1.4189453125, 1.9512939453125, 2.483642578125, 3.0159912109375, 3.54833984375, 4.0806884765625, 4.613037109375, 5.1453857421875, 5.677734375, 6.2100830078125, 6.742431640625, 7.2747802734375, 7.80712890625, 8.3394775390625, 8.871826171875, 9.4041748046875, 9.9365234375, 10.4688720703125, 11.001220703125, 11.5335693359375, 12.06591796875, 12.5982666015625, 13.130615234375, 13.6629638671875, 14.1953125]}, "gradients/decoder.transformer.h.23.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 2.0, 3.0, 6.0, 8.0, 8.0, 8.0, 11.0, 10.0, 14.0, 17.0, 11.0, 22.0, 23.0, 36.0, 25.0, 46.0, 46.0, 73.0, 127.0, 197.0, 734.0, 5952.0, 3027636.0, 108154.0, 1522.0, 417.0, 163.0, 117.0, 65.0, 45.0, 37.0, 34.0, 15.0, 20.0, 18.0, 15.0, 9.0, 10.0, 10.0, 10.0, 11.0, 9.0, 4.0, 3.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-58.875, -56.5888671875, -54.302734375, -52.0166015625, -49.73046875, -47.4443359375, -45.158203125, -42.8720703125, -40.5859375, -38.2998046875, -36.013671875, -33.7275390625, -31.44140625, -29.1552734375, -26.869140625, -24.5830078125, -22.296875, -20.0107421875, -17.724609375, -15.4384765625, -13.15234375, -10.8662109375, -8.580078125, -6.2939453125, -4.0078125, -1.7216796875, 0.564453125, 2.8505859375, 5.13671875, 7.4228515625, 9.708984375, 11.9951171875, 14.28125, 16.5673828125, 18.853515625, 21.1396484375, 23.42578125, 25.7119140625, 27.998046875, 30.2841796875, 32.5703125, 34.8564453125, 37.142578125, 39.4287109375, 41.71484375, 44.0009765625, 46.287109375, 48.5732421875, 50.859375, 53.1455078125, 55.431640625, 57.7177734375, 60.00390625, 62.2900390625, 64.576171875, 66.8623046875, 69.1484375, 71.4345703125, 73.720703125, 76.0068359375, 78.29296875, 80.5791015625, 82.865234375, 85.1513671875, 87.4375]}, "gradients/decoder.transformer.h.23.ln_1.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 117.0, 804.0, 88.0, 6.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-164.1995391845703, -158.19998168945312, -152.20042419433594, -146.20086669921875, -140.20130920410156, -134.20175170898438, -128.20220947265625, -122.20264434814453, -116.20308685302734, -110.20352935791016, -104.20397186279297, -98.20442199707031, -92.20486450195312, -86.20530700683594, -80.20574951171875, -74.20619201660156, -68.20663452148438, -62.20707702636719, -56.20751953125, -50.20796585083008, -44.20840835571289, -38.2088508605957, -32.20929718017578, -26.209739685058594, -20.210182189941406, -14.210625648498535, -8.211069107055664, -2.2115135192871094, 3.788043975830078, 9.787601470947266, 15.787155151367188, 21.786712646484375, 27.7862548828125, 33.78581237792969, 39.785369873046875, 45.7849235534668, 51.784481048583984, 57.78403854370117, 63.783592224121094, 69.78314971923828, 75.78270721435547, 81.78226470947266, 87.78182220458984, 93.7813720703125, 99.78092956542969, 105.78048706054688, 111.78004455566406, 117.77960205078125, 123.77915954589844, 129.77871704101562, 135.7782745361328, 141.77783203125, 147.7773895263672, 153.77694702148438, 159.7764892578125, 165.77606201171875, 171.77560424804688, 177.77516174316406, 183.77471923828125, 189.77427673339844, 195.77383422851562, 201.7733917236328, 207.77294921875, 213.77249145507812, 219.77206420898438]}, "gradients/decoder.transformer.h.23.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 2.0, 6.0, 5.0, 7.0, 8.0, 11.0, 15.0, 14.0, 14.0, 27.0, 25.0, 24.0, 20.0, 30.0, 32.0, 30.0, 38.0, 24.0, 44.0, 44.0, 47.0, 50.0, 57.0, 52.0, 42.0, 48.0, 33.0, 28.0, 30.0, 30.0, 30.0, 28.0, 25.0, 24.0, 17.0, 10.0, 12.0, 7.0, 6.0, 5.0, 1.0, 5.0, 2.0, 1.0, 2.0, 2.0], "bins": [-68.90167999267578, -67.07246398925781, -65.24324798583984, -63.41402816772461, -61.584808349609375, -59.755592346191406, -57.92637634277344, -56.09716033935547, -54.267940521240234, -52.438724517822266, -50.60950469970703, -48.78028869628906, -46.951072692871094, -45.12185287475586, -43.29263687133789, -41.463417053222656, -39.63420104980469, -37.80498504638672, -35.975765228271484, -34.146549224853516, -32.31732940673828, -30.488113403320312, -28.658897399902344, -26.829679489135742, -25.00046157836914, -23.17124366760254, -21.342025756835938, -19.51280975341797, -17.683591842651367, -15.854373931884766, -14.02515697479248, -12.195940017700195, -10.366722106933594, -8.537504196166992, -6.708287239074707, -4.879069805145264, -3.0498523712158203, -1.2206344604492188, 0.6085824966430664, 2.4377994537353516, 4.267017364501953, 6.0962347984313965, 7.92545223236084, 9.754669189453125, 11.583887100219727, 13.413105010986328, 15.242321968078613, 17.0715389251709, 18.9007568359375, 20.7299747467041, 22.559192657470703, 24.388408660888672, 26.217626571655273, 28.046844482421875, 29.876060485839844, 31.705278396606445, 33.53449630737305, 35.363712310791016, 37.19293212890625, 39.02214813232422, 40.85136413574219, 42.68058395385742, 44.50979995727539, 46.339019775390625, 48.168235778808594]}, "gradients/decoder.transformer.h.22.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 6.0, 7.0, 8.0, 14.0, 9.0, 18.0, 19.0, 15.0, 22.0, 12.0, 17.0, 27.0, 39.0, 30.0, 25.0, 37.0, 39.0, 47.0, 49.0, 46.0, 43.0, 39.0, 46.0, 48.0, 45.0, 33.0, 41.0, 27.0, 37.0, 26.0, 28.0, 14.0, 16.0, 13.0, 11.0, 12.0, 13.0, 5.0, 7.0, 4.0, 3.0, 4.0, 3.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-5.8359375, -5.64849853515625, -5.4610595703125, -5.27362060546875, -5.086181640625, -4.89874267578125, -4.7113037109375, -4.52386474609375, -4.33642578125, -4.14898681640625, -3.9615478515625, -3.77410888671875, -3.586669921875, -3.39923095703125, -3.2117919921875, -3.02435302734375, -2.8369140625, -2.64947509765625, -2.4620361328125, -2.27459716796875, -2.087158203125, -1.89971923828125, -1.7122802734375, -1.52484130859375, -1.33740234375, -1.14996337890625, -0.9625244140625, -0.77508544921875, -0.587646484375, -0.40020751953125, -0.2127685546875, -0.02532958984375, 0.162109375, 0.34954833984375, 0.5369873046875, 0.72442626953125, 0.911865234375, 1.09930419921875, 1.2867431640625, 1.47418212890625, 1.66162109375, 1.84906005859375, 2.0364990234375, 2.22393798828125, 2.411376953125, 2.59881591796875, 2.7862548828125, 2.97369384765625, 3.1611328125, 3.34857177734375, 3.5360107421875, 3.72344970703125, 3.910888671875, 4.09832763671875, 4.2857666015625, 4.47320556640625, 4.66064453125, 4.84808349609375, 5.0355224609375, 5.22296142578125, 5.410400390625, 5.59783935546875, 5.7852783203125, 5.97271728515625, 6.16015625]}, "gradients/decoder.transformer.h.22.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 5.0, 1.0, 7.0, 11.0, 17.0, 22.0, 28.0, 18.0, 51.0, 61.0, 71.0, 153.0, 202.0, 311.0, 511.0, 983.0, 2141.0, 5165.0, 16270.0, 80013.0, 1317085.0, 2604971.0, 132096.0, 22108.0, 6581.0, 2589.0, 1198.0, 608.0, 335.0, 202.0, 142.0, 95.0, 62.0, 53.0, 32.0, 18.0, 20.0, 18.0, 10.0, 7.0, 7.0, 5.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-30.03125, -29.0, -27.96875, -26.9375, -25.90625, -24.875, -23.84375, -22.8125, -21.78125, -20.75, -19.71875, -18.6875, -17.65625, -16.625, -15.59375, -14.5625, -13.53125, -12.5, -11.46875, -10.4375, -9.40625, -8.375, -7.34375, -6.3125, -5.28125, -4.25, -3.21875, -2.1875, -1.15625, -0.125, 0.90625, 1.9375, 2.96875, 4.0, 5.03125, 6.0625, 7.09375, 8.125, 9.15625, 10.1875, 11.21875, 12.25, 13.28125, 14.3125, 15.34375, 16.375, 17.40625, 18.4375, 19.46875, 20.5, 21.53125, 22.5625, 23.59375, 24.625, 25.65625, 26.6875, 27.71875, 28.75, 29.78125, 30.8125, 31.84375, 32.875, 33.90625, 34.9375, 35.96875]}, "gradients/decoder.transformer.h.22.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 3.0, 5.0, 5.0, 7.0, 16.0, 17.0, 20.0, 41.0, 41.0, 66.0, 116.0, 156.0, 234.0, 361.0, 473.0, 688.0, 579.0, 353.0, 291.0, 181.0, 113.0, 113.0, 61.0, 44.0, 31.0, 21.0, 15.0, 15.0, 11.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.21875, -34.283203125, -33.34765625, -32.412109375, -31.4765625, -30.541015625, -29.60546875, -28.669921875, -27.734375, -26.798828125, -25.86328125, -24.927734375, -23.9921875, -23.056640625, -22.12109375, -21.185546875, -20.25, -19.314453125, -18.37890625, -17.443359375, -16.5078125, -15.572265625, -14.63671875, -13.701171875, -12.765625, -11.830078125, -10.89453125, -9.958984375, -9.0234375, -8.087890625, -7.15234375, -6.216796875, -5.28125, -4.345703125, -3.41015625, -2.474609375, -1.5390625, -0.603515625, 0.33203125, 1.267578125, 2.203125, 3.138671875, 4.07421875, 5.009765625, 5.9453125, 6.880859375, 7.81640625, 8.751953125, 9.6875, 10.623046875, 11.55859375, 12.494140625, 13.4296875, 14.365234375, 15.30078125, 16.236328125, 17.171875, 18.107421875, 19.04296875, 19.978515625, 20.9140625, 21.849609375, 22.78515625, 23.720703125, 24.65625]}, "gradients/decoder.transformer.h.22.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 9.0, 8.0, 11.0, 21.0, 26.0, 27.0, 57.0, 95.0, 122.0, 221.0, 578.0, 3514.0, 1549447.0, 2634858.0, 4157.0, 596.0, 189.0, 126.0, 74.0, 42.0, 37.0, 23.0, 14.0, 12.0, 9.0, 3.0, 1.0, 4.0, 3.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-96.4375, -92.0595703125, -87.681640625, -83.3037109375, -78.92578125, -74.5478515625, -70.169921875, -65.7919921875, -61.4140625, -57.0361328125, -52.658203125, -48.2802734375, -43.90234375, -39.5244140625, -35.146484375, -30.7685546875, -26.390625, -22.0126953125, -17.634765625, -13.2568359375, -8.87890625, -4.5009765625, -0.123046875, 4.2548828125, 8.6328125, 13.0107421875, 17.388671875, 21.7666015625, 26.14453125, 30.5224609375, 34.900390625, 39.2783203125, 43.65625, 48.0341796875, 52.412109375, 56.7900390625, 61.16796875, 65.5458984375, 69.923828125, 74.3017578125, 78.6796875, 83.0576171875, 87.435546875, 91.8134765625, 96.19140625, 100.5693359375, 104.947265625, 109.3251953125, 113.703125, 118.0810546875, 122.458984375, 126.8369140625, 131.21484375, 135.5927734375, 139.970703125, 144.3486328125, 148.7265625, 153.1044921875, 157.482421875, 161.8603515625, 166.23828125, 170.6162109375, 174.994140625, 179.3720703125, 183.75]}, "gradients/decoder.transformer.h.22.ln_2.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 21.0, 404.0, 560.0, 31.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-138.68788146972656, -123.40946197509766, -108.13104248046875, -92.85263061523438, -77.57421112060547, -62.29579162597656, -47.01737976074219, -31.73896026611328, -16.460540771484375, -1.1821231842041016, 14.096294403076172, 29.374710083007812, 44.65312957763672, 59.931549072265625, 75.2099609375, 90.4883804321289, 105.76679992675781, 121.04521942138672, 136.32363891601562, 151.60205078125, 166.88046264648438, 182.1588897705078, 197.4373016357422, 212.71572875976562, 227.994140625, 243.27255249023438, 258.55096435546875, 273.82940673828125, 289.1078186035156, 304.38623046875, 319.6646423339844, 334.94305419921875, 350.22149658203125, 365.4999084472656, 380.7783203125, 396.0567626953125, 411.3351745605469, 426.61358642578125, 441.8919982910156, 457.17041015625, 472.4488525390625, 487.7272644042969, 503.00567626953125, 518.2841186523438, 533.5625, 548.8409423828125, 564.119384765625, 579.3977661132812, 594.6761474609375, 609.95458984375, 625.2329711914062, 640.5114135742188, 655.789794921875, 671.0682373046875, 686.3466796875, 701.6250610351562, 716.9035034179688, 732.1819458007812, 747.4603271484375, 762.73876953125, 778.0171508789062, 793.2955932617188, 808.573974609375, 823.8524169921875, 839.130859375]}, "gradients/decoder.transformer.h.22.ln_2.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 5.0, 4.0, 6.0, 4.0, 7.0, 6.0, 13.0, 12.0, 13.0, 11.0, 7.0, 24.0, 26.0, 20.0, 28.0, 25.0, 27.0, 27.0, 45.0, 46.0, 43.0, 38.0, 41.0, 43.0, 44.0, 36.0, 42.0, 33.0, 32.0, 35.0, 32.0, 34.0, 20.0, 32.0, 29.0, 17.0, 12.0, 23.0, 15.0, 8.0, 9.0, 15.0, 6.0, 6.0, 4.0, 3.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.233245849609375, -60.78960418701172, -58.3459587097168, -55.902313232421875, -53.45867156982422, -51.01502990722656, -48.57138442993164, -46.12773895263672, -43.68409729003906, -41.240455627441406, -38.796810150146484, -36.35316467285156, -33.909523010253906, -31.465879440307617, -29.022235870361328, -26.57859230041504, -24.13494873046875, -21.69130516052246, -19.247661590576172, -16.804018020629883, -14.360374450683594, -11.916730880737305, -9.473087310791016, -7.029443740844727, -4.5858001708984375, -2.1421566009521484, 0.3014869689941406, 2.7451305389404297, 5.188774108886719, 7.632417678833008, 10.076061248779297, 12.519704818725586, 14.963340759277344, 17.406984329223633, 19.850627899169922, 22.29427146911621, 24.7379150390625, 27.18155860900879, 29.625202178955078, 32.06884765625, 34.512489318847656, 36.95613098144531, 39.399776458740234, 41.843421936035156, 44.28706359863281, 46.73070526123047, 49.17435073852539, 51.61799621582031, 54.06163787841797, 56.505279541015625, 58.94892501831055, 61.39257049560547, 63.836212158203125, 66.27985382080078, 68.72349548339844, 71.16714477539062, 73.61078643798828, 76.05442810058594, 78.49807739257812, 80.94171905517578, 83.38536071777344, 85.8290023803711, 88.27264404296875, 90.71629333496094, 93.1599349975586]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 7.0, 6.0, 11.0, 14.0, 18.0, 12.0, 21.0, 18.0, 20.0, 21.0, 19.0, 39.0, 37.0, 33.0, 43.0, 37.0, 34.0, 50.0, 38.0, 47.0, 32.0, 49.0, 50.0, 43.0, 47.0, 26.0, 19.0, 33.0, 23.0, 26.0, 19.0, 19.0, 19.0, 10.0, 15.0, 15.0, 4.0, 7.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.38671875, -5.20037841796875, -5.0140380859375, -4.82769775390625, -4.641357421875, -4.45501708984375, -4.2686767578125, -4.08233642578125, -3.89599609375, -3.70965576171875, -3.5233154296875, -3.33697509765625, -3.150634765625, -2.96429443359375, -2.7779541015625, -2.59161376953125, -2.4052734375, -2.21893310546875, -2.0325927734375, -1.84625244140625, -1.659912109375, -1.47357177734375, -1.2872314453125, -1.10089111328125, -0.91455078125, -0.72821044921875, -0.5418701171875, -0.35552978515625, -0.169189453125, 0.01715087890625, 0.2034912109375, 0.38983154296875, 0.576171875, 0.76251220703125, 0.9488525390625, 1.13519287109375, 1.321533203125, 1.50787353515625, 1.6942138671875, 1.88055419921875, 2.06689453125, 2.25323486328125, 2.4395751953125, 2.62591552734375, 2.812255859375, 2.99859619140625, 3.1849365234375, 3.37127685546875, 3.5576171875, 3.74395751953125, 3.9302978515625, 4.11663818359375, 4.302978515625, 4.48931884765625, 4.6756591796875, 4.86199951171875, 5.04833984375, 5.23468017578125, 5.4210205078125, 5.60736083984375, 5.793701171875, 5.98004150390625, 6.1663818359375, 6.35272216796875, 6.5390625]}, "gradients/decoder.transformer.h.22.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 14.0, 18.0, 22.0, 49.0, 58.0, 106.0, 144.0, 250.0, 429.0, 702.0, 1194.0, 2019.0, 3436.0, 6085.0, 10724.0, 19196.0, 35926.0, 69395.0, 140188.0, 266508.0, 239260.0, 121918.0, 59653.0, 31569.0, 17081.0, 9604.0, 5370.0, 3041.0, 1878.0, 1086.0, 631.0, 359.0, 213.0, 148.0, 92.0, 67.0, 44.0, 27.0, 14.0, 11.0, 5.0, 8.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.83935546875, -0.8103103637695312, -0.7812652587890625, -0.7522201538085938, -0.723175048828125, -0.6941299438476562, -0.6650848388671875, -0.6360397338867188, -0.60699462890625, -0.5779495239257812, -0.5489044189453125, -0.5198593139648438, -0.490814208984375, -0.46176910400390625, -0.4327239990234375, -0.40367889404296875, -0.3746337890625, -0.34558868408203125, -0.3165435791015625, -0.28749847412109375, -0.258453369140625, -0.22940826416015625, -0.2003631591796875, -0.17131805419921875, -0.14227294921875, -0.11322784423828125, -0.0841827392578125, -0.05513763427734375, -0.026092529296875, 0.00295257568359375, 0.0319976806640625, 0.06104278564453125, 0.090087890625, 0.11913299560546875, 0.1481781005859375, 0.17722320556640625, 0.206268310546875, 0.23531341552734375, 0.2643585205078125, 0.29340362548828125, 0.32244873046875, 0.35149383544921875, 0.3805389404296875, 0.40958404541015625, 0.438629150390625, 0.46767425537109375, 0.4967193603515625, 0.5257644653320312, 0.5548095703125, 0.5838546752929688, 0.6128997802734375, 0.6419448852539062, 0.670989990234375, 0.7000350952148438, 0.7290802001953125, 0.7581253051757812, 0.78717041015625, 0.8162155151367188, 0.8452606201171875, 0.8743057250976562, 0.903350830078125, 0.9323959350585938, 0.9614410400390625, 0.9904861450195312, 1.01953125]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 2.0, 9.0, 9.0, 6.0, 6.0, 10.0, 11.0, 11.0, 15.0, 16.0, 22.0, 19.0, 24.0, 37.0, 30.0, 34.0, 35.0, 36.0, 41.0, 47.0, 45.0, 40.0, 1067.0, 35.0, 44.0, 32.0, 33.0, 30.0, 37.0, 34.0, 29.0, 25.0, 29.0, 13.0, 20.0, 24.0, 12.0, 13.0, 12.0, 10.0, 4.0, 7.0, 6.0, 3.0, 2.0, 6.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.712890625, -3.59832763671875, -3.4837646484375, -3.36920166015625, -3.254638671875, -3.14007568359375, -3.0255126953125, -2.91094970703125, -2.79638671875, -2.68182373046875, -2.5672607421875, -2.45269775390625, -2.338134765625, -2.22357177734375, -2.1090087890625, -1.99444580078125, -1.8798828125, -1.76531982421875, -1.6507568359375, -1.53619384765625, -1.421630859375, -1.30706787109375, -1.1925048828125, -1.07794189453125, -0.96337890625, -0.84881591796875, -0.7342529296875, -0.61968994140625, -0.505126953125, -0.39056396484375, -0.2760009765625, -0.16143798828125, -0.046875, 0.06768798828125, 0.1822509765625, 0.29681396484375, 0.411376953125, 0.52593994140625, 0.6405029296875, 0.75506591796875, 0.86962890625, 0.98419189453125, 1.0987548828125, 1.21331787109375, 1.327880859375, 1.44244384765625, 1.5570068359375, 1.67156982421875, 1.7861328125, 1.90069580078125, 2.0152587890625, 2.12982177734375, 2.244384765625, 2.35894775390625, 2.4735107421875, 2.58807373046875, 2.70263671875, 2.81719970703125, 2.9317626953125, 3.04632568359375, 3.160888671875, 3.27545166015625, 3.3900146484375, 3.50457763671875, 3.619140625]}, "gradients/decoder.transformer.h.22.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 3.0, 7.0, 13.0, 13.0, 24.0, 34.0, 50.0, 84.0, 126.0, 176.0, 247.0, 314.0, 463.0, 687.0, 1034.0, 1365.0, 2007.0, 3059.0, 4324.0, 6586.0, 9809.0, 14620.0, 21944.0, 33136.0, 50023.0, 75197.0, 110131.0, 149738.0, 1201783.0, 131336.0, 92319.0, 61921.0, 41293.0, 27412.0, 18146.0, 12210.0, 8093.0, 5433.0, 3718.0, 2583.0, 1777.0, 1202.0, 855.0, 583.0, 400.0, 272.0, 177.0, 130.0, 100.0, 65.0, 41.0, 29.0, 19.0, 10.0, 17.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.39599609375, -0.383331298828125, -0.37066650390625, -0.358001708984375, -0.3453369140625, -0.332672119140625, -0.32000732421875, -0.307342529296875, -0.294677734375, -0.282012939453125, -0.26934814453125, -0.256683349609375, -0.2440185546875, -0.231353759765625, -0.21868896484375, -0.206024169921875, -0.193359375, -0.180694580078125, -0.16802978515625, -0.155364990234375, -0.1427001953125, -0.130035400390625, -0.11737060546875, -0.104705810546875, -0.092041015625, -0.079376220703125, -0.06671142578125, -0.054046630859375, -0.0413818359375, -0.028717041015625, -0.01605224609375, -0.003387451171875, 0.00927734375, 0.021942138671875, 0.03460693359375, 0.047271728515625, 0.0599365234375, 0.072601318359375, 0.08526611328125, 0.097930908203125, 0.110595703125, 0.123260498046875, 0.13592529296875, 0.148590087890625, 0.1612548828125, 0.173919677734375, 0.18658447265625, 0.199249267578125, 0.2119140625, 0.224578857421875, 0.23724365234375, 0.249908447265625, 0.2625732421875, 0.275238037109375, 0.28790283203125, 0.300567626953125, 0.313232421875, 0.325897216796875, 0.33856201171875, 0.351226806640625, 0.3638916015625, 0.376556396484375, 0.38922119140625, 0.401885986328125, 0.41455078125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 4.0, 2.0, 5.0, 4.0, 9.0, 10.0, 11.0, 18.0, 15.0, 16.0, 22.0, 29.0, 26.0, 36.0, 50.0, 62.0, 55.0, 78.0, 78.0, 89.0, 70.0, 69.0, 42.0, 52.0, 26.0, 27.0, 18.0, 20.0, 20.0, 12.0, 8.0, 6.0, 10.0, 3.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004657745361328125, -0.004519641399383545, -0.004381537437438965, -0.004243433475494385, -0.004105329513549805, -0.003967225551605225, -0.0038291215896606445, -0.0036910176277160645, -0.0035529136657714844, -0.0034148097038269043, -0.0032767057418823242, -0.003138601779937744, -0.003000497817993164, -0.002862393856048584, -0.002724289894104004, -0.002586185932159424, -0.0024480819702148438, -0.0023099780082702637, -0.0021718740463256836, -0.0020337700843811035, -0.0018956661224365234, -0.0017575621604919434, -0.0016194581985473633, -0.0014813542366027832, -0.0013432502746582031, -0.001205146312713623, -0.001067042350769043, -0.0009289383888244629, -0.0007908344268798828, -0.0006527304649353027, -0.0005146265029907227, -0.0003765225410461426, -0.0002384185791015625, -0.00010031461715698242, 3.7789344787597656e-05, 0.00017589330673217773, 0.0003139972686767578, 0.0004521012306213379, 0.000590205192565918, 0.000728309154510498, 0.0008664131164550781, 0.0010045170783996582, 0.0011426210403442383, 0.0012807250022888184, 0.0014188289642333984, 0.0015569329261779785, 0.0016950368881225586, 0.0018331408500671387, 0.0019712448120117188, 0.002109348773956299, 0.002247452735900879, 0.002385556697845459, 0.002523660659790039, 0.002661764621734619, 0.0027998685836791992, 0.0029379725456237793, 0.0030760765075683594, 0.0032141804695129395, 0.0033522844314575195, 0.0034903883934020996, 0.0036284923553466797, 0.0037665963172912598, 0.00390470027923584, 0.00404280424118042, 0.004180908203125]}, "gradients/decoder.transformer.h.22.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 4.0, 5.0, 9.0, 9.0, 8.0, 11.0, 13.0, 28.0, 23.0, 41.0, 47.0, 62.0, 73.0, 124.0, 215.0, 387.0, 1179.0, 997044.0, 47758.0, 645.0, 286.0, 153.0, 105.0, 85.0, 46.0, 42.0, 27.0, 23.0, 25.0, 12.0, 14.0, 10.0, 8.0, 8.0, 13.0, 2.0, 5.0, 4.0, 3.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0906982421875, -0.08765506744384766, -0.08461189270019531, -0.08156871795654297, -0.07852554321289062, -0.07548236846923828, -0.07243919372558594, -0.0693960189819336, -0.06635284423828125, -0.0633096694946289, -0.06026649475097656, -0.05722332000732422, -0.054180145263671875, -0.05113697052001953, -0.04809379577636719, -0.045050621032714844, -0.0420074462890625, -0.038964271545410156, -0.03592109680175781, -0.03287792205810547, -0.029834747314453125, -0.02679157257080078, -0.023748397827148438, -0.020705223083496094, -0.01766204833984375, -0.014618873596191406, -0.011575698852539062, -0.008532524108886719, -0.005489349365234375, -0.0024461746215820312, 0.0005970001220703125, 0.0036401748657226562, 0.006683349609375, 0.009726524353027344, 0.012769699096679688, 0.01581287384033203, 0.018856048583984375, 0.02189922332763672, 0.024942398071289062, 0.027985572814941406, 0.03102874755859375, 0.034071922302246094, 0.03711509704589844, 0.04015827178955078, 0.043201446533203125, 0.04624462127685547, 0.04928779602050781, 0.052330970764160156, 0.0553741455078125, 0.058417320251464844, 0.06146049499511719, 0.06450366973876953, 0.06754684448242188, 0.07059001922607422, 0.07363319396972656, 0.0766763687133789, 0.07971954345703125, 0.0827627182006836, 0.08580589294433594, 0.08884906768798828, 0.09189224243164062, 0.09493541717529297, 0.09797859191894531, 0.10102176666259766, 0.10406494140625]}, "gradients/decoder.transformer.h.22.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 342.0, 675.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0869641825556755, -0.08535484969615936, -0.08374552428722382, -0.08213619142770767, -0.08052685856819153, -0.07891753315925598, -0.07730820029973984, -0.0756988674402237, -0.07408954203128815, -0.072480209171772, -0.07087088376283646, -0.06926155090332031, -0.06765221804380417, -0.06604289263486862, -0.06443355977535248, -0.06282422691583633, -0.06121489778161049, -0.059605568647384644, -0.0579962357878685, -0.056386906653642654, -0.05477757751941681, -0.053168244659900665, -0.05155891552567482, -0.049949586391448975, -0.04834025353193283, -0.046730924397706985, -0.04512159153819084, -0.043512262403964996, -0.04190293326973915, -0.040293604135513306, -0.03868427127599716, -0.037074942141771317, -0.03546561300754547, -0.033856283873319626, -0.03224695101380348, -0.030637621879577637, -0.02902829274535179, -0.027418961748480797, -0.025809630751609802, -0.024200301617383957, -0.022590970620512962, -0.020981639623641968, -0.019372310489416122, -0.017762979492545128, -0.016153648495674133, -0.014544319361448288, -0.012934988364577293, -0.011325658299028873, -0.009716328233480453, -0.008106998167932034, -0.006497667636722326, -0.004888337105512619, -0.003279007039964199, -0.0016696769744157791, -6.0345977544784546e-05, 0.0015489840880036354, 0.0031583141535520554, 0.004767644219100475, 0.006376974750310183, 0.00798630528151989, 0.00959563534706831, 0.01120496541261673, 0.012814296409487724, 0.014423626475036144, 0.016032956540584564]}, "gradients/decoder.transformer.h.22.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 2.0, 4.0, 2.0, 3.0, 4.0, 7.0, 8.0, 14.0, 19.0, 15.0, 23.0, 27.0, 32.0, 25.0, 43.0, 26.0, 59.0, 38.0, 61.0, 60.0, 46.0, 44.0, 49.0, 51.0, 57.0, 43.0, 34.0, 37.0, 42.0, 24.0, 24.0, 25.0, 17.0, 12.0, 8.0, 10.0, 5.0, 3.0, 5.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0019191503524780273, -0.0018393006175756454, -0.0017594508826732635, -0.0016796011477708817, -0.0015997514128684998, -0.0015199016779661179, -0.001440051943063736, -0.001360202208161354, -0.0012803524732589722, -0.0012005027383565903, -0.0011206530034542084, -0.0010408032685518265, -0.0009609535336494446, -0.0008811037987470627, -0.0008012540638446808, -0.0007214043289422989, -0.000641554594039917, -0.0005617048591375351, -0.0004818551242351532, -0.0004020053893327713, -0.0003221556544303894, -0.0002423059195280075, -0.0001624561846256256, -8.260644972324371e-05, -2.7567148208618164e-06, 7.709302008152008e-05, 0.00015694275498390198, 0.00023679248988628387, 0.00031664222478866577, 0.00039649195969104767, 0.00047634169459342957, 0.0005561914294958115, 0.0006360411643981934, 0.0007158908993005753, 0.0007957406342029572, 0.000875590369105339, 0.000955440104007721, 0.0010352898389101028, 0.0011151395738124847, 0.0011949893087148666, 0.0012748390436172485, 0.0013546887785196304, 0.0014345385134220123, 0.0015143882483243942, 0.0015942379832267761, 0.001674087718129158, 0.00175393745303154, 0.0018337871879339218, 0.0019136369228363037, 0.0019934866577386856, 0.0020733363926410675, 0.0021531861275434494, 0.0022330358624458313, 0.002312885597348213, 0.002392735332250595, 0.002472585067152977, 0.002552434802055359, 0.002632284536957741, 0.0027121342718601227, 0.0027919840067625046, 0.0028718337416648865, 0.0029516834765672684, 0.0030315332114696503, 0.003111382946372032, 0.003191232681274414]}, "gradients/decoder.transformer.h.22.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 5.0, 3.0, 8.0, 7.0, 6.0, 11.0, 14.0, 18.0, 12.0, 21.0, 18.0, 20.0, 21.0, 19.0, 39.0, 38.0, 32.0, 43.0, 37.0, 34.0, 50.0, 38.0, 47.0, 32.0, 49.0, 50.0, 43.0, 47.0, 26.0, 19.0, 33.0, 23.0, 26.0, 19.0, 19.0, 19.0, 10.0, 15.0, 15.0, 4.0, 7.0, 4.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.38671875, -5.20037841796875, -5.0140380859375, -4.82769775390625, -4.641357421875, -4.45501708984375, -4.2686767578125, -4.08233642578125, -3.89599609375, -3.70965576171875, -3.5233154296875, -3.33697509765625, -3.150634765625, -2.96429443359375, -2.7779541015625, -2.59161376953125, -2.4052734375, -2.21893310546875, -2.0325927734375, -1.84625244140625, -1.659912109375, -1.47357177734375, -1.2872314453125, -1.10089111328125, -0.91455078125, -0.72821044921875, -0.5418701171875, -0.35552978515625, -0.169189453125, 0.01715087890625, 0.2034912109375, 0.38983154296875, 0.576171875, 0.76251220703125, 0.9488525390625, 1.13519287109375, 1.321533203125, 1.50787353515625, 1.6942138671875, 1.88055419921875, 2.06689453125, 2.25323486328125, 2.4395751953125, 2.62591552734375, 2.812255859375, 2.99859619140625, 3.1849365234375, 3.37127685546875, 3.5576171875, 3.74395751953125, 3.9302978515625, 4.11663818359375, 4.302978515625, 4.48931884765625, 4.6756591796875, 4.86199951171875, 5.04833984375, 5.23468017578125, 5.4210205078125, 5.60736083984375, 5.793701171875, 5.98004150390625, 6.1663818359375, 6.35272216796875, 6.5390625]}, "gradients/decoder.transformer.h.22.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 4.0, 1.0, 4.0, 3.0, 9.0, 10.0, 16.0, 13.0, 28.0, 35.0, 53.0, 73.0, 75.0, 130.0, 175.0, 234.0, 387.0, 608.0, 1024.0, 2140.0, 4943.0, 12995.0, 41319.0, 154431.0, 498681.0, 238970.0, 60972.0, 18542.0, 6543.0, 2739.0, 1309.0, 733.0, 420.0, 283.0, 191.0, 152.0, 78.0, 81.0, 38.0, 35.0, 28.0, 18.0, 17.0, 6.0, 1.0, 10.0, 2.0, 6.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.72265625, -5.52294921875, -5.3232421875, -5.12353515625, -4.923828125, -4.72412109375, -4.5244140625, -4.32470703125, -4.125, -3.92529296875, -3.7255859375, -3.52587890625, -3.326171875, -3.12646484375, -2.9267578125, -2.72705078125, -2.52734375, -2.32763671875, -2.1279296875, -1.92822265625, -1.728515625, -1.52880859375, -1.3291015625, -1.12939453125, -0.9296875, -0.72998046875, -0.5302734375, -0.33056640625, -0.130859375, 0.06884765625, 0.2685546875, 0.46826171875, 0.66796875, 0.86767578125, 1.0673828125, 1.26708984375, 1.466796875, 1.66650390625, 1.8662109375, 2.06591796875, 2.265625, 2.46533203125, 2.6650390625, 2.86474609375, 3.064453125, 3.26416015625, 3.4638671875, 3.66357421875, 3.86328125, 4.06298828125, 4.2626953125, 4.46240234375, 4.662109375, 4.86181640625, 5.0615234375, 5.26123046875, 5.4609375, 5.66064453125, 5.8603515625, 6.06005859375, 6.259765625, 6.45947265625, 6.6591796875, 6.85888671875, 7.05859375]}, "gradients/decoder.transformer.h.22.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 4.0, 0.0, 8.0, 7.0, 5.0, 13.0, 10.0, 13.0, 14.0, 15.0, 16.0, 26.0, 31.0, 38.0, 37.0, 37.0, 35.0, 39.0, 58.0, 58.0, 107.0, 1599.0, 361.0, 112.0, 57.0, 49.0, 31.0, 45.0, 34.0, 37.0, 20.0, 19.0, 22.0, 17.0, 18.0, 16.0, 6.0, 12.0, 13.0, 5.0, 5.0, 5.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.96875, -22.269775390625, -21.57080078125, -20.871826171875, -20.1728515625, -19.473876953125, -18.77490234375, -18.075927734375, -17.376953125, -16.677978515625, -15.97900390625, -15.280029296875, -14.5810546875, -13.882080078125, -13.18310546875, -12.484130859375, -11.78515625, -11.086181640625, -10.38720703125, -9.688232421875, -8.9892578125, -8.290283203125, -7.59130859375, -6.892333984375, -6.193359375, -5.494384765625, -4.79541015625, -4.096435546875, -3.3974609375, -2.698486328125, -1.99951171875, -1.300537109375, -0.6015625, 0.097412109375, 0.79638671875, 1.495361328125, 2.1943359375, 2.893310546875, 3.59228515625, 4.291259765625, 4.990234375, 5.689208984375, 6.38818359375, 7.087158203125, 7.7861328125, 8.485107421875, 9.18408203125, 9.883056640625, 10.58203125, 11.281005859375, 11.97998046875, 12.678955078125, 13.3779296875, 14.076904296875, 14.77587890625, 15.474853515625, 16.173828125, 16.872802734375, 17.57177734375, 18.270751953125, 18.9697265625, 19.668701171875, 20.36767578125, 21.066650390625, 21.765625]}, "gradients/decoder.transformer.h.22.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 6.0, 8.0, 11.0, 8.0, 10.0, 17.0, 23.0, 20.0, 21.0, 17.0, 48.0, 43.0, 57.0, 80.0, 130.0, 255.0, 673.0, 3172.0, 2897352.0, 240679.0, 1871.0, 467.0, 224.0, 103.0, 86.0, 69.0, 46.0, 39.0, 40.0, 18.0, 21.0, 17.0, 12.0, 11.0, 13.0, 10.0, 8.0, 5.0, 5.0, 2.0, 2.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-47.375, -45.7890625, -44.203125, -42.6171875, -41.03125, -39.4453125, -37.859375, -36.2734375, -34.6875, -33.1015625, -31.515625, -29.9296875, -28.34375, -26.7578125, -25.171875, -23.5859375, -22.0, -20.4140625, -18.828125, -17.2421875, -15.65625, -14.0703125, -12.484375, -10.8984375, -9.3125, -7.7265625, -6.140625, -4.5546875, -2.96875, -1.3828125, 0.203125, 1.7890625, 3.375, 4.9609375, 6.546875, 8.1328125, 9.71875, 11.3046875, 12.890625, 14.4765625, 16.0625, 17.6484375, 19.234375, 20.8203125, 22.40625, 23.9921875, 25.578125, 27.1640625, 28.75, 30.3359375, 31.921875, 33.5078125, 35.09375, 36.6796875, 38.265625, 39.8515625, 41.4375, 43.0234375, 44.609375, 46.1953125, 47.78125, 49.3671875, 50.953125, 52.5390625, 54.125]}, "gradients/decoder.transformer.h.22.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 141.0, 827.0, 39.0, 3.0], "bins": [-274.7508850097656, -270.2724609375, -265.7940673828125, -261.3156433105469, -256.83721923828125, -252.35882568359375, -247.88040161132812, -243.40199279785156, -238.923583984375, -234.44517517089844, -229.96676635742188, -225.48834228515625, -221.0099334716797, -216.53152465820312, -212.0531005859375, -207.57469177246094, -203.09628295898438, -198.6178741455078, -194.13946533203125, -189.66104125976562, -185.18263244628906, -180.7042236328125, -176.22579956054688, -171.7473907470703, -167.26898193359375, -162.7905731201172, -158.31216430664062, -153.833740234375, -149.35533142089844, -144.87692260742188, -140.39849853515625, -135.9200897216797, -131.44168090820312, -126.96327209472656, -122.48485565185547, -118.00643920898438, -113.52803039550781, -109.04962158203125, -104.57120513916016, -100.09278869628906, -95.61438751220703, -91.13597106933594, -86.65756225585938, -82.17915344238281, -77.70073699951172, -73.22232055664062, -68.74391174316406, -64.2655029296875, -59.787086486816406, -55.30867385864258, -50.83026123046875, -46.35184860229492, -41.873435974121094, -37.395023345947266, -32.91661071777344, -28.43819808959961, -23.95978546142578, -19.481372833251953, -15.002960205078125, -10.524547576904297, -6.046134948730469, -1.5677223205566406, 2.9106903076171875, 7.389102935791016, 11.86751651763916]}, "gradients/decoder.transformer.h.22.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 2.0, 3.0, 7.0, 3.0, 6.0, 5.0, 10.0, 7.0, 12.0, 25.0, 20.0, 31.0, 24.0, 26.0, 28.0, 29.0, 31.0, 27.0, 36.0, 34.0, 51.0, 32.0, 48.0, 32.0, 40.0, 46.0, 45.0, 33.0, 40.0, 35.0, 33.0, 27.0, 29.0, 26.0, 22.0, 13.0, 16.0, 12.0, 13.0, 5.0, 4.0, 10.0, 5.0, 8.0, 2.0, 4.0, 5.0, 1.0, 2.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-63.05537033081055, -61.02915954589844, -59.002952575683594, -56.976741790771484, -54.95053482055664, -52.92432403564453, -50.89811706542969, -48.87190628051758, -46.84569549560547, -44.81948471069336, -42.793277740478516, -40.767066955566406, -38.74085998535156, -36.71464920043945, -34.688438415527344, -32.6622314453125, -30.636024475097656, -28.60981559753418, -26.583606719970703, -24.557395935058594, -22.53118896484375, -20.50497817993164, -18.478769302368164, -16.452560424804688, -14.426351547241211, -12.400142669677734, -10.373933792114258, -8.347723960876465, -6.321515083312988, -4.295306205749512, -2.2690963745117188, -0.2428874969482422, 1.7833251953125, 3.8095343112945557, 5.835743427276611, 7.861952781677246, 9.888161659240723, 11.9143705368042, 13.940580368041992, 15.966789245605469, 17.992998123168945, 20.019207000732422, 22.0454158782959, 24.071624755859375, 26.097835540771484, 28.124042510986328, 30.150253295898438, 32.17646026611328, 34.20267105102539, 36.2288818359375, 38.255088806152344, 40.28129959106445, 42.3075065612793, 44.333717346191406, 46.35992431640625, 48.38613510131836, 50.41234588623047, 52.43855667114258, 54.46476364135742, 56.49097442626953, 58.517181396484375, 60.543392181396484, 62.569602966308594, 64.59580993652344, 66.62201690673828]}, "gradients/decoder.transformer.h.21.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 1.0, 6.0, 3.0, 6.0, 7.0, 7.0, 13.0, 15.0, 10.0, 16.0, 20.0, 17.0, 23.0, 18.0, 23.0, 31.0, 40.0, 40.0, 32.0, 40.0, 35.0, 45.0, 41.0, 44.0, 44.0, 52.0, 45.0, 40.0, 40.0, 41.0, 25.0, 24.0, 29.0, 18.0, 21.0, 17.0, 20.0, 14.0, 14.0, 10.0, 10.0, 5.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.51953125, -5.328857421875, -5.13818359375, -4.947509765625, -4.7568359375, -4.566162109375, -4.37548828125, -4.184814453125, -3.994140625, -3.803466796875, -3.61279296875, -3.422119140625, -3.2314453125, -3.040771484375, -2.85009765625, -2.659423828125, -2.46875, -2.278076171875, -2.08740234375, -1.896728515625, -1.7060546875, -1.515380859375, -1.32470703125, -1.134033203125, -0.943359375, -0.752685546875, -0.56201171875, -0.371337890625, -0.1806640625, 0.010009765625, 0.20068359375, 0.391357421875, 0.58203125, 0.772705078125, 0.96337890625, 1.154052734375, 1.3447265625, 1.535400390625, 1.72607421875, 1.916748046875, 2.107421875, 2.298095703125, 2.48876953125, 2.679443359375, 2.8701171875, 3.060791015625, 3.25146484375, 3.442138671875, 3.6328125, 3.823486328125, 4.01416015625, 4.204833984375, 4.3955078125, 4.586181640625, 4.77685546875, 4.967529296875, 5.158203125, 5.348876953125, 5.53955078125, 5.730224609375, 5.9208984375, 6.111572265625, 6.30224609375, 6.492919921875, 6.68359375]}, "gradients/decoder.transformer.h.21.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 8.0, 14.0, 18.0, 33.0, 22.0, 50.0, 52.0, 61.0, 95.0, 125.0, 275.0, 521.0, 1484.0, 5504.0, 32809.0, 371509.0, 3270178.0, 464894.0, 37625.0, 6182.0, 1520.0, 523.0, 233.0, 154.0, 93.0, 71.0, 54.0, 45.0, 34.0, 20.0, 11.0, 16.0, 12.0, 8.0, 2.0, 4.0, 8.0, 3.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.359375, -24.55517578125, -23.7509765625, -22.94677734375, -22.142578125, -21.33837890625, -20.5341796875, -19.72998046875, -18.92578125, -18.12158203125, -17.3173828125, -16.51318359375, -15.708984375, -14.90478515625, -14.1005859375, -13.29638671875, -12.4921875, -11.68798828125, -10.8837890625, -10.07958984375, -9.275390625, -8.47119140625, -7.6669921875, -6.86279296875, -6.05859375, -5.25439453125, -4.4501953125, -3.64599609375, -2.841796875, -2.03759765625, -1.2333984375, -0.42919921875, 0.375, 1.17919921875, 1.9833984375, 2.78759765625, 3.591796875, 4.39599609375, 5.2001953125, 6.00439453125, 6.80859375, 7.61279296875, 8.4169921875, 9.22119140625, 10.025390625, 10.82958984375, 11.6337890625, 12.43798828125, 13.2421875, 14.04638671875, 14.8505859375, 15.65478515625, 16.458984375, 17.26318359375, 18.0673828125, 18.87158203125, 19.67578125, 20.47998046875, 21.2841796875, 22.08837890625, 22.892578125, 23.69677734375, 24.5009765625, 25.30517578125, 26.109375]}, "gradients/decoder.transformer.h.21.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 12.0, 21.0, 34.0, 46.0, 76.0, 135.0, 235.0, 331.0, 531.0, 719.0, 707.0, 451.0, 310.0, 200.0, 112.0, 56.0, 42.0, 25.0, 17.0, 11.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-45.1875, -44.131103515625, -43.07470703125, -42.018310546875, -40.9619140625, -39.905517578125, -38.84912109375, -37.792724609375, -36.736328125, -35.679931640625, -34.62353515625, -33.567138671875, -32.5107421875, -31.454345703125, -30.39794921875, -29.341552734375, -28.28515625, -27.228759765625, -26.17236328125, -25.115966796875, -24.0595703125, -23.003173828125, -21.94677734375, -20.890380859375, -19.833984375, -18.777587890625, -17.72119140625, -16.664794921875, -15.6083984375, -14.552001953125, -13.49560546875, -12.439208984375, -11.3828125, -10.326416015625, -9.27001953125, -8.213623046875, -7.1572265625, -6.100830078125, -5.04443359375, -3.988037109375, -2.931640625, -1.875244140625, -0.81884765625, 0.237548828125, 1.2939453125, 2.350341796875, 3.40673828125, 4.463134765625, 5.51953125, 6.575927734375, 7.63232421875, 8.688720703125, 9.7451171875, 10.801513671875, 11.85791015625, 12.914306640625, 13.970703125, 15.027099609375, 16.08349609375, 17.139892578125, 18.1962890625, 19.252685546875, 20.30908203125, 21.365478515625, 22.421875]}, "gradients/decoder.transformer.h.21.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 5.0, 4.0, 9.0, 7.0, 14.0, 36.0, 62.0, 83.0, 170.0, 317.0, 917.0, 7901.0, 805732.0, 3356956.0, 19961.0, 1342.0, 353.0, 173.0, 101.0, 47.0, 36.0, 25.0, 14.0, 5.0, 7.0, 6.0, 1.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-71.375, -68.53515625, -65.6953125, -62.85546875, -60.015625, -57.17578125, -54.3359375, -51.49609375, -48.65625, -45.81640625, -42.9765625, -40.13671875, -37.296875, -34.45703125, -31.6171875, -28.77734375, -25.9375, -23.09765625, -20.2578125, -17.41796875, -14.578125, -11.73828125, -8.8984375, -6.05859375, -3.21875, -0.37890625, 2.4609375, 5.30078125, 8.140625, 10.98046875, 13.8203125, 16.66015625, 19.5, 22.33984375, 25.1796875, 28.01953125, 30.859375, 33.69921875, 36.5390625, 39.37890625, 42.21875, 45.05859375, 47.8984375, 50.73828125, 53.578125, 56.41796875, 59.2578125, 62.09765625, 64.9375, 67.77734375, 70.6171875, 73.45703125, 76.296875, 79.13671875, 81.9765625, 84.81640625, 87.65625, 90.49609375, 93.3359375, 96.17578125, 99.015625, 101.85546875, 104.6953125, 107.53515625, 110.375]}, "gradients/decoder.transformer.h.21.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 18.0, 73.0, 235.0, 365.0, 234.0, 72.0, 13.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-317.4837951660156, -309.6406555175781, -301.79754638671875, -293.95440673828125, -286.11126708984375, -278.2681579589844, -270.4250183105469, -262.5818786621094, -254.73875427246094, -246.8956298828125, -239.052490234375, -231.20936584472656, -223.36624145507812, -215.52310180664062, -207.6799774169922, -199.83685302734375, -191.99371337890625, -184.1505889892578, -176.3074493408203, -168.46432495117188, -160.62120056152344, -152.77806091308594, -144.9349365234375, -137.091796875, -129.24868774414062, -121.40555572509766, -113.56243133544922, -105.71929931640625, -97.87616729736328, -90.03303527832031, -82.18991088867188, -74.3467788696289, -66.50364685058594, -58.660518646240234, -50.817386627197266, -42.97425842285156, -35.131126403808594, -27.28799819946289, -19.444869995117188, -11.601737976074219, -3.7586097717285156, 4.084519863128662, 11.92764949798584, 19.77077865600586, 27.613908767700195, 35.45703887939453, 43.300167083740234, 51.1432991027832, 58.986427307128906, 66.82955932617188, 74.67268371582031, 82.51581573486328, 90.35894775390625, 98.20207214355469, 106.04520416259766, 113.88833618164062, 121.73146057128906, 129.5745849609375, 137.417724609375, 145.26084899902344, 153.10397338867188, 160.94711303710938, 168.7902374267578, 176.63336181640625, 184.47650146484375]}, "gradients/decoder.transformer.h.21.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 1.0, 5.0, 1.0, 6.0, 7.0, 6.0, 9.0, 16.0, 13.0, 22.0, 19.0, 16.0, 25.0, 29.0, 28.0, 30.0, 30.0, 28.0, 46.0, 39.0, 40.0, 48.0, 38.0, 35.0, 31.0, 42.0, 44.0, 46.0, 33.0, 34.0, 25.0, 31.0, 22.0, 28.0, 22.0, 27.0, 21.0, 19.0, 15.0, 11.0, 4.0, 7.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-68.70602416992188, -66.41228485107422, -64.11854553222656, -61.82481002807617, -59.531070709228516, -57.237335205078125, -54.94359588623047, -52.64985656738281, -50.356117248535156, -48.0623779296875, -45.76864242553711, -43.47490310668945, -41.1811637878418, -38.887428283691406, -36.59368896484375, -34.299949645996094, -32.0062141418457, -29.71247673034668, -27.418737411499023, -25.125, -22.831260681152344, -20.53752326965332, -18.243785858154297, -15.95004653930664, -13.656309127807617, -11.362570762634277, -9.068832397460938, -6.775094985961914, -4.481356620788574, -2.1876182556152344, 0.10611915588378906, 2.3998584747314453, 4.693595886230469, 6.987334251403809, 9.281072616577148, 11.574810028076172, 13.868548393249512, 16.16228675842285, 18.456024169921875, 20.74976348876953, 23.043500900268555, 25.337238311767578, 27.630977630615234, 29.924715042114258, 32.21845245361328, 34.51219177246094, 36.805931091308594, 39.09967041015625, 41.39340591430664, 43.6871452331543, 45.98088073730469, 48.274620056152344, 50.568359375, 52.862098693847656, 55.15583419799805, 57.4495735168457, 59.743309020996094, 62.03704833984375, 64.3307876586914, 66.62452697753906, 68.91825866699219, 71.21199798583984, 73.5057373046875, 75.79947662353516, 78.09321594238281]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 0.0, 6.0, 6.0, 12.0, 14.0, 16.0, 10.0, 15.0, 15.0, 14.0, 12.0, 23.0, 35.0, 25.0, 32.0, 30.0, 42.0, 42.0, 46.0, 52.0, 41.0, 46.0, 41.0, 38.0, 52.0, 44.0, 46.0, 38.0, 28.0, 30.0, 22.0, 26.0, 20.0, 18.0, 15.0, 14.0, 9.0, 12.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.40899658203125, -5.2086181640625, -5.00823974609375, -4.807861328125, -4.60748291015625, -4.4071044921875, -4.20672607421875, -4.00634765625, -3.80596923828125, -3.6055908203125, -3.40521240234375, -3.204833984375, -3.00445556640625, -2.8040771484375, -2.60369873046875, -2.4033203125, -2.20294189453125, -2.0025634765625, -1.80218505859375, -1.601806640625, -1.40142822265625, -1.2010498046875, -1.00067138671875, -0.80029296875, -0.59991455078125, -0.3995361328125, -0.19915771484375, 0.001220703125, 0.20159912109375, 0.4019775390625, 0.60235595703125, 0.802734375, 1.00311279296875, 1.2034912109375, 1.40386962890625, 1.604248046875, 1.80462646484375, 2.0050048828125, 2.20538330078125, 2.40576171875, 2.60614013671875, 2.8065185546875, 3.00689697265625, 3.207275390625, 3.40765380859375, 3.6080322265625, 3.80841064453125, 4.0087890625, 4.20916748046875, 4.4095458984375, 4.60992431640625, 4.810302734375, 5.01068115234375, 5.2110595703125, 5.41143798828125, 5.61181640625, 5.81219482421875, 6.0125732421875, 6.21295166015625, 6.413330078125, 6.61370849609375, 6.8140869140625, 7.01446533203125, 7.21484375]}, "gradients/decoder.transformer.h.21.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 20.0, 10.0, 29.0, 25.0, 46.0, 71.0, 91.0, 145.0, 221.0, 318.0, 499.0, 807.0, 1091.0, 1829.0, 2724.0, 4343.0, 6831.0, 10671.0, 17200.0, 28875.0, 49129.0, 86825.0, 152615.0, 227966.0, 189024.0, 111035.0, 62339.0, 35959.0, 21624.0, 13127.0, 8323.0, 5243.0, 3288.0, 2137.0, 1413.0, 873.0, 565.0, 423.0, 256.0, 187.0, 114.0, 86.0, 54.0, 29.0, 25.0, 21.0, 11.0, 9.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 2.0], "bins": [-0.76025390625, -0.7370147705078125, -0.713775634765625, -0.6905364990234375, -0.66729736328125, -0.6440582275390625, -0.620819091796875, -0.5975799560546875, -0.5743408203125, -0.5511016845703125, -0.527862548828125, -0.5046234130859375, -0.48138427734375, -0.4581451416015625, -0.434906005859375, -0.4116668701171875, -0.388427734375, -0.3651885986328125, -0.341949462890625, -0.3187103271484375, -0.29547119140625, -0.2722320556640625, -0.248992919921875, -0.2257537841796875, -0.2025146484375, -0.1792755126953125, -0.156036376953125, -0.1327972412109375, -0.10955810546875, -0.0863189697265625, -0.063079833984375, -0.0398406982421875, -0.0166015625, 0.0066375732421875, 0.029876708984375, 0.0531158447265625, 0.07635498046875, 0.0995941162109375, 0.122833251953125, 0.1460723876953125, 0.1693115234375, 0.1925506591796875, 0.215789794921875, 0.2390289306640625, 0.26226806640625, 0.2855072021484375, 0.308746337890625, 0.3319854736328125, 0.355224609375, 0.3784637451171875, 0.401702880859375, 0.4249420166015625, 0.44818115234375, 0.4714202880859375, 0.494659423828125, 0.5178985595703125, 0.5411376953125, 0.5643768310546875, 0.587615966796875, 0.6108551025390625, 0.63409423828125, 0.6573333740234375, 0.680572509765625, 0.7038116455078125, 0.72705078125]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 3.0, 2.0, 1.0, 1.0, 4.0, 8.0, 5.0, 12.0, 9.0, 7.0, 22.0, 16.0, 25.0, 19.0, 20.0, 29.0, 31.0, 24.0, 31.0, 43.0, 41.0, 55.0, 41.0, 1073.0, 41.0, 46.0, 35.0, 37.0, 57.0, 45.0, 35.0, 36.0, 23.0, 32.0, 28.0, 24.0, 14.0, 10.0, 15.0, 7.0, 9.0, 5.0, 0.0, 3.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.84765625, -4.71240234375, -4.5771484375, -4.44189453125, -4.306640625, -4.17138671875, -4.0361328125, -3.90087890625, -3.765625, -3.63037109375, -3.4951171875, -3.35986328125, -3.224609375, -3.08935546875, -2.9541015625, -2.81884765625, -2.68359375, -2.54833984375, -2.4130859375, -2.27783203125, -2.142578125, -2.00732421875, -1.8720703125, -1.73681640625, -1.6015625, -1.46630859375, -1.3310546875, -1.19580078125, -1.060546875, -0.92529296875, -0.7900390625, -0.65478515625, -0.51953125, -0.38427734375, -0.2490234375, -0.11376953125, 0.021484375, 0.15673828125, 0.2919921875, 0.42724609375, 0.5625, 0.69775390625, 0.8330078125, 0.96826171875, 1.103515625, 1.23876953125, 1.3740234375, 1.50927734375, 1.64453125, 1.77978515625, 1.9150390625, 2.05029296875, 2.185546875, 2.32080078125, 2.4560546875, 2.59130859375, 2.7265625, 2.86181640625, 2.9970703125, 3.13232421875, 3.267578125, 3.40283203125, 3.5380859375, 3.67333984375, 3.80859375]}, "gradients/decoder.transformer.h.21.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 1.0, 5.0, 6.0, 8.0, 11.0, 20.0, 17.0, 30.0, 47.0, 64.0, 111.0, 156.0, 191.0, 344.0, 490.0, 667.0, 1004.0, 1349.0, 2116.0, 3130.0, 5018.0, 7467.0, 11443.0, 17777.0, 27569.0, 42806.0, 67801.0, 105005.0, 149725.0, 1218863.0, 147335.0, 102012.0, 65616.0, 42005.0, 27168.0, 17164.0, 11030.0, 7179.0, 4705.0, 3137.0, 2084.0, 1460.0, 949.0, 700.0, 472.0, 289.0, 190.0, 120.0, 82.0, 62.0, 46.0, 29.0, 23.0, 17.0, 12.0, 7.0, 4.0, 3.0, 1.0, 0.0, 3.0], "bins": [-0.466064453125, -0.4517097473144531, -0.43735504150390625, -0.4230003356933594, -0.4086456298828125, -0.3942909240722656, -0.37993621826171875, -0.3655815124511719, -0.351226806640625, -0.3368721008300781, -0.32251739501953125, -0.3081626892089844, -0.2938079833984375, -0.2794532775878906, -0.26509857177734375, -0.2507438659667969, -0.23638916015625, -0.22203445434570312, -0.20767974853515625, -0.19332504272460938, -0.1789703369140625, -0.16461563110351562, -0.15026092529296875, -0.13590621948242188, -0.121551513671875, -0.10719680786132812, -0.09284210205078125, -0.07848739624023438, -0.0641326904296875, -0.049777984619140625, -0.03542327880859375, -0.021068572998046875, -0.0067138671875, 0.007640838623046875, 0.02199554443359375, 0.036350250244140625, 0.0507049560546875, 0.06505966186523438, 0.07941436767578125, 0.09376907348632812, 0.108123779296875, 0.12247848510742188, 0.13683319091796875, 0.15118789672851562, 0.1655426025390625, 0.17989730834960938, 0.19425201416015625, 0.20860671997070312, 0.22296142578125, 0.23731613159179688, 0.25167083740234375, 0.2660255432128906, 0.2803802490234375, 0.2947349548339844, 0.30908966064453125, 0.3234443664550781, 0.337799072265625, 0.3521537780761719, 0.36650848388671875, 0.3808631896972656, 0.3952178955078125, 0.4095726013183594, 0.42392730712890625, 0.4382820129394531, 0.45263671875]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 3.0, 2.0, 2.0, 3.0, 5.0, 5.0, 6.0, 4.0, 5.0, 12.0, 11.0, 13.0, 14.0, 12.0, 24.0, 37.0, 47.0, 58.0, 64.0, 91.0, 96.0, 83.0, 81.0, 77.0, 59.0, 35.0, 33.0, 27.0, 26.0, 16.0, 10.0, 9.0, 8.0, 3.0, 3.0, 6.0, 4.0, 4.0, 3.0, 1.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.007099151611328125, -0.00690990686416626, -0.0067206621170043945, -0.006531417369842529, -0.006342172622680664, -0.006152927875518799, -0.005963683128356934, -0.005774438381195068, -0.005585193634033203, -0.005395948886871338, -0.005206704139709473, -0.005017459392547607, -0.004828214645385742, -0.004638969898223877, -0.004449725151062012, -0.0042604804039001465, -0.004071235656738281, -0.003881990909576416, -0.0036927461624145508, -0.0035035014152526855, -0.0033142566680908203, -0.003125011920928955, -0.00293576717376709, -0.0027465224266052246, -0.0025572776794433594, -0.002368032932281494, -0.002178788185119629, -0.0019895434379577637, -0.0018002986907958984, -0.0016110539436340332, -0.001421809196472168, -0.0012325644493103027, -0.0010433197021484375, -0.0008540749549865723, -0.000664830207824707, -0.0004755854606628418, -0.00028634071350097656, -9.709596633911133e-05, 9.21487808227539e-05, 0.00028139352798461914, 0.0004706382751464844, 0.0006598830223083496, 0.0008491277694702148, 0.00103837251663208, 0.0012276172637939453, 0.0014168620109558105, 0.0016061067581176758, 0.001795351505279541, 0.0019845962524414062, 0.0021738409996032715, 0.0023630857467651367, 0.002552330493927002, 0.002741575241088867, 0.0029308199882507324, 0.0031200647354125977, 0.003309309482574463, 0.003498554229736328, 0.0036877989768981934, 0.0038770437240600586, 0.004066288471221924, 0.004255533218383789, 0.004444777965545654, 0.0046340227127075195, 0.004823267459869385, 0.00501251220703125]}, "gradients/decoder.transformer.h.21.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 5.0, 3.0, 1.0, 2.0, 5.0, 9.0, 3.0, 5.0, 5.0, 11.0, 25.0, 19.0, 33.0, 41.0, 45.0, 67.0, 123.0, 197.0, 299.0, 805.0, 744363.0, 300888.0, 731.0, 318.0, 171.0, 129.0, 65.0, 43.0, 31.0, 27.0, 18.0, 16.0, 11.0, 12.0, 3.0, 5.0, 6.0, 7.0, 3.0, 4.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.10943603515625, -0.1053762435913086, -0.10131645202636719, -0.09725666046142578, -0.09319686889648438, -0.08913707733154297, -0.08507728576660156, -0.08101749420166016, -0.07695770263671875, -0.07289791107177734, -0.06883811950683594, -0.06477832794189453, -0.060718536376953125, -0.05665874481201172, -0.05259895324707031, -0.048539161682128906, -0.0444793701171875, -0.040419578552246094, -0.03635978698730469, -0.03229999542236328, -0.028240203857421875, -0.02418041229248047, -0.020120620727539062, -0.016060829162597656, -0.01200103759765625, -0.007941246032714844, -0.0038814544677734375, 0.00017833709716796875, 0.004238128662109375, 0.008297920227050781, 0.012357711791992188, 0.016417503356933594, 0.020477294921875, 0.024537086486816406, 0.028596878051757812, 0.03265666961669922, 0.036716461181640625, 0.04077625274658203, 0.04483604431152344, 0.048895835876464844, 0.05295562744140625, 0.057015419006347656, 0.06107521057128906, 0.06513500213623047, 0.06919479370117188, 0.07325458526611328, 0.07731437683105469, 0.0813741683959961, 0.0854339599609375, 0.0894937515258789, 0.09355354309082031, 0.09761333465576172, 0.10167312622070312, 0.10573291778564453, 0.10979270935058594, 0.11385250091552734, 0.11791229248046875, 0.12197208404541016, 0.12603187561035156, 0.13009166717529297, 0.13415145874023438, 0.13821125030517578, 0.1422710418701172, 0.1463308334350586, 0.150390625]}, "gradients/decoder.transformer.h.21.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 518.0, 498.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03060906007885933, -0.029217127710580826, -0.027825195342302322, -0.02643326297402382, -0.025041330605745316, -0.023649398237466812, -0.022257467731833458, -0.020865535363554955, -0.01947360299527645, -0.018081670626997948, -0.016689738258719444, -0.015297806821763515, -0.013905874453485012, -0.012513942085206509, -0.01112201064825058, -0.009730078279972076, -0.008338145911693573, -0.00694621354341507, -0.0055542816407978535, -0.004162349738180637, -0.002770417369902134, -0.0013784850016236305, 1.3446435332298279e-05, 0.0014053788036108017, 0.002797311171889305, 0.0041892435401678085, 0.005581175442785025, 0.006973107345402241, 0.008365039713680744, 0.009756972081959248, 0.011148903518915176, 0.01254083588719368, 0.013932771980762482, 0.015324704349040985, 0.01671663671731949, 0.018108569085597992, 0.019500501453876495, 0.020892433822155, 0.022284364327788353, 0.023676296696066856, 0.02506822906434536, 0.026460161432623863, 0.027852093800902367, 0.02924402430653572, 0.030635956674814224, 0.03202788904309273, 0.03341982141137123, 0.034811753779649734, 0.03620368614792824, 0.03759561851620674, 0.038987550884485245, 0.04037948325276375, 0.04177141562104225, 0.043163347989320755, 0.04455527663230896, 0.04594720900058746, 0.04733914136886597, 0.04873107373714447, 0.050123006105422974, 0.05151493847370148, 0.05290687084197998, 0.054298803210258484, 0.05569073557853699, 0.05708266794681549, 0.058474600315093994]}, "gradients/decoder.transformer.h.21.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 1.0, 4.0, 10.0, 19.0, 21.0, 22.0, 25.0, 36.0, 52.0, 53.0, 46.0, 71.0, 75.0, 74.0, 70.0, 79.0, 75.0, 63.0, 44.0, 38.0, 31.0, 27.0, 25.0, 11.0, 13.0, 10.0, 5.0, 7.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003817319869995117, -0.003658144734799862, -0.0034989695996046066, -0.0033397944644093513, -0.003180619329214096, -0.003021444194018841, -0.0028622690588235855, -0.0027030939236283302, -0.002543918788433075, -0.0023847436532378197, -0.0022255685180425644, -0.002066393382847309, -0.0019072182476520538, -0.0017480431124567986, -0.0015888679772615433, -0.001429692842066288, -0.0012705177068710327, -0.0011113425716757774, -0.0009521674364805222, -0.0007929923012852669, -0.0006338171660900116, -0.0004746420308947563, -0.00031546689569950104, -0.00015629176050424576, 2.8833746910095215e-06, 0.0001620585098862648, 0.0003212336450815201, 0.00048040878027677536, 0.0006395839154720306, 0.0007987590506672859, 0.0009579341858625412, 0.0011171093210577965, 0.0012762844562530518, 0.001435459591448307, 0.0015946347266435623, 0.0017538098618388176, 0.0019129849970340729, 0.002072160132229328, 0.0022313352674245834, 0.0023905104026198387, 0.002549685537815094, 0.0027088606730103493, 0.0028680358082056046, 0.00302721094340086, 0.003186386078596115, 0.0033455612137913704, 0.0035047363489866257, 0.003663911484181881, 0.0038230866193771362, 0.0039822617545723915, 0.004141436889767647, 0.004300612024962902, 0.004459787160158157, 0.004618962295353413, 0.004778137430548668, 0.004937312565743923, 0.0050964877009391785, 0.005255662836134434, 0.005414837971329689, 0.005574013106524944, 0.0057331882417202, 0.005892363376915455, 0.00605153851211071, 0.006210713647305965, 0.006369888782501221]}, "gradients/decoder.transformer.h.21.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 3.0, 1.0, 5.0, 0.0, 6.0, 6.0, 12.0, 14.0, 16.0, 10.0, 15.0, 15.0, 14.0, 12.0, 23.0, 35.0, 25.0, 32.0, 30.0, 42.0, 42.0, 46.0, 52.0, 41.0, 46.0, 41.0, 38.0, 52.0, 44.0, 46.0, 38.0, 28.0, 30.0, 22.0, 26.0, 20.0, 18.0, 15.0, 14.0, 9.0, 12.0, 7.0, 3.0, 4.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.609375, -5.40899658203125, -5.2086181640625, -5.00823974609375, -4.807861328125, -4.60748291015625, -4.4071044921875, -4.20672607421875, -4.00634765625, -3.80596923828125, -3.6055908203125, -3.40521240234375, -3.204833984375, -3.00445556640625, -2.8040771484375, -2.60369873046875, -2.4033203125, -2.20294189453125, -2.0025634765625, -1.80218505859375, -1.601806640625, -1.40142822265625, -1.2010498046875, -1.00067138671875, -0.80029296875, -0.59991455078125, -0.3995361328125, -0.19915771484375, 0.001220703125, 0.20159912109375, 0.4019775390625, 0.60235595703125, 0.802734375, 1.00311279296875, 1.2034912109375, 1.40386962890625, 1.604248046875, 1.80462646484375, 2.0050048828125, 2.20538330078125, 2.40576171875, 2.60614013671875, 2.8065185546875, 3.00689697265625, 3.207275390625, 3.40765380859375, 3.6080322265625, 3.80841064453125, 4.0087890625, 4.20916748046875, 4.4095458984375, 4.60992431640625, 4.810302734375, 5.01068115234375, 5.2110595703125, 5.41143798828125, 5.61181640625, 5.81219482421875, 6.0125732421875, 6.21295166015625, 6.413330078125, 6.61370849609375, 6.8140869140625, 7.01446533203125, 7.21484375]}, "gradients/decoder.transformer.h.21.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 3.0, 11.0, 3.0, 18.0, 20.0, 27.0, 30.0, 64.0, 61.0, 110.0, 163.0, 209.0, 322.0, 481.0, 652.0, 1016.0, 1472.0, 2172.0, 3611.0, 5713.0, 10487.0, 21862.0, 53988.0, 174399.0, 475187.0, 188554.0, 57360.0, 23016.0, 10785.0, 6053.0, 3733.0, 2279.0, 1475.0, 1027.0, 680.0, 472.0, 317.0, 215.0, 148.0, 111.0, 68.0, 56.0, 38.0, 29.0, 21.0, 13.0, 4.0, 9.0, 3.0, 9.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0], "bins": [-5.5234375, -5.3536376953125, -5.183837890625, -5.0140380859375, -4.84423828125, -4.6744384765625, -4.504638671875, -4.3348388671875, -4.1650390625, -3.9952392578125, -3.825439453125, -3.6556396484375, -3.48583984375, -3.3160400390625, -3.146240234375, -2.9764404296875, -2.806640625, -2.6368408203125, -2.467041015625, -2.2972412109375, -2.12744140625, -1.9576416015625, -1.787841796875, -1.6180419921875, -1.4482421875, -1.2784423828125, -1.108642578125, -0.9388427734375, -0.76904296875, -0.5992431640625, -0.429443359375, -0.2596435546875, -0.08984375, 0.0799560546875, 0.249755859375, 0.4195556640625, 0.58935546875, 0.7591552734375, 0.928955078125, 1.0987548828125, 1.2685546875, 1.4383544921875, 1.608154296875, 1.7779541015625, 1.94775390625, 2.1175537109375, 2.287353515625, 2.4571533203125, 2.626953125, 2.7967529296875, 2.966552734375, 3.1363525390625, 3.30615234375, 3.4759521484375, 3.645751953125, 3.8155517578125, 3.9853515625, 4.1551513671875, 4.324951171875, 4.4947509765625, 4.66455078125, 4.8343505859375, 5.004150390625, 5.1739501953125, 5.34375]}, "gradients/decoder.transformer.h.21.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 2.0, 5.0, 3.0, 8.0, 7.0, 5.0, 4.0, 13.0, 9.0, 15.0, 14.0, 12.0, 23.0, 16.0, 28.0, 28.0, 25.0, 38.0, 28.0, 31.0, 39.0, 49.0, 44.0, 58.0, 107.0, 1634.0, 272.0, 76.0, 42.0, 51.0, 38.0, 33.0, 36.0, 43.0, 34.0, 28.0, 26.0, 15.0, 20.0, 17.0, 16.0, 10.0, 9.0, 9.0, 2.0, 7.0, 8.0, 8.0, 6.0, 6.0, 3.0, 2.0, 2.0, 1.0], "bins": [-22.328125, -21.7041015625, -21.080078125, -20.4560546875, -19.83203125, -19.2080078125, -18.583984375, -17.9599609375, -17.3359375, -16.7119140625, -16.087890625, -15.4638671875, -14.83984375, -14.2158203125, -13.591796875, -12.9677734375, -12.34375, -11.7197265625, -11.095703125, -10.4716796875, -9.84765625, -9.2236328125, -8.599609375, -7.9755859375, -7.3515625, -6.7275390625, -6.103515625, -5.4794921875, -4.85546875, -4.2314453125, -3.607421875, -2.9833984375, -2.359375, -1.7353515625, -1.111328125, -0.4873046875, 0.13671875, 0.7607421875, 1.384765625, 2.0087890625, 2.6328125, 3.2568359375, 3.880859375, 4.5048828125, 5.12890625, 5.7529296875, 6.376953125, 7.0009765625, 7.625, 8.2490234375, 8.873046875, 9.4970703125, 10.12109375, 10.7451171875, 11.369140625, 11.9931640625, 12.6171875, 13.2412109375, 13.865234375, 14.4892578125, 15.11328125, 15.7373046875, 16.361328125, 16.9853515625, 17.609375]}, "gradients/decoder.transformer.h.21.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 10.0, 5.0, 9.0, 13.0, 5.0, 5.0, 12.0, 12.0, 21.0, 20.0, 26.0, 36.0, 45.0, 68.0, 112.0, 147.0, 232.0, 515.0, 1280.0, 5140.0, 86813.0, 3008965.0, 36580.0, 3505.0, 1018.0, 389.0, 218.0, 130.0, 87.0, 49.0, 50.0, 45.0, 27.0, 20.0, 19.0, 23.0, 15.0, 14.0, 5.0, 5.0, 9.0, 7.0, 4.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-39.1875, -37.9775390625, -36.767578125, -35.5576171875, -34.34765625, -33.1376953125, -31.927734375, -30.7177734375, -29.5078125, -28.2978515625, -27.087890625, -25.8779296875, -24.66796875, -23.4580078125, -22.248046875, -21.0380859375, -19.828125, -18.6181640625, -17.408203125, -16.1982421875, -14.98828125, -13.7783203125, -12.568359375, -11.3583984375, -10.1484375, -8.9384765625, -7.728515625, -6.5185546875, -5.30859375, -4.0986328125, -2.888671875, -1.6787109375, -0.46875, 0.7412109375, 1.951171875, 3.1611328125, 4.37109375, 5.5810546875, 6.791015625, 8.0009765625, 9.2109375, 10.4208984375, 11.630859375, 12.8408203125, 14.05078125, 15.2607421875, 16.470703125, 17.6806640625, 18.890625, 20.1005859375, 21.310546875, 22.5205078125, 23.73046875, 24.9404296875, 26.150390625, 27.3603515625, 28.5703125, 29.7802734375, 30.990234375, 32.2001953125, 33.41015625, 34.6201171875, 35.830078125, 37.0400390625, 38.25]}, "gradients/decoder.transformer.h.21.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 30.0, 209.0, 393.0, 294.0, 64.0, 15.0, 2.0, 1.0, 0.0, 2.0], "bins": [-164.3690948486328, -161.46563720703125, -158.56216430664062, -155.65870666503906, -152.7552490234375, -149.85177612304688, -146.9483184814453, -144.04486083984375, -141.1414031982422, -138.23794555664062, -135.33447265625, -132.43101501464844, -129.52755737304688, -126.62409210205078, -123.72062683105469, -120.81716918945312, -117.9136962890625, -115.0102310180664, -112.10677337646484, -109.20330810546875, -106.29985046386719, -103.3963851928711, -100.492919921875, -97.58946228027344, -94.68600463867188, -91.78253936767578, -88.87908172607422, -85.97561645507812, -83.07215881347656, -80.16869354248047, -77.26522827148438, -74.36177062988281, -71.45829772949219, -68.5548324584961, -65.65137481689453, -62.74790954589844, -59.84444808959961, -56.94098663330078, -54.03752517700195, -51.134063720703125, -48.2306022644043, -45.32714080810547, -42.42367935180664, -39.52021789550781, -36.61675262451172, -33.71329116821289, -30.809829711914062, -27.9063663482666, -25.002904891967773, -22.099443435668945, -19.195980072021484, -16.292518615722656, -13.389056205749512, -10.485593795776367, -7.582132339477539, -4.678668975830078, -1.77520751953125, 1.1282546520233154, 4.031716823577881, 6.935178756713867, 9.838641166687012, 12.742103576660156, 15.645565032958984, 18.549028396606445, 21.452489852905273]}, "gradients/decoder.transformer.h.21.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 7.0, 7.0, 11.0, 12.0, 13.0, 20.0, 20.0, 32.0, 28.0, 18.0, 32.0, 38.0, 34.0, 33.0, 30.0, 52.0, 44.0, 54.0, 39.0, 45.0, 52.0, 35.0, 34.0, 39.0, 38.0, 32.0, 27.0, 26.0, 20.0, 27.0, 16.0, 9.0, 15.0, 12.0, 6.0, 7.0, 5.0, 3.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.67668914794922, -70.34230041503906, -68.0079116821289, -65.67352294921875, -63.339134216308594, -61.00474548339844, -58.67036056518555, -56.33597183227539, -54.001583099365234, -51.66719436645508, -49.33280563354492, -46.998416900634766, -44.664031982421875, -42.32964324951172, -39.99525451660156, -37.660865783691406, -35.32647705078125, -32.992088317871094, -30.657699584960938, -28.323312759399414, -25.988924026489258, -23.6545352935791, -21.320148468017578, -18.985759735107422, -16.651371002197266, -14.31698226928711, -11.98259449005127, -9.64820671081543, -7.313817977905273, -4.979429244995117, -2.6450414657592773, -0.3106536865234375, 2.0237350463867188, 4.358123302459717, 6.692511558532715, 9.026899337768555, 11.361288070678711, 13.695676803588867, 16.03006362915039, 18.364452362060547, 20.698841094970703, 23.03322982788086, 25.367618560791016, 27.70200538635254, 30.036394119262695, 32.37078094482422, 34.705169677734375, 37.03955841064453, 39.37394714355469, 41.708335876464844, 44.042724609375, 46.377113342285156, 48.71150207519531, 51.04589080810547, 53.38027572631836, 55.714664459228516, 58.04905319213867, 60.38344192504883, 62.717830657958984, 65.05221557617188, 67.38660430908203, 69.72099304199219, 72.05538177490234, 74.3897705078125, 76.72415924072266]}, "gradients/decoder.transformer.h.20.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 4.0, 1.0, 1.0, 5.0, 8.0, 6.0, 12.0, 11.0, 11.0, 9.0, 15.0, 14.0, 19.0, 19.0, 19.0, 27.0, 27.0, 32.0, 29.0, 41.0, 43.0, 45.0, 45.0, 45.0, 38.0, 54.0, 37.0, 38.0, 48.0, 48.0, 43.0, 37.0, 27.0, 12.0, 35.0, 14.0, 26.0, 13.0, 14.0, 11.0, 6.0, 7.0, 10.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.77734375, -5.5726318359375, -5.367919921875, -5.1632080078125, -4.95849609375, -4.7537841796875, -4.549072265625, -4.3443603515625, -4.1396484375, -3.9349365234375, -3.730224609375, -3.5255126953125, -3.32080078125, -3.1160888671875, -2.911376953125, -2.7066650390625, -2.501953125, -2.2972412109375, -2.092529296875, -1.8878173828125, -1.68310546875, -1.4783935546875, -1.273681640625, -1.0689697265625, -0.8642578125, -0.6595458984375, -0.454833984375, -0.2501220703125, -0.04541015625, 0.1593017578125, 0.364013671875, 0.5687255859375, 0.7734375, 0.9781494140625, 1.182861328125, 1.3875732421875, 1.59228515625, 1.7969970703125, 2.001708984375, 2.2064208984375, 2.4111328125, 2.6158447265625, 2.820556640625, 3.0252685546875, 3.22998046875, 3.4346923828125, 3.639404296875, 3.8441162109375, 4.048828125, 4.2535400390625, 4.458251953125, 4.6629638671875, 4.86767578125, 5.0723876953125, 5.277099609375, 5.4818115234375, 5.6865234375, 5.8912353515625, 6.095947265625, 6.3006591796875, 6.50537109375, 6.7100830078125, 6.914794921875, 7.1195068359375, 7.32421875]}, "gradients/decoder.transformer.h.20.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 4.0, 1.0, 5.0, 2.0, 8.0, 5.0, 8.0, 8.0, 8.0, 19.0, 10.0, 13.0, 12.0, 21.0, 18.0, 33.0, 23.0, 55.0, 63.0, 102.0, 140.0, 360.0, 1224.0, 6391.0, 56401.0, 1578791.0, 2453833.0, 85374.0, 8827.0, 1513.0, 430.0, 183.0, 98.0, 65.0, 49.0, 31.0, 27.0, 26.0, 18.0, 17.0, 16.0, 13.0, 10.0, 7.0, 11.0, 6.0, 5.0, 2.0, 3.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-28.875, -27.9150390625, -26.955078125, -25.9951171875, -25.03515625, -24.0751953125, -23.115234375, -22.1552734375, -21.1953125, -20.2353515625, -19.275390625, -18.3154296875, -17.35546875, -16.3955078125, -15.435546875, -14.4755859375, -13.515625, -12.5556640625, -11.595703125, -10.6357421875, -9.67578125, -8.7158203125, -7.755859375, -6.7958984375, -5.8359375, -4.8759765625, -3.916015625, -2.9560546875, -1.99609375, -1.0361328125, -0.076171875, 0.8837890625, 1.84375, 2.8037109375, 3.763671875, 4.7236328125, 5.68359375, 6.6435546875, 7.603515625, 8.5634765625, 9.5234375, 10.4833984375, 11.443359375, 12.4033203125, 13.36328125, 14.3232421875, 15.283203125, 16.2431640625, 17.203125, 18.1630859375, 19.123046875, 20.0830078125, 21.04296875, 22.0029296875, 22.962890625, 23.9228515625, 24.8828125, 25.8427734375, 26.802734375, 27.7626953125, 28.72265625, 29.6826171875, 30.642578125, 31.6025390625, 32.5625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 6.0, 2.0, 10.0, 8.0, 15.0, 38.0, 35.0, 64.0, 78.0, 128.0, 157.0, 248.0, 316.0, 466.0, 581.0, 556.0, 398.0, 294.0, 214.0, 147.0, 112.0, 64.0, 54.0, 29.0, 22.0, 9.0, 8.0, 13.0, 8.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.328125, -22.56884765625, -21.8095703125, -21.05029296875, -20.291015625, -19.53173828125, -18.7724609375, -18.01318359375, -17.25390625, -16.49462890625, -15.7353515625, -14.97607421875, -14.216796875, -13.45751953125, -12.6982421875, -11.93896484375, -11.1796875, -10.42041015625, -9.6611328125, -8.90185546875, -8.142578125, -7.38330078125, -6.6240234375, -5.86474609375, -5.10546875, -4.34619140625, -3.5869140625, -2.82763671875, -2.068359375, -1.30908203125, -0.5498046875, 0.20947265625, 0.96875, 1.72802734375, 2.4873046875, 3.24658203125, 4.005859375, 4.76513671875, 5.5244140625, 6.28369140625, 7.04296875, 7.80224609375, 8.5615234375, 9.32080078125, 10.080078125, 10.83935546875, 11.5986328125, 12.35791015625, 13.1171875, 13.87646484375, 14.6357421875, 15.39501953125, 16.154296875, 16.91357421875, 17.6728515625, 18.43212890625, 19.19140625, 19.95068359375, 20.7099609375, 21.46923828125, 22.228515625, 22.98779296875, 23.7470703125, 24.50634765625, 25.265625]}, "gradients/decoder.transformer.h.20.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 5.0, 12.0, 12.0, 16.0, 29.0, 55.0, 84.0, 126.0, 253.0, 551.0, 3183.0, 325979.0, 3843746.0, 18476.0, 973.0, 372.0, 183.0, 97.0, 63.0, 34.0, 16.0, 9.0, 6.0, 5.0, 6.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-112.625, -109.3359375, -106.046875, -102.7578125, -99.46875, -96.1796875, -92.890625, -89.6015625, -86.3125, -83.0234375, -79.734375, -76.4453125, -73.15625, -69.8671875, -66.578125, -63.2890625, -60.0, -56.7109375, -53.421875, -50.1328125, -46.84375, -43.5546875, -40.265625, -36.9765625, -33.6875, -30.3984375, -27.109375, -23.8203125, -20.53125, -17.2421875, -13.953125, -10.6640625, -7.375, -4.0859375, -0.796875, 2.4921875, 5.78125, 9.0703125, 12.359375, 15.6484375, 18.9375, 22.2265625, 25.515625, 28.8046875, 32.09375, 35.3828125, 38.671875, 41.9609375, 45.25, 48.5390625, 51.828125, 55.1171875, 58.40625, 61.6953125, 64.984375, 68.2734375, 71.5625, 74.8515625, 78.140625, 81.4296875, 84.71875, 88.0078125, 91.296875, 94.5859375, 97.875]}, "gradients/decoder.transformer.h.20.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 5.0, 14.0, 23.0, 26.0, 40.0, 52.0, 56.0, 71.0, 89.0, 99.0, 110.0, 85.0, 83.0, 70.0, 61.0, 35.0, 31.0, 15.0, 10.0, 12.0, 7.0, 6.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0], "bins": [-84.47265625, -82.25282287597656, -80.03298950195312, -77.81315612792969, -75.59332275390625, -73.37348937988281, -71.15365600585938, -68.93382263183594, -66.7139892578125, -64.49415588378906, -62.274322509765625, -60.05448913574219, -57.83465576171875, -55.61482238769531, -53.394989013671875, -51.17515563964844, -48.955322265625, -46.73548889160156, -44.515655517578125, -42.29582214355469, -40.07598876953125, -37.85615539550781, -35.636322021484375, -33.41648864746094, -31.1966552734375, -28.976821899414062, -26.756988525390625, -24.537155151367188, -22.31732177734375, -20.097488403320312, -17.877655029296875, -15.657821655273438, -13.43798828125, -11.218154907226562, -8.998321533203125, -6.7784881591796875, -4.55865478515625, -2.3388214111328125, -0.118988037109375, 2.1008453369140625, 4.3206787109375, 6.5405120849609375, 8.760345458984375, 10.980178833007812, 13.20001220703125, 15.419845581054688, 17.639678955078125, 19.859512329101562, 22.079345703125, 24.299179077148438, 26.519012451171875, 28.738845825195312, 30.95867919921875, 33.17851257324219, 35.398345947265625, 37.61817932128906, 39.8380126953125, 42.05784606933594, 44.277679443359375, 46.49751281738281, 48.71734619140625, 50.93717956542969, 53.157012939453125, 55.37684631347656, 57.5966796875]}, "gradients/decoder.transformer.h.20.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 5.0, 4.0, 6.0, 11.0, 11.0, 11.0, 9.0, 18.0, 18.0, 30.0, 19.0, 41.0, 32.0, 33.0, 30.0, 37.0, 48.0, 45.0, 36.0, 50.0, 44.0, 38.0, 28.0, 36.0, 44.0, 35.0, 39.0, 25.0, 36.0, 25.0, 24.0, 13.0, 28.0, 21.0, 17.0, 17.0, 6.0, 12.0, 6.0, 5.0, 6.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-58.01872253417969, -55.890869140625, -53.76301193237305, -51.63515853881836, -49.507301330566406, -47.37944793701172, -45.25159454345703, -43.123741149902344, -40.99588394165039, -38.8680305480957, -36.74017333984375, -34.61231994628906, -32.484466552734375, -30.356609344482422, -28.228755950927734, -26.100900650024414, -23.973045349121094, -21.845190048217773, -19.717334747314453, -17.589481353759766, -15.461626052856445, -13.333770751953125, -11.205916404724121, -9.078062057495117, -6.950206756591797, -4.822351932525635, -2.6944971084594727, -0.5666422843933105, 1.5612125396728516, 3.689067840576172, 5.816922187805176, 7.94477653503418, 10.0726318359375, 12.20048713684082, 14.328341484069824, 16.456195831298828, 18.58405113220215, 20.71190643310547, 22.839759826660156, 24.967615127563477, 27.095470428466797, 29.223325729370117, 31.351181030273438, 33.479034423828125, 35.60688781738281, 37.734745025634766, 39.86259841918945, 41.990455627441406, 44.118309020996094, 46.24616241455078, 48.374019622802734, 50.50187301635742, 52.629730224609375, 54.75758361816406, 56.88543701171875, 59.01329040527344, 61.14114761352539, 63.26900100708008, 65.39685821533203, 67.52471160888672, 69.6525650024414, 71.78042602539062, 73.90827941894531, 76.0361328125, 78.16398620605469]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 11.0, 5.0, 5.0, 13.0, 14.0, 21.0, 12.0, 24.0, 31.0, 23.0, 32.0, 35.0, 25.0, 42.0, 41.0, 43.0, 56.0, 31.0, 46.0, 43.0, 44.0, 49.0, 52.0, 41.0, 30.0, 36.0, 23.0, 24.0, 28.0, 17.0, 21.0, 12.0, 18.0, 9.0, 13.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.25390625, -6.04058837890625, -5.8272705078125, -5.61395263671875, -5.400634765625, -5.18731689453125, -4.9739990234375, -4.76068115234375, -4.54736328125, -4.33404541015625, -4.1207275390625, -3.90740966796875, -3.694091796875, -3.48077392578125, -3.2674560546875, -3.05413818359375, -2.8408203125, -2.62750244140625, -2.4141845703125, -2.20086669921875, -1.987548828125, -1.77423095703125, -1.5609130859375, -1.34759521484375, -1.13427734375, -0.92095947265625, -0.7076416015625, -0.49432373046875, -0.281005859375, -0.06768798828125, 0.1456298828125, 0.35894775390625, 0.572265625, 0.78558349609375, 0.9989013671875, 1.21221923828125, 1.425537109375, 1.63885498046875, 1.8521728515625, 2.06549072265625, 2.27880859375, 2.49212646484375, 2.7054443359375, 2.91876220703125, 3.132080078125, 3.34539794921875, 3.5587158203125, 3.77203369140625, 3.9853515625, 4.19866943359375, 4.4119873046875, 4.62530517578125, 4.838623046875, 5.05194091796875, 5.2652587890625, 5.47857666015625, 5.69189453125, 5.90521240234375, 6.1185302734375, 6.33184814453125, 6.545166015625, 6.75848388671875, 6.9718017578125, 7.18511962890625, 7.3984375]}, "gradients/decoder.transformer.h.20.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 2.0, 4.0, 7.0, 7.0, 9.0, 24.0, 24.0, 52.0, 66.0, 93.0, 105.0, 175.0, 219.0, 327.0, 485.0, 704.0, 995.0, 1535.0, 2092.0, 3117.0, 4390.0, 6494.0, 9510.0, 14421.0, 21593.0, 32194.0, 50279.0, 79541.0, 122758.0, 171893.0, 172444.0, 123024.0, 79819.0, 50904.0, 32789.0, 21496.0, 14147.0, 9693.0, 6615.0, 4453.0, 3114.0, 2119.0, 1441.0, 1043.0, 712.0, 522.0, 356.0, 250.0, 146.0, 112.0, 79.0, 60.0, 39.0, 21.0, 20.0, 17.0, 9.0, 6.0, 2.0, 4.0, 0.0, 0.0, 2.0], "bins": [-0.62451171875, -0.6043701171875, -0.584228515625, -0.5640869140625, -0.5439453125, -0.5238037109375, -0.503662109375, -0.4835205078125, -0.46337890625, -0.4432373046875, -0.423095703125, -0.4029541015625, -0.3828125, -0.3626708984375, -0.342529296875, -0.3223876953125, -0.30224609375, -0.2821044921875, -0.261962890625, -0.2418212890625, -0.2216796875, -0.2015380859375, -0.181396484375, -0.1612548828125, -0.14111328125, -0.1209716796875, -0.100830078125, -0.0806884765625, -0.060546875, -0.0404052734375, -0.020263671875, -0.0001220703125, 0.02001953125, 0.0401611328125, 0.060302734375, 0.0804443359375, 0.1005859375, 0.1207275390625, 0.140869140625, 0.1610107421875, 0.18115234375, 0.2012939453125, 0.221435546875, 0.2415771484375, 0.26171875, 0.2818603515625, 0.302001953125, 0.3221435546875, 0.34228515625, 0.3624267578125, 0.382568359375, 0.4027099609375, 0.4228515625, 0.4429931640625, 0.463134765625, 0.4832763671875, 0.50341796875, 0.5235595703125, 0.543701171875, 0.5638427734375, 0.583984375, 0.6041259765625, 0.624267578125, 0.6444091796875, 0.66455078125]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 2.0, 2.0, 2.0, 10.0, 10.0, 9.0, 13.0, 14.0, 12.0, 16.0, 18.0, 23.0, 33.0, 40.0, 24.0, 39.0, 46.0, 39.0, 49.0, 40.0, 55.0, 1069.0, 48.0, 43.0, 42.0, 30.0, 42.0, 32.0, 31.0, 35.0, 30.0, 20.0, 24.0, 22.0, 11.0, 11.0, 11.0, 6.0, 9.0, 3.0, 7.0, 4.0, 4.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.82421875, -4.68267822265625, -4.5411376953125, -4.39959716796875, -4.258056640625, -4.11651611328125, -3.9749755859375, -3.83343505859375, -3.69189453125, -3.55035400390625, -3.4088134765625, -3.26727294921875, -3.125732421875, -2.98419189453125, -2.8426513671875, -2.70111083984375, -2.5595703125, -2.41802978515625, -2.2764892578125, -2.13494873046875, -1.993408203125, -1.85186767578125, -1.7103271484375, -1.56878662109375, -1.42724609375, -1.28570556640625, -1.1441650390625, -1.00262451171875, -0.861083984375, -0.71954345703125, -0.5780029296875, -0.43646240234375, -0.294921875, -0.15338134765625, -0.0118408203125, 0.12969970703125, 0.271240234375, 0.41278076171875, 0.5543212890625, 0.69586181640625, 0.83740234375, 0.97894287109375, 1.1204833984375, 1.26202392578125, 1.403564453125, 1.54510498046875, 1.6866455078125, 1.82818603515625, 1.9697265625, 2.11126708984375, 2.2528076171875, 2.39434814453125, 2.535888671875, 2.67742919921875, 2.8189697265625, 2.96051025390625, 3.10205078125, 3.24359130859375, 3.3851318359375, 3.52667236328125, 3.668212890625, 3.80975341796875, 3.9512939453125, 4.09283447265625, 4.234375]}, "gradients/decoder.transformer.h.20.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 4.0, 3.0, 1.0, 9.0, 10.0, 19.0, 31.0, 28.0, 70.0, 65.0, 129.0, 189.0, 238.0, 362.0, 518.0, 737.0, 1037.0, 1496.0, 2090.0, 3090.0, 4504.0, 6483.0, 9598.0, 14245.0, 20959.0, 31325.0, 45951.0, 69671.0, 99227.0, 134643.0, 1200392.0, 134786.0, 100637.0, 69514.0, 46725.0, 31715.0, 21165.0, 14273.0, 9753.0, 6609.0, 4528.0, 3082.0, 2217.0, 1509.0, 1092.0, 752.0, 528.0, 338.0, 256.0, 177.0, 128.0, 86.0, 54.0, 35.0, 20.0, 15.0, 13.0, 8.0, 1.0, 3.0, 3.0, 0.0, 3.0], "bins": [-0.426513671875, -0.4129791259765625, -0.399444580078125, -0.3859100341796875, -0.37237548828125, -0.3588409423828125, -0.345306396484375, -0.3317718505859375, -0.3182373046875, -0.3047027587890625, -0.291168212890625, -0.2776336669921875, -0.26409912109375, -0.2505645751953125, -0.237030029296875, -0.2234954833984375, -0.2099609375, -0.1964263916015625, -0.182891845703125, -0.1693572998046875, -0.15582275390625, -0.1422882080078125, -0.128753662109375, -0.1152191162109375, -0.1016845703125, -0.0881500244140625, -0.074615478515625, -0.0610809326171875, -0.04754638671875, -0.0340118408203125, -0.020477294921875, -0.0069427490234375, 0.006591796875, 0.0201263427734375, 0.033660888671875, 0.0471954345703125, 0.06072998046875, 0.0742645263671875, 0.087799072265625, 0.1013336181640625, 0.1148681640625, 0.1284027099609375, 0.141937255859375, 0.1554718017578125, 0.16900634765625, 0.1825408935546875, 0.196075439453125, 0.2096099853515625, 0.22314453125, 0.2366790771484375, 0.250213623046875, 0.2637481689453125, 0.27728271484375, 0.2908172607421875, 0.304351806640625, 0.3178863525390625, 0.3314208984375, 0.3449554443359375, 0.358489990234375, 0.3720245361328125, 0.38555908203125, 0.3990936279296875, 0.412628173828125, 0.4261627197265625, 0.439697265625]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 5.0, 3.0, 3.0, 1.0, 6.0, 8.0, 4.0, 7.0, 4.0, 7.0, 11.0, 18.0, 23.0, 21.0, 16.0, 33.0, 44.0, 42.0, 62.0, 53.0, 64.0, 53.0, 59.0, 52.0, 51.0, 51.0, 52.0, 39.0, 37.0, 33.0, 23.0, 16.0, 23.0, 18.0, 12.0, 8.0, 11.0, 10.0, 3.0, 10.0, 3.0, 4.0, 7.0, 0.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.0032291412353515625, -0.0031062662601470947, -0.002983391284942627, -0.002860516309738159, -0.0027376413345336914, -0.0026147663593292236, -0.002491891384124756, -0.002369016408920288, -0.0022461414337158203, -0.0021232664585113525, -0.0020003914833068848, -0.001877516508102417, -0.0017546415328979492, -0.0016317665576934814, -0.0015088915824890137, -0.001386016607284546, -0.0012631416320800781, -0.0011402666568756104, -0.0010173916816711426, -0.0008945167064666748, -0.000771641731262207, -0.0006487667560577393, -0.0005258917808532715, -0.0004030168056488037, -0.00028014183044433594, -0.00015726685523986816, -3.439188003540039e-05, 8.848309516906738e-05, 0.00021135807037353516, 0.00033423304557800293, 0.0004571080207824707, 0.0005799829959869385, 0.0007028579711914062, 0.000825732946395874, 0.0009486079216003418, 0.0010714828968048096, 0.0011943578720092773, 0.0013172328472137451, 0.0014401078224182129, 0.0015629827976226807, 0.0016858577728271484, 0.0018087327480316162, 0.001931607723236084, 0.0020544826984405518, 0.0021773576736450195, 0.0023002326488494873, 0.002423107624053955, 0.002545982599258423, 0.0026688575744628906, 0.0027917325496673584, 0.002914607524871826, 0.003037482500076294, 0.0031603574752807617, 0.0032832324504852295, 0.0034061074256896973, 0.003528982400894165, 0.003651857376098633, 0.0037747323513031006, 0.0038976073265075684, 0.004020482301712036, 0.004143357276916504, 0.004266232252120972, 0.0043891072273254395, 0.004511982202529907, 0.004634857177734375]}, "gradients/decoder.transformer.h.20.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 4.0, 3.0, 5.0, 13.0, 4.0, 10.0, 10.0, 11.0, 12.0, 21.0, 23.0, 34.0, 47.0, 61.0, 75.0, 112.0, 203.0, 387.0, 897.0, 101873.0, 940781.0, 2701.0, 464.0, 230.0, 163.0, 100.0, 103.0, 45.0, 29.0, 31.0, 28.0, 11.0, 13.0, 8.0, 7.0, 5.0, 6.0, 6.0, 3.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.1004638671875, -0.09768867492675781, -0.09491348266601562, -0.09213829040527344, -0.08936309814453125, -0.08658790588378906, -0.08381271362304688, -0.08103752136230469, -0.0782623291015625, -0.07548713684082031, -0.07271194458007812, -0.06993675231933594, -0.06716156005859375, -0.06438636779785156, -0.061611175537109375, -0.05883598327636719, -0.056060791015625, -0.05328559875488281, -0.050510406494140625, -0.04773521423339844, -0.04496002197265625, -0.04218482971191406, -0.039409637451171875, -0.03663444519042969, -0.0338592529296875, -0.031084060668945312, -0.028308868408203125, -0.025533676147460938, -0.02275848388671875, -0.019983291625976562, -0.017208099365234375, -0.014432907104492188, -0.01165771484375, -0.008882522583007812, -0.006107330322265625, -0.0033321380615234375, -0.00055694580078125, 0.0022182464599609375, 0.004993438720703125, 0.0077686309814453125, 0.0105438232421875, 0.013319015502929688, 0.016094207763671875, 0.018869400024414062, 0.02164459228515625, 0.024419784545898438, 0.027194976806640625, 0.029970169067382812, 0.032745361328125, 0.03552055358886719, 0.038295745849609375, 0.04107093811035156, 0.04384613037109375, 0.04662132263183594, 0.049396514892578125, 0.05217170715332031, 0.0549468994140625, 0.05772209167480469, 0.060497283935546875, 0.06327247619628906, 0.06604766845703125, 0.06882286071777344, 0.07159805297851562, 0.07437324523925781, 0.0771484375]}, "gradients/decoder.transformer.h.20.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 897.0, 122.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.10068836063146591, -0.09885051101446152, -0.09701266884803772, -0.09517481923103333, -0.09333697706460953, -0.09149912744760513, -0.08966128528118134, -0.08782343566417694, -0.08598558604717255, -0.08414773643016815, -0.08230989426374435, -0.08047204464673996, -0.07863420248031616, -0.07679635286331177, -0.07495850324630737, -0.07312066107988358, -0.07128281891345978, -0.06944496929645538, -0.06760712713003159, -0.06576927751302719, -0.0639314353466034, -0.062093585729599, -0.0602557398378849, -0.05841789394617081, -0.05658004432916641, -0.054742198437452316, -0.05290435254573822, -0.051066502928733826, -0.04922865703701973, -0.047390811145305634, -0.04555296525359154, -0.04371511936187744, -0.04187726974487305, -0.04003942385315895, -0.038201577961444855, -0.03636372834444046, -0.034525882452726364, -0.03268803656101227, -0.030850190669298172, -0.029012344777584076, -0.02717449888586998, -0.025336652994155884, -0.02349880523979664, -0.021660959348082542, -0.019823113456368446, -0.0179852657020092, -0.016147419810295105, -0.014309573918581009, -0.012471728026866913, -0.010633881203830242, -0.008796035312116146, -0.006958188489079475, -0.005120342131704092, -0.0032824957743287086, -0.001444648951292038, 0.0003931969404220581, 0.002231043763458729, 0.004068890120834112, 0.0059067364782094955, 0.007744583301246166, 0.009582430124282837, 0.011420276015996933, 0.013258122839033604, 0.0150959687307477, 0.01693381555378437]}, "gradients/decoder.transformer.h.20.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 6.0, 8.0, 11.0, 19.0, 15.0, 20.0, 23.0, 39.0, 35.0, 41.0, 43.0, 39.0, 56.0, 59.0, 57.0, 55.0, 58.0, 49.0, 54.0, 57.0, 55.0, 33.0, 30.0, 39.0, 32.0, 12.0, 18.0, 12.0, 9.0, 12.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0021790266036987305, -0.002082289196550846, -0.0019855517894029617, -0.0018888143822550774, -0.001792076975107193, -0.0016953395679593086, -0.0015986021608114243, -0.0015018647536635399, -0.0014051273465156555, -0.0013083899393677711, -0.0012116525322198868, -0.0011149151250720024, -0.001018177717924118, -0.0009214403107762337, -0.0008247029036283493, -0.0007279654964804649, -0.0006312280893325806, -0.0005344906821846962, -0.00043775327503681183, -0.00034101586788892746, -0.0002442784607410431, -0.00014754105359315872, -5.080364644527435e-05, 4.5933760702610016e-05, 0.00014267116785049438, 0.00023940857499837875, 0.0003361459821462631, 0.0004328833892941475, 0.0005296207964420319, 0.0006263582035899162, 0.0007230956107378006, 0.000819833017885685, 0.0009165704250335693, 0.0010133078321814537, 0.001110045239329338, 0.0012067826464772224, 0.0013035200536251068, 0.0014002574607729912, 0.0014969948679208755, 0.00159373227506876, 0.0016904696822166443, 0.0017872070893645287, 0.001883944496512413, 0.0019806819036602974, 0.0020774193108081818, 0.002174156717956066, 0.0022708941251039505, 0.002367631532251835, 0.0024643689393997192, 0.0025611063465476036, 0.002657843753695488, 0.0027545811608433723, 0.0028513185679912567, 0.002948055975139141, 0.0030447933822870255, 0.00314153078943491, 0.003238268196582794, 0.0033350056037306786, 0.003431743010878563, 0.0035284804180264473, 0.0036252178251743317, 0.003721955232322216, 0.0038186926394701004, 0.003915430046617985, 0.004012167453765869]}, "gradients/decoder.transformer.h.20.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 4.0, 7.0, 11.0, 5.0, 5.0, 13.0, 14.0, 21.0, 12.0, 24.0, 31.0, 23.0, 32.0, 35.0, 25.0, 42.0, 41.0, 43.0, 56.0, 31.0, 46.0, 43.0, 44.0, 50.0, 51.0, 41.0, 30.0, 36.0, 23.0, 23.0, 29.0, 17.0, 21.0, 12.0, 18.0, 9.0, 13.0, 10.0, 5.0, 4.0, 4.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.25390625, -6.04058837890625, -5.8272705078125, -5.61395263671875, -5.400634765625, -5.18731689453125, -4.9739990234375, -4.76068115234375, -4.54736328125, -4.33404541015625, -4.1207275390625, -3.90740966796875, -3.694091796875, -3.48077392578125, -3.2674560546875, -3.05413818359375, -2.8408203125, -2.62750244140625, -2.4141845703125, -2.20086669921875, -1.987548828125, -1.77423095703125, -1.5609130859375, -1.34759521484375, -1.13427734375, -0.92095947265625, -0.7076416015625, -0.49432373046875, -0.281005859375, -0.06768798828125, 0.1456298828125, 0.35894775390625, 0.572265625, 0.78558349609375, 0.9989013671875, 1.21221923828125, 1.425537109375, 1.63885498046875, 1.8521728515625, 2.06549072265625, 2.27880859375, 2.49212646484375, 2.7054443359375, 2.91876220703125, 3.132080078125, 3.34539794921875, 3.5587158203125, 3.77203369140625, 3.9853515625, 4.19866943359375, 4.4119873046875, 4.62530517578125, 4.838623046875, 5.05194091796875, 5.2652587890625, 5.47857666015625, 5.69189453125, 5.90521240234375, 6.1185302734375, 6.33184814453125, 6.545166015625, 6.75848388671875, 6.9718017578125, 7.18511962890625, 7.3984375]}, "gradients/decoder.transformer.h.20.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 4.0, 0.0, 3.0, 1.0, 7.0, 7.0, 18.0, 15.0, 30.0, 43.0, 74.0, 107.0, 165.0, 257.0, 445.0, 843.0, 1608.0, 3523.0, 9369.0, 32464.0, 183876.0, 632891.0, 141505.0, 26655.0, 8009.0, 3202.0, 1578.0, 768.0, 440.0, 229.0, 138.0, 100.0, 73.0, 38.0, 30.0, 18.0, 9.0, 8.0, 4.0, 4.0, 4.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1015625, -5.8707275390625, -5.639892578125, -5.4090576171875, -5.17822265625, -4.9473876953125, -4.716552734375, -4.4857177734375, -4.2548828125, -4.0240478515625, -3.793212890625, -3.5623779296875, -3.33154296875, -3.1007080078125, -2.869873046875, -2.6390380859375, -2.408203125, -2.1773681640625, -1.946533203125, -1.7156982421875, -1.48486328125, -1.2540283203125, -1.023193359375, -0.7923583984375, -0.5615234375, -0.3306884765625, -0.099853515625, 0.1309814453125, 0.36181640625, 0.5926513671875, 0.823486328125, 1.0543212890625, 1.28515625, 1.5159912109375, 1.746826171875, 1.9776611328125, 2.20849609375, 2.4393310546875, 2.670166015625, 2.9010009765625, 3.1318359375, 3.3626708984375, 3.593505859375, 3.8243408203125, 4.05517578125, 4.2860107421875, 4.516845703125, 4.7476806640625, 4.978515625, 5.2093505859375, 5.440185546875, 5.6710205078125, 5.90185546875, 6.1326904296875, 6.363525390625, 6.5943603515625, 6.8251953125, 7.0560302734375, 7.286865234375, 7.5177001953125, 7.74853515625, 7.9793701171875, 8.210205078125, 8.4410400390625, 8.671875]}, "gradients/decoder.transformer.h.20.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 7.0, 5.0, 5.0, 4.0, 5.0, 3.0, 5.0, 5.0, 7.0, 7.0, 11.0, 14.0, 13.0, 22.0, 18.0, 18.0, 26.0, 27.0, 32.0, 50.0, 40.0, 35.0, 48.0, 58.0, 100.0, 1491.0, 462.0, 99.0, 53.0, 52.0, 44.0, 35.0, 32.0, 42.0, 23.0, 28.0, 22.0, 20.0, 18.0, 6.0, 9.0, 9.0, 10.0, 11.0, 3.0, 6.0, 5.0, 5.0, 4.0, 3.0, 3.0, 3.0, 0.0, 2.0, 1.0, 1.0], "bins": [-23.828125, -23.127197265625, -22.42626953125, -21.725341796875, -21.0244140625, -20.323486328125, -19.62255859375, -18.921630859375, -18.220703125, -17.519775390625, -16.81884765625, -16.117919921875, -15.4169921875, -14.716064453125, -14.01513671875, -13.314208984375, -12.61328125, -11.912353515625, -11.21142578125, -10.510498046875, -9.8095703125, -9.108642578125, -8.40771484375, -7.706787109375, -7.005859375, -6.304931640625, -5.60400390625, -4.903076171875, -4.2021484375, -3.501220703125, -2.80029296875, -2.099365234375, -1.3984375, -0.697509765625, 0.00341796875, 0.704345703125, 1.4052734375, 2.106201171875, 2.80712890625, 3.508056640625, 4.208984375, 4.909912109375, 5.61083984375, 6.311767578125, 7.0126953125, 7.713623046875, 8.41455078125, 9.115478515625, 9.81640625, 10.517333984375, 11.21826171875, 11.919189453125, 12.6201171875, 13.321044921875, 14.02197265625, 14.722900390625, 15.423828125, 16.124755859375, 16.82568359375, 17.526611328125, 18.2275390625, 18.928466796875, 19.62939453125, 20.330322265625, 21.03125]}, "gradients/decoder.transformer.h.20.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 7.0, 5.0, 11.0, 8.0, 9.0, 13.0, 7.0, 8.0, 23.0, 24.0, 32.0, 42.0, 45.0, 80.0, 95.0, 156.0, 260.0, 550.0, 1794.0, 12871.0, 2804063.0, 317413.0, 5810.0, 1160.0, 429.0, 214.0, 149.0, 92.0, 77.0, 54.0, 39.0, 24.0, 23.0, 21.0, 15.0, 9.0, 17.0, 7.0, 6.0, 6.0, 6.0, 2.0, 7.0, 5.0, 3.0, 7.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-33.8125, -32.6796875, -31.546875, -30.4140625, -29.28125, -28.1484375, -27.015625, -25.8828125, -24.75, -23.6171875, -22.484375, -21.3515625, -20.21875, -19.0859375, -17.953125, -16.8203125, -15.6875, -14.5546875, -13.421875, -12.2890625, -11.15625, -10.0234375, -8.890625, -7.7578125, -6.625, -5.4921875, -4.359375, -3.2265625, -2.09375, -0.9609375, 0.171875, 1.3046875, 2.4375, 3.5703125, 4.703125, 5.8359375, 6.96875, 8.1015625, 9.234375, 10.3671875, 11.5, 12.6328125, 13.765625, 14.8984375, 16.03125, 17.1640625, 18.296875, 19.4296875, 20.5625, 21.6953125, 22.828125, 23.9609375, 25.09375, 26.2265625, 27.359375, 28.4921875, 29.625, 30.7578125, 31.890625, 33.0234375, 34.15625, 35.2890625, 36.421875, 37.5546875, 38.6875]}, "gradients/decoder.transformer.h.20.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 314.0, 685.0, 17.0], "bins": [-401.2157287597656, -394.7601623535156, -388.3045654296875, -381.8489990234375, -375.3934326171875, -368.9378356933594, -362.4822692871094, -356.0267028808594, -349.57110595703125, -343.11553955078125, -336.6599426269531, -330.2043762207031, -323.7488098144531, -317.293212890625, -310.837646484375, -304.382080078125, -297.926513671875, -291.470947265625, -285.0153503417969, -278.5597839355469, -272.1042175292969, -265.64862060546875, -259.19305419921875, -252.73748779296875, -246.28189086914062, -239.82630920410156, -233.37074279785156, -226.9151611328125, -220.45957946777344, -214.00401306152344, -207.54843139648438, -201.09286499023438, -194.63729858398438, -188.1817169189453, -181.7261505126953, -175.27056884765625, -168.8149871826172, -162.3594207763672, -155.90383911132812, -149.44827270507812, -142.99267578125, -136.53709411621094, -130.08152770996094, -123.62594604492188, -117.17037200927734, -110.71479797363281, -104.25921630859375, -97.80364227294922, -91.34806823730469, -84.89249420166016, -78.4369125366211, -71.98133850097656, -65.52576446533203, -59.070186614990234, -52.61460876464844, -46.159034729003906, -39.703460693359375, -33.24788284301758, -26.792308807373047, -20.33673095703125, -13.881155014038086, -7.425579071044922, -0.970001220703125, 5.485572814941406, 11.94115161895752]}, "gradients/decoder.transformer.h.20.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 5.0, 2.0, 6.0, 5.0, 6.0, 7.0, 10.0, 9.0, 13.0, 11.0, 19.0, 15.0, 18.0, 25.0, 27.0, 23.0, 29.0, 28.0, 38.0, 29.0, 32.0, 24.0, 36.0, 39.0, 46.0, 52.0, 44.0, 44.0, 29.0, 29.0, 38.0, 32.0, 24.0, 20.0, 24.0, 17.0, 14.0, 21.0, 19.0, 17.0, 16.0, 6.0, 15.0, 8.0, 6.0, 10.0, 7.0, 3.0, 3.0, 3.0, 3.0, 3.0, 0.0, 1.0, 2.0], "bins": [-71.29705810546875, -69.14692687988281, -66.9968032836914, -64.84667205810547, -62.6965446472168, -60.546417236328125, -58.39628601074219, -56.246158599853516, -54.096031188964844, -51.94590377807617, -49.795772552490234, -47.64564514160156, -45.49551773071289, -43.34539031982422, -41.19525909423828, -39.04513168334961, -36.89500045776367, -34.744873046875, -32.59474182128906, -30.44461441040039, -28.29448699951172, -26.144357681274414, -23.99422836303711, -21.844100952148438, -19.693971633911133, -17.543842315673828, -15.393714904785156, -13.243585586547852, -11.093457221984863, -8.943328857421875, -6.79319953918457, -4.643071174621582, -2.4929428100585938, -0.34281420707702637, 1.807314395904541, 3.9574432373046875, 6.107571601867676, 8.257699966430664, 10.407829284667969, 12.557957649230957, 14.708086013793945, 16.85821533203125, 19.008342742919922, 21.158472061157227, 23.30860137939453, 25.458728790283203, 27.608858108520508, 29.758987426757812, 31.909114837646484, 34.059242248535156, 36.209373474121094, 38.359500885009766, 40.50962829589844, 42.659759521484375, 44.80988693237305, 46.96001434326172, 49.110145568847656, 51.26027297973633, 53.410404205322266, 55.56053161621094, 57.71065902709961, 59.86078643798828, 62.01091766357422, 64.16104888916016, 66.31117248535156]}, "gradients/decoder.transformer.h.19.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 2.0, 8.0, 10.0, 4.0, 7.0, 7.0, 8.0, 16.0, 26.0, 13.0, 27.0, 23.0, 30.0, 29.0, 39.0, 31.0, 33.0, 49.0, 47.0, 35.0, 34.0, 47.0, 46.0, 41.0, 53.0, 36.0, 39.0, 40.0, 35.0, 23.0, 21.0, 30.0, 21.0, 22.0, 13.0, 11.0, 13.0, 10.0, 13.0, 5.0, 4.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2109375, -5.99774169921875, -5.7845458984375, -5.57135009765625, -5.358154296875, -5.14495849609375, -4.9317626953125, -4.71856689453125, -4.50537109375, -4.29217529296875, -4.0789794921875, -3.86578369140625, -3.652587890625, -3.43939208984375, -3.2261962890625, -3.01300048828125, -2.7998046875, -2.58660888671875, -2.3734130859375, -2.16021728515625, -1.947021484375, -1.73382568359375, -1.5206298828125, -1.30743408203125, -1.09423828125, -0.88104248046875, -0.6678466796875, -0.45465087890625, -0.241455078125, -0.02825927734375, 0.1849365234375, 0.39813232421875, 0.611328125, 0.82452392578125, 1.0377197265625, 1.25091552734375, 1.464111328125, 1.67730712890625, 1.8905029296875, 2.10369873046875, 2.31689453125, 2.53009033203125, 2.7432861328125, 2.95648193359375, 3.169677734375, 3.38287353515625, 3.5960693359375, 3.80926513671875, 4.0224609375, 4.23565673828125, 4.4488525390625, 4.66204833984375, 4.875244140625, 5.08843994140625, 5.3016357421875, 5.51483154296875, 5.72802734375, 5.94122314453125, 6.1544189453125, 6.36761474609375, 6.580810546875, 6.79400634765625, 7.0072021484375, 7.22039794921875, 7.43359375]}, "gradients/decoder.transformer.h.19.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 6.0, 5.0, 6.0, 7.0, 11.0, 17.0, 22.0, 25.0, 33.0, 37.0, 81.0, 110.0, 183.0, 431.0, 924.0, 2655.0, 9065.0, 36056.0, 190296.0, 1730874.0, 1943737.0, 224659.0, 40120.0, 10049.0, 2912.0, 973.0, 416.0, 210.0, 117.0, 61.0, 45.0, 40.0, 27.0, 20.0, 15.0, 14.0, 13.0, 6.0, 7.0, 4.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.1328125, -14.5731201171875, -14.013427734375, -13.4537353515625, -12.89404296875, -12.3343505859375, -11.774658203125, -11.2149658203125, -10.6552734375, -10.0955810546875, -9.535888671875, -8.9761962890625, -8.41650390625, -7.8568115234375, -7.297119140625, -6.7374267578125, -6.177734375, -5.6180419921875, -5.058349609375, -4.4986572265625, -3.93896484375, -3.3792724609375, -2.819580078125, -2.2598876953125, -1.7001953125, -1.1405029296875, -0.580810546875, -0.0211181640625, 0.53857421875, 1.0982666015625, 1.657958984375, 2.2176513671875, 2.77734375, 3.3370361328125, 3.896728515625, 4.4564208984375, 5.01611328125, 5.5758056640625, 6.135498046875, 6.6951904296875, 7.2548828125, 7.8145751953125, 8.374267578125, 8.9339599609375, 9.49365234375, 10.0533447265625, 10.613037109375, 11.1727294921875, 11.732421875, 12.2921142578125, 12.851806640625, 13.4114990234375, 13.97119140625, 14.5308837890625, 15.090576171875, 15.6502685546875, 16.2099609375, 16.7696533203125, 17.329345703125, 17.8890380859375, 18.44873046875, 19.0084228515625, 19.568115234375, 20.1278076171875, 20.6875]}, "gradients/decoder.transformer.h.19.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 3.0, 10.0, 10.0, 14.0, 28.0, 30.0, 52.0, 64.0, 84.0, 121.0, 150.0, 227.0, 284.0, 406.0, 477.0, 504.0, 440.0, 314.0, 245.0, 172.0, 129.0, 92.0, 72.0, 41.0, 40.0, 22.0, 8.0, 13.0, 7.0, 3.0, 6.0, 4.0, 6.0, 2.0, 2.0, 1.0], "bins": [-28.515625, -27.854248046875, -27.19287109375, -26.531494140625, -25.8701171875, -25.208740234375, -24.54736328125, -23.885986328125, -23.224609375, -22.563232421875, -21.90185546875, -21.240478515625, -20.5791015625, -19.917724609375, -19.25634765625, -18.594970703125, -17.93359375, -17.272216796875, -16.61083984375, -15.949462890625, -15.2880859375, -14.626708984375, -13.96533203125, -13.303955078125, -12.642578125, -11.981201171875, -11.31982421875, -10.658447265625, -9.9970703125, -9.335693359375, -8.67431640625, -8.012939453125, -7.3515625, -6.690185546875, -6.02880859375, -5.367431640625, -4.7060546875, -4.044677734375, -3.38330078125, -2.721923828125, -2.060546875, -1.399169921875, -0.73779296875, -0.076416015625, 0.5849609375, 1.246337890625, 1.90771484375, 2.569091796875, 3.23046875, 3.891845703125, 4.55322265625, 5.214599609375, 5.8759765625, 6.537353515625, 7.19873046875, 7.860107421875, 8.521484375, 9.182861328125, 9.84423828125, 10.505615234375, 11.1669921875, 11.828369140625, 12.48974609375, 13.151123046875, 13.8125]}, "gradients/decoder.transformer.h.19.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 8.0, 9.0, 14.0, 16.0, 20.0, 32.0, 56.0, 77.0, 128.0, 220.0, 461.0, 1963.0, 42221.0, 3772571.0, 369068.0, 5884.0, 800.0, 300.0, 154.0, 92.0, 71.0, 37.0, 33.0, 19.0, 13.0, 10.0, 4.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-71.3125, -68.740234375, -66.16796875, -63.595703125, -61.0234375, -58.451171875, -55.87890625, -53.306640625, -50.734375, -48.162109375, -45.58984375, -43.017578125, -40.4453125, -37.873046875, -35.30078125, -32.728515625, -30.15625, -27.583984375, -25.01171875, -22.439453125, -19.8671875, -17.294921875, -14.72265625, -12.150390625, -9.578125, -7.005859375, -4.43359375, -1.861328125, 0.7109375, 3.283203125, 5.85546875, 8.427734375, 11.0, 13.572265625, 16.14453125, 18.716796875, 21.2890625, 23.861328125, 26.43359375, 29.005859375, 31.578125, 34.150390625, 36.72265625, 39.294921875, 41.8671875, 44.439453125, 47.01171875, 49.583984375, 52.15625, 54.728515625, 57.30078125, 59.873046875, 62.4453125, 65.017578125, 67.58984375, 70.162109375, 72.734375, 75.306640625, 77.87890625, 80.451171875, 83.0234375, 85.595703125, 88.16796875, 90.740234375, 93.3125]}, "gradients/decoder.transformer.h.19.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 19.0, 36.0, 89.0, 207.0, 202.0, 205.0, 147.0, 66.0, 23.0, 12.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-103.1478500366211, -97.66360473632812, -92.17935943603516, -86.69511413574219, -81.21086883544922, -75.72662353515625, -70.24238586425781, -64.75813293457031, -59.27389144897461, -53.78964614868164, -48.30540084838867, -42.82115936279297, -37.3369140625, -31.8526668548584, -26.368423461914062, -20.884178161621094, -15.399932861328125, -9.915687561035156, -4.431443214416504, 1.0528011322021484, 6.537046432495117, 12.021291732788086, 17.505535125732422, 22.98978042602539, 28.47402572631836, 33.95827102661133, 39.4425163269043, 44.9267578125, 50.41100311279297, 55.89524841308594, 61.379493713378906, 66.86373901367188, 72.34797668457031, 77.83222198486328, 83.31646728515625, 88.80071258544922, 94.28495788574219, 99.76920318603516, 105.25344848632812, 110.73768615722656, 116.22193908691406, 121.70618438720703, 127.1904296875, 132.67466735839844, 138.15892028808594, 143.64315795898438, 149.12741088867188, 154.6116485595703, 160.09588623046875, 165.5801239013672, 171.0643768310547, 176.54861450195312, 182.03286743164062, 187.51710510253906, 193.00135803222656, 198.485595703125, 203.9698486328125, 209.45408630371094, 214.93833923339844, 220.42257690429688, 225.90682983398438, 231.3910675048828, 236.8753204345703, 242.35955810546875, 247.84381103515625]}, "gradients/decoder.transformer.h.19.ln_2.bias": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 2.0, 1.0, 5.0, 4.0, 10.0, 5.0, 6.0, 9.0, 11.0, 16.0, 5.0, 23.0, 15.0, 19.0, 18.0, 19.0, 29.0, 31.0, 29.0, 38.0, 33.0, 27.0, 32.0, 35.0, 39.0, 30.0, 37.0, 50.0, 36.0, 36.0, 34.0, 41.0, 33.0, 26.0, 32.0, 24.0, 21.0, 19.0, 19.0, 16.0, 13.0, 15.0, 10.0, 14.0, 4.0, 9.0, 9.0, 5.0, 5.0, 5.0, 3.0, 2.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-52.90128707885742, -51.10117721557617, -49.30106735229492, -47.50095748901367, -45.70085144042969, -43.90074157714844, -42.10063171386719, -40.30052185058594, -38.50041198730469, -36.70030212402344, -34.90019226074219, -33.10008239746094, -31.29997444152832, -29.49986457824707, -27.699756622314453, -25.899646759033203, -24.099536895751953, -22.299427032470703, -20.499317169189453, -18.699209213256836, -16.899099349975586, -15.098989486694336, -13.298880577087402, -11.498771667480469, -9.698661804199219, -7.898552417755127, -6.098443031311035, -4.298333644866943, -2.4982242584228516, -0.6981143951416016, 1.101994514465332, 2.9021034240722656, 4.70220947265625, 6.502318859100342, 8.302428245544434, 10.102537155151367, 11.902647018432617, 13.702756881713867, 15.5028657913208, 17.302974700927734, 19.103084564208984, 20.903194427490234, 22.703304290771484, 24.5034122467041, 26.30352210998535, 28.1036319732666, 29.90373992919922, 31.70384979248047, 33.50395965576172, 35.30406951904297, 37.10417938232422, 38.90428924560547, 40.70439910888672, 42.50450897216797, 44.30461502075195, 46.1047248840332, 47.90483474731445, 49.7049446105957, 51.50505447387695, 53.3051643371582, 55.10527038574219, 56.90538024902344, 58.70549011230469, 60.50559997558594, 62.30570983886719]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 10.0, 17.0, 11.0, 21.0, 17.0, 25.0, 26.0, 25.0, 26.0, 33.0, 37.0, 28.0, 42.0, 47.0, 41.0, 54.0, 41.0, 44.0, 49.0, 39.0, 34.0, 45.0, 38.0, 31.0, 29.0, 22.0, 31.0, 19.0, 21.0, 16.0, 19.0, 15.0, 12.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12890625, -6.90179443359375, -6.6746826171875, -6.44757080078125, -6.220458984375, -5.99334716796875, -5.7662353515625, -5.53912353515625, -5.31201171875, -5.08489990234375, -4.8577880859375, -4.63067626953125, -4.403564453125, -4.17645263671875, -3.9493408203125, -3.72222900390625, -3.4951171875, -3.26800537109375, -3.0408935546875, -2.81378173828125, -2.586669921875, -2.35955810546875, -2.1324462890625, -1.90533447265625, -1.67822265625, -1.45111083984375, -1.2239990234375, -0.99688720703125, -0.769775390625, -0.54266357421875, -0.3155517578125, -0.08843994140625, 0.138671875, 0.36578369140625, 0.5928955078125, 0.82000732421875, 1.047119140625, 1.27423095703125, 1.5013427734375, 1.72845458984375, 1.95556640625, 2.18267822265625, 2.4097900390625, 2.63690185546875, 2.864013671875, 3.09112548828125, 3.3182373046875, 3.54534912109375, 3.7724609375, 3.99957275390625, 4.2266845703125, 4.45379638671875, 4.680908203125, 4.90802001953125, 5.1351318359375, 5.36224365234375, 5.58935546875, 5.81646728515625, 6.0435791015625, 6.27069091796875, 6.497802734375, 6.72491455078125, 6.9520263671875, 7.17913818359375, 7.40625]}, "gradients/decoder.transformer.h.19.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 5.0, 4.0, 15.0, 14.0, 28.0, 29.0, 43.0, 64.0, 85.0, 147.0, 194.0, 252.0, 370.0, 570.0, 789.0, 1136.0, 1626.0, 2366.0, 3314.0, 5020.0, 7114.0, 10343.0, 15360.0, 22925.0, 34565.0, 52553.0, 82022.0, 124878.0, 174092.0, 166674.0, 117031.0, 76451.0, 49317.0, 32087.0, 21303.0, 14448.0, 9514.0, 6642.0, 4600.0, 3193.0, 2248.0, 1556.0, 1081.0, 753.0, 488.0, 374.0, 262.0, 200.0, 138.0, 85.0, 72.0, 49.0, 26.0, 15.0, 12.0, 12.0, 6.0, 5.0, 3.0, 1.0, 1.0], "bins": [-0.662109375, -0.6413650512695312, -0.6206207275390625, -0.5998764038085938, -0.579132080078125, -0.5583877563476562, -0.5376434326171875, -0.5168991088867188, -0.49615478515625, -0.47541046142578125, -0.4546661376953125, -0.43392181396484375, -0.413177490234375, -0.39243316650390625, -0.3716888427734375, -0.35094451904296875, -0.3302001953125, -0.30945587158203125, -0.2887115478515625, -0.26796722412109375, -0.247222900390625, -0.22647857666015625, -0.2057342529296875, -0.18498992919921875, -0.16424560546875, -0.14350128173828125, -0.1227569580078125, -0.10201263427734375, -0.081268310546875, -0.06052398681640625, -0.0397796630859375, -0.01903533935546875, 0.001708984375, 0.02245330810546875, 0.0431976318359375, 0.06394195556640625, 0.084686279296875, 0.10543060302734375, 0.1261749267578125, 0.14691925048828125, 0.16766357421875, 0.18840789794921875, 0.2091522216796875, 0.22989654541015625, 0.250640869140625, 0.27138519287109375, 0.2921295166015625, 0.31287384033203125, 0.3336181640625, 0.35436248779296875, 0.3751068115234375, 0.39585113525390625, 0.416595458984375, 0.43733978271484375, 0.4580841064453125, 0.47882843017578125, 0.49957275390625, 0.5203170776367188, 0.5410614013671875, 0.5618057250976562, 0.582550048828125, 0.6032943725585938, 0.6240386962890625, 0.6447830200195312, 0.66552734375]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 4.0, 1.0, 6.0, 1.0, 3.0, 8.0, 9.0, 7.0, 13.0, 23.0, 10.0, 15.0, 22.0, 17.0, 34.0, 25.0, 33.0, 30.0, 41.0, 34.0, 37.0, 45.0, 39.0, 35.0, 1061.0, 40.0, 51.0, 45.0, 29.0, 33.0, 34.0, 27.0, 28.0, 25.0, 28.0, 21.0, 21.0, 18.0, 16.0, 16.0, 18.0, 3.0, 2.0, 3.0, 10.0, 6.0, 5.0, 3.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.0859375, -3.95458984375, -3.8232421875, -3.69189453125, -3.560546875, -3.42919921875, -3.2978515625, -3.16650390625, -3.03515625, -2.90380859375, -2.7724609375, -2.64111328125, -2.509765625, -2.37841796875, -2.2470703125, -2.11572265625, -1.984375, -1.85302734375, -1.7216796875, -1.59033203125, -1.458984375, -1.32763671875, -1.1962890625, -1.06494140625, -0.93359375, -0.80224609375, -0.6708984375, -0.53955078125, -0.408203125, -0.27685546875, -0.1455078125, -0.01416015625, 0.1171875, 0.24853515625, 0.3798828125, 0.51123046875, 0.642578125, 0.77392578125, 0.9052734375, 1.03662109375, 1.16796875, 1.29931640625, 1.4306640625, 1.56201171875, 1.693359375, 1.82470703125, 1.9560546875, 2.08740234375, 2.21875, 2.35009765625, 2.4814453125, 2.61279296875, 2.744140625, 2.87548828125, 3.0068359375, 3.13818359375, 3.26953125, 3.40087890625, 3.5322265625, 3.66357421875, 3.794921875, 3.92626953125, 4.0576171875, 4.18896484375, 4.3203125]}, "gradients/decoder.transformer.h.19.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 7.0, 6.0, 11.0, 20.0, 40.0, 42.0, 57.0, 70.0, 127.0, 153.0, 224.0, 307.0, 401.0, 607.0, 843.0, 1222.0, 1760.0, 2506.0, 3647.0, 5086.0, 7499.0, 11108.0, 16284.0, 23783.0, 35481.0, 51968.0, 76150.0, 107098.0, 143895.0, 1187481.0, 125030.0, 92278.0, 64516.0, 43837.0, 29578.0, 20075.0, 13475.0, 9375.0, 6472.0, 4434.0, 3116.0, 2105.0, 1418.0, 1038.0, 717.0, 528.0, 369.0, 248.0, 187.0, 145.0, 89.0, 58.0, 53.0, 41.0, 18.0, 23.0, 13.0, 10.0, 11.0, 2.0, 5.0, 3.0], "bins": [-0.41552734375, -0.4022407531738281, -0.38895416259765625, -0.3756675720214844, -0.3623809814453125, -0.3490943908691406, -0.33580780029296875, -0.3225212097167969, -0.309234619140625, -0.2959480285644531, -0.28266143798828125, -0.2693748474121094, -0.2560882568359375, -0.24280166625976562, -0.22951507568359375, -0.21622848510742188, -0.20294189453125, -0.18965530395507812, -0.17636871337890625, -0.16308212280273438, -0.1497955322265625, -0.13650894165039062, -0.12322235107421875, -0.10993576049804688, -0.096649169921875, -0.08336257934570312, -0.07007598876953125, -0.056789398193359375, -0.0435028076171875, -0.030216217041015625, -0.01692962646484375, -0.003643035888671875, 0.0096435546875, 0.022930145263671875, 0.03621673583984375, 0.049503326416015625, 0.0627899169921875, 0.07607650756835938, 0.08936309814453125, 0.10264968872070312, 0.115936279296875, 0.12922286987304688, 0.14250946044921875, 0.15579605102539062, 0.1690826416015625, 0.18236923217773438, 0.19565582275390625, 0.20894241333007812, 0.22222900390625, 0.23551559448242188, 0.24880218505859375, 0.2620887756347656, 0.2753753662109375, 0.2886619567871094, 0.30194854736328125, 0.3152351379394531, 0.328521728515625, 0.3418083190917969, 0.35509490966796875, 0.3683815002441406, 0.3816680908203125, 0.3949546813964844, 0.40824127197265625, 0.4215278625488281, 0.434814453125]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 1.0, 5.0, 8.0, 6.0, 9.0, 6.0, 12.0, 9.0, 21.0, 24.0, 26.0, 34.0, 34.0, 33.0, 37.0, 40.0, 46.0, 57.0, 56.0, 61.0, 55.0, 54.0, 50.0, 46.0, 42.0, 30.0, 41.0, 35.0, 20.0, 19.0, 11.0, 15.0, 15.0, 9.0, 7.0, 5.0, 4.0, 9.0, 4.0, 1.0, 4.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00415802001953125, -0.0040076375007629395, -0.003857254981994629, -0.0037068724632263184, -0.003556489944458008, -0.0034061074256896973, -0.0032557249069213867, -0.003105342388153076, -0.0029549598693847656, -0.002804577350616455, -0.0026541948318481445, -0.002503812313079834, -0.0023534297943115234, -0.002203047275543213, -0.0020526647567749023, -0.0019022822380065918, -0.0017518997192382812, -0.0016015172004699707, -0.0014511346817016602, -0.0013007521629333496, -0.001150369644165039, -0.0009999871253967285, -0.000849604606628418, -0.0006992220878601074, -0.0005488395690917969, -0.00039845705032348633, -0.0002480745315551758, -9.769201278686523e-05, 5.269050598144531e-05, 0.00020307302474975586, 0.0003534555435180664, 0.000503838062286377, 0.0006542205810546875, 0.000804603099822998, 0.0009549856185913086, 0.0011053681373596191, 0.0012557506561279297, 0.0014061331748962402, 0.0015565156936645508, 0.0017068982124328613, 0.0018572807312011719, 0.0020076632499694824, 0.002158045768737793, 0.0023084282875061035, 0.002458810806274414, 0.0026091933250427246, 0.002759575843811035, 0.0029099583625793457, 0.0030603408813476562, 0.003210723400115967, 0.0033611059188842773, 0.003511488437652588, 0.0036618709564208984, 0.003812253475189209, 0.0039626359939575195, 0.00411301851272583, 0.004263401031494141, 0.004413783550262451, 0.004564166069030762, 0.004714548587799072, 0.004864931106567383, 0.005015313625335693, 0.005165696144104004, 0.0053160786628723145, 0.005466461181640625]}, "gradients/decoder.transformer.h.19.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 7.0, 5.0, 5.0, 7.0, 9.0, 15.0, 13.0, 22.0, 22.0, 19.0, 41.0, 42.0, 81.0, 102.0, 163.0, 270.0, 407.0, 1215.0, 189964.0, 852609.0, 2158.0, 480.0, 270.0, 165.0, 129.0, 82.0, 65.0, 42.0, 28.0, 29.0, 14.0, 17.0, 15.0, 8.0, 13.0, 7.0, 4.0, 6.0, 1.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.119873046875, -0.11655521392822266, -0.11323738098144531, -0.10991954803466797, -0.10660171508789062, -0.10328388214111328, -0.09996604919433594, -0.0966482162475586, -0.09333038330078125, -0.0900125503540039, -0.08669471740722656, -0.08337688446044922, -0.08005905151367188, -0.07674121856689453, -0.07342338562011719, -0.07010555267333984, -0.0667877197265625, -0.06346988677978516, -0.06015205383300781, -0.05683422088623047, -0.053516387939453125, -0.05019855499267578, -0.04688072204589844, -0.043562889099121094, -0.04024505615234375, -0.036927223205566406, -0.03360939025878906, -0.03029155731201172, -0.026973724365234375, -0.02365589141845703, -0.020338058471679688, -0.017020225524902344, -0.013702392578125, -0.010384559631347656, -0.0070667266845703125, -0.0037488937377929688, -0.000431060791015625, 0.0028867721557617188, 0.0062046051025390625, 0.009522438049316406, 0.01284027099609375, 0.016158103942871094, 0.019475936889648438, 0.02279376983642578, 0.026111602783203125, 0.02942943572998047, 0.03274726867675781, 0.036065101623535156, 0.0393829345703125, 0.042700767517089844, 0.04601860046386719, 0.04933643341064453, 0.052654266357421875, 0.05597209930419922, 0.05928993225097656, 0.0626077651977539, 0.06592559814453125, 0.0692434310913086, 0.07256126403808594, 0.07587909698486328, 0.07919692993164062, 0.08251476287841797, 0.08583259582519531, 0.08915042877197266, 0.09246826171875]}, "gradients/decoder.transformer.h.19.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 326.0, 655.0, 26.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03520818427205086, -0.03423449769616127, -0.03326081112027168, -0.032287124544382095, -0.03131343796849251, -0.03033974952995777, -0.029366062954068184, -0.028392376378178596, -0.02741868793964386, -0.026445001363754272, -0.025471314787864685, -0.024497628211975098, -0.02352393977344036, -0.022550253197550774, -0.021576566621661186, -0.0206028800457716, -0.01962919346988201, -0.018655506893992424, -0.017681820318102837, -0.0167081318795681, -0.015734445303678513, -0.014760758727788925, -0.013787072151899338, -0.01281338557600975, -0.011839698068797588, -0.010866011492908001, -0.009892323985695839, -0.008918637409806252, -0.007944950833916664, -0.006971263326704502, -0.005997576750814915, -0.00502388970926404, -0.0040502045303583145, -0.00307651748880744, -0.0021028306800872087, -0.0011291438713669777, -0.00015545682981610298, 0.0008182302117347717, 0.0017919167876243591, 0.002765603829175234, 0.0037392908707261086, 0.004712977912276983, 0.005686664953827858, 0.006660351529717445, 0.00763403857126832, 0.008607725612819195, 0.009581412188708782, 0.010555099695920944, 0.011528786271810532, 0.012502472847700119, 0.013476160354912281, 0.014449846930801868, 0.01542353443801403, 0.016397221013903618, 0.017370907589793205, 0.018344594165682793, 0.01931828260421753, 0.020291969180107117, 0.021265655755996704, 0.02223934233188629, 0.023213030770421028, 0.024186717346310616, 0.025160403922200203, 0.02613409049808979, 0.027107777073979378]}, "gradients/decoder.transformer.h.19.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 2.0, 6.0, 15.0, 13.0, 15.0, 14.0, 11.0, 17.0, 21.0, 28.0, 19.0, 31.0, 27.0, 36.0, 36.0, 38.0, 39.0, 39.0, 47.0, 48.0, 46.0, 41.0, 33.0, 47.0, 39.0, 33.0, 42.0, 26.0, 21.0, 31.0, 13.0, 14.0, 19.0, 23.0, 14.0, 13.0, 11.0, 10.0, 3.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 1.0], "bins": [-0.0027774572372436523, -0.002688334323465824, -0.002599211409687996, -0.0025100884959101677, -0.0024209655821323395, -0.0023318426683545113, -0.002242719754576683, -0.002153596840798855, -0.0020644739270210266, -0.0019753510132431984, -0.0018862280994653702, -0.001797105185687542, -0.0017079822719097137, -0.0016188593581318855, -0.0015297364443540573, -0.001440613530576229, -0.0013514906167984009, -0.0012623677030205727, -0.0011732447892427444, -0.0010841218754649162, -0.000994998961687088, -0.0009058760479092598, -0.0008167531341314316, -0.0007276302203536034, -0.0006385073065757751, -0.0005493843927979469, -0.0004602614790201187, -0.0003711385652422905, -0.0002820156514644623, -0.00019289273768663406, -0.00010376982390880585, -1.464691013097763e-05, 7.447600364685059e-05, 0.0001635989174246788, 0.000252721831202507, 0.00034184474498033524, 0.00043096765875816345, 0.0005200905725359917, 0.0006092134863138199, 0.0006983364000916481, 0.0007874593138694763, 0.0008765822276473045, 0.0009657051414251328, 0.001054828055202961, 0.0011439509689807892, 0.0012330738827586174, 0.0013221967965364456, 0.0014113197103142738, 0.001500442624092102, 0.0015895655378699303, 0.0016786884516477585, 0.0017678113654255867, 0.001856934279203415, 0.0019460571929812431, 0.0020351801067590714, 0.0021243030205368996, 0.002213425934314728, 0.002302548848092556, 0.002391671761870384, 0.0024807946756482124, 0.0025699175894260406, 0.002659040503203869, 0.002748163416981697, 0.0028372863307595253, 0.0029264092445373535]}, "gradients/decoder.transformer.h.19.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 5.0, 1.0, 1.0, 4.0, 2.0, 4.0, 9.0, 10.0, 17.0, 11.0, 21.0, 17.0, 25.0, 26.0, 25.0, 26.0, 33.0, 37.0, 28.0, 42.0, 47.0, 41.0, 54.0, 41.0, 44.0, 49.0, 39.0, 34.0, 45.0, 38.0, 31.0, 29.0, 22.0, 31.0, 19.0, 21.0, 16.0, 19.0, 15.0, 12.0, 8.0, 5.0, 2.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.12890625, -6.90179443359375, -6.6746826171875, -6.44757080078125, -6.220458984375, -5.99334716796875, -5.7662353515625, -5.53912353515625, -5.31201171875, -5.08489990234375, -4.8577880859375, -4.63067626953125, -4.403564453125, -4.17645263671875, -3.9493408203125, -3.72222900390625, -3.4951171875, -3.26800537109375, -3.0408935546875, -2.81378173828125, -2.586669921875, -2.35955810546875, -2.1324462890625, -1.90533447265625, -1.67822265625, -1.45111083984375, -1.2239990234375, -0.99688720703125, -0.769775390625, -0.54266357421875, -0.3155517578125, -0.08843994140625, 0.138671875, 0.36578369140625, 0.5928955078125, 0.82000732421875, 1.047119140625, 1.27423095703125, 1.5013427734375, 1.72845458984375, 1.95556640625, 2.18267822265625, 2.4097900390625, 2.63690185546875, 2.864013671875, 3.09112548828125, 3.3182373046875, 3.54534912109375, 3.7724609375, 3.99957275390625, 4.2266845703125, 4.45379638671875, 4.680908203125, 4.90802001953125, 5.1351318359375, 5.36224365234375, 5.58935546875, 5.81646728515625, 6.0435791015625, 6.27069091796875, 6.497802734375, 6.72491455078125, 6.9520263671875, 7.17913818359375, 7.40625]}, "gradients/decoder.transformer.h.19.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 11.0, 16.0, 15.0, 17.0, 22.0, 41.0, 47.0, 71.0, 103.0, 119.0, 185.0, 216.0, 312.0, 383.0, 537.0, 654.0, 919.0, 1300.0, 1907.0, 3176.0, 5488.0, 10844.0, 24223.0, 65177.0, 215318.0, 433600.0, 181612.0, 56227.0, 21580.0, 9909.0, 5071.0, 2916.0, 1788.0, 1233.0, 911.0, 601.0, 523.0, 387.0, 262.0, 226.0, 159.0, 126.0, 97.0, 77.0, 48.0, 30.0, 29.0, 16.0, 15.0, 5.0, 10.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.86328125, -4.70855712890625, -4.5538330078125, -4.39910888671875, -4.244384765625, -4.08966064453125, -3.9349365234375, -3.78021240234375, -3.62548828125, -3.47076416015625, -3.3160400390625, -3.16131591796875, -3.006591796875, -2.85186767578125, -2.6971435546875, -2.54241943359375, -2.3876953125, -2.23297119140625, -2.0782470703125, -1.92352294921875, -1.768798828125, -1.61407470703125, -1.4593505859375, -1.30462646484375, -1.14990234375, -0.99517822265625, -0.8404541015625, -0.68572998046875, -0.531005859375, -0.37628173828125, -0.2215576171875, -0.06683349609375, 0.087890625, 0.24261474609375, 0.3973388671875, 0.55206298828125, 0.706787109375, 0.86151123046875, 1.0162353515625, 1.17095947265625, 1.32568359375, 1.48040771484375, 1.6351318359375, 1.78985595703125, 1.944580078125, 2.09930419921875, 2.2540283203125, 2.40875244140625, 2.5634765625, 2.71820068359375, 2.8729248046875, 3.02764892578125, 3.182373046875, 3.33709716796875, 3.4918212890625, 3.64654541015625, 3.80126953125, 3.95599365234375, 4.1107177734375, 4.26544189453125, 4.420166015625, 4.57489013671875, 4.7296142578125, 4.88433837890625, 5.0390625]}, "gradients/decoder.transformer.h.19.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 4.0, 4.0, 4.0, 3.0, 8.0, 9.0, 12.0, 14.0, 11.0, 21.0, 16.0, 16.0, 17.0, 30.0, 19.0, 30.0, 32.0, 29.0, 47.0, 40.0, 41.0, 63.0, 117.0, 1590.0, 306.0, 122.0, 59.0, 54.0, 36.0, 47.0, 45.0, 25.0, 24.0, 26.0, 20.0, 14.0, 17.0, 7.0, 10.0, 14.0, 9.0, 8.0, 6.0, 6.0, 2.0, 10.0, 5.0, 1.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0], "bins": [-21.640625, -20.916015625, -20.19140625, -19.466796875, -18.7421875, -18.017578125, -17.29296875, -16.568359375, -15.84375, -15.119140625, -14.39453125, -13.669921875, -12.9453125, -12.220703125, -11.49609375, -10.771484375, -10.046875, -9.322265625, -8.59765625, -7.873046875, -7.1484375, -6.423828125, -5.69921875, -4.974609375, -4.25, -3.525390625, -2.80078125, -2.076171875, -1.3515625, -0.626953125, 0.09765625, 0.822265625, 1.546875, 2.271484375, 2.99609375, 3.720703125, 4.4453125, 5.169921875, 5.89453125, 6.619140625, 7.34375, 8.068359375, 8.79296875, 9.517578125, 10.2421875, 10.966796875, 11.69140625, 12.416015625, 13.140625, 13.865234375, 14.58984375, 15.314453125, 16.0390625, 16.763671875, 17.48828125, 18.212890625, 18.9375, 19.662109375, 20.38671875, 21.111328125, 21.8359375, 22.560546875, 23.28515625, 24.009765625, 24.734375]}, "gradients/decoder.transformer.h.19.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 8.0, 2.0, 5.0, 5.0, 10.0, 7.0, 13.0, 15.0, 8.0, 13.0, 24.0, 25.0, 39.0, 58.0, 64.0, 85.0, 127.0, 169.0, 316.0, 729.0, 3181.0, 52417.0, 3039508.0, 44375.0, 2819.0, 672.0, 310.0, 181.0, 112.0, 88.0, 71.0, 43.0, 40.0, 26.0, 21.0, 15.0, 20.0, 18.0, 11.0, 18.0, 8.0, 7.0, 4.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0], "bins": [-41.5, -40.29638671875, -39.0927734375, -37.88916015625, -36.685546875, -35.48193359375, -34.2783203125, -33.07470703125, -31.87109375, -30.66748046875, -29.4638671875, -28.26025390625, -27.056640625, -25.85302734375, -24.6494140625, -23.44580078125, -22.2421875, -21.03857421875, -19.8349609375, -18.63134765625, -17.427734375, -16.22412109375, -15.0205078125, -13.81689453125, -12.61328125, -11.40966796875, -10.2060546875, -9.00244140625, -7.798828125, -6.59521484375, -5.3916015625, -4.18798828125, -2.984375, -1.78076171875, -0.5771484375, 0.62646484375, 1.830078125, 3.03369140625, 4.2373046875, 5.44091796875, 6.64453125, 7.84814453125, 9.0517578125, 10.25537109375, 11.458984375, 12.66259765625, 13.8662109375, 15.06982421875, 16.2734375, 17.47705078125, 18.6806640625, 19.88427734375, 21.087890625, 22.29150390625, 23.4951171875, 24.69873046875, 25.90234375, 27.10595703125, 28.3095703125, 29.51318359375, 30.716796875, 31.92041015625, 33.1240234375, 34.32763671875, 35.53125]}, "gradients/decoder.transformer.h.19.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 9.0, 53.0, 205.0, 418.0, 262.0, 62.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-64.32811737060547, -61.589595794677734, -58.851070404052734, -56.112548828125, -53.3740234375, -50.635501861572266, -47.89698028564453, -45.15845489501953, -42.4199333190918, -39.68141174316406, -36.94288635253906, -34.20436477661133, -31.46584129333496, -28.727317810058594, -25.98879623413086, -23.250272750854492, -20.511749267578125, -17.773225784301758, -15.034703254699707, -12.296180725097656, -9.557657241821289, -6.819133758544922, -4.0806121826171875, -1.3420886993408203, 1.3964347839355469, 4.134957790374756, 6.873480796813965, 9.612003326416016, 12.350526809692383, 15.08905029296875, 17.827571868896484, 20.56609535217285, 23.30461883544922, 26.043142318725586, 28.781665802001953, 31.520187377929688, 34.25871276855469, 36.99723434448242, 39.735755920410156, 42.474281311035156, 45.21280288696289, 47.951324462890625, 50.689849853515625, 53.42837142944336, 56.166893005371094, 58.905418395996094, 61.64393997192383, 64.38246154785156, 67.12098693847656, 69.85951232910156, 72.59803009033203, 75.33655548095703, 78.07508087158203, 80.8135986328125, 83.5521240234375, 86.2906494140625, 89.0291748046875, 91.7677001953125, 94.50621795654297, 97.24474334716797, 99.98326873779297, 102.72178649902344, 105.46031188964844, 108.19883728027344, 110.9373550415039]}, "gradients/decoder.transformer.h.19.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 1.0, 4.0, 3.0, 6.0, 7.0, 7.0, 17.0, 11.0, 14.0, 21.0, 21.0, 21.0, 29.0, 26.0, 29.0, 40.0, 35.0, 43.0, 42.0, 38.0, 41.0, 43.0, 37.0, 52.0, 38.0, 47.0, 37.0, 33.0, 26.0, 29.0, 35.0, 23.0, 24.0, 15.0, 22.0, 16.0, 12.0, 11.0, 12.0, 9.0, 4.0, 7.0, 8.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0], "bins": [-92.89500427246094, -90.39706420898438, -87.89911651611328, -85.40117645263672, -82.90323638916016, -80.40528869628906, -77.9073486328125, -75.40940856933594, -72.91146850585938, -70.41352844238281, -67.91558074951172, -65.41764068603516, -62.919700622558594, -60.421756744384766, -57.92381286621094, -55.425872802734375, -52.92792510986328, -50.42998123168945, -47.93204116821289, -45.43409729003906, -42.9361572265625, -40.43821334838867, -37.940269470214844, -35.44232940673828, -32.94438552856445, -30.446443557739258, -27.948501586914062, -25.450557708740234, -22.95261573791504, -20.454673767089844, -17.956729888916016, -15.45878791809082, -12.960853576660156, -10.462911605834961, -7.964968681335449, -5.467026233673096, -2.969083786010742, -0.4711418151855469, 2.026801109313965, 4.524744033813477, 7.022686004638672, 9.520627975463867, 12.018570899963379, 14.51651382446289, 17.014455795288086, 19.51239776611328, 22.01034164428711, 24.508283615112305, 27.0062255859375, 29.504167556762695, 32.00210952758789, 34.50005340576172, 36.99799346923828, 39.49593734741211, 41.99388122558594, 44.4918212890625, 46.98976516723633, 49.487709045410156, 51.98564910888672, 54.48359298706055, 56.981536865234375, 59.47947692871094, 61.977420806884766, 64.4753646850586, 66.97330474853516]}, "gradients/decoder.transformer.h.18.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 2.0, 3.0, 3.0, 8.0, 12.0, 12.0, 10.0, 13.0, 27.0, 22.0, 26.0, 26.0, 30.0, 28.0, 24.0, 36.0, 42.0, 43.0, 46.0, 49.0, 46.0, 48.0, 47.0, 38.0, 36.0, 39.0, 34.0, 45.0, 28.0, 26.0, 27.0, 21.0, 20.0, 16.0, 19.0, 16.0, 15.0, 8.0, 4.0, 5.0, 0.0, 3.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.6171875, -7.384521484375, -7.15185546875, -6.919189453125, -6.6865234375, -6.453857421875, -6.22119140625, -5.988525390625, -5.755859375, -5.523193359375, -5.29052734375, -5.057861328125, -4.8251953125, -4.592529296875, -4.35986328125, -4.127197265625, -3.89453125, -3.661865234375, -3.42919921875, -3.196533203125, -2.9638671875, -2.731201171875, -2.49853515625, -2.265869140625, -2.033203125, -1.800537109375, -1.56787109375, -1.335205078125, -1.1025390625, -0.869873046875, -0.63720703125, -0.404541015625, -0.171875, 0.060791015625, 0.29345703125, 0.526123046875, 0.7587890625, 0.991455078125, 1.22412109375, 1.456787109375, 1.689453125, 1.922119140625, 2.15478515625, 2.387451171875, 2.6201171875, 2.852783203125, 3.08544921875, 3.318115234375, 3.55078125, 3.783447265625, 4.01611328125, 4.248779296875, 4.4814453125, 4.714111328125, 4.94677734375, 5.179443359375, 5.412109375, 5.644775390625, 5.87744140625, 6.110107421875, 6.3427734375, 6.575439453125, 6.80810546875, 7.040771484375, 7.2734375]}, "gradients/decoder.transformer.h.18.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 5.0, 5.0, 4.0, 9.0, 15.0, 21.0, 18.0, 28.0, 19.0, 37.0, 60.0, 82.0, 168.0, 345.0, 880.0, 3064.0, 13595.0, 82454.0, 1033398.0, 2737716.0, 279121.0, 33819.0, 6527.0, 1715.0, 542.0, 252.0, 92.0, 81.0, 45.0, 40.0, 34.0, 14.0, 22.0, 16.0, 11.0, 6.0, 8.0, 9.0, 2.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.953125, -22.24169921875, -21.5302734375, -20.81884765625, -20.107421875, -19.39599609375, -18.6845703125, -17.97314453125, -17.26171875, -16.55029296875, -15.8388671875, -15.12744140625, -14.416015625, -13.70458984375, -12.9931640625, -12.28173828125, -11.5703125, -10.85888671875, -10.1474609375, -9.43603515625, -8.724609375, -8.01318359375, -7.3017578125, -6.59033203125, -5.87890625, -5.16748046875, -4.4560546875, -3.74462890625, -3.033203125, -2.32177734375, -1.6103515625, -0.89892578125, -0.1875, 0.52392578125, 1.2353515625, 1.94677734375, 2.658203125, 3.36962890625, 4.0810546875, 4.79248046875, 5.50390625, 6.21533203125, 6.9267578125, 7.63818359375, 8.349609375, 9.06103515625, 9.7724609375, 10.48388671875, 11.1953125, 11.90673828125, 12.6181640625, 13.32958984375, 14.041015625, 14.75244140625, 15.4638671875, 16.17529296875, 16.88671875, 17.59814453125, 18.3095703125, 19.02099609375, 19.732421875, 20.44384765625, 21.1552734375, 21.86669921875, 22.578125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 9.0, 6.0, 4.0, 7.0, 6.0, 16.0, 43.0, 32.0, 68.0, 101.0, 144.0, 233.0, 311.0, 478.0, 609.0, 602.0, 453.0, 278.0, 224.0, 172.0, 99.0, 79.0, 36.0, 23.0, 21.0, 13.0, 4.0, 5.0, 4.0, 4.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-33.40625, -32.568603515625, -31.73095703125, -30.893310546875, -30.0556640625, -29.218017578125, -28.38037109375, -27.542724609375, -26.705078125, -25.867431640625, -25.02978515625, -24.192138671875, -23.3544921875, -22.516845703125, -21.67919921875, -20.841552734375, -20.00390625, -19.166259765625, -18.32861328125, -17.490966796875, -16.6533203125, -15.815673828125, -14.97802734375, -14.140380859375, -13.302734375, -12.465087890625, -11.62744140625, -10.789794921875, -9.9521484375, -9.114501953125, -8.27685546875, -7.439208984375, -6.6015625, -5.763916015625, -4.92626953125, -4.088623046875, -3.2509765625, -2.413330078125, -1.57568359375, -0.738037109375, 0.099609375, 0.937255859375, 1.77490234375, 2.612548828125, 3.4501953125, 4.287841796875, 5.12548828125, 5.963134765625, 6.80078125, 7.638427734375, 8.47607421875, 9.313720703125, 10.1513671875, 10.989013671875, 11.82666015625, 12.664306640625, 13.501953125, 14.339599609375, 15.17724609375, 16.014892578125, 16.8525390625, 17.690185546875, 18.52783203125, 19.365478515625, 20.203125]}, "gradients/decoder.transformer.h.18.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 5.0, 1.0, 3.0, 3.0, 4.0, 8.0, 18.0, 17.0, 23.0, 37.0, 44.0, 64.0, 92.0, 159.0, 235.0, 427.0, 847.0, 3156.0, 33052.0, 1442390.0, 2654526.0, 52888.0, 4088.0, 1024.0, 452.0, 236.0, 154.0, 96.0, 68.0, 56.0, 36.0, 22.0, 17.0, 7.0, 12.0, 9.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-52.65625, -50.78076171875, -48.9052734375, -47.02978515625, -45.154296875, -43.27880859375, -41.4033203125, -39.52783203125, -37.65234375, -35.77685546875, -33.9013671875, -32.02587890625, -30.150390625, -28.27490234375, -26.3994140625, -24.52392578125, -22.6484375, -20.77294921875, -18.8974609375, -17.02197265625, -15.146484375, -13.27099609375, -11.3955078125, -9.52001953125, -7.64453125, -5.76904296875, -3.8935546875, -2.01806640625, -0.142578125, 1.73291015625, 3.6083984375, 5.48388671875, 7.359375, 9.23486328125, 11.1103515625, 12.98583984375, 14.861328125, 16.73681640625, 18.6123046875, 20.48779296875, 22.36328125, 24.23876953125, 26.1142578125, 27.98974609375, 29.865234375, 31.74072265625, 33.6162109375, 35.49169921875, 37.3671875, 39.24267578125, 41.1181640625, 42.99365234375, 44.869140625, 46.74462890625, 48.6201171875, 50.49560546875, 52.37109375, 54.24658203125, 56.1220703125, 57.99755859375, 59.873046875, 61.74853515625, 63.6240234375, 65.49951171875, 67.375]}, "gradients/decoder.transformer.h.18.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 9.0, 12.0, 24.0, 81.0, 123.0, 200.0, 211.0, 164.0, 102.0, 52.0, 19.0, 11.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-77.49533081054688, -72.02521514892578, -66.55509185791016, -61.08497619628906, -55.61486053466797, -50.14474105834961, -44.67462158203125, -39.204505920410156, -33.7343864440918, -28.26426887512207, -22.794151306152344, -17.324031829833984, -11.853914260864258, -6.383796691894531, -0.9136772155761719, 4.556438446044922, 10.026557922363281, 15.496675491333008, 20.966793060302734, 26.436912536621094, 31.90703010559082, 37.37714767456055, 42.847267150878906, 48.3173828125, 53.78750228881836, 59.25762176513672, 64.72773742675781, 70.19786071777344, 75.66797637939453, 81.13809204101562, 86.60821533203125, 92.07832336425781, 97.54844665527344, 103.01856231689453, 108.48868560791016, 113.95880126953125, 119.42891693115234, 124.89903259277344, 130.36915588378906, 135.83926391601562, 141.30938720703125, 146.77951049804688, 152.24961853027344, 157.71974182128906, 163.1898651123047, 168.65997314453125, 174.13009643554688, 179.6002197265625, 185.07034301757812, 190.54046630859375, 196.0105743408203, 201.48069763183594, 206.95082092285156, 212.42092895507812, 217.89105224609375, 223.36117553710938, 228.83128356933594, 234.30140686035156, 239.77151489257812, 245.24163818359375, 250.71176147460938, 256.181884765625, 261.6519775390625, 267.1221008300781, 272.59222412109375]}, "gradients/decoder.transformer.h.18.ln_2.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 4.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 2.0, 2.0, 8.0, 2.0, 5.0, 10.0, 13.0, 12.0, 16.0, 14.0, 25.0, 22.0, 27.0, 29.0, 22.0, 42.0, 32.0, 24.0, 34.0, 43.0, 35.0, 36.0, 40.0, 30.0, 39.0, 43.0, 41.0, 46.0, 37.0, 41.0, 37.0, 28.0, 22.0, 17.0, 17.0, 19.0, 10.0, 14.0, 7.0, 7.0, 11.0, 5.0, 4.0, 7.0, 3.0, 7.0, 5.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0], "bins": [-66.65666961669922, -64.62848663330078, -62.600303649902344, -60.57212448120117, -58.543941497802734, -56.5157585144043, -54.487579345703125, -52.45939636230469, -50.43121337890625, -48.40303039550781, -46.374847412109375, -44.3466682434082, -42.318485260009766, -40.29030227661133, -38.262123107910156, -36.23394012451172, -34.20575714111328, -32.177574157714844, -30.14939308166504, -28.121212005615234, -26.093029022216797, -24.06484603881836, -22.036664962768555, -20.00848388671875, -17.980300903320312, -15.952118873596191, -13.92393684387207, -11.89575481414795, -9.867572784423828, -7.839390754699707, -5.811208724975586, -3.783026695251465, -1.7548370361328125, 0.2733449935913086, 2.3015270233154297, 4.329709053039551, 6.357891082763672, 8.386073112487793, 10.414255142211914, 12.442437171936035, 14.470619201660156, 16.498802185058594, 18.5269832611084, 20.555164337158203, 22.58334732055664, 24.611530303955078, 26.639711380004883, 28.667892456054688, 30.696075439453125, 32.72425842285156, 34.75244140625, 36.78062057495117, 38.80880355834961, 40.83698654174805, 42.86516571044922, 44.893348693847656, 46.921531677246094, 48.94971466064453, 50.97789764404297, 53.00607681274414, 55.03425979614258, 57.062442779541016, 59.09062194824219, 61.118804931640625, 63.14698791503906]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 6.0, 14.0, 13.0, 17.0, 13.0, 18.0, 18.0, 28.0, 37.0, 34.0, 33.0, 53.0, 39.0, 35.0, 41.0, 42.0, 47.0, 35.0, 38.0, 51.0, 40.0, 40.0, 35.0, 41.0, 31.0, 21.0, 31.0, 26.0, 22.0, 20.0, 18.0, 14.0, 7.0, 11.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.9754638671875, -7.732177734375, -7.4888916015625, -7.24560546875, -7.0023193359375, -6.759033203125, -6.5157470703125, -6.2724609375, -6.0291748046875, -5.785888671875, -5.5426025390625, -5.29931640625, -5.0560302734375, -4.812744140625, -4.5694580078125, -4.326171875, -4.0828857421875, -3.839599609375, -3.5963134765625, -3.35302734375, -3.1097412109375, -2.866455078125, -2.6231689453125, -2.3798828125, -2.1365966796875, -1.893310546875, -1.6500244140625, -1.40673828125, -1.1634521484375, -0.920166015625, -0.6768798828125, -0.43359375, -0.1903076171875, 0.052978515625, 0.2962646484375, 0.53955078125, 0.7828369140625, 1.026123046875, 1.2694091796875, 1.5126953125, 1.7559814453125, 1.999267578125, 2.2425537109375, 2.48583984375, 2.7291259765625, 2.972412109375, 3.2156982421875, 3.458984375, 3.7022705078125, 3.945556640625, 4.1888427734375, 4.43212890625, 4.6754150390625, 4.918701171875, 5.1619873046875, 5.4052734375, 5.6485595703125, 5.891845703125, 6.1351318359375, 6.37841796875, 6.6217041015625, 6.864990234375, 7.1082763671875, 7.3515625]}, "gradients/decoder.transformer.h.18.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 5.0, 3.0, 5.0, 7.0, 13.0, 22.0, 29.0, 50.0, 73.0, 98.0, 138.0, 247.0, 293.0, 490.0, 717.0, 1041.0, 1540.0, 2235.0, 3302.0, 4867.0, 7267.0, 10847.0, 16722.0, 25282.0, 39954.0, 63906.0, 101821.0, 157668.0, 191560.0, 150813.0, 97050.0, 60457.0, 37655.0, 24601.0, 15854.0, 10466.0, 6833.0, 4804.0, 3116.0, 2137.0, 1439.0, 1011.0, 671.0, 447.0, 308.0, 259.0, 140.0, 105.0, 65.0, 50.0, 27.0, 22.0, 17.0, 14.0, 5.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.72021484375, -0.6973114013671875, -0.674407958984375, -0.6515045166015625, -0.62860107421875, -0.6056976318359375, -0.582794189453125, -0.5598907470703125, -0.5369873046875, -0.5140838623046875, -0.491180419921875, -0.4682769775390625, -0.44537353515625, -0.4224700927734375, -0.399566650390625, -0.3766632080078125, -0.353759765625, -0.3308563232421875, -0.307952880859375, -0.2850494384765625, -0.26214599609375, -0.2392425537109375, -0.216339111328125, -0.1934356689453125, -0.1705322265625, -0.1476287841796875, -0.124725341796875, -0.1018218994140625, -0.07891845703125, -0.0560150146484375, -0.033111572265625, -0.0102081298828125, 0.0126953125, 0.0355987548828125, 0.058502197265625, 0.0814056396484375, 0.10430908203125, 0.1272125244140625, 0.150115966796875, 0.1730194091796875, 0.1959228515625, 0.2188262939453125, 0.241729736328125, 0.2646331787109375, 0.28753662109375, 0.3104400634765625, 0.333343505859375, 0.3562469482421875, 0.379150390625, 0.4020538330078125, 0.424957275390625, 0.4478607177734375, 0.47076416015625, 0.4936676025390625, 0.516571044921875, 0.5394744873046875, 0.5623779296875, 0.5852813720703125, 0.608184814453125, 0.6310882568359375, 0.65399169921875, 0.6768951416015625, 0.699798583984375, 0.7227020263671875, 0.74560546875]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 3.0, 5.0, 2.0, 8.0, 5.0, 3.0, 12.0, 17.0, 13.0, 5.0, 18.0, 18.0, 13.0, 22.0, 20.0, 35.0, 29.0, 20.0, 24.0, 30.0, 38.0, 40.0, 24.0, 32.0, 36.0, 1061.0, 35.0, 38.0, 36.0, 32.0, 34.0, 32.0, 32.0, 25.0, 26.0, 24.0, 25.0, 16.0, 27.0, 21.0, 16.0, 12.0, 11.0, 9.0, 10.0, 6.0, 8.0, 7.0, 4.0, 3.0, 6.0, 0.0, 4.0, 2.0, 3.0, 0.0, 3.0], "bins": [-3.87890625, -3.7586669921875, -3.638427734375, -3.5181884765625, -3.39794921875, -3.2777099609375, -3.157470703125, -3.0372314453125, -2.9169921875, -2.7967529296875, -2.676513671875, -2.5562744140625, -2.43603515625, -2.3157958984375, -2.195556640625, -2.0753173828125, -1.955078125, -1.8348388671875, -1.714599609375, -1.5943603515625, -1.47412109375, -1.3538818359375, -1.233642578125, -1.1134033203125, -0.9931640625, -0.8729248046875, -0.752685546875, -0.6324462890625, -0.51220703125, -0.3919677734375, -0.271728515625, -0.1514892578125, -0.03125, 0.0889892578125, 0.209228515625, 0.3294677734375, 0.44970703125, 0.5699462890625, 0.690185546875, 0.8104248046875, 0.9306640625, 1.0509033203125, 1.171142578125, 1.2913818359375, 1.41162109375, 1.5318603515625, 1.652099609375, 1.7723388671875, 1.892578125, 2.0128173828125, 2.133056640625, 2.2532958984375, 2.37353515625, 2.4937744140625, 2.614013671875, 2.7342529296875, 2.8544921875, 2.9747314453125, 3.094970703125, 3.2152099609375, 3.33544921875, 3.4556884765625, 3.575927734375, 3.6961669921875, 3.81640625]}, "gradients/decoder.transformer.h.18.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 8.0, 6.0, 8.0, 20.0, 32.0, 35.0, 54.0, 92.0, 123.0, 191.0, 267.0, 424.0, 612.0, 833.0, 1288.0, 2057.0, 2995.0, 4609.0, 7050.0, 11078.0, 16974.0, 26217.0, 40987.0, 63878.0, 98141.0, 139641.0, 1211834.0, 153716.0, 109753.0, 72951.0, 46870.0, 29834.0, 19130.0, 11984.0, 8017.0, 5165.0, 3343.0, 2243.0, 1490.0, 1006.0, 681.0, 472.0, 339.0, 220.0, 127.0, 121.0, 72.0, 43.0, 32.0, 24.0, 22.0, 9.0, 10.0, 8.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.515625, -0.4998283386230469, -0.48403167724609375, -0.4682350158691406, -0.4524383544921875, -0.4366416931152344, -0.42084503173828125, -0.4050483703613281, -0.389251708984375, -0.3734550476074219, -0.35765838623046875, -0.3418617248535156, -0.3260650634765625, -0.3102684020996094, -0.29447174072265625, -0.2786750793457031, -0.26287841796875, -0.24708175659179688, -0.23128509521484375, -0.21548843383789062, -0.1996917724609375, -0.18389511108398438, -0.16809844970703125, -0.15230178833007812, -0.136505126953125, -0.12070846557617188, -0.10491180419921875, -0.08911514282226562, -0.0733184814453125, -0.057521820068359375, -0.04172515869140625, -0.025928497314453125, -0.0101318359375, 0.005664825439453125, 0.02146148681640625, 0.037258148193359375, 0.0530548095703125, 0.06885147094726562, 0.08464813232421875, 0.10044479370117188, 0.116241455078125, 0.13203811645507812, 0.14783477783203125, 0.16363143920898438, 0.1794281005859375, 0.19522476196289062, 0.21102142333984375, 0.22681808471679688, 0.24261474609375, 0.2584114074707031, 0.27420806884765625, 0.2900047302246094, 0.3058013916015625, 0.3215980529785156, 0.33739471435546875, 0.3531913757324219, 0.368988037109375, 0.3847846984863281, 0.40058135986328125, 0.4163780212402344, 0.4321746826171875, 0.4479713439941406, 0.46376800537109375, 0.4795646667480469, 0.495361328125]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 11.0, 5.0, 8.0, 12.0, 32.0, 39.0, 65.0, 89.0, 92.0, 126.0, 136.0, 101.0, 77.0, 57.0, 30.0, 23.0, 22.0, 17.0, 11.0, 7.0, 2.0, 5.0, 1.0, 6.0, 4.0, 6.0, 0.0, 4.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.010711669921875, -0.010397553443908691, -0.010083436965942383, -0.009769320487976074, -0.009455204010009766, -0.009141087532043457, -0.008826971054077148, -0.00851285457611084, -0.008198738098144531, -0.007884621620178223, -0.007570505142211914, -0.0072563886642456055, -0.006942272186279297, -0.006628155708312988, -0.00631403923034668, -0.005999922752380371, -0.0056858062744140625, -0.005371689796447754, -0.005057573318481445, -0.004743456840515137, -0.004429340362548828, -0.0041152238845825195, -0.003801107406616211, -0.0034869909286499023, -0.0031728744506835938, -0.002858757972717285, -0.0025446414947509766, -0.002230525016784668, -0.0019164085388183594, -0.0016022920608520508, -0.0012881755828857422, -0.0009740591049194336, -0.000659942626953125, -0.0003458261489868164, -3.170967102050781e-05, 0.0002824068069458008, 0.0005965232849121094, 0.000910639762878418, 0.0012247562408447266, 0.0015388727188110352, 0.0018529891967773438, 0.0021671056747436523, 0.002481222152709961, 0.0027953386306762695, 0.003109455108642578, 0.0034235715866088867, 0.0037376880645751953, 0.004051804542541504, 0.0043659210205078125, 0.004680037498474121, 0.00499415397644043, 0.005308270454406738, 0.005622386932373047, 0.0059365034103393555, 0.006250619888305664, 0.006564736366271973, 0.006878852844238281, 0.00719296932220459, 0.0075070858001708984, 0.007821202278137207, 0.008135318756103516, 0.008449435234069824, 0.008763551712036133, 0.009077668190002441, 0.00939178466796875]}, "gradients/decoder.transformer.h.18.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 7.0, 5.0, 2.0, 6.0, 6.0, 18.0, 13.0, 22.0, 22.0, 56.0, 98.0, 162.0, 473.0, 4612.0, 1040739.0, 1545.0, 356.0, 167.0, 90.0, 68.0, 31.0, 19.0, 10.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.219482421875, -0.21226119995117188, -0.20503997802734375, -0.19781875610351562, -0.1905975341796875, -0.18337631225585938, -0.17615509033203125, -0.16893386840820312, -0.161712646484375, -0.15449142456054688, -0.14727020263671875, -0.14004898071289062, -0.1328277587890625, -0.12560653686523438, -0.11838531494140625, -0.11116409301757812, -0.10394287109375, -0.09672164916992188, -0.08950042724609375, -0.08227920532226562, -0.0750579833984375, -0.06783676147460938, -0.06061553955078125, -0.053394317626953125, -0.046173095703125, -0.038951873779296875, -0.03173065185546875, -0.024509429931640625, -0.0172882080078125, -0.010066986083984375, -0.00284576416015625, 0.004375457763671875, 0.0115966796875, 0.018817901611328125, 0.02603912353515625, 0.033260345458984375, 0.0404815673828125, 0.047702789306640625, 0.05492401123046875, 0.062145233154296875, 0.069366455078125, 0.07658767700195312, 0.08380889892578125, 0.09103012084960938, 0.0982513427734375, 0.10547256469726562, 0.11269378662109375, 0.11991500854492188, 0.12713623046875, 0.13435745239257812, 0.14157867431640625, 0.14879989624023438, 0.1560211181640625, 0.16324234008789062, 0.17046356201171875, 0.17768478393554688, 0.184906005859375, 0.19212722778320312, 0.19934844970703125, 0.20656967163085938, 0.2137908935546875, 0.22101211547851562, 0.22823333740234375, 0.23545455932617188, 0.24267578125]}, "gradients/decoder.transformer.h.18.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 14.0, 65.0, 202.0, 339.0, 255.0, 105.0, 19.0, 6.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0027733028400689363, -0.0024084763135761023, -0.002043650019913912, -0.0016788234934210777, -0.0013139970833435655, -0.0009491706732660532, -0.0005843441467732191, -0.00021951785311102867, 0.00014530867338180542, 0.0005101350834593177, 0.0008749615517444909, 0.001239788020029664, 0.0016046144301071763, 0.0019694408401846886, 0.0023342673666775227, 0.002699093660339713, 0.003063920186832547, 0.0034287467133253813, 0.0037935730069875717, 0.004158399533480406, 0.00452322605997324, 0.004888052120804787, 0.005252879112958908, 0.005617705173790455, 0.005982531700283289, 0.006347358226776123, 0.006712184753268957, 0.007077011279761791, 0.007441837340593338, 0.007806663867086172, 0.008171490393579006, 0.008536316454410553, 0.0089011425152421, 0.009265968576073647, 0.009630795568227768, 0.009995621629059315, 0.010360448621213436, 0.010725274682044983, 0.011090101674199104, 0.011454927735030651, 0.011819753795862198, 0.012184579856693745, 0.012549406848847866, 0.012914232909679413, 0.013279059901833534, 0.013643885962665081, 0.014008712023496628, 0.01437353901565075, 0.01473836600780487, 0.015103192068636417, 0.015468019060790539, 0.015832845121622086, 0.016197672113776207, 0.01656249910593033, 0.0169273242354393, 0.017292151227593422, 0.017656976357102394, 0.018021803349256516, 0.018386628478765488, 0.01875145547091961, 0.01911628246307373, 0.019481107592582703, 0.019845934584736824, 0.020210761576890945, 0.020575588569045067]}, "gradients/decoder.transformer.h.18.ln_cross_attn.bias": {"_type": "histogram", "values": [7.0, 2.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 6.0, 4.0, 11.0, 8.0, 9.0, 8.0, 14.0, 10.0, 18.0, 20.0, 20.0, 13.0, 30.0, 30.0, 31.0, 45.0, 33.0, 41.0, 32.0, 47.0, 27.0, 39.0, 47.0, 33.0, 34.0, 29.0, 38.0, 38.0, 31.0, 42.0, 21.0, 19.0, 25.0, 17.0, 21.0, 17.0, 19.0, 12.0, 14.0, 13.0, 6.0, 6.0, 3.0, 4.0, 5.0, 2.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.0037806034088134766, -0.0036630742251873016, -0.0035455450415611267, -0.0034280158579349518, -0.003310486674308777, -0.003192957490682602, -0.003075428307056427, -0.002957899123430252, -0.002840369939804077, -0.0027228407561779022, -0.0026053115725517273, -0.0024877823889255524, -0.0023702532052993774, -0.0022527240216732025, -0.0021351948380470276, -0.0020176656544208527, -0.0019001364707946777, -0.0017826072871685028, -0.0016650781035423279, -0.001547548919916153, -0.001430019736289978, -0.001312490552663803, -0.0011949613690376282, -0.0010774321854114532, -0.0009599030017852783, -0.0008423738181591034, -0.0007248446345329285, -0.0006073154509067535, -0.0004897862672805786, -0.0003722570836544037, -0.00025472790002822876, -0.00013719871640205383, -1.9669532775878906e-05, 9.785965085029602e-05, 0.00021538883447647095, 0.0003329180181026459, 0.0004504472017288208, 0.0005679763853549957, 0.0006855055689811707, 0.0008030347526073456, 0.0009205639362335205, 0.0010380931198596954, 0.0011556223034858704, 0.0012731514871120453, 0.0013906806707382202, 0.0015082098543643951, 0.00162573903799057, 0.001743268221616745, 0.00186079740524292, 0.001978326588869095, 0.0020958557724952698, 0.0022133849561214447, 0.0023309141397476196, 0.0024484433233737946, 0.0025659725069999695, 0.0026835016906261444, 0.0028010308742523193, 0.0029185600578784943, 0.003036089241504669, 0.003153618425130844, 0.003271147608757019, 0.003388676792383194, 0.003506205976009369, 0.003623735159635544, 0.0037412643432617188]}, "gradients/decoder.transformer.h.18.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 5.0, 4.0, 5.0, 8.0, 6.0, 14.0, 13.0, 17.0, 13.0, 18.0, 18.0, 28.0, 37.0, 34.0, 33.0, 53.0, 39.0, 35.0, 41.0, 42.0, 47.0, 35.0, 38.0, 51.0, 40.0, 40.0, 35.0, 41.0, 31.0, 21.0, 31.0, 26.0, 22.0, 20.0, 18.0, 14.0, 7.0, 11.0, 4.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-8.21875, -7.9754638671875, -7.732177734375, -7.4888916015625, -7.24560546875, -7.0023193359375, -6.759033203125, -6.5157470703125, -6.2724609375, -6.0291748046875, -5.785888671875, -5.5426025390625, -5.29931640625, -5.0560302734375, -4.812744140625, -4.5694580078125, -4.326171875, -4.0828857421875, -3.839599609375, -3.5963134765625, -3.35302734375, -3.1097412109375, -2.866455078125, -2.6231689453125, -2.3798828125, -2.1365966796875, -1.893310546875, -1.6500244140625, -1.40673828125, -1.1634521484375, -0.920166015625, -0.6768798828125, -0.43359375, -0.1903076171875, 0.052978515625, 0.2962646484375, 0.53955078125, 0.7828369140625, 1.026123046875, 1.2694091796875, 1.5126953125, 1.7559814453125, 1.999267578125, 2.2425537109375, 2.48583984375, 2.7291259765625, 2.972412109375, 3.2156982421875, 3.458984375, 3.7022705078125, 3.945556640625, 4.1888427734375, 4.43212890625, 4.6754150390625, 4.918701171875, 5.1619873046875, 5.4052734375, 5.6485595703125, 5.891845703125, 6.1351318359375, 6.37841796875, 6.6217041015625, 6.864990234375, 7.1082763671875, 7.3515625]}, "gradients/decoder.transformer.h.18.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 1.0, 2.0, 10.0, 4.0, 10.0, 14.0, 13.0, 36.0, 35.0, 53.0, 67.0, 88.0, 135.0, 219.0, 348.0, 609.0, 949.0, 1506.0, 2740.0, 4801.0, 8982.0, 18507.0, 50851.0, 228677.0, 563860.0, 106434.0, 30748.0, 12989.0, 6798.0, 3711.0, 2071.0, 1223.0, 711.0, 435.0, 291.0, 186.0, 123.0, 87.0, 71.0, 48.0, 29.0, 16.0, 16.0, 13.0, 12.0, 7.0, 3.0, 5.0, 7.0, 1.0, 2.0, 0.0, 2.0, 2.0], "bins": [-9.71875, -9.4351806640625, -9.151611328125, -8.8680419921875, -8.58447265625, -8.3009033203125, -8.017333984375, -7.7337646484375, -7.4501953125, -7.1666259765625, -6.883056640625, -6.5994873046875, -6.31591796875, -6.0323486328125, -5.748779296875, -5.4652099609375, -5.181640625, -4.8980712890625, -4.614501953125, -4.3309326171875, -4.04736328125, -3.7637939453125, -3.480224609375, -3.1966552734375, -2.9130859375, -2.6295166015625, -2.345947265625, -2.0623779296875, -1.77880859375, -1.4952392578125, -1.211669921875, -0.9281005859375, -0.64453125, -0.3609619140625, -0.077392578125, 0.2061767578125, 0.48974609375, 0.7733154296875, 1.056884765625, 1.3404541015625, 1.6240234375, 1.9075927734375, 2.191162109375, 2.4747314453125, 2.75830078125, 3.0418701171875, 3.325439453125, 3.6090087890625, 3.892578125, 4.1761474609375, 4.459716796875, 4.7432861328125, 5.02685546875, 5.3104248046875, 5.593994140625, 5.8775634765625, 6.1611328125, 6.4447021484375, 6.728271484375, 7.0118408203125, 7.29541015625, 7.5789794921875, 7.862548828125, 8.1461181640625, 8.4296875]}, "gradients/decoder.transformer.h.18.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 7.0, 9.0, 5.0, 8.0, 14.0, 11.0, 14.0, 12.0, 17.0, 16.0, 32.0, 28.0, 21.0, 30.0, 32.0, 38.0, 41.0, 41.0, 69.0, 119.0, 1513.0, 404.0, 106.0, 69.0, 47.0, 35.0, 50.0, 20.0, 31.0, 25.0, 20.0, 17.0, 20.0, 21.0, 25.0, 18.0, 14.0, 7.0, 9.0, 6.0, 2.0, 4.0, 4.0, 4.0, 2.0, 1.0, 0.0, 5.0, 1.0, 0.0, 1.0], "bins": [-25.96875, -25.203857421875, -24.43896484375, -23.674072265625, -22.9091796875, -22.144287109375, -21.37939453125, -20.614501953125, -19.849609375, -19.084716796875, -18.31982421875, -17.554931640625, -16.7900390625, -16.025146484375, -15.26025390625, -14.495361328125, -13.73046875, -12.965576171875, -12.20068359375, -11.435791015625, -10.6708984375, -9.906005859375, -9.14111328125, -8.376220703125, -7.611328125, -6.846435546875, -6.08154296875, -5.316650390625, -4.5517578125, -3.786865234375, -3.02197265625, -2.257080078125, -1.4921875, -0.727294921875, 0.03759765625, 0.802490234375, 1.5673828125, 2.332275390625, 3.09716796875, 3.862060546875, 4.626953125, 5.391845703125, 6.15673828125, 6.921630859375, 7.6865234375, 8.451416015625, 9.21630859375, 9.981201171875, 10.74609375, 11.510986328125, 12.27587890625, 13.040771484375, 13.8056640625, 14.570556640625, 15.33544921875, 16.100341796875, 16.865234375, 17.630126953125, 18.39501953125, 19.159912109375, 19.9248046875, 20.689697265625, 21.45458984375, 22.219482421875, 22.984375]}, "gradients/decoder.transformer.h.18.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 9.0, 8.0, 8.0, 3.0, 15.0, 17.0, 30.0, 31.0, 39.0, 42.0, 90.0, 116.0, 219.0, 380.0, 1055.0, 12153.0, 2995597.0, 131145.0, 3330.0, 580.0, 274.0, 163.0, 105.0, 84.0, 54.0, 38.0, 29.0, 19.0, 18.0, 10.0, 9.0, 12.0, 11.0, 2.0, 2.0, 3.0, 5.0, 1.0, 2.0, 0.0, 2.0, 0.0, 2.0, 1.0], "bins": [-71.0625, -69.1298828125, -67.197265625, -65.2646484375, -63.33203125, -61.3994140625, -59.466796875, -57.5341796875, -55.6015625, -53.6689453125, -51.736328125, -49.8037109375, -47.87109375, -45.9384765625, -44.005859375, -42.0732421875, -40.140625, -38.2080078125, -36.275390625, -34.3427734375, -32.41015625, -30.4775390625, -28.544921875, -26.6123046875, -24.6796875, -22.7470703125, -20.814453125, -18.8818359375, -16.94921875, -15.0166015625, -13.083984375, -11.1513671875, -9.21875, -7.2861328125, -5.353515625, -3.4208984375, -1.48828125, 0.4443359375, 2.376953125, 4.3095703125, 6.2421875, 8.1748046875, 10.107421875, 12.0400390625, 13.97265625, 15.9052734375, 17.837890625, 19.7705078125, 21.703125, 23.6357421875, 25.568359375, 27.5009765625, 29.43359375, 31.3662109375, 33.298828125, 35.2314453125, 37.1640625, 39.0966796875, 41.029296875, 42.9619140625, 44.89453125, 46.8271484375, 48.759765625, 50.6923828125, 52.625]}, "gradients/decoder.transformer.h.18.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 9.0, 34.0, 117.0, 264.0, 316.0, 193.0, 58.0, 17.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-74.61109924316406, -72.0590591430664, -69.50702667236328, -66.95498657226562, -64.4029541015625, -61.850914001464844, -59.29887771606445, -56.74684143066406, -54.194801330566406, -51.642765045166016, -49.090728759765625, -46.53868865966797, -43.98665237426758, -41.43461608886719, -38.8825798034668, -36.330543518066406, -33.778507232666016, -31.226470947265625, -28.6744327545166, -26.12239646911621, -23.570358276367188, -21.018321990966797, -18.466285705566406, -15.914247512817383, -13.362211227416992, -10.810173988342285, -8.258136749267578, -5.7061004638671875, -3.1540632247924805, -0.6020259857177734, 1.9500102996826172, 4.502048492431641, 7.054084777832031, 9.606122016906738, 12.158159255981445, 14.710195541381836, 17.26223373413086, 19.81427001953125, 22.36630630493164, 24.918344497680664, 27.470380783081055, 30.022417068481445, 32.57445526123047, 35.12649154663086, 37.67852783203125, 40.230567932128906, 42.78260040283203, 45.33464050292969, 47.88667678833008, 50.43871307373047, 52.99074935913086, 55.54278564453125, 58.094825744628906, 60.6468620300293, 63.19889831542969, 65.75093841552734, 68.30297088623047, 70.85501098632812, 73.40704345703125, 75.9590835571289, 78.51111602783203, 81.06315612792969, 83.61518859863281, 86.16722869873047, 88.71926879882812]}, "gradients/decoder.transformer.h.18.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 5.0, 6.0, 4.0, 7.0, 9.0, 10.0, 8.0, 15.0, 14.0, 13.0, 19.0, 22.0, 25.0, 23.0, 34.0, 36.0, 38.0, 33.0, 40.0, 39.0, 33.0, 34.0, 41.0, 50.0, 44.0, 36.0, 36.0, 38.0, 35.0, 27.0, 43.0, 27.0, 29.0, 17.0, 15.0, 18.0, 15.0, 5.0, 14.0, 8.0, 4.0, 4.0, 5.0, 7.0, 7.0, 4.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-75.21470642089844, -72.8707275390625, -70.52674865722656, -68.1827621459961, -65.83878326416016, -63.49480438232422, -61.15082550048828, -58.806846618652344, -56.46286392211914, -54.1188850402832, -51.77490234375, -49.43092346191406, -47.086944580078125, -44.74296188354492, -42.398983001708984, -40.05500030517578, -37.711021423339844, -35.367042541503906, -33.0230598449707, -30.679080963134766, -28.335100173950195, -25.991119384765625, -23.647140502929688, -21.303159713745117, -18.959178924560547, -16.615198135375977, -14.271218299865723, -11.927238464355469, -9.583257675170898, -7.239276885986328, -4.895297050476074, -2.5513172149658203, -0.20733642578125, 2.136643886566162, 4.480624198913574, 6.824604511260986, 9.168584823608398, 11.512565612792969, 13.856545448303223, 16.200525283813477, 18.544506072998047, 20.888486862182617, 23.232467651367188, 25.576446533203125, 27.920427322387695, 30.264408111572266, 32.6083869934082, 34.952369689941406, 37.296348571777344, 39.64032745361328, 41.984310150146484, 44.32828903198242, 46.672271728515625, 49.01625061035156, 51.3602294921875, 53.70420837402344, 56.04819107055664, 58.39216995239258, 60.73615264892578, 63.08013153076172, 65.42411041259766, 67.76809692382812, 70.11207580566406, 72.4560546875, 74.80003356933594]}, "gradients/decoder.transformer.h.17.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 6.0, 6.0, 6.0, 3.0, 6.0, 12.0, 13.0, 11.0, 22.0, 18.0, 21.0, 26.0, 27.0, 34.0, 42.0, 38.0, 47.0, 38.0, 44.0, 41.0, 43.0, 42.0, 40.0, 45.0, 37.0, 58.0, 36.0, 42.0, 21.0, 21.0, 31.0, 22.0, 25.0, 23.0, 19.0, 8.0, 10.0, 8.0, 5.0, 4.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-8.5859375, -8.33270263671875, -8.0794677734375, -7.82623291015625, -7.572998046875, -7.31976318359375, -7.0665283203125, -6.81329345703125, -6.56005859375, -6.30682373046875, -6.0535888671875, -5.80035400390625, -5.547119140625, -5.29388427734375, -5.0406494140625, -4.78741455078125, -4.5341796875, -4.28094482421875, -4.0277099609375, -3.77447509765625, -3.521240234375, -3.26800537109375, -3.0147705078125, -2.76153564453125, -2.50830078125, -2.25506591796875, -2.0018310546875, -1.74859619140625, -1.495361328125, -1.24212646484375, -0.9888916015625, -0.73565673828125, -0.482421875, -0.22918701171875, 0.0240478515625, 0.27728271484375, 0.530517578125, 0.78375244140625, 1.0369873046875, 1.29022216796875, 1.54345703125, 1.79669189453125, 2.0499267578125, 2.30316162109375, 2.556396484375, 2.80963134765625, 3.0628662109375, 3.31610107421875, 3.5693359375, 3.82257080078125, 4.0758056640625, 4.32904052734375, 4.582275390625, 4.83551025390625, 5.0887451171875, 5.34197998046875, 5.59521484375, 5.84844970703125, 6.1016845703125, 6.35491943359375, 6.608154296875, 6.86138916015625, 7.1146240234375, 7.36785888671875, 7.62109375]}, "gradients/decoder.transformer.h.17.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 6.0, 4.0, 3.0, 9.0, 13.0, 33.0, 34.0, 33.0, 60.0, 91.0, 103.0, 179.0, 290.0, 472.0, 768.0, 1304.0, 2362.0, 4516.0, 9140.0, 19413.0, 42492.0, 106678.0, 321233.0, 969719.0, 1489848.0, 805481.0, 259347.0, 89560.0, 36932.0, 16807.0, 7969.0, 4059.0, 2161.0, 1192.0, 679.0, 446.0, 278.0, 168.0, 123.0, 75.0, 67.0, 43.0, 30.0, 20.0, 15.0, 16.0, 6.0, 6.0, 7.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-9.1015625, -8.811767578125, -8.52197265625, -8.232177734375, -7.9423828125, -7.652587890625, -7.36279296875, -7.072998046875, -6.783203125, -6.493408203125, -6.20361328125, -5.913818359375, -5.6240234375, -5.334228515625, -5.04443359375, -4.754638671875, -4.46484375, -4.175048828125, -3.88525390625, -3.595458984375, -3.3056640625, -3.015869140625, -2.72607421875, -2.436279296875, -2.146484375, -1.856689453125, -1.56689453125, -1.277099609375, -0.9873046875, -0.697509765625, -0.40771484375, -0.117919921875, 0.171875, 0.461669921875, 0.75146484375, 1.041259765625, 1.3310546875, 1.620849609375, 1.91064453125, 2.200439453125, 2.490234375, 2.780029296875, 3.06982421875, 3.359619140625, 3.6494140625, 3.939208984375, 4.22900390625, 4.518798828125, 4.80859375, 5.098388671875, 5.38818359375, 5.677978515625, 5.9677734375, 6.257568359375, 6.54736328125, 6.837158203125, 7.126953125, 7.416748046875, 7.70654296875, 7.996337890625, 8.2861328125, 8.575927734375, 8.86572265625, 9.155517578125, 9.4453125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 5.0, 3.0, 3.0, 4.0, 11.0, 15.0, 16.0, 23.0, 14.0, 45.0, 51.0, 82.0, 98.0, 148.0, 187.0, 276.0, 340.0, 416.0, 464.0, 459.0, 414.0, 297.0, 206.0, 138.0, 108.0, 73.0, 54.0, 35.0, 30.0, 29.0, 11.0, 7.0, 9.0, 9.0, 5.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.03125, -25.35693359375, -24.6826171875, -24.00830078125, -23.333984375, -22.65966796875, -21.9853515625, -21.31103515625, -20.63671875, -19.96240234375, -19.2880859375, -18.61376953125, -17.939453125, -17.26513671875, -16.5908203125, -15.91650390625, -15.2421875, -14.56787109375, -13.8935546875, -13.21923828125, -12.544921875, -11.87060546875, -11.1962890625, -10.52197265625, -9.84765625, -9.17333984375, -8.4990234375, -7.82470703125, -7.150390625, -6.47607421875, -5.8017578125, -5.12744140625, -4.453125, -3.77880859375, -3.1044921875, -2.43017578125, -1.755859375, -1.08154296875, -0.4072265625, 0.26708984375, 0.94140625, 1.61572265625, 2.2900390625, 2.96435546875, 3.638671875, 4.31298828125, 4.9873046875, 5.66162109375, 6.3359375, 7.01025390625, 7.6845703125, 8.35888671875, 9.033203125, 9.70751953125, 10.3818359375, 11.05615234375, 11.73046875, 12.40478515625, 13.0791015625, 13.75341796875, 14.427734375, 15.10205078125, 15.7763671875, 16.45068359375, 17.125]}, "gradients/decoder.transformer.h.17.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 5.0, 6.0, 8.0, 4.0, 15.0, 11.0, 19.0, 27.0, 38.0, 59.0, 68.0, 109.0, 160.0, 297.0, 582.0, 1896.0, 15669.0, 467614.0, 3579306.0, 119661.0, 6431.0, 1153.0, 440.0, 240.0, 134.0, 82.0, 61.0, 42.0, 41.0, 29.0, 21.0, 19.0, 12.0, 7.0, 11.0, 2.0, 3.0, 4.0, 2.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-49.78125, -47.89013671875, -45.9990234375, -44.10791015625, -42.216796875, -40.32568359375, -38.4345703125, -36.54345703125, -34.65234375, -32.76123046875, -30.8701171875, -28.97900390625, -27.087890625, -25.19677734375, -23.3056640625, -21.41455078125, -19.5234375, -17.63232421875, -15.7412109375, -13.85009765625, -11.958984375, -10.06787109375, -8.1767578125, -6.28564453125, -4.39453125, -2.50341796875, -0.6123046875, 1.27880859375, 3.169921875, 5.06103515625, 6.9521484375, 8.84326171875, 10.734375, 12.62548828125, 14.5166015625, 16.40771484375, 18.298828125, 20.18994140625, 22.0810546875, 23.97216796875, 25.86328125, 27.75439453125, 29.6455078125, 31.53662109375, 33.427734375, 35.31884765625, 37.2099609375, 39.10107421875, 40.9921875, 42.88330078125, 44.7744140625, 46.66552734375, 48.556640625, 50.44775390625, 52.3388671875, 54.22998046875, 56.12109375, 58.01220703125, 59.9033203125, 61.79443359375, 63.685546875, 65.57666015625, 67.4677734375, 69.35888671875, 71.25]}, "gradients/decoder.transformer.h.17.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 10.0, 33.0, 71.0, 127.0, 204.0, 226.0, 178.0, 87.0, 50.0, 19.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-164.1261444091797, -158.10586547851562, -152.0855712890625, -146.06529235839844, -140.04501342773438, -134.02471923828125, -128.0044403076172, -121.9841537475586, -115.9638671875, -109.9435806274414, -103.92329406738281, -97.90301513671875, -91.88272857666016, -85.86244201660156, -79.8421630859375, -73.8218765258789, -67.80158996582031, -61.78130340576172, -55.76102066040039, -49.74073791503906, -43.72045135498047, -37.700164794921875, -31.679882049560547, -25.65959930419922, -19.639312744140625, -13.619028091430664, -7.598743438720703, -1.5784587860107422, 4.441825866699219, 10.46211051940918, 16.48239517211914, 22.50267791748047, 28.52294921875, 34.543235778808594, 40.56351852416992, 46.58380126953125, 52.604087829589844, 58.62437438964844, 64.6446533203125, 70.6649398803711, 76.68522644042969, 82.70551300048828, 88.72579956054688, 94.74607849121094, 100.76636505126953, 106.78665161132812, 112.80693054199219, 118.82721710205078, 124.84750366210938, 130.86778259277344, 136.88807678222656, 142.90835571289062, 148.92864990234375, 154.9489288330078, 160.96920776367188, 166.989501953125, 173.00978088378906, 179.03005981445312, 185.05035400390625, 191.0706329345703, 197.09091186523438, 203.1112060546875, 209.13148498535156, 215.15176391601562, 221.17205810546875]}, "gradients/decoder.transformer.h.17.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 10.0, 7.0, 12.0, 12.0, 13.0, 25.0, 17.0, 28.0, 24.0, 31.0, 33.0, 42.0, 37.0, 43.0, 43.0, 54.0, 46.0, 39.0, 30.0, 50.0, 44.0, 42.0, 36.0, 27.0, 25.0, 40.0, 25.0, 31.0, 22.0, 18.0, 17.0, 15.0, 16.0, 12.0, 5.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-69.18965911865234, -66.94194030761719, -64.69422149658203, -62.44649887084961, -60.19877624511719, -57.95105743408203, -55.703338623046875, -53.45561981201172, -51.2078971862793, -48.96017837524414, -46.71245574951172, -44.46473693847656, -42.217018127441406, -39.969295501708984, -37.72157669067383, -35.473854064941406, -33.22613525390625, -30.97841453552246, -28.730693817138672, -26.482975006103516, -24.235254287719727, -21.987533569335938, -19.73981475830078, -17.492094039916992, -15.244373321533203, -12.996652603149414, -10.748932838439941, -8.501213073730469, -6.25349235534668, -4.005771636962891, -1.758051872253418, 0.4896678924560547, 2.7373809814453125, 4.985101222991943, 7.232821464538574, 9.480541229248047, 11.728261947631836, 13.975982666015625, 16.22370147705078, 18.47142219543457, 20.71914291381836, 22.96686363220215, 25.214584350585938, 27.462303161621094, 29.710023880004883, 31.957744598388672, 34.20546340942383, 36.45318603515625, 38.700904846191406, 40.94862365722656, 43.196346282958984, 45.44406509399414, 47.69178771972656, 49.93950653076172, 52.187225341796875, 54.43494415283203, 56.68266677856445, 58.93038558959961, 61.17810821533203, 63.42582702636719, 65.67354583740234, 67.9212646484375, 70.16899108886719, 72.41670989990234, 74.6644287109375]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 4.0, 4.0, 4.0, 10.0, 12.0, 16.0, 11.0, 19.0, 23.0, 26.0, 19.0, 32.0, 43.0, 33.0, 37.0, 49.0, 43.0, 53.0, 47.0, 38.0, 36.0, 51.0, 42.0, 52.0, 35.0, 43.0, 35.0, 31.0, 28.0, 26.0, 22.0, 18.0, 13.0, 13.0, 5.0, 12.0, 7.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.234375, -8.9580078125, -8.681640625, -8.4052734375, -8.12890625, -7.8525390625, -7.576171875, -7.2998046875, -7.0234375, -6.7470703125, -6.470703125, -6.1943359375, -5.91796875, -5.6416015625, -5.365234375, -5.0888671875, -4.8125, -4.5361328125, -4.259765625, -3.9833984375, -3.70703125, -3.4306640625, -3.154296875, -2.8779296875, -2.6015625, -2.3251953125, -2.048828125, -1.7724609375, -1.49609375, -1.2197265625, -0.943359375, -0.6669921875, -0.390625, -0.1142578125, 0.162109375, 0.4384765625, 0.71484375, 0.9912109375, 1.267578125, 1.5439453125, 1.8203125, 2.0966796875, 2.373046875, 2.6494140625, 2.92578125, 3.2021484375, 3.478515625, 3.7548828125, 4.03125, 4.3076171875, 4.583984375, 4.8603515625, 5.13671875, 5.4130859375, 5.689453125, 5.9658203125, 6.2421875, 6.5185546875, 6.794921875, 7.0712890625, 7.34765625, 7.6240234375, 7.900390625, 8.1767578125, 8.453125]}, "gradients/decoder.transformer.h.17.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 9.0, 9.0, 14.0, 15.0, 24.0, 36.0, 57.0, 88.0, 141.0, 205.0, 307.0, 432.0, 621.0, 973.0, 1403.0, 2082.0, 3234.0, 5036.0, 7650.0, 11759.0, 18017.0, 28369.0, 45294.0, 72635.0, 115618.0, 170101.0, 186474.0, 137736.0, 88202.0, 55403.0, 34447.0, 21636.0, 13951.0, 9221.0, 5854.0, 3792.0, 2588.0, 1733.0, 1099.0, 738.0, 501.0, 331.0, 250.0, 148.0, 122.0, 74.0, 46.0, 35.0, 20.0, 8.0, 11.0, 8.0, 6.0, 4.0, 2.0, 1.0], "bins": [-0.81005859375, -0.786376953125, -0.7626953125, -0.739013671875, -0.71533203125, -0.691650390625, -0.66796875, -0.644287109375, -0.62060546875, -0.596923828125, -0.5732421875, -0.549560546875, -0.52587890625, -0.502197265625, -0.478515625, -0.454833984375, -0.43115234375, -0.407470703125, -0.3837890625, -0.360107421875, -0.33642578125, -0.312744140625, -0.2890625, -0.265380859375, -0.24169921875, -0.218017578125, -0.1943359375, -0.170654296875, -0.14697265625, -0.123291015625, -0.099609375, -0.075927734375, -0.05224609375, -0.028564453125, -0.0048828125, 0.018798828125, 0.04248046875, 0.066162109375, 0.08984375, 0.113525390625, 0.13720703125, 0.160888671875, 0.1845703125, 0.208251953125, 0.23193359375, 0.255615234375, 0.279296875, 0.302978515625, 0.32666015625, 0.350341796875, 0.3740234375, 0.397705078125, 0.42138671875, 0.445068359375, 0.46875, 0.492431640625, 0.51611328125, 0.539794921875, 0.5634765625, 0.587158203125, 0.61083984375, 0.634521484375, 0.658203125, 0.681884765625, 0.70556640625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 2.0, 7.0, 11.0, 12.0, 7.0, 6.0, 26.0, 24.0, 22.0, 26.0, 31.0, 27.0, 31.0, 36.0, 39.0, 37.0, 35.0, 46.0, 57.0, 1072.0, 38.0, 38.0, 35.0, 43.0, 33.0, 41.0, 37.0, 29.0, 27.0, 29.0, 18.0, 23.0, 14.0, 21.0, 16.0, 9.0, 6.0, 5.0, 3.0, 2.0, 2.0, 5.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.859375, -4.69403076171875, -4.5286865234375, -4.36334228515625, -4.197998046875, -4.03265380859375, -3.8673095703125, -3.70196533203125, -3.53662109375, -3.37127685546875, -3.2059326171875, -3.04058837890625, -2.875244140625, -2.70989990234375, -2.5445556640625, -2.37921142578125, -2.2138671875, -2.04852294921875, -1.8831787109375, -1.71783447265625, -1.552490234375, -1.38714599609375, -1.2218017578125, -1.05645751953125, -0.89111328125, -0.72576904296875, -0.5604248046875, -0.39508056640625, -0.229736328125, -0.06439208984375, 0.1009521484375, 0.26629638671875, 0.431640625, 0.59698486328125, 0.7623291015625, 0.92767333984375, 1.093017578125, 1.25836181640625, 1.4237060546875, 1.58905029296875, 1.75439453125, 1.91973876953125, 2.0850830078125, 2.25042724609375, 2.415771484375, 2.58111572265625, 2.7464599609375, 2.91180419921875, 3.0771484375, 3.24249267578125, 3.4078369140625, 3.57318115234375, 3.738525390625, 3.90386962890625, 4.0692138671875, 4.23455810546875, 4.39990234375, 4.56524658203125, 4.7305908203125, 4.89593505859375, 5.061279296875, 5.22662353515625, 5.3919677734375, 5.55731201171875, 5.72265625]}, "gradients/decoder.transformer.h.17.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 4.0, 5.0, 17.0, 15.0, 17.0, 30.0, 45.0, 68.0, 98.0, 128.0, 207.0, 331.0, 439.0, 701.0, 1047.0, 1662.0, 2572.0, 3944.0, 6391.0, 10044.0, 16119.0, 26182.0, 42490.0, 68222.0, 107141.0, 154744.0, 1225516.0, 151094.0, 103377.0, 65780.0, 40907.0, 25236.0, 15517.0, 9988.0, 6031.0, 3973.0, 2492.0, 1645.0, 986.0, 671.0, 458.0, 251.0, 177.0, 113.0, 97.0, 54.0, 33.0, 26.0, 13.0, 11.0, 10.0, 8.0, 4.0, 5.0, 1.0, 1.0, 3.0], "bins": [-0.609375, -0.5911636352539062, -0.5729522705078125, -0.5547409057617188, -0.536529541015625, -0.5183181762695312, -0.5001068115234375, -0.48189544677734375, -0.46368408203125, -0.44547271728515625, -0.4272613525390625, -0.40904998779296875, -0.390838623046875, -0.37262725830078125, -0.3544158935546875, -0.33620452880859375, -0.3179931640625, -0.29978179931640625, -0.2815704345703125, -0.26335906982421875, -0.245147705078125, -0.22693634033203125, -0.2087249755859375, -0.19051361083984375, -0.17230224609375, -0.15409088134765625, -0.1358795166015625, -0.11766815185546875, -0.099456787109375, -0.08124542236328125, -0.0630340576171875, -0.04482269287109375, -0.026611328125, -0.00839996337890625, 0.0098114013671875, 0.02802276611328125, 0.046234130859375, 0.06444549560546875, 0.0826568603515625, 0.10086822509765625, 0.11907958984375, 0.13729095458984375, 0.1555023193359375, 0.17371368408203125, 0.191925048828125, 0.21013641357421875, 0.2283477783203125, 0.24655914306640625, 0.2647705078125, 0.28298187255859375, 0.3011932373046875, 0.31940460205078125, 0.337615966796875, 0.35582733154296875, 0.3740386962890625, 0.39225006103515625, 0.41046142578125, 0.42867279052734375, 0.4468841552734375, 0.46509552001953125, 0.483306884765625, 0.5015182495117188, 0.5197296142578125, 0.5379409790039062, 0.55615234375]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 3.0, 8.0, 14.0, 12.0, 15.0, 13.0, 13.0, 27.0, 29.0, 26.0, 31.0, 45.0, 42.0, 62.0, 79.0, 74.0, 85.0, 59.0, 75.0, 42.0, 52.0, 33.0, 24.0, 22.0, 29.0, 16.0, 15.0, 9.0, 10.0, 12.0, 7.0, 7.0, 1.0, 3.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.008758544921875, -0.008516490459442139, -0.008274435997009277, -0.008032381534576416, -0.007790327072143555, -0.007548272609710693, -0.007306218147277832, -0.007064163684844971, -0.006822109222412109, -0.006580054759979248, -0.006338000297546387, -0.006095945835113525, -0.005853891372680664, -0.005611836910247803, -0.005369782447814941, -0.00512772798538208, -0.004885673522949219, -0.004643619060516357, -0.004401564598083496, -0.004159510135650635, -0.0039174556732177734, -0.003675401210784912, -0.0034333467483520508, -0.0031912922859191895, -0.002949237823486328, -0.002707183361053467, -0.0024651288986206055, -0.002223074436187744, -0.001981019973754883, -0.0017389655113220215, -0.0014969110488891602, -0.0012548565864562988, -0.0010128021240234375, -0.0007707476615905762, -0.0005286931991577148, -0.0002866387367248535, -4.458427429199219e-05, 0.00019747018814086914, 0.00043952465057373047, 0.0006815791130065918, 0.0009236335754394531, 0.0011656880378723145, 0.0014077425003051758, 0.0016497969627380371, 0.0018918514251708984, 0.0021339058876037598, 0.002375960350036621, 0.0026180148124694824, 0.0028600692749023438, 0.003102123737335205, 0.0033441781997680664, 0.0035862326622009277, 0.003828287124633789, 0.00407034158706665, 0.004312396049499512, 0.004554450511932373, 0.004796504974365234, 0.005038559436798096, 0.005280613899230957, 0.005522668361663818, 0.00576472282409668, 0.006006777286529541, 0.006248831748962402, 0.006490886211395264, 0.006732940673828125]}, "gradients/decoder.transformer.h.17.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 9.0, 12.0, 9.0, 15.0, 15.0, 26.0, 27.0, 48.0, 65.0, 104.0, 170.0, 261.0, 456.0, 1501.0, 554642.0, 488418.0, 1533.0, 462.0, 269.0, 145.0, 101.0, 72.0, 49.0, 43.0, 16.0, 22.0, 9.0, 14.0, 12.0, 7.0, 9.0, 0.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.132568359375, -0.1276569366455078, -0.12274551391601562, -0.11783409118652344, -0.11292266845703125, -0.10801124572753906, -0.10309982299804688, -0.09818840026855469, -0.0932769775390625, -0.08836555480957031, -0.08345413208007812, -0.07854270935058594, -0.07363128662109375, -0.06871986389160156, -0.06380844116210938, -0.05889701843261719, -0.053985595703125, -0.04907417297363281, -0.044162750244140625, -0.03925132751464844, -0.03433990478515625, -0.029428482055664062, -0.024517059326171875, -0.019605636596679688, -0.0146942138671875, -0.009782791137695312, -0.004871368408203125, 4.00543212890625e-05, 0.00495147705078125, 0.009862899780273438, 0.014774322509765625, 0.019685745239257812, 0.02459716796875, 0.029508590698242188, 0.034420013427734375, 0.03933143615722656, 0.04424285888671875, 0.04915428161621094, 0.054065704345703125, 0.05897712707519531, 0.0638885498046875, 0.06879997253417969, 0.07371139526367188, 0.07862281799316406, 0.08353424072265625, 0.08844566345214844, 0.09335708618164062, 0.09826850891113281, 0.103179931640625, 0.10809135437011719, 0.11300277709960938, 0.11791419982910156, 0.12282562255859375, 0.12773704528808594, 0.13264846801757812, 0.1375598907470703, 0.1424713134765625, 0.1473827362060547, 0.15229415893554688, 0.15720558166503906, 0.16211700439453125, 0.16702842712402344, 0.17193984985351562, 0.1768512725830078, 0.1817626953125]}, "gradients/decoder.transformer.h.17.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 16.0, 144.0, 530.0, 273.0, 40.0, 9.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0026666298508644104, -0.00194618571549654, -0.0012257416965439916, -0.0005052976775914431, 0.00021514645777642727, 0.0009355905931442976, 0.0016560344956815243, 0.0023764786310493946, 0.003096922766417265, 0.0038173669017851353, 0.004537811037153006, 0.005258254706859589, 0.005978698842227459, 0.006699142977595329, 0.0074195871129632, 0.00814003124833107, 0.00886047538369894, 0.00958091951906681, 0.010301363654434681, 0.011021807789802551, 0.011742251925170422, 0.012462696060538292, 0.013183139264583588, 0.013903584331274033, 0.014624027535319328, 0.015344471670687199, 0.01606491580605507, 0.016785359010100365, 0.01750580407679081, 0.018226247280836105, 0.01894669234752655, 0.019667135551571846, 0.02038758061826229, 0.021108023822307587, 0.02182846888899803, 0.022548912093043327, 0.023269357159733772, 0.023989800363779068, 0.024710245430469513, 0.02543068863451481, 0.026151133701205254, 0.02687157690525055, 0.027592021971940994, 0.02831246517598629, 0.029032910242676735, 0.02975335344672203, 0.030473798513412476, 0.03119424171745777, 0.03191468492150307, 0.03263512998819351, 0.03335557132959366, 0.0340760163962841, 0.03479646146297455, 0.03551690652966499, 0.03623734787106514, 0.036957792937755585, 0.03767823800444603, 0.038398683071136475, 0.03911912441253662, 0.039839569479227066, 0.04056001454591751, 0.041280459612607956, 0.0420009009540081, 0.04272134602069855, 0.04344179108738899]}, "gradients/decoder.transformer.h.17.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 3.0, 0.0, 8.0, 7.0, 10.0, 10.0, 8.0, 25.0, 12.0, 23.0, 19.0, 18.0, 37.0, 34.0, 34.0, 43.0, 48.0, 36.0, 49.0, 48.0, 54.0, 51.0, 46.0, 31.0, 43.0, 32.0, 38.0, 27.0, 35.0, 26.0, 25.0, 24.0, 19.0, 16.0, 18.0, 13.0, 10.0, 8.0, 7.0, 6.0, 6.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004884064197540283, -0.004735061898827553, -0.004586059600114822, -0.004437057301402092, -0.004288055002689362, -0.004139052703976631, -0.003990050405263901, -0.0038410481065511703, -0.00369204580783844, -0.0035430435091257095, -0.003394041210412979, -0.0032450389117002487, -0.0030960366129875183, -0.002947034314274788, -0.0027980320155620575, -0.002649029716849327, -0.0025000274181365967, -0.0023510251194238663, -0.002202022820711136, -0.0020530205219984055, -0.001904018223285675, -0.0017550159245729446, -0.0016060136258602142, -0.0014570113271474838, -0.0013080090284347534, -0.001159006729722023, -0.0010100044310092926, -0.0008610021322965622, -0.0007119998335838318, -0.0005629975348711014, -0.00041399523615837097, -0.00026499293744564056, -0.00011599063873291016, 3.301165997982025e-05, 0.00018201395869255066, 0.00033101625740528107, 0.0004800185561180115, 0.0006290208548307419, 0.0007780231535434723, 0.0009270254522562027, 0.001076027750968933, 0.0012250300496816635, 0.001374032348394394, 0.0015230346471071243, 0.0016720369458198547, 0.0018210392445325851, 0.0019700415432453156, 0.002119043841958046, 0.0022680461406707764, 0.0024170484393835068, 0.002566050738096237, 0.0027150530368089676, 0.002864055335521698, 0.0030130576342344284, 0.003162059932947159, 0.0033110622316598892, 0.0034600645303726196, 0.00360906682908535, 0.0037580691277980804, 0.003907071426510811, 0.004056073725223541, 0.004205076023936272, 0.004354078322649002, 0.0045030806213617325, 0.004652082920074463]}, "gradients/decoder.transformer.h.17.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 6.0, 4.0, 4.0, 4.0, 10.0, 12.0, 16.0, 11.0, 19.0, 23.0, 26.0, 19.0, 32.0, 43.0, 33.0, 37.0, 49.0, 43.0, 53.0, 47.0, 38.0, 36.0, 51.0, 42.0, 52.0, 35.0, 43.0, 35.0, 31.0, 28.0, 26.0, 21.0, 19.0, 13.0, 13.0, 5.0, 12.0, 7.0, 5.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.234375, -8.9580078125, -8.681640625, -8.4052734375, -8.12890625, -7.8525390625, -7.576171875, -7.2998046875, -7.0234375, -6.7470703125, -6.470703125, -6.1943359375, -5.91796875, -5.6416015625, -5.365234375, -5.0888671875, -4.8125, -4.5361328125, -4.259765625, -3.9833984375, -3.70703125, -3.4306640625, -3.154296875, -2.8779296875, -2.6015625, -2.3251953125, -2.048828125, -1.7724609375, -1.49609375, -1.2197265625, -0.943359375, -0.6669921875, -0.390625, -0.1142578125, 0.162109375, 0.4384765625, 0.71484375, 0.9912109375, 1.267578125, 1.5439453125, 1.8203125, 2.0966796875, 2.373046875, 2.6494140625, 2.92578125, 3.2021484375, 3.478515625, 3.7548828125, 4.03125, 4.3076171875, 4.583984375, 4.8603515625, 5.13671875, 5.4130859375, 5.689453125, 5.9658203125, 6.2421875, 6.5185546875, 6.794921875, 7.0712890625, 7.34765625, 7.6240234375, 7.900390625, 8.1767578125, 8.453125]}, "gradients/decoder.transformer.h.17.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 5.0, 5.0, 7.0, 11.0, 19.0, 31.0, 24.0, 65.0, 93.0, 150.0, 237.0, 404.0, 615.0, 1076.0, 1864.0, 3283.0, 5965.0, 11154.0, 24065.0, 66724.0, 259832.0, 471205.0, 127770.0, 38976.0, 16466.0, 8180.0, 4449.0, 2410.0, 1384.0, 787.0, 496.0, 299.0, 169.0, 115.0, 60.0, 47.0, 43.0, 31.0, 15.0, 11.0, 5.0, 6.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.96875, -7.7291259765625, -7.489501953125, -7.2498779296875, -7.01025390625, -6.7706298828125, -6.531005859375, -6.2913818359375, -6.0517578125, -5.8121337890625, -5.572509765625, -5.3328857421875, -5.09326171875, -4.8536376953125, -4.614013671875, -4.3743896484375, -4.134765625, -3.8951416015625, -3.655517578125, -3.4158935546875, -3.17626953125, -2.9366455078125, -2.697021484375, -2.4573974609375, -2.2177734375, -1.9781494140625, -1.738525390625, -1.4989013671875, -1.25927734375, -1.0196533203125, -0.780029296875, -0.5404052734375, -0.30078125, -0.0611572265625, 0.178466796875, 0.4180908203125, 0.65771484375, 0.8973388671875, 1.136962890625, 1.3765869140625, 1.6162109375, 1.8558349609375, 2.095458984375, 2.3350830078125, 2.57470703125, 2.8143310546875, 3.053955078125, 3.2935791015625, 3.533203125, 3.7728271484375, 4.012451171875, 4.2520751953125, 4.49169921875, 4.7313232421875, 4.970947265625, 5.2105712890625, 5.4501953125, 5.6898193359375, 5.929443359375, 6.1690673828125, 6.40869140625, 6.6483154296875, 6.887939453125, 7.1275634765625, 7.3671875]}, "gradients/decoder.transformer.h.17.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 4.0, 1.0, 3.0, 5.0, 6.0, 9.0, 4.0, 9.0, 20.0, 16.0, 15.0, 25.0, 30.0, 42.0, 36.0, 34.0, 52.0, 55.0, 68.0, 76.0, 189.0, 1582.0, 222.0, 94.0, 76.0, 53.0, 56.0, 44.0, 38.0, 29.0, 34.0, 24.0, 26.0, 10.0, 15.0, 16.0, 13.0, 10.0, 8.0, 5.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-35.96875, -34.958740234375, -33.94873046875, -32.938720703125, -31.9287109375, -30.918701171875, -29.90869140625, -28.898681640625, -27.888671875, -26.878662109375, -25.86865234375, -24.858642578125, -23.8486328125, -22.838623046875, -21.82861328125, -20.818603515625, -19.80859375, -18.798583984375, -17.78857421875, -16.778564453125, -15.7685546875, -14.758544921875, -13.74853515625, -12.738525390625, -11.728515625, -10.718505859375, -9.70849609375, -8.698486328125, -7.6884765625, -6.678466796875, -5.66845703125, -4.658447265625, -3.6484375, -2.638427734375, -1.62841796875, -0.618408203125, 0.3916015625, 1.401611328125, 2.41162109375, 3.421630859375, 4.431640625, 5.441650390625, 6.45166015625, 7.461669921875, 8.4716796875, 9.481689453125, 10.49169921875, 11.501708984375, 12.51171875, 13.521728515625, 14.53173828125, 15.541748046875, 16.5517578125, 17.561767578125, 18.57177734375, 19.581787109375, 20.591796875, 21.601806640625, 22.61181640625, 23.621826171875, 24.6318359375, 25.641845703125, 26.65185546875, 27.661865234375, 28.671875]}, "gradients/decoder.transformer.h.17.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 5.0, 0.0, 2.0, 2.0, 14.0, 15.0, 12.0, 30.0, 18.0, 44.0, 49.0, 56.0, 104.0, 137.0, 222.0, 325.0, 884.0, 5865.0, 2809686.0, 323370.0, 3280.0, 682.0, 297.0, 176.0, 113.0, 94.0, 61.0, 45.0, 29.0, 26.0, 21.0, 14.0, 11.0, 4.0, 8.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-73.6875, -71.2216796875, -68.755859375, -66.2900390625, -63.82421875, -61.3583984375, -58.892578125, -56.4267578125, -53.9609375, -51.4951171875, -49.029296875, -46.5634765625, -44.09765625, -41.6318359375, -39.166015625, -36.7001953125, -34.234375, -31.7685546875, -29.302734375, -26.8369140625, -24.37109375, -21.9052734375, -19.439453125, -16.9736328125, -14.5078125, -12.0419921875, -9.576171875, -7.1103515625, -4.64453125, -2.1787109375, 0.287109375, 2.7529296875, 5.21875, 7.6845703125, 10.150390625, 12.6162109375, 15.08203125, 17.5478515625, 20.013671875, 22.4794921875, 24.9453125, 27.4111328125, 29.876953125, 32.3427734375, 34.80859375, 37.2744140625, 39.740234375, 42.2060546875, 44.671875, 47.1376953125, 49.603515625, 52.0693359375, 54.53515625, 57.0009765625, 59.466796875, 61.9326171875, 64.3984375, 66.8642578125, 69.330078125, 71.7958984375, 74.26171875, 76.7275390625, 79.193359375, 81.6591796875, 84.125]}, "gradients/decoder.transformer.h.17.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 9.0, 87.0, 459.0, 376.0, 79.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-220.84524536132812, -215.80874633789062, -210.77224731445312, -205.73574829101562, -200.69923400878906, -195.66273498535156, -190.62623596191406, -185.58973693847656, -180.55323791503906, -175.51673889160156, -170.48023986816406, -165.4437255859375, -160.4072265625, -155.3707275390625, -150.334228515625, -145.2977294921875, -140.26123046875, -135.2247314453125, -130.188232421875, -125.15172576904297, -120.11522674560547, -115.07872009277344, -110.04222106933594, -105.00572204589844, -99.96920776367188, -94.93270874023438, -89.89620208740234, -84.85970306396484, -79.82320404052734, -74.78669738769531, -69.75019836425781, -64.71369934082031, -59.67720031738281, -54.64069747924805, -49.60419845581055, -44.56769561767578, -39.53119659423828, -34.494693756103516, -29.45819091796875, -24.42169189453125, -19.385189056396484, -14.348688125610352, -9.312186241149902, -4.275684356689453, 0.7608165740966797, 5.7973175048828125, 10.833820343017578, 15.870319366455078, 20.906822204589844, 25.943323135375977, 30.97982406616211, 36.016326904296875, 41.052825927734375, 46.08932876586914, 51.125831604003906, 56.162330627441406, 61.19883346557617, 66.23533630371094, 71.27183532714844, 76.30833435058594, 81.34484100341797, 86.38134002685547, 91.4178466796875, 96.454345703125, 101.4908447265625]}, "gradients/decoder.transformer.h.17.ln_1.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 6.0, 8.0, 11.0, 11.0, 11.0, 16.0, 17.0, 24.0, 23.0, 28.0, 33.0, 31.0, 29.0, 30.0, 41.0, 43.0, 39.0, 39.0, 37.0, 45.0, 28.0, 44.0, 51.0, 22.0, 30.0, 37.0, 34.0, 29.0, 29.0, 24.0, 24.0, 19.0, 10.0, 12.0, 18.0, 12.0, 11.0, 9.0, 10.0, 8.0, 3.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-66.06924438476562, -63.86018753051758, -61.6511344909668, -59.44207763671875, -57.23302459716797, -55.02396774291992, -52.814910888671875, -50.605857849121094, -48.39680099487305, -46.187744140625, -43.97869110107422, -41.76963424682617, -39.560577392578125, -37.351524353027344, -35.1424674987793, -32.93341064453125, -30.72435760498047, -28.515302658081055, -26.30624771118164, -24.097190856933594, -21.88813591003418, -19.679080963134766, -17.47002410888672, -15.260969161987305, -13.05191421508789, -10.842859268188477, -8.633803367614746, -6.424747943878174, -4.215692520141602, -2.0066375732421875, 0.20241832733154297, 2.4114742279052734, 4.6205291748046875, 6.82958459854126, 9.038640022277832, 11.247695922851562, 13.456750869750977, 15.66580581665039, 17.874862670898438, 20.08391761779785, 22.292972564697266, 24.50202751159668, 26.711082458496094, 28.92013931274414, 31.129194259643555, 33.33824920654297, 35.547306060791016, 37.75636291503906, 39.965415954589844, 42.17447280883789, 44.38352584838867, 46.59258270263672, 48.8016357421875, 51.01069259643555, 53.219749450683594, 55.428802490234375, 57.63785934448242, 59.84691619873047, 62.05596923828125, 64.26502227783203, 66.47408294677734, 68.68313598632812, 70.8921890258789, 73.10124969482422, 75.310302734375]}, "gradients/decoder.transformer.h.16.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 4.0, 8.0, 5.0, 11.0, 12.0, 20.0, 17.0, 27.0, 17.0, 27.0, 33.0, 41.0, 39.0, 35.0, 46.0, 38.0, 51.0, 44.0, 52.0, 41.0, 36.0, 50.0, 39.0, 39.0, 45.0, 41.0, 33.0, 24.0, 25.0, 17.0, 23.0, 18.0, 10.0, 8.0, 9.0, 5.0, 4.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.5546875, -9.26904296875, -8.9833984375, -8.69775390625, -8.412109375, -8.12646484375, -7.8408203125, -7.55517578125, -7.26953125, -6.98388671875, -6.6982421875, -6.41259765625, -6.126953125, -5.84130859375, -5.5556640625, -5.27001953125, -4.984375, -4.69873046875, -4.4130859375, -4.12744140625, -3.841796875, -3.55615234375, -3.2705078125, -2.98486328125, -2.69921875, -2.41357421875, -2.1279296875, -1.84228515625, -1.556640625, -1.27099609375, -0.9853515625, -0.69970703125, -0.4140625, -0.12841796875, 0.1572265625, 0.44287109375, 0.728515625, 1.01416015625, 1.2998046875, 1.58544921875, 1.87109375, 2.15673828125, 2.4423828125, 2.72802734375, 3.013671875, 3.29931640625, 3.5849609375, 3.87060546875, 4.15625, 4.44189453125, 4.7275390625, 5.01318359375, 5.298828125, 5.58447265625, 5.8701171875, 6.15576171875, 6.44140625, 6.72705078125, 7.0126953125, 7.29833984375, 7.583984375, 7.86962890625, 8.1552734375, 8.44091796875, 8.7265625]}, "gradients/decoder.transformer.h.16.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 3.0, 1.0, 7.0, 9.0, 8.0, 9.0, 6.0, 16.0, 20.0, 19.0, 31.0, 32.0, 46.0, 46.0, 61.0, 68.0, 87.0, 173.0, 452.0, 2323.0, 23269.0, 772379.0, 3275575.0, 110864.0, 6989.0, 993.0, 256.0, 121.0, 77.0, 59.0, 46.0, 51.0, 48.0, 32.0, 22.0, 19.0, 14.0, 13.0, 11.0, 7.0, 7.0, 7.0, 8.0, 0.0, 1.0, 2.0, 1.0, 3.0, 0.0, 0.0, 2.0], "bins": [-42.625, -41.416015625, -40.20703125, -38.998046875, -37.7890625, -36.580078125, -35.37109375, -34.162109375, -32.953125, -31.744140625, -30.53515625, -29.326171875, -28.1171875, -26.908203125, -25.69921875, -24.490234375, -23.28125, -22.072265625, -20.86328125, -19.654296875, -18.4453125, -17.236328125, -16.02734375, -14.818359375, -13.609375, -12.400390625, -11.19140625, -9.982421875, -8.7734375, -7.564453125, -6.35546875, -5.146484375, -3.9375, -2.728515625, -1.51953125, -0.310546875, 0.8984375, 2.107421875, 3.31640625, 4.525390625, 5.734375, 6.943359375, 8.15234375, 9.361328125, 10.5703125, 11.779296875, 12.98828125, 14.197265625, 15.40625, 16.615234375, 17.82421875, 19.033203125, 20.2421875, 21.451171875, 22.66015625, 23.869140625, 25.078125, 26.287109375, 27.49609375, 28.705078125, 29.9140625, 31.123046875, 32.33203125, 33.541015625, 34.75]}, "gradients/decoder.transformer.h.16.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 2.0, 4.0, 9.0, 8.0, 13.0, 25.0, 33.0, 43.0, 69.0, 88.0, 121.0, 185.0, 280.0, 321.0, 500.0, 558.0, 512.0, 379.0, 253.0, 207.0, 128.0, 115.0, 58.0, 56.0, 39.0, 20.0, 19.0, 9.0, 9.0, 5.0, 3.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.3125, -25.552734375, -24.79296875, -24.033203125, -23.2734375, -22.513671875, -21.75390625, -20.994140625, -20.234375, -19.474609375, -18.71484375, -17.955078125, -17.1953125, -16.435546875, -15.67578125, -14.916015625, -14.15625, -13.396484375, -12.63671875, -11.876953125, -11.1171875, -10.357421875, -9.59765625, -8.837890625, -8.078125, -7.318359375, -6.55859375, -5.798828125, -5.0390625, -4.279296875, -3.51953125, -2.759765625, -2.0, -1.240234375, -0.48046875, 0.279296875, 1.0390625, 1.798828125, 2.55859375, 3.318359375, 4.078125, 4.837890625, 5.59765625, 6.357421875, 7.1171875, 7.876953125, 8.63671875, 9.396484375, 10.15625, 10.916015625, 11.67578125, 12.435546875, 13.1953125, 13.955078125, 14.71484375, 15.474609375, 16.234375, 16.994140625, 17.75390625, 18.513671875, 19.2734375, 20.033203125, 20.79296875, 21.552734375, 22.3125]}, "gradients/decoder.transformer.h.16.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 8.0, 5.0, 10.0, 20.0, 22.0, 29.0, 34.0, 39.0, 74.0, 90.0, 104.0, 150.0, 259.0, 457.0, 1075.0, 4572.0, 96603.0, 3668524.0, 408865.0, 10260.0, 1531.0, 535.0, 294.0, 197.0, 139.0, 93.0, 82.0, 72.0, 42.0, 20.0, 20.0, 11.0, 16.0, 7.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-62.65625, -60.54443359375, -58.4326171875, -56.32080078125, -54.208984375, -52.09716796875, -49.9853515625, -47.87353515625, -45.76171875, -43.64990234375, -41.5380859375, -39.42626953125, -37.314453125, -35.20263671875, -33.0908203125, -30.97900390625, -28.8671875, -26.75537109375, -24.6435546875, -22.53173828125, -20.419921875, -18.30810546875, -16.1962890625, -14.08447265625, -11.97265625, -9.86083984375, -7.7490234375, -5.63720703125, -3.525390625, -1.41357421875, 0.6982421875, 2.81005859375, 4.921875, 7.03369140625, 9.1455078125, 11.25732421875, 13.369140625, 15.48095703125, 17.5927734375, 19.70458984375, 21.81640625, 23.92822265625, 26.0400390625, 28.15185546875, 30.263671875, 32.37548828125, 34.4873046875, 36.59912109375, 38.7109375, 40.82275390625, 42.9345703125, 45.04638671875, 47.158203125, 49.27001953125, 51.3818359375, 53.49365234375, 55.60546875, 57.71728515625, 59.8291015625, 61.94091796875, 64.052734375, 66.16455078125, 68.2763671875, 70.38818359375, 72.5]}, "gradients/decoder.transformer.h.16.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 8.0, 25.0, 70.0, 183.0, 291.0, 232.0, 126.0, 55.0, 16.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-66.56511688232422, -59.006038665771484, -51.44696044921875, -43.88787841796875, -36.32880401611328, -28.76972198486328, -21.210643768310547, -13.651565551757812, -6.092487335205078, 1.4665913581848145, 9.025670051574707, 16.584749221801758, 24.143827438354492, 31.70290756225586, 39.261985778808594, 46.82106399536133, 54.38014221191406, 61.9392204284668, 69.49829864501953, 77.05738067626953, 84.616455078125, 92.175537109375, 99.734619140625, 107.29369354248047, 114.85276794433594, 122.41184997558594, 129.97093200683594, 137.52999877929688, 145.08908081054688, 152.64816284179688, 160.20724487304688, 167.76632690429688, 175.3253936767578, 182.8844757080078, 190.4435577392578, 198.00262451171875, 205.56170654296875, 213.12078857421875, 220.67987060546875, 228.23895263671875, 235.7980194091797, 243.3571014404297, 250.9161834716797, 258.4752502441406, 266.0343322753906, 273.5934143066406, 281.1524963378906, 288.7115783691406, 296.2706604003906, 303.8297424316406, 311.3888244628906, 318.9479064941406, 326.5069885253906, 334.0660400390625, 341.6251220703125, 349.1842041015625, 356.7432861328125, 364.3023681640625, 371.8614501953125, 379.4205322265625, 386.9796142578125, 394.5386962890625, 402.0977478027344, 409.6568298339844, 417.2159118652344]}, "gradients/decoder.transformer.h.16.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 3.0, 6.0, 2.0, 8.0, 7.0, 9.0, 12.0, 20.0, 16.0, 22.0, 20.0, 19.0, 26.0, 31.0, 37.0, 33.0, 32.0, 31.0, 31.0, 34.0, 37.0, 34.0, 29.0, 39.0, 32.0, 31.0, 35.0, 31.0, 29.0, 39.0, 44.0, 20.0, 31.0, 20.0, 24.0, 16.0, 18.0, 14.0, 14.0, 11.0, 14.0, 9.0, 9.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 2.0, 0.0, 1.0], "bins": [-63.25408935546875, -61.28107452392578, -59.30805587768555, -57.33504104614258, -55.36202621459961, -53.389007568359375, -51.415992736816406, -49.44297790527344, -47.4699592590332, -45.496944427490234, -43.52392578125, -41.55091094970703, -39.57789611816406, -37.60487747192383, -35.63186264038086, -33.658843994140625, -31.68583106994629, -29.712814331054688, -27.73979949951172, -25.766782760620117, -23.793766021728516, -21.820751190185547, -19.847734451293945, -17.874717712402344, -15.901701927185059, -13.928686141967773, -11.955669403076172, -9.982653617858887, -8.009637832641602, -6.03662109375, -4.063605308532715, -2.0905885696411133, -0.11757278442382812, 1.8554433584213257, 3.8284595012664795, 5.801475524902344, 7.774491786956787, 9.74750804901123, 11.720523834228516, 13.693540573120117, 15.666556358337402, 17.639572143554688, 19.61258888244629, 21.58560562133789, 23.55862045288086, 25.53163719177246, 27.504653930664062, 29.47766876220703, 31.450685501098633, 33.423702239990234, 35.3967170715332, 37.36973571777344, 39.342750549316406, 41.315765380859375, 43.288780212402344, 45.26179885864258, 47.23481369018555, 49.207828521728516, 51.18084716796875, 53.15386199951172, 55.12687683105469, 57.09989547729492, 59.07291030883789, 61.045928955078125, 63.018943786621094]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 8.0, 12.0, 11.0, 17.0, 13.0, 18.0, 20.0, 28.0, 33.0, 29.0, 37.0, 36.0, 39.0, 47.0, 38.0, 56.0, 44.0, 43.0, 44.0, 44.0, 41.0, 46.0, 38.0, 34.0, 29.0, 33.0, 38.0, 16.0, 26.0, 13.0, 13.0, 12.0, 15.0, 1.0, 12.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.578125, -10.29266357421875, -10.0072021484375, -9.72174072265625, -9.436279296875, -9.15081787109375, -8.8653564453125, -8.57989501953125, -8.29443359375, -8.00897216796875, -7.7235107421875, -7.43804931640625, -7.152587890625, -6.86712646484375, -6.5816650390625, -6.29620361328125, -6.0107421875, -5.72528076171875, -5.4398193359375, -5.15435791015625, -4.868896484375, -4.58343505859375, -4.2979736328125, -4.01251220703125, -3.72705078125, -3.44158935546875, -3.1561279296875, -2.87066650390625, -2.585205078125, -2.29974365234375, -2.0142822265625, -1.72882080078125, -1.443359375, -1.15789794921875, -0.8724365234375, -0.58697509765625, -0.301513671875, -0.01605224609375, 0.2694091796875, 0.55487060546875, 0.84033203125, 1.12579345703125, 1.4112548828125, 1.69671630859375, 1.982177734375, 2.26763916015625, 2.5531005859375, 2.83856201171875, 3.1240234375, 3.40948486328125, 3.6949462890625, 3.98040771484375, 4.265869140625, 4.55133056640625, 4.8367919921875, 5.12225341796875, 5.40771484375, 5.69317626953125, 5.9786376953125, 6.26409912109375, 6.549560546875, 6.83502197265625, 7.1204833984375, 7.40594482421875, 7.69140625]}, "gradients/decoder.transformer.h.16.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 6.0, 4.0, 6.0, 19.0, 18.0, 29.0, 45.0, 68.0, 84.0, 119.0, 162.0, 249.0, 379.0, 541.0, 773.0, 1007.0, 1407.0, 2083.0, 2961.0, 4174.0, 5983.0, 8947.0, 12906.0, 19205.0, 28821.0, 43712.0, 67340.0, 100891.0, 142180.0, 165626.0, 141544.0, 99622.0, 65642.0, 43179.0, 28329.0, 18868.0, 12960.0, 8741.0, 5959.0, 4125.0, 2930.0, 2071.0, 1428.0, 988.0, 703.0, 523.0, 378.0, 272.0, 179.0, 127.0, 88.0, 48.0, 37.0, 36.0, 17.0, 23.0, 8.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.72314453125, -0.7008819580078125, -0.678619384765625, -0.6563568115234375, -0.63409423828125, -0.6118316650390625, -0.589569091796875, -0.5673065185546875, -0.5450439453125, -0.5227813720703125, -0.500518798828125, -0.4782562255859375, -0.45599365234375, -0.4337310791015625, -0.411468505859375, -0.3892059326171875, -0.366943359375, -0.3446807861328125, -0.322418212890625, -0.3001556396484375, -0.27789306640625, -0.2556304931640625, -0.233367919921875, -0.2111053466796875, -0.1888427734375, -0.1665802001953125, -0.144317626953125, -0.1220550537109375, -0.09979248046875, -0.0775299072265625, -0.055267333984375, -0.0330047607421875, -0.0107421875, 0.0115203857421875, 0.033782958984375, 0.0560455322265625, 0.07830810546875, 0.1005706787109375, 0.122833251953125, 0.1450958251953125, 0.1673583984375, 0.1896209716796875, 0.211883544921875, 0.2341461181640625, 0.25640869140625, 0.2786712646484375, 0.300933837890625, 0.3231964111328125, 0.345458984375, 0.3677215576171875, 0.389984130859375, 0.4122467041015625, 0.43450927734375, 0.4567718505859375, 0.479034423828125, 0.5012969970703125, 0.5235595703125, 0.5458221435546875, 0.568084716796875, 0.5903472900390625, 0.61260986328125, 0.6348724365234375, 0.657135009765625, 0.6793975830078125, 0.70166015625]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 4.0, 5.0, 4.0, 4.0, 7.0, 9.0, 6.0, 4.0, 3.0, 14.0, 14.0, 16.0, 10.0, 15.0, 23.0, 26.0, 28.0, 42.0, 38.0, 37.0, 46.0, 37.0, 25.0, 32.0, 45.0, 1059.0, 43.0, 38.0, 49.0, 28.0, 40.0, 38.0, 24.0, 24.0, 23.0, 42.0, 26.0, 17.0, 18.0, 14.0, 10.0, 14.0, 13.0, 11.0, 8.0, 3.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.19140625, -5.02154541015625, -4.8516845703125, -4.68182373046875, -4.511962890625, -4.34210205078125, -4.1722412109375, -4.00238037109375, -3.83251953125, -3.66265869140625, -3.4927978515625, -3.32293701171875, -3.153076171875, -2.98321533203125, -2.8133544921875, -2.64349365234375, -2.4736328125, -2.30377197265625, -2.1339111328125, -1.96405029296875, -1.794189453125, -1.62432861328125, -1.4544677734375, -1.28460693359375, -1.11474609375, -0.94488525390625, -0.7750244140625, -0.60516357421875, -0.435302734375, -0.26544189453125, -0.0955810546875, 0.07427978515625, 0.244140625, 0.41400146484375, 0.5838623046875, 0.75372314453125, 0.923583984375, 1.09344482421875, 1.2633056640625, 1.43316650390625, 1.60302734375, 1.77288818359375, 1.9427490234375, 2.11260986328125, 2.282470703125, 2.45233154296875, 2.6221923828125, 2.79205322265625, 2.9619140625, 3.13177490234375, 3.3016357421875, 3.47149658203125, 3.641357421875, 3.81121826171875, 3.9810791015625, 4.15093994140625, 4.32080078125, 4.49066162109375, 4.6605224609375, 4.83038330078125, 5.000244140625, 5.17010498046875, 5.3399658203125, 5.50982666015625, 5.6796875]}, "gradients/decoder.transformer.h.16.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 4.0, 4.0, 13.0, 21.0, 19.0, 42.0, 73.0, 86.0, 139.0, 195.0, 293.0, 422.0, 629.0, 930.0, 1396.0, 2038.0, 3047.0, 4692.0, 7108.0, 10791.0, 17192.0, 25741.0, 39999.0, 62246.0, 94193.0, 134769.0, 1205681.0, 156573.0, 113055.0, 75194.0, 49072.0, 31893.0, 20788.0, 13376.0, 8588.0, 5629.0, 3703.0, 2504.0, 1655.0, 1124.0, 748.0, 469.0, 327.0, 201.0, 144.0, 105.0, 75.0, 46.0, 32.0, 24.0, 20.0, 9.0, 7.0, 6.0, 6.0, 1.0, 0.0, 2.0], "bins": [-0.57568359375, -0.5580978393554688, -0.5405120849609375, -0.5229263305664062, -0.505340576171875, -0.48775482177734375, -0.4701690673828125, -0.45258331298828125, -0.43499755859375, -0.41741180419921875, -0.3998260498046875, -0.38224029541015625, -0.364654541015625, -0.34706878662109375, -0.3294830322265625, -0.31189727783203125, -0.2943115234375, -0.27672576904296875, -0.2591400146484375, -0.24155426025390625, -0.223968505859375, -0.20638275146484375, -0.1887969970703125, -0.17121124267578125, -0.15362548828125, -0.13603973388671875, -0.1184539794921875, -0.10086822509765625, -0.083282470703125, -0.06569671630859375, -0.0481109619140625, -0.03052520751953125, -0.012939453125, 0.00464630126953125, 0.0222320556640625, 0.03981781005859375, 0.057403564453125, 0.07498931884765625, 0.0925750732421875, 0.11016082763671875, 0.12774658203125, 0.14533233642578125, 0.1629180908203125, 0.18050384521484375, 0.198089599609375, 0.21567535400390625, 0.2332611083984375, 0.25084686279296875, 0.2684326171875, 0.28601837158203125, 0.3036041259765625, 0.32118988037109375, 0.338775634765625, 0.35636138916015625, 0.3739471435546875, 0.39153289794921875, 0.40911865234375, 0.42670440673828125, 0.4442901611328125, 0.46187591552734375, 0.479461669921875, 0.49704742431640625, 0.5146331787109375, 0.5322189331054688, 0.5498046875]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 4.0, 5.0, 8.0, 3.0, 3.0, 4.0, 4.0, 10.0, 13.0, 27.0, 30.0, 32.0, 45.0, 35.0, 53.0, 52.0, 70.0, 79.0, 67.0, 82.0, 76.0, 57.0, 46.0, 45.0, 28.0, 22.0, 24.0, 14.0, 12.0, 12.0, 10.0, 9.0, 1.0, 4.0, 6.0, 3.0, 3.0, 4.0, 0.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0], "bins": [-0.0088958740234375, -0.008635938167572021, -0.008376002311706543, -0.008116066455841064, -0.007856130599975586, -0.007596194744110107, -0.007336258888244629, -0.00707632303237915, -0.006816387176513672, -0.006556451320648193, -0.006296515464782715, -0.006036579608917236, -0.005776643753051758, -0.005516707897186279, -0.005256772041320801, -0.004996836185455322, -0.004736900329589844, -0.004476964473724365, -0.004217028617858887, -0.003957092761993408, -0.0036971569061279297, -0.003437221050262451, -0.0031772851943969727, -0.002917349338531494, -0.0026574134826660156, -0.002397477626800537, -0.0021375417709350586, -0.00187760591506958, -0.0016176700592041016, -0.001357734203338623, -0.0010977983474731445, -0.000837862491607666, -0.0005779266357421875, -0.000317990779876709, -5.805492401123047e-05, 0.00020188093185424805, 0.00046181678771972656, 0.0007217526435852051, 0.0009816884994506836, 0.0012416243553161621, 0.0015015602111816406, 0.0017614960670471191, 0.0020214319229125977, 0.002281367778778076, 0.0025413036346435547, 0.002801239490509033, 0.0030611753463745117, 0.0033211112022399902, 0.0035810470581054688, 0.0038409829139709473, 0.004100918769836426, 0.004360854625701904, 0.004620790481567383, 0.004880726337432861, 0.00514066219329834, 0.005400598049163818, 0.005660533905029297, 0.005920469760894775, 0.006180405616760254, 0.006440341472625732, 0.006700277328491211, 0.0069602131843566895, 0.007220149040222168, 0.0074800848960876465, 0.007740020751953125]}, "gradients/decoder.transformer.h.16.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 1.0, 10.0, 5.0, 2.0, 7.0, 13.0, 14.0, 20.0, 27.0, 18.0, 47.0, 62.0, 101.0, 182.0, 335.0, 1319.0, 717410.0, 327098.0, 1054.0, 344.0, 153.0, 104.0, 51.0, 46.0, 38.0, 25.0, 18.0, 11.0, 6.0, 6.0, 1.0, 3.0, 7.0, 5.0, 1.0, 5.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.17333984375, -0.16735267639160156, -0.16136550903320312, -0.1553783416748047, -0.14939117431640625, -0.1434040069580078, -0.13741683959960938, -0.13142967224121094, -0.1254425048828125, -0.11945533752441406, -0.11346817016601562, -0.10748100280761719, -0.10149383544921875, -0.09550666809082031, -0.08951950073242188, -0.08353233337402344, -0.077545166015625, -0.07155799865722656, -0.06557083129882812, -0.05958366394042969, -0.05359649658203125, -0.04760932922363281, -0.041622161865234375, -0.03563499450683594, -0.0296478271484375, -0.023660659790039062, -0.017673492431640625, -0.011686325073242188, -0.00569915771484375, 0.0002880096435546875, 0.006275177001953125, 0.012262344360351562, 0.01824951171875, 0.024236679077148438, 0.030223846435546875, 0.03621101379394531, 0.04219818115234375, 0.04818534851074219, 0.054172515869140625, 0.06015968322753906, 0.0661468505859375, 0.07213401794433594, 0.07812118530273438, 0.08410835266113281, 0.09009552001953125, 0.09608268737792969, 0.10206985473632812, 0.10805702209472656, 0.114044189453125, 0.12003135681152344, 0.12601852416992188, 0.1320056915283203, 0.13799285888671875, 0.1439800262451172, 0.14996719360351562, 0.15595436096191406, 0.1619415283203125, 0.16792869567871094, 0.17391586303710938, 0.1799030303955078, 0.18589019775390625, 0.1918773651123047, 0.19786453247070312, 0.20385169982910156, 0.2098388671875]}, "gradients/decoder.transformer.h.16.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 5.0, 176.0, 801.0, 32.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004977295640856028, -0.0034739633556455374, -0.001970631070435047, -0.0004672990180552006, 0.0010360334999859333, 0.002539366018027067, 0.0040426976047456264, 0.00554603012278676, 0.007049362640827894, 0.00855269469320774, 0.010056027211248875, 0.011559359729290009, 0.013062691316008568, 0.014566024765372276, 0.016069356352090836, 0.017572687938809395, 0.019076021388173103, 0.020579352974891663, 0.02208268642425537, 0.02358601801097393, 0.02508934959769249, 0.026592683047056198, 0.028096014633774757, 0.029599346220493317, 0.031102679669857025, 0.032606013119220734, 0.034109342843294144, 0.03561267629265785, 0.03711600974202156, 0.03861933946609497, 0.04012267291545868, 0.04162600636482239, 0.043129339814186096, 0.044632673263549805, 0.046136002987623215, 0.04763933643698692, 0.04914266988635063, 0.05064599961042404, 0.05214933305978775, 0.05365266650915146, 0.05515599995851517, 0.056659333407878876, 0.058162663131952286, 0.059665996581315994, 0.0611693300306797, 0.06267265975475311, 0.06417599320411682, 0.06567932665348053, 0.06718266010284424, 0.06868599355220795, 0.07018932700157166, 0.07169266045093536, 0.07319598644971848, 0.07469931989908218, 0.07620265334844589, 0.0777059867978096, 0.07920931279659271, 0.08071264624595642, 0.08221597969532013, 0.08371931314468384, 0.08522263914346695, 0.08672597259283066, 0.08822930604219437, 0.08973263949155807, 0.09123597294092178]}, "gradients/decoder.transformer.h.16.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 1.0, 7.0, 3.0, 6.0, 8.0, 12.0, 10.0, 14.0, 12.0, 16.0, 28.0, 29.0, 22.0, 26.0, 32.0, 24.0, 45.0, 40.0, 24.0, 42.0, 49.0, 60.0, 34.0, 39.0, 41.0, 36.0, 49.0, 41.0, 43.0, 35.0, 34.0, 25.0, 25.0, 20.0, 13.0, 17.0, 13.0, 8.0, 9.0, 3.0, 6.0, 3.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.004888296127319336, -0.004735466092824936, -0.004582636058330536, -0.004429806023836136, -0.004276975989341736, -0.004124145954847336, -0.003971315920352936, -0.0038184858858585358, -0.0036656558513641357, -0.0035128258168697357, -0.0033599957823753357, -0.0032071657478809357, -0.0030543357133865356, -0.0029015056788921356, -0.0027486756443977356, -0.0025958456099033356, -0.0024430155754089355, -0.0022901855409145355, -0.0021373555064201355, -0.0019845254719257355, -0.0018316954374313354, -0.0016788654029369354, -0.0015260353684425354, -0.0013732053339481354, -0.0012203752994537354, -0.0010675452649593353, -0.0009147152304649353, -0.0007618851959705353, -0.0006090551614761353, -0.00045622512698173523, -0.0003033950924873352, -0.00015056505799293518, 2.2649765014648438e-06, 0.00015509501099586487, 0.0003079250454902649, 0.0004607550799846649, 0.0006135851144790649, 0.000766415148973465, 0.000919245183467865, 0.001072075217962265, 0.001224905252456665, 0.001377735286951065, 0.001530565321445465, 0.0016833953559398651, 0.0018362253904342651, 0.001989055424928665, 0.002141885459423065, 0.002294715493917465, 0.0024475455284118652, 0.0026003755629062653, 0.0027532055974006653, 0.0029060356318950653, 0.0030588656663894653, 0.0032116957008838654, 0.0033645257353782654, 0.0035173557698726654, 0.0036701858043670654, 0.0038230158388614655, 0.0039758458733558655, 0.0041286759078502655, 0.0042815059423446655, 0.0044343359768390656, 0.004587166011333466, 0.004739996045827866, 0.004892826080322266]}, "gradients/decoder.transformer.h.16.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 3.0, 6.0, 4.0, 8.0, 12.0, 11.0, 17.0, 13.0, 18.0, 20.0, 28.0, 33.0, 29.0, 37.0, 36.0, 39.0, 47.0, 39.0, 55.0, 44.0, 43.0, 44.0, 44.0, 41.0, 46.0, 39.0, 33.0, 29.0, 33.0, 38.0, 17.0, 25.0, 13.0, 13.0, 12.0, 15.0, 1.0, 12.0, 1.0, 4.0, 1.0, 2.0, 2.0, 0.0, 2.0, 1.0, 2.0], "bins": [-10.578125, -10.2926025390625, -10.007080078125, -9.7215576171875, -9.43603515625, -9.1505126953125, -8.864990234375, -8.5794677734375, -8.2939453125, -8.0084228515625, -7.722900390625, -7.4373779296875, -7.15185546875, -6.8663330078125, -6.580810546875, -6.2952880859375, -6.009765625, -5.7242431640625, -5.438720703125, -5.1531982421875, -4.86767578125, -4.5821533203125, -4.296630859375, -4.0111083984375, -3.7255859375, -3.4400634765625, -3.154541015625, -2.8690185546875, -2.58349609375, -2.2979736328125, -2.012451171875, -1.7269287109375, -1.44140625, -1.1558837890625, -0.870361328125, -0.5848388671875, -0.29931640625, -0.0137939453125, 0.271728515625, 0.5572509765625, 0.8427734375, 1.1282958984375, 1.413818359375, 1.6993408203125, 1.98486328125, 2.2703857421875, 2.555908203125, 2.8414306640625, 3.126953125, 3.4124755859375, 3.697998046875, 3.9835205078125, 4.26904296875, 4.5545654296875, 4.840087890625, 5.1256103515625, 5.4111328125, 5.6966552734375, 5.982177734375, 6.2677001953125, 6.55322265625, 6.8387451171875, 7.124267578125, 7.4097900390625, 7.6953125]}, "gradients/decoder.transformer.h.16.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 1.0, 6.0, 4.0, 6.0, 14.0, 19.0, 36.0, 46.0, 65.0, 89.0, 152.0, 218.0, 319.0, 455.0, 756.0, 1077.0, 1767.0, 2769.0, 4494.0, 7299.0, 12175.0, 21927.0, 42083.0, 95232.0, 317072.0, 340171.0, 101357.0, 43605.0, 22724.0, 12669.0, 7383.0, 4590.0, 2877.0, 1750.0, 1138.0, 735.0, 505.0, 292.0, 236.0, 174.0, 91.0, 67.0, 42.0, 31.0, 22.0, 15.0, 9.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.20703125, -5.02764892578125, -4.8482666015625, -4.66888427734375, -4.489501953125, -4.31011962890625, -4.1307373046875, -3.95135498046875, -3.77197265625, -3.59259033203125, -3.4132080078125, -3.23382568359375, -3.054443359375, -2.87506103515625, -2.6956787109375, -2.51629638671875, -2.3369140625, -2.15753173828125, -1.9781494140625, -1.79876708984375, -1.619384765625, -1.44000244140625, -1.2606201171875, -1.08123779296875, -0.90185546875, -0.72247314453125, -0.5430908203125, -0.36370849609375, -0.184326171875, -0.00494384765625, 0.1744384765625, 0.35382080078125, 0.533203125, 0.71258544921875, 0.8919677734375, 1.07135009765625, 1.250732421875, 1.43011474609375, 1.6094970703125, 1.78887939453125, 1.96826171875, 2.14764404296875, 2.3270263671875, 2.50640869140625, 2.685791015625, 2.86517333984375, 3.0445556640625, 3.22393798828125, 3.4033203125, 3.58270263671875, 3.7620849609375, 3.94146728515625, 4.120849609375, 4.30023193359375, 4.4796142578125, 4.65899658203125, 4.83837890625, 5.01776123046875, 5.1971435546875, 5.37652587890625, 5.555908203125, 5.73529052734375, 5.9146728515625, 6.09405517578125, 6.2734375]}, "gradients/decoder.transformer.h.16.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 4.0, 0.0, 6.0, 3.0, 5.0, 5.0, 7.0, 6.0, 7.0, 10.0, 16.0, 10.0, 27.0, 31.0, 32.0, 37.0, 31.0, 46.0, 48.0, 58.0, 61.0, 83.0, 344.0, 1612.0, 111.0, 56.0, 70.0, 43.0, 39.0, 43.0, 34.0, 31.0, 21.0, 27.0, 20.0, 11.0, 17.0, 9.0, 13.0, 7.0, 6.0, 5.0, 4.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-29.546875, -28.455810546875, -27.36474609375, -26.273681640625, -25.1826171875, -24.091552734375, -23.00048828125, -21.909423828125, -20.818359375, -19.727294921875, -18.63623046875, -17.545166015625, -16.4541015625, -15.363037109375, -14.27197265625, -13.180908203125, -12.08984375, -10.998779296875, -9.90771484375, -8.816650390625, -7.7255859375, -6.634521484375, -5.54345703125, -4.452392578125, -3.361328125, -2.270263671875, -1.17919921875, -0.088134765625, 1.0029296875, 2.093994140625, 3.18505859375, 4.276123046875, 5.3671875, 6.458251953125, 7.54931640625, 8.640380859375, 9.7314453125, 10.822509765625, 11.91357421875, 13.004638671875, 14.095703125, 15.186767578125, 16.27783203125, 17.368896484375, 18.4599609375, 19.551025390625, 20.64208984375, 21.733154296875, 22.82421875, 23.915283203125, 25.00634765625, 26.097412109375, 27.1884765625, 28.279541015625, 29.37060546875, 30.461669921875, 31.552734375, 32.643798828125, 33.73486328125, 34.825927734375, 35.9169921875, 37.008056640625, 38.09912109375, 39.190185546875, 40.28125]}, "gradients/decoder.transformer.h.16.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 6.0, 18.0, 18.0, 33.0, 36.0, 60.0, 78.0, 139.0, 233.0, 482.0, 1903.0, 1044489.0, 2095138.0, 1911.0, 492.0, 228.0, 156.0, 91.0, 47.0, 45.0, 29.0, 22.0, 15.0, 6.0, 6.0, 1.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.125, -90.640625, -87.15625, -83.671875, -80.1875, -76.703125, -73.21875, -69.734375, -66.25, -62.765625, -59.28125, -55.796875, -52.3125, -48.828125, -45.34375, -41.859375, -38.375, -34.890625, -31.40625, -27.921875, -24.4375, -20.953125, -17.46875, -13.984375, -10.5, -7.015625, -3.53125, -0.046875, 3.4375, 6.921875, 10.40625, 13.890625, 17.375, 20.859375, 24.34375, 27.828125, 31.3125, 34.796875, 38.28125, 41.765625, 45.25, 48.734375, 52.21875, 55.703125, 59.1875, 62.671875, 66.15625, 69.640625, 73.125, 76.609375, 80.09375, 83.578125, 87.0625, 90.546875, 94.03125, 97.515625, 101.0, 104.484375, 107.96875, 111.453125, 114.9375, 118.421875, 121.90625, 125.390625, 128.875]}, "gradients/decoder.transformer.h.16.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 6.0, 966.0, 47.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.23606491088867, -44.301368713378906, -27.366668701171875, -10.43197250366211, 6.502727508544922, 23.437427520751953, 40.37211990356445, 57.306819915771484, 74.24151611328125, 91.17621612548828, 108.11091613769531, 125.04560852050781, 141.98031616210938, 158.91500854492188, 175.84970092773438, 192.78439331054688, 209.71910095214844, 226.65379333496094, 243.5885009765625, 260.523193359375, 277.4578857421875, 294.392578125, 311.3272705078125, 328.2619934082031, 345.1966857910156, 362.1313781738281, 379.0660705566406, 396.00079345703125, 412.93548583984375, 429.87017822265625, 446.80487060546875, 463.73956298828125, 480.67431640625, 497.6090087890625, 514.543701171875, 531.4783935546875, 548.4130859375, 565.3477783203125, 582.282470703125, 599.2172241210938, 616.1519165039062, 633.0866088867188, 650.0213012695312, 666.9559936523438, 683.8906860351562, 700.825439453125, 717.7601318359375, 734.69482421875, 751.6295166015625, 768.564208984375, 785.4989013671875, 802.43359375, 819.3682861328125, 836.302978515625, 853.2376708984375, 870.1724243164062, 887.1070556640625, 904.041748046875, 920.9764404296875, 937.9111328125, 954.8458251953125, 971.780517578125, 988.7152099609375, 1005.6499633789062, 1022.5846557617188]}, "gradients/decoder.transformer.h.16.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 2.0, 4.0, 5.0, 8.0, 8.0, 7.0, 7.0, 13.0, 13.0, 15.0, 22.0, 26.0, 29.0, 31.0, 28.0, 33.0, 19.0, 43.0, 45.0, 39.0, 43.0, 44.0, 39.0, 44.0, 39.0, 51.0, 40.0, 40.0, 37.0, 20.0, 26.0, 32.0, 21.0, 23.0, 15.0, 16.0, 21.0, 14.0, 8.0, 9.0, 2.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-96.8150863647461, -93.96878051757812, -91.12248229980469, -88.27617645263672, -85.42987823486328, -82.58357238769531, -79.73727416992188, -76.8909683227539, -74.04466247558594, -71.19835662841797, -68.35205841064453, -65.50575256347656, -62.659454345703125, -59.813148498535156, -56.96684646606445, -54.12054443359375, -51.27424621582031, -48.42794418334961, -45.581642150878906, -42.73533630371094, -39.8890380859375, -37.04273223876953, -34.19643020629883, -31.350128173828125, -28.503826141357422, -25.65752410888672, -22.811222076416016, -19.96491813659668, -17.118616104125977, -14.272314071655273, -11.426010131835938, -8.579708099365234, -5.7333984375, -2.8870959281921387, -0.040793418884277344, 2.805509567260742, 5.651811599731445, 8.498113632202148, 11.344417572021484, 14.190719604492188, 17.03702163696289, 19.883323669433594, 22.729625701904297, 25.575929641723633, 28.422231674194336, 31.26853370666504, 34.114837646484375, 36.96113967895508, 39.80744171142578, 42.653743743896484, 45.50004577636719, 48.346351623535156, 51.192649841308594, 54.03895568847656, 56.885257720947266, 59.73155975341797, 62.57786178588867, 65.42416381835938, 68.27046966552734, 71.11676788330078, 73.96307373046875, 76.80937194824219, 79.65567779541016, 82.50198364257812, 85.34828186035156]}, "gradients/decoder.transformer.h.15.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 3.0, 8.0, 6.0, 7.0, 11.0, 11.0, 18.0, 14.0, 22.0, 17.0, 27.0, 38.0, 31.0, 34.0, 32.0, 42.0, 47.0, 45.0, 50.0, 36.0, 44.0, 51.0, 48.0, 40.0, 47.0, 30.0, 36.0, 31.0, 32.0, 27.0, 23.0, 23.0, 15.0, 12.0, 11.0, 13.0, 3.0, 12.0, 4.0, 1.0, 2.0, 2.0, 0.0, 3.0, 2.0, 1.0, 1.0], "bins": [-11.0, -10.7020263671875, -10.404052734375, -10.1060791015625, -9.80810546875, -9.5101318359375, -9.212158203125, -8.9141845703125, -8.6162109375, -8.3182373046875, -8.020263671875, -7.7222900390625, -7.42431640625, -7.1263427734375, -6.828369140625, -6.5303955078125, -6.232421875, -5.9344482421875, -5.636474609375, -5.3385009765625, -5.04052734375, -4.7425537109375, -4.444580078125, -4.1466064453125, -3.8486328125, -3.5506591796875, -3.252685546875, -2.9547119140625, -2.65673828125, -2.3587646484375, -2.060791015625, -1.7628173828125, -1.46484375, -1.1668701171875, -0.868896484375, -0.5709228515625, -0.27294921875, 0.0250244140625, 0.322998046875, 0.6209716796875, 0.9189453125, 1.2169189453125, 1.514892578125, 1.8128662109375, 2.11083984375, 2.4088134765625, 2.706787109375, 3.0047607421875, 3.302734375, 3.6007080078125, 3.898681640625, 4.1966552734375, 4.49462890625, 4.7926025390625, 5.090576171875, 5.3885498046875, 5.6865234375, 5.9844970703125, 6.282470703125, 6.5804443359375, 6.87841796875, 7.1763916015625, 7.474365234375, 7.7723388671875, 8.0703125]}, "gradients/decoder.transformer.h.15.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 7.0, 4.0, 8.0, 6.0, 14.0, 16.0, 17.0, 21.0, 22.0, 23.0, 35.0, 47.0, 73.0, 93.0, 164.0, 241.0, 449.0, 993.0, 2211.0, 6010.0, 18933.0, 73045.0, 393824.0, 1759644.0, 1537479.0, 313770.0, 61722.0, 16271.0, 5243.0, 1922.0, 838.0, 409.0, 231.0, 145.0, 84.0, 63.0, 62.0, 32.0, 23.0, 24.0, 16.0, 18.0, 8.0, 10.0, 2.0, 6.0, 4.0, 4.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-16.359375, -15.8626708984375, -15.365966796875, -14.8692626953125, -14.37255859375, -13.8758544921875, -13.379150390625, -12.8824462890625, -12.3857421875, -11.8890380859375, -11.392333984375, -10.8956298828125, -10.39892578125, -9.9022216796875, -9.405517578125, -8.9088134765625, -8.412109375, -7.9154052734375, -7.418701171875, -6.9219970703125, -6.42529296875, -5.9285888671875, -5.431884765625, -4.9351806640625, -4.4384765625, -3.9417724609375, -3.445068359375, -2.9483642578125, -2.45166015625, -1.9549560546875, -1.458251953125, -0.9615478515625, -0.46484375, 0.0318603515625, 0.528564453125, 1.0252685546875, 1.52197265625, 2.0186767578125, 2.515380859375, 3.0120849609375, 3.5087890625, 4.0054931640625, 4.502197265625, 4.9989013671875, 5.49560546875, 5.9923095703125, 6.489013671875, 6.9857177734375, 7.482421875, 7.9791259765625, 8.475830078125, 8.9725341796875, 9.46923828125, 9.9659423828125, 10.462646484375, 10.9593505859375, 11.4560546875, 11.9527587890625, 12.449462890625, 12.9461669921875, 13.44287109375, 13.9395751953125, 14.436279296875, 14.9329833984375, 15.4296875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 11.0, 26.0, 30.0, 58.0, 93.0, 149.0, 252.0, 445.0, 696.0, 788.0, 608.0, 403.0, 228.0, 120.0, 77.0, 43.0, 28.0, 9.0, 7.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-40.75, -39.628173828125, -38.50634765625, -37.384521484375, -36.2626953125, -35.140869140625, -34.01904296875, -32.897216796875, -31.775390625, -30.653564453125, -29.53173828125, -28.409912109375, -27.2880859375, -26.166259765625, -25.04443359375, -23.922607421875, -22.80078125, -21.678955078125, -20.55712890625, -19.435302734375, -18.3134765625, -17.191650390625, -16.06982421875, -14.947998046875, -13.826171875, -12.704345703125, -11.58251953125, -10.460693359375, -9.3388671875, -8.217041015625, -7.09521484375, -5.973388671875, -4.8515625, -3.729736328125, -2.60791015625, -1.486083984375, -0.3642578125, 0.757568359375, 1.87939453125, 3.001220703125, 4.123046875, 5.244873046875, 6.36669921875, 7.488525390625, 8.6103515625, 9.732177734375, 10.85400390625, 11.975830078125, 13.09765625, 14.219482421875, 15.34130859375, 16.463134765625, 17.5849609375, 18.706787109375, 19.82861328125, 20.950439453125, 22.072265625, 23.194091796875, 24.31591796875, 25.437744140625, 26.5595703125, 27.681396484375, 28.80322265625, 29.925048828125, 31.046875]}, "gradients/decoder.transformer.h.15.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 4.0, 4.0, 13.0, 11.0, 13.0, 19.0, 20.0, 37.0, 42.0, 58.0, 111.0, 182.0, 314.0, 616.0, 2099.0, 44834.0, 3535166.0, 600384.0, 8171.0, 1054.0, 457.0, 238.0, 134.0, 94.0, 64.0, 43.0, 37.0, 29.0, 17.0, 4.0, 7.0, 4.0, 6.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-70.5625, -68.26953125, -65.9765625, -63.68359375, -61.390625, -59.09765625, -56.8046875, -54.51171875, -52.21875, -49.92578125, -47.6328125, -45.33984375, -43.046875, -40.75390625, -38.4609375, -36.16796875, -33.875, -31.58203125, -29.2890625, -26.99609375, -24.703125, -22.41015625, -20.1171875, -17.82421875, -15.53125, -13.23828125, -10.9453125, -8.65234375, -6.359375, -4.06640625, -1.7734375, 0.51953125, 2.8125, 5.10546875, 7.3984375, 9.69140625, 11.984375, 14.27734375, 16.5703125, 18.86328125, 21.15625, 23.44921875, 25.7421875, 28.03515625, 30.328125, 32.62109375, 34.9140625, 37.20703125, 39.5, 41.79296875, 44.0859375, 46.37890625, 48.671875, 50.96484375, 53.2578125, 55.55078125, 57.84375, 60.13671875, 62.4296875, 64.72265625, 67.015625, 69.30859375, 71.6015625, 73.89453125, 76.1875]}, "gradients/decoder.transformer.h.15.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 6.0, 18.0, 41.0, 64.0, 105.0, 143.0, 166.0, 155.0, 137.0, 85.0, 48.0, 17.0, 17.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-132.06883239746094, -127.63428497314453, -123.19974517822266, -118.76519775390625, -114.33065795898438, -109.89611053466797, -105.46156311035156, -101.02702331542969, -96.59247589111328, -92.15792846679688, -87.723388671875, -83.2888412475586, -78.85429382324219, -74.41975402832031, -69.9852066040039, -65.5506591796875, -61.116119384765625, -56.681575775146484, -52.247032165527344, -47.81248474121094, -43.3779411315918, -38.943397521972656, -34.50885009765625, -30.07430648803711, -25.63976287841797, -21.205219268798828, -16.770673751831055, -12.336129188537598, -7.901584625244141, -3.467041015625, 0.9675045013427734, 5.402050018310547, 9.836578369140625, 14.271122932434082, 18.70566749572754, 23.140213012695312, 27.574756622314453, 32.009300231933594, 36.44384765625, 40.87839126586914, 45.31293487548828, 49.74747848510742, 54.18202209472656, 58.61656951904297, 63.05111312866211, 67.48565673828125, 71.92020416259766, 76.35475158691406, 80.78929138183594, 85.22383880615234, 89.65837860107422, 94.09292602539062, 98.5274658203125, 102.9620132446289, 107.39656066894531, 111.83110046386719, 116.2656478881836, 120.7001953125, 125.13473510742188, 129.56927490234375, 134.0038299560547, 138.43836975097656, 142.87290954589844, 147.30746459960938, 151.74200439453125]}, "gradients/decoder.transformer.h.15.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 3.0, 8.0, 14.0, 12.0, 14.0, 16.0, 12.0, 12.0, 21.0, 28.0, 26.0, 25.0, 21.0, 37.0, 33.0, 35.0, 50.0, 43.0, 31.0, 47.0, 36.0, 45.0, 46.0, 41.0, 39.0, 27.0, 33.0, 32.0, 29.0, 29.0, 19.0, 20.0, 24.0, 16.0, 11.0, 16.0, 12.0, 6.0, 7.0, 8.0, 6.0, 4.0, 5.0, 1.0, 0.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-63.7955322265625, -61.680599212646484, -59.56566619873047, -57.45073318481445, -55.33580017089844, -53.22086715698242, -51.105934143066406, -48.990997314453125, -46.876068115234375, -44.76113510131836, -42.646202087402344, -40.53126907348633, -38.41633605957031, -36.3014030456543, -34.18647003173828, -32.071533203125, -29.956600189208984, -27.84166717529297, -25.726734161376953, -23.611801147460938, -21.496868133544922, -19.381935119628906, -17.267000198364258, -15.152067184448242, -13.037134170532227, -10.922201156616211, -8.807268142700195, -6.692334175109863, -4.577401161193848, -2.462468147277832, -0.3475341796875, 1.7673988342285156, 3.8823318481445312, 5.997264862060547, 8.112197875976562, 10.227131843566895, 12.34206485748291, 14.456997871398926, 16.571931838989258, 18.686864852905273, 20.80179786682129, 22.916730880737305, 25.03166389465332, 27.14659881591797, 29.261531829833984, 31.37646484375, 33.491397857666016, 35.60633087158203, 37.72126388549805, 39.83619689941406, 41.95112991333008, 44.066062927246094, 46.18099594116211, 48.295928955078125, 50.410865783691406, 52.525794982910156, 54.64073181152344, 56.75566482543945, 58.87059783935547, 60.985530853271484, 63.1004638671875, 65.21540069580078, 67.33032989501953, 69.44526672363281, 71.56019592285156]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 3.0, 10.0, 2.0, 7.0, 11.0, 12.0, 15.0, 14.0, 17.0, 28.0, 29.0, 30.0, 33.0, 24.0, 25.0, 32.0, 36.0, 43.0, 37.0, 46.0, 43.0, 38.0, 48.0, 52.0, 42.0, 41.0, 27.0, 31.0, 30.0, 29.0, 22.0, 22.0, 20.0, 18.0, 17.0, 11.0, 16.0, 7.0, 5.0, 7.0, 6.0, 7.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.6640625, -9.38720703125, -9.1103515625, -8.83349609375, -8.556640625, -8.27978515625, -8.0029296875, -7.72607421875, -7.44921875, -7.17236328125, -6.8955078125, -6.61865234375, -6.341796875, -6.06494140625, -5.7880859375, -5.51123046875, -5.234375, -4.95751953125, -4.6806640625, -4.40380859375, -4.126953125, -3.85009765625, -3.5732421875, -3.29638671875, -3.01953125, -2.74267578125, -2.4658203125, -2.18896484375, -1.912109375, -1.63525390625, -1.3583984375, -1.08154296875, -0.8046875, -0.52783203125, -0.2509765625, 0.02587890625, 0.302734375, 0.57958984375, 0.8564453125, 1.13330078125, 1.41015625, 1.68701171875, 1.9638671875, 2.24072265625, 2.517578125, 2.79443359375, 3.0712890625, 3.34814453125, 3.625, 3.90185546875, 4.1787109375, 4.45556640625, 4.732421875, 5.00927734375, 5.2861328125, 5.56298828125, 5.83984375, 6.11669921875, 6.3935546875, 6.67041015625, 6.947265625, 7.22412109375, 7.5009765625, 7.77783203125, 8.0546875]}, "gradients/decoder.transformer.h.15.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 3.0, 3.0, 6.0, 7.0, 21.0, 23.0, 33.0, 35.0, 84.0, 109.0, 142.0, 215.0, 296.0, 478.0, 669.0, 922.0, 1316.0, 1906.0, 2713.0, 3899.0, 5557.0, 8137.0, 11909.0, 17467.0, 25740.0, 38232.0, 55682.0, 82217.0, 120125.0, 159956.0, 155250.0, 112833.0, 77377.0, 52881.0, 35654.0, 23955.0, 16280.0, 11339.0, 7611.0, 5377.0, 3611.0, 2581.0, 1744.0, 1305.0, 820.0, 649.0, 432.0, 321.0, 195.0, 154.0, 106.0, 63.0, 48.0, 30.0, 13.0, 19.0, 8.0, 7.0, 3.0, 1.0, 4.0], "bins": [-0.76904296875, -0.7456817626953125, -0.722320556640625, -0.6989593505859375, -0.67559814453125, -0.6522369384765625, -0.628875732421875, -0.6055145263671875, -0.5821533203125, -0.5587921142578125, -0.535430908203125, -0.5120697021484375, -0.48870849609375, -0.4653472900390625, -0.441986083984375, -0.4186248779296875, -0.395263671875, -0.3719024658203125, -0.348541259765625, -0.3251800537109375, -0.30181884765625, -0.2784576416015625, -0.255096435546875, -0.2317352294921875, -0.2083740234375, -0.1850128173828125, -0.161651611328125, -0.1382904052734375, -0.11492919921875, -0.0915679931640625, -0.068206787109375, -0.0448455810546875, -0.021484375, 0.0018768310546875, 0.025238037109375, 0.0485992431640625, 0.07196044921875, 0.0953216552734375, 0.118682861328125, 0.1420440673828125, 0.1654052734375, 0.1887664794921875, 0.212127685546875, 0.2354888916015625, 0.25885009765625, 0.2822113037109375, 0.305572509765625, 0.3289337158203125, 0.352294921875, 0.3756561279296875, 0.399017333984375, 0.4223785400390625, 0.44573974609375, 0.4691009521484375, 0.492462158203125, 0.5158233642578125, 0.5391845703125, 0.5625457763671875, 0.585906982421875, 0.6092681884765625, 0.63262939453125, 0.6559906005859375, 0.679351806640625, 0.7027130126953125, 0.72607421875]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 5.0, 3.0, 2.0, 3.0, 4.0, 8.0, 5.0, 6.0, 10.0, 11.0, 10.0, 13.0, 20.0, 22.0, 20.0, 19.0, 30.0, 24.0, 32.0, 39.0, 41.0, 34.0, 18.0, 39.0, 38.0, 1062.0, 50.0, 46.0, 33.0, 48.0, 45.0, 40.0, 24.0, 26.0, 23.0, 23.0, 22.0, 23.0, 21.0, 15.0, 11.0, 12.0, 14.0, 8.0, 8.0, 5.0, 5.0, 2.0, 4.0, 9.0, 4.0, 2.0, 2.0], "bins": [-6.09765625, -5.931640625, -5.765625, -5.599609375, -5.43359375, -5.267578125, -5.1015625, -4.935546875, -4.76953125, -4.603515625, -4.4375, -4.271484375, -4.10546875, -3.939453125, -3.7734375, -3.607421875, -3.44140625, -3.275390625, -3.109375, -2.943359375, -2.77734375, -2.611328125, -2.4453125, -2.279296875, -2.11328125, -1.947265625, -1.78125, -1.615234375, -1.44921875, -1.283203125, -1.1171875, -0.951171875, -0.78515625, -0.619140625, -0.453125, -0.287109375, -0.12109375, 0.044921875, 0.2109375, 0.376953125, 0.54296875, 0.708984375, 0.875, 1.041015625, 1.20703125, 1.373046875, 1.5390625, 1.705078125, 1.87109375, 2.037109375, 2.203125, 2.369140625, 2.53515625, 2.701171875, 2.8671875, 3.033203125, 3.19921875, 3.365234375, 3.53125, 3.697265625, 3.86328125, 4.029296875, 4.1953125, 4.361328125, 4.52734375]}, "gradients/decoder.transformer.h.15.crossattention.c_attn.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 5.0, 4.0, 12.0, 11.0, 16.0, 24.0, 46.0, 61.0, 113.0, 122.0, 200.0, 298.0, 435.0, 639.0, 972.0, 1463.0, 2106.0, 3088.0, 4844.0, 7312.0, 10596.0, 15910.0, 23907.0, 36166.0, 53153.0, 78028.0, 111366.0, 156806.0, 1184877.0, 124881.0, 90663.0, 62223.0, 41838.0, 27977.0, 18850.0, 12538.0, 8466.0, 5636.0, 3816.0, 2594.0, 1671.0, 1104.0, 777.0, 517.0, 322.0, 235.0, 155.0, 103.0, 69.0, 38.0, 26.0, 26.0, 19.0, 6.0, 5.0, 1.0, 3.0, 2.0, 0.0, 3.0, 2.0], "bins": [-0.54150390625, -0.5241470336914062, -0.5067901611328125, -0.48943328857421875, -0.472076416015625, -0.45471954345703125, -0.4373626708984375, -0.42000579833984375, -0.40264892578125, -0.38529205322265625, -0.3679351806640625, -0.35057830810546875, -0.333221435546875, -0.31586456298828125, -0.2985076904296875, -0.28115081787109375, -0.2637939453125, -0.24643707275390625, -0.2290802001953125, -0.21172332763671875, -0.194366455078125, -0.17700958251953125, -0.1596527099609375, -0.14229583740234375, -0.12493896484375, -0.10758209228515625, -0.0902252197265625, -0.07286834716796875, -0.055511474609375, -0.03815460205078125, -0.0207977294921875, -0.00344085693359375, 0.013916015625, 0.03127288818359375, 0.0486297607421875, 0.06598663330078125, 0.083343505859375, 0.10070037841796875, 0.1180572509765625, 0.13541412353515625, 0.15277099609375, 0.17012786865234375, 0.1874847412109375, 0.20484161376953125, 0.222198486328125, 0.23955535888671875, 0.2569122314453125, 0.27426910400390625, 0.2916259765625, 0.30898284912109375, 0.3263397216796875, 0.34369659423828125, 0.361053466796875, 0.37841033935546875, 0.3957672119140625, 0.41312408447265625, 0.43048095703125, 0.44783782958984375, 0.4651947021484375, 0.48255157470703125, 0.499908447265625, 0.5172653198242188, 0.5346221923828125, 0.5519790649414062, 0.5693359375]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 3.0, 7.0, 5.0, 10.0, 12.0, 19.0, 13.0, 31.0, 49.0, 57.0, 59.0, 93.0, 84.0, 89.0, 79.0, 72.0, 73.0, 73.0, 42.0, 30.0, 31.0, 14.0, 12.0, 8.0, 6.0, 6.0, 1.0, 2.0, 4.0, 0.0, 2.0, 3.0, 3.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.00937652587890625, -0.00907886028289795, -0.008781194686889648, -0.008483529090881348, -0.008185863494873047, -0.007888197898864746, -0.007590532302856445, -0.0072928667068481445, -0.006995201110839844, -0.006697535514831543, -0.006399869918823242, -0.006102204322814941, -0.005804538726806641, -0.00550687313079834, -0.005209207534790039, -0.004911541938781738, -0.0046138763427734375, -0.004316210746765137, -0.004018545150756836, -0.003720879554748535, -0.0034232139587402344, -0.0031255483627319336, -0.002827882766723633, -0.002530217170715332, -0.0022325515747070312, -0.0019348859786987305, -0.0016372203826904297, -0.001339554786682129, -0.0010418891906738281, -0.0007442235946655273, -0.00044655799865722656, -0.00014889240264892578, 0.000148773193359375, 0.0004464387893676758, 0.0007441043853759766, 0.0010417699813842773, 0.0013394355773925781, 0.001637101173400879, 0.0019347667694091797, 0.0022324323654174805, 0.0025300979614257812, 0.002827763557434082, 0.003125429153442383, 0.0034230947494506836, 0.0037207603454589844, 0.004018425941467285, 0.004316091537475586, 0.004613757133483887, 0.0049114227294921875, 0.005209088325500488, 0.005506753921508789, 0.00580441951751709, 0.006102085113525391, 0.006399750709533691, 0.006697416305541992, 0.006995081901550293, 0.007292747497558594, 0.0075904130935668945, 0.007888078689575195, 0.008185744285583496, 0.008483409881591797, 0.008781075477600098, 0.009078741073608398, 0.0093764066696167, 0.009674072265625]}, "gradients/decoder.transformer.h.15.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 4.0, 2.0, 5.0, 5.0, 5.0, 8.0, 10.0, 19.0, 32.0, 35.0, 45.0, 86.0, 141.0, 237.0, 623.0, 24439.0, 1019114.0, 2825.0, 414.0, 175.0, 103.0, 66.0, 48.0, 26.0, 27.0, 15.0, 11.0, 7.0, 7.0, 6.0, 2.0, 2.0, 4.0, 2.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.2076416015625, -0.2012176513671875, -0.194793701171875, -0.1883697509765625, -0.18194580078125, -0.1755218505859375, -0.169097900390625, -0.1626739501953125, -0.15625, -0.1498260498046875, -0.143402099609375, -0.1369781494140625, -0.13055419921875, -0.1241302490234375, -0.117706298828125, -0.1112823486328125, -0.1048583984375, -0.0984344482421875, -0.092010498046875, -0.0855865478515625, -0.07916259765625, -0.0727386474609375, -0.066314697265625, -0.0598907470703125, -0.053466796875, -0.0470428466796875, -0.040618896484375, -0.0341949462890625, -0.02777099609375, -0.0213470458984375, -0.014923095703125, -0.0084991455078125, -0.0020751953125, 0.0043487548828125, 0.010772705078125, 0.0171966552734375, 0.02362060546875, 0.0300445556640625, 0.036468505859375, 0.0428924560546875, 0.04931640625, 0.0557403564453125, 0.062164306640625, 0.0685882568359375, 0.07501220703125, 0.0814361572265625, 0.087860107421875, 0.0942840576171875, 0.1007080078125, 0.1071319580078125, 0.113555908203125, 0.1199798583984375, 0.12640380859375, 0.1328277587890625, 0.139251708984375, 0.1456756591796875, 0.152099609375, 0.1585235595703125, 0.164947509765625, 0.1713714599609375, 0.17779541015625, 0.1842193603515625, 0.190643310546875, 0.1970672607421875, 0.2034912109375]}, "gradients/decoder.transformer.h.15.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 14.0, 57.0, 252.0, 494.0, 162.0, 29.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.028306107968091965, -0.02752826176583767, -0.026750413700938225, -0.02597256749868393, -0.025194719433784485, -0.02441687323153019, -0.023639027029275894, -0.02286117896437645, -0.022083330899477005, -0.02130548469722271, -0.020527636632323265, -0.01974979043006897, -0.018971942365169525, -0.01819409616291523, -0.017416249960660934, -0.01663840189576149, -0.015860555693507195, -0.015082708559930325, -0.014304861426353455, -0.01352701522409916, -0.012749167159199715, -0.01197132095694542, -0.01119347382336855, -0.01041562668979168, -0.00963777955621481, -0.00885993242263794, -0.00808208528906107, -0.007304238621145487, -0.006526391487568617, -0.005748544353991747, -0.004970697686076164, -0.004192850552499294, -0.0034150034189224243, -0.0026371562853455544, -0.001859309384599328, -0.0010814624838531017, -0.00030361535027623177, 0.0004742317833006382, 0.0012520784512162209, 0.002029925584793091, 0.002807772718369961, 0.0035856198519468307, 0.004363466985523701, 0.005141313653439283, 0.005919160787016153, 0.006697007920593023, 0.007474854588508606, 0.008252701722085476, 0.009030548855662346, 0.009808395989239216, 0.010586243122816086, 0.011364089325070381, 0.012141937389969826, 0.012919783592224121, 0.013697630725800991, 0.014475477859377861, 0.015253324992954731, 0.0160311721265316, 0.016809018328785896, 0.01758686639368534, 0.018364712595939636, 0.01914256066083908, 0.019920406863093376, 0.02069825306534767, 0.021476101130247116]}, "gradients/decoder.transformer.h.15.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 6.0, 3.0, 8.0, 7.0, 9.0, 10.0, 3.0, 7.0, 14.0, 18.0, 15.0, 13.0, 37.0, 27.0, 24.0, 33.0, 30.0, 43.0, 35.0, 42.0, 41.0, 40.0, 38.0, 39.0, 47.0, 38.0, 45.0, 47.0, 35.0, 34.0, 32.0, 28.0, 22.0, 31.0, 14.0, 17.0, 13.0, 15.0, 15.0, 6.0, 8.0, 7.0, 4.0, 6.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.004151046276092529, -0.003997752442955971, -0.0038444586098194122, -0.0036911647766828537, -0.003537870943546295, -0.0033845771104097366, -0.003231283277273178, -0.0030779894441366196, -0.002924695611000061, -0.0027714017778635025, -0.002618107944726944, -0.0024648141115903854, -0.002311520278453827, -0.0021582264453172684, -0.00200493261218071, -0.0018516387790441513, -0.0016983449459075928, -0.0015450511127710342, -0.0013917572796344757, -0.0012384634464979172, -0.0010851696133613586, -0.0009318757802248001, -0.0007785819470882416, -0.000625288113951683, -0.0004719942808151245, -0.000318700447678566, -0.00016540661454200745, -1.2112781405448914e-05, 0.00014118105173110962, 0.00029447488486766815, 0.0004477687180042267, 0.0006010625511407852, 0.0007543563842773438, 0.0009076502174139023, 0.0010609440505504608, 0.0012142378836870193, 0.0013675317168235779, 0.0015208255499601364, 0.001674119383096695, 0.0018274132162332535, 0.001980707049369812, 0.0021340008825063705, 0.002287294715642929, 0.0024405885487794876, 0.002593882381916046, 0.0027471762150526047, 0.002900470048189163, 0.0030537638813257217, 0.0032070577144622803, 0.003360351547598839, 0.0035136453807353973, 0.003666939213871956, 0.0038202330470085144, 0.003973526880145073, 0.0041268207132816315, 0.00428011454641819, 0.0044334083795547485, 0.004586702212691307, 0.004739996045827866, 0.004893289878964424, 0.005046583712100983, 0.005199877545237541, 0.0053531713783741, 0.005506465211510658, 0.005659759044647217]}, "gradients/decoder.transformer.h.15.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 2.0, 3.0, 10.0, 2.0, 7.0, 11.0, 12.0, 15.0, 14.0, 17.0, 28.0, 29.0, 30.0, 33.0, 24.0, 25.0, 32.0, 36.0, 43.0, 37.0, 46.0, 43.0, 38.0, 48.0, 51.0, 43.0, 41.0, 27.0, 31.0, 30.0, 29.0, 22.0, 22.0, 20.0, 18.0, 17.0, 12.0, 15.0, 7.0, 5.0, 7.0, 6.0, 7.0, 6.0, 1.0, 1.0, 3.0, 1.0, 2.0, 0.0, 2.0], "bins": [-9.6640625, -9.38720703125, -9.1103515625, -8.83349609375, -8.556640625, -8.27978515625, -8.0029296875, -7.72607421875, -7.44921875, -7.17236328125, -6.8955078125, -6.61865234375, -6.341796875, -6.06494140625, -5.7880859375, -5.51123046875, -5.234375, -4.95751953125, -4.6806640625, -4.40380859375, -4.126953125, -3.85009765625, -3.5732421875, -3.29638671875, -3.01953125, -2.74267578125, -2.4658203125, -2.18896484375, -1.912109375, -1.63525390625, -1.3583984375, -1.08154296875, -0.8046875, -0.52783203125, -0.2509765625, 0.02587890625, 0.302734375, 0.57958984375, 0.8564453125, 1.13330078125, 1.41015625, 1.68701171875, 1.9638671875, 2.24072265625, 2.517578125, 2.79443359375, 3.0712890625, 3.34814453125, 3.625, 3.90185546875, 4.1787109375, 4.45556640625, 4.732421875, 5.00927734375, 5.2861328125, 5.56298828125, 5.83984375, 6.11669921875, 6.3935546875, 6.67041015625, 6.947265625, 7.22412109375, 7.5009765625, 7.77783203125, 8.0546875]}, "gradients/decoder.transformer.h.15.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 4.0, 6.0, 8.0, 13.0, 22.0, 20.0, 29.0, 41.0, 57.0, 84.0, 142.0, 197.0, 272.0, 442.0, 689.0, 1164.0, 1857.0, 3343.0, 5874.0, 10440.0, 19868.0, 38904.0, 80115.0, 169600.0, 301658.0, 211169.0, 100549.0, 48128.0, 24287.0, 12716.0, 6862.0, 3972.0, 2303.0, 1383.0, 845.0, 514.0, 311.0, 205.0, 131.0, 106.0, 75.0, 37.0, 38.0, 19.0, 17.0, 10.0, 8.0, 10.0, 2.0, 2.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0], "bins": [-5.76953125, -5.59283447265625, -5.4161376953125, -5.23944091796875, -5.062744140625, -4.88604736328125, -4.7093505859375, -4.53265380859375, -4.35595703125, -4.17926025390625, -4.0025634765625, -3.82586669921875, -3.649169921875, -3.47247314453125, -3.2957763671875, -3.11907958984375, -2.9423828125, -2.76568603515625, -2.5889892578125, -2.41229248046875, -2.235595703125, -2.05889892578125, -1.8822021484375, -1.70550537109375, -1.52880859375, -1.35211181640625, -1.1754150390625, -0.99871826171875, -0.822021484375, -0.64532470703125, -0.4686279296875, -0.29193115234375, -0.115234375, 0.06146240234375, 0.2381591796875, 0.41485595703125, 0.591552734375, 0.76824951171875, 0.9449462890625, 1.12164306640625, 1.29833984375, 1.47503662109375, 1.6517333984375, 1.82843017578125, 2.005126953125, 2.18182373046875, 2.3585205078125, 2.53521728515625, 2.7119140625, 2.88861083984375, 3.0653076171875, 3.24200439453125, 3.418701171875, 3.59539794921875, 3.7720947265625, 3.94879150390625, 4.12548828125, 4.30218505859375, 4.4788818359375, 4.65557861328125, 4.832275390625, 5.00897216796875, 5.1856689453125, 5.36236572265625, 5.5390625]}, "gradients/decoder.transformer.h.15.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 1.0, 3.0, 3.0, 2.0, 5.0, 4.0, 7.0, 8.0, 10.0, 18.0, 19.0, 21.0, 28.0, 39.0, 31.0, 40.0, 46.0, 58.0, 65.0, 163.0, 1702.0, 278.0, 83.0, 63.0, 59.0, 55.0, 55.0, 36.0, 47.0, 16.0, 22.0, 15.0, 10.0, 11.0, 9.0, 6.0, 4.0, 4.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-46.0, -44.67236328125, -43.3447265625, -42.01708984375, -40.689453125, -39.36181640625, -38.0341796875, -36.70654296875, -35.37890625, -34.05126953125, -32.7236328125, -31.39599609375, -30.068359375, -28.74072265625, -27.4130859375, -26.08544921875, -24.7578125, -23.43017578125, -22.1025390625, -20.77490234375, -19.447265625, -18.11962890625, -16.7919921875, -15.46435546875, -14.13671875, -12.80908203125, -11.4814453125, -10.15380859375, -8.826171875, -7.49853515625, -6.1708984375, -4.84326171875, -3.515625, -2.18798828125, -0.8603515625, 0.46728515625, 1.794921875, 3.12255859375, 4.4501953125, 5.77783203125, 7.10546875, 8.43310546875, 9.7607421875, 11.08837890625, 12.416015625, 13.74365234375, 15.0712890625, 16.39892578125, 17.7265625, 19.05419921875, 20.3818359375, 21.70947265625, 23.037109375, 24.36474609375, 25.6923828125, 27.02001953125, 28.34765625, 29.67529296875, 31.0029296875, 32.33056640625, 33.658203125, 34.98583984375, 36.3134765625, 37.64111328125, 38.96875]}, "gradients/decoder.transformer.h.15.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 5.0, 2.0, 3.0, 9.0, 6.0, 15.0, 11.0, 17.0, 22.0, 29.0, 37.0, 71.0, 88.0, 130.0, 154.0, 262.0, 447.0, 1214.0, 48586.0, 3087238.0, 5700.0, 654.0, 333.0, 190.0, 141.0, 87.0, 61.0, 55.0, 43.0, 32.0, 23.0, 13.0, 7.0, 5.0, 6.0, 4.0, 3.0, 4.0, 3.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-87.1875, -84.2119140625, -81.236328125, -78.2607421875, -75.28515625, -72.3095703125, -69.333984375, -66.3583984375, -63.3828125, -60.4072265625, -57.431640625, -54.4560546875, -51.48046875, -48.5048828125, -45.529296875, -42.5537109375, -39.578125, -36.6025390625, -33.626953125, -30.6513671875, -27.67578125, -24.7001953125, -21.724609375, -18.7490234375, -15.7734375, -12.7978515625, -9.822265625, -6.8466796875, -3.87109375, -0.8955078125, 2.080078125, 5.0556640625, 8.03125, 11.0068359375, 13.982421875, 16.9580078125, 19.93359375, 22.9091796875, 25.884765625, 28.8603515625, 31.8359375, 34.8115234375, 37.787109375, 40.7626953125, 43.73828125, 46.7138671875, 49.689453125, 52.6650390625, 55.640625, 58.6162109375, 61.591796875, 64.5673828125, 67.54296875, 70.5185546875, 73.494140625, 76.4697265625, 79.4453125, 82.4208984375, 85.396484375, 88.3720703125, 91.34765625, 94.3232421875, 97.298828125, 100.2744140625, 103.25]}, "gradients/decoder.transformer.h.15.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 26.0, 132.0, 345.0, 346.0, 132.0, 24.0, 5.0, 2.0, 0.0, 1.0], "bins": [-210.7089080810547, -207.01072692871094, -203.3125457763672, -199.6143798828125, -195.91619873046875, -192.218017578125, -188.51983642578125, -184.8216552734375, -181.1234893798828, -177.42530822753906, -173.7271270751953, -170.02896118164062, -166.33078002929688, -162.63259887695312, -158.93441772460938, -155.23623657226562, -151.53805541992188, -147.83987426757812, -144.14169311523438, -140.4435272216797, -136.74534606933594, -133.0471649169922, -129.34898376464844, -125.65081024169922, -121.95263671875, -118.25445556640625, -114.55628204345703, -110.85810089111328, -107.15992736816406, -103.46174621582031, -99.76356506347656, -96.06539154052734, -92.36721801757812, -88.66903686523438, -84.97086334228516, -81.2726821899414, -77.57450866699219, -73.87632751464844, -70.17814636230469, -66.47997283935547, -62.78179931640625, -59.083621978759766, -55.38544464111328, -51.68726348876953, -47.98908996582031, -44.29090881347656, -40.59273147583008, -36.894554138183594, -33.19637680053711, -29.498199462890625, -25.80002212524414, -22.101842880249023, -18.40366554260254, -14.705488204956055, -11.007308959960938, -7.309131622314453, -3.6109542846679688, 0.08722352981567383, 3.7854013442993164, 7.483579635620117, 11.181756973266602, 14.879934310913086, 18.578113555908203, 22.276290893554688, 25.974468231201172]}, "gradients/decoder.transformer.h.15.ln_1.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 2.0, 3.0, 7.0, 7.0, 7.0, 7.0, 9.0, 19.0, 16.0, 11.0, 14.0, 22.0, 35.0, 28.0, 22.0, 24.0, 33.0, 37.0, 26.0, 35.0, 31.0, 44.0, 45.0, 45.0, 33.0, 47.0, 26.0, 38.0, 40.0, 38.0, 24.0, 34.0, 31.0, 19.0, 15.0, 18.0, 21.0, 17.0, 20.0, 8.0, 15.0, 8.0, 7.0, 5.0, 2.0, 2.0, 2.0, 1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0], "bins": [-76.93017578125, -74.37652587890625, -71.82288360595703, -69.26923370361328, -66.71559143066406, -64.16194152832031, -61.60829544067383, -59.054649353027344, -56.50100326538086, -53.947357177734375, -51.39371109008789, -48.840065002441406, -46.286415100097656, -43.73277282714844, -41.17912292480469, -38.6254768371582, -36.07183074951172, -33.518184661865234, -30.96453857421875, -28.410890579223633, -25.85724449157715, -23.303598403930664, -20.749950408935547, -18.196304321289062, -15.642658233642578, -13.089012145996094, -10.535365104675293, -7.98171854019165, -5.428071975708008, -2.8744258880615234, -0.32077884674072266, 2.232868194580078, 4.7865142822265625, 7.340160846710205, 9.893807411193848, 12.447454452514648, 15.001100540161133, 17.554746627807617, 20.108394622802734, 22.66204071044922, 25.215686798095703, 27.769332885742188, 30.322978973388672, 32.876625061035156, 35.430274963378906, 37.983917236328125, 40.537567138671875, 43.09121322631836, 45.644859313964844, 48.19850540161133, 50.75215148925781, 53.3057975769043, 55.85944366455078, 58.41309356689453, 60.966739654541016, 63.5203857421875, 66.07403564453125, 68.627685546875, 71.18132781982422, 73.73497772216797, 76.28861999511719, 78.84226989746094, 81.39591217041016, 83.9495620727539, 86.50320434570312]}, "gradients/decoder.transformer.h.14.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 2.0, 3.0, 5.0, 5.0, 11.0, 8.0, 8.0, 20.0, 11.0, 14.0, 27.0, 25.0, 37.0, 21.0, 23.0, 36.0, 28.0, 34.0, 30.0, 47.0, 39.0, 42.0, 43.0, 38.0, 46.0, 45.0, 38.0, 37.0, 34.0, 27.0, 32.0, 24.0, 28.0, 24.0, 16.0, 16.0, 16.0, 11.0, 13.0, 9.0, 5.0, 6.0, 7.0, 7.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0], "bins": [-9.6484375, -9.3685302734375, -9.088623046875, -8.8087158203125, -8.52880859375, -8.2489013671875, -7.968994140625, -7.6890869140625, -7.4091796875, -7.1292724609375, -6.849365234375, -6.5694580078125, -6.28955078125, -6.0096435546875, -5.729736328125, -5.4498291015625, -5.169921875, -4.8900146484375, -4.610107421875, -4.3302001953125, -4.05029296875, -3.7703857421875, -3.490478515625, -3.2105712890625, -2.9306640625, -2.6507568359375, -2.370849609375, -2.0909423828125, -1.81103515625, -1.5311279296875, -1.251220703125, -0.9713134765625, -0.69140625, -0.4114990234375, -0.131591796875, 0.1483154296875, 0.42822265625, 0.7081298828125, 0.988037109375, 1.2679443359375, 1.5478515625, 1.8277587890625, 2.107666015625, 2.3875732421875, 2.66748046875, 2.9473876953125, 3.227294921875, 3.5072021484375, 3.787109375, 4.0670166015625, 4.346923828125, 4.6268310546875, 4.90673828125, 5.1866455078125, 5.466552734375, 5.7464599609375, 6.0263671875, 6.3062744140625, 6.586181640625, 6.8660888671875, 7.14599609375, 7.4259033203125, 7.705810546875, 7.9857177734375, 8.265625]}, "gradients/decoder.transformer.h.14.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 8.0, 7.0, 4.0, 4.0, 4.0, 7.0, 6.0, 10.0, 13.0, 18.0, 23.0, 21.0, 32.0, 29.0, 24.0, 28.0, 38.0, 95.0, 217.0, 827.0, 4725.0, 49027.0, 1382790.0, 2628957.0, 117226.0, 8170.0, 1288.0, 304.0, 100.0, 50.0, 28.0, 28.0, 27.0, 22.0, 19.0, 21.0, 19.0, 14.0, 11.0, 14.0, 6.0, 9.0, 6.0, 9.0, 0.0, 5.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-37.65625, -36.584716796875, -35.51318359375, -34.441650390625, -33.3701171875, -32.298583984375, -31.22705078125, -30.155517578125, -29.083984375, -28.012451171875, -26.94091796875, -25.869384765625, -24.7978515625, -23.726318359375, -22.65478515625, -21.583251953125, -20.51171875, -19.440185546875, -18.36865234375, -17.297119140625, -16.2255859375, -15.154052734375, -14.08251953125, -13.010986328125, -11.939453125, -10.867919921875, -9.79638671875, -8.724853515625, -7.6533203125, -6.581787109375, -5.51025390625, -4.438720703125, -3.3671875, -2.295654296875, -1.22412109375, -0.152587890625, 0.9189453125, 1.990478515625, 3.06201171875, 4.133544921875, 5.205078125, 6.276611328125, 7.34814453125, 8.419677734375, 9.4912109375, 10.562744140625, 11.63427734375, 12.705810546875, 13.77734375, 14.848876953125, 15.92041015625, 16.991943359375, 18.0634765625, 19.135009765625, 20.20654296875, 21.278076171875, 22.349609375, 23.421142578125, 24.49267578125, 25.564208984375, 26.6357421875, 27.707275390625, 28.77880859375, 29.850341796875, 30.921875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 8.0, 11.0, 16.0, 24.0, 48.0, 60.0, 115.0, 160.0, 241.0, 362.0, 513.0, 601.0, 601.0, 467.0, 276.0, 209.0, 118.0, 81.0, 45.0, 31.0, 26.0, 25.0, 16.0, 12.0, 5.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-34.625, -33.731689453125, -32.83837890625, -31.945068359375, -31.0517578125, -30.158447265625, -29.26513671875, -28.371826171875, -27.478515625, -26.585205078125, -25.69189453125, -24.798583984375, -23.9052734375, -23.011962890625, -22.11865234375, -21.225341796875, -20.33203125, -19.438720703125, -18.54541015625, -17.652099609375, -16.7587890625, -15.865478515625, -14.97216796875, -14.078857421875, -13.185546875, -12.292236328125, -11.39892578125, -10.505615234375, -9.6123046875, -8.718994140625, -7.82568359375, -6.932373046875, -6.0390625, -5.145751953125, -4.25244140625, -3.359130859375, -2.4658203125, -1.572509765625, -0.67919921875, 0.214111328125, 1.107421875, 2.000732421875, 2.89404296875, 3.787353515625, 4.6806640625, 5.573974609375, 6.46728515625, 7.360595703125, 8.25390625, 9.147216796875, 10.04052734375, 10.933837890625, 11.8271484375, 12.720458984375, 13.61376953125, 14.507080078125, 15.400390625, 16.293701171875, 17.18701171875, 18.080322265625, 18.9736328125, 19.866943359375, 20.76025390625, 21.653564453125, 22.546875]}, "gradients/decoder.transformer.h.14.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 3.0, 5.0, 11.0, 11.0, 17.0, 34.0, 43.0, 50.0, 70.0, 112.0, 145.0, 278.0, 599.0, 2081.0, 65468.0, 3963047.0, 157925.0, 2885.0, 690.0, 283.0, 187.0, 105.0, 74.0, 49.0, 36.0, 27.0, 18.0, 12.0, 7.0, 8.0, 3.0, 4.0, 1.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-90.3125, -87.623046875, -84.93359375, -82.244140625, -79.5546875, -76.865234375, -74.17578125, -71.486328125, -68.796875, -66.107421875, -63.41796875, -60.728515625, -58.0390625, -55.349609375, -52.66015625, -49.970703125, -47.28125, -44.591796875, -41.90234375, -39.212890625, -36.5234375, -33.833984375, -31.14453125, -28.455078125, -25.765625, -23.076171875, -20.38671875, -17.697265625, -15.0078125, -12.318359375, -9.62890625, -6.939453125, -4.25, -1.560546875, 1.12890625, 3.818359375, 6.5078125, 9.197265625, 11.88671875, 14.576171875, 17.265625, 19.955078125, 22.64453125, 25.333984375, 28.0234375, 30.712890625, 33.40234375, 36.091796875, 38.78125, 41.470703125, 44.16015625, 46.849609375, 49.5390625, 52.228515625, 54.91796875, 57.607421875, 60.296875, 62.986328125, 65.67578125, 68.365234375, 71.0546875, 73.744140625, 76.43359375, 79.123046875, 81.8125]}, "gradients/decoder.transformer.h.14.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 14.0, 45.0, 88.0, 156.0, 194.0, 244.0, 135.0, 74.0, 47.0, 11.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-171.202392578125, -165.27557373046875, -159.3487548828125, -153.4219512939453, -147.49513244628906, -141.5683135986328, -135.64149475097656, -129.71469116210938, -123.78787231445312, -117.86105346679688, -111.93424224853516, -106.0074234008789, -100.08061218261719, -94.15379333496094, -88.22697448730469, -82.30016326904297, -76.37334442138672, -70.44652557373047, -64.51971435546875, -58.5928955078125, -52.66608428955078, -46.73926544189453, -40.81245040893555, -34.88563537597656, -28.958820343017578, -23.032005310058594, -17.10519027709961, -11.178373336791992, -5.251558303833008, 0.6752567291259766, 6.602073669433594, 12.528888702392578, 18.455703735351562, 24.382518768310547, 30.30933380126953, 36.23615264892578, 42.1629638671875, 48.08978271484375, 54.016597747802734, 59.94341278076172, 65.87022399902344, 71.79704284667969, 77.7238540649414, 83.65067291259766, 89.57748413085938, 95.50430297851562, 101.43112182617188, 107.3579330444336, 113.28475189208984, 119.2115707397461, 125.13838195800781, 131.06520080566406, 136.9920196533203, 142.9188232421875, 148.84564208984375, 154.7724609375, 160.69927978515625, 166.6260986328125, 172.55291748046875, 178.47972106933594, 184.4065399169922, 190.33335876464844, 196.2601776123047, 202.18698120117188, 208.11380004882812]}, "gradients/decoder.transformer.h.14.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 7.0, 1.0, 7.0, 3.0, 6.0, 13.0, 12.0, 6.0, 16.0, 11.0, 12.0, 14.0, 22.0, 19.0, 21.0, 29.0, 26.0, 31.0, 44.0, 19.0, 43.0, 29.0, 38.0, 43.0, 34.0, 27.0, 43.0, 40.0, 38.0, 48.0, 37.0, 38.0, 30.0, 23.0, 23.0, 20.0, 18.0, 18.0, 19.0, 15.0, 18.0, 13.0, 7.0, 11.0, 7.0, 3.0, 3.0, 1.0, 5.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-56.4300537109375, -54.341880798339844, -52.25370788574219, -50.16553497314453, -48.077362060546875, -45.98918914794922, -43.90101623535156, -41.812843322753906, -39.72467041015625, -37.636497497558594, -35.54832458496094, -33.46015167236328, -31.371978759765625, -29.28380584716797, -27.195632934570312, -25.107460021972656, -23.019287109375, -20.931114196777344, -18.842941284179688, -16.75476837158203, -14.666595458984375, -12.578422546386719, -10.490249633789062, -8.402076721191406, -6.31390380859375, -4.225730895996094, -2.1375579833984375, -0.04938507080078125, 2.038787841796875, 4.126960754394531, 6.2151336669921875, 8.303306579589844, 10.3914794921875, 12.479652404785156, 14.567825317382812, 16.65599822998047, 18.744171142578125, 20.83234405517578, 22.920516967773438, 25.008689880371094, 27.09686279296875, 29.185035705566406, 31.273208618164062, 33.36138153076172, 35.449554443359375, 37.53772735595703, 39.62590026855469, 41.714073181152344, 43.80224609375, 45.890419006347656, 47.97859191894531, 50.06676483154297, 52.154937744140625, 54.24311065673828, 56.33128356933594, 58.419456481933594, 60.50762939453125, 62.595802307128906, 64.68397521972656, 66.77214813232422, 68.86032104492188, 70.94849395751953, 73.03666687011719, 75.12483978271484, 77.2130126953125]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 9.0, 17.0, 13.0, 16.0, 18.0, 20.0, 16.0, 27.0, 39.0, 25.0, 29.0, 34.0, 32.0, 37.0, 34.0, 37.0, 43.0, 36.0, 39.0, 38.0, 48.0, 36.0, 40.0, 39.0, 25.0, 31.0, 26.0, 27.0, 17.0, 25.0, 20.0, 17.0, 17.0, 11.0, 9.0, 7.0, 10.0, 8.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6875, -8.4144287109375, -8.141357421875, -7.8682861328125, -7.59521484375, -7.3221435546875, -7.049072265625, -6.7760009765625, -6.5029296875, -6.2298583984375, -5.956787109375, -5.6837158203125, -5.41064453125, -5.1375732421875, -4.864501953125, -4.5914306640625, -4.318359375, -4.0452880859375, -3.772216796875, -3.4991455078125, -3.22607421875, -2.9530029296875, -2.679931640625, -2.4068603515625, -2.1337890625, -1.8607177734375, -1.587646484375, -1.3145751953125, -1.04150390625, -0.7684326171875, -0.495361328125, -0.2222900390625, 0.05078125, 0.3238525390625, 0.596923828125, 0.8699951171875, 1.14306640625, 1.4161376953125, 1.689208984375, 1.9622802734375, 2.2353515625, 2.5084228515625, 2.781494140625, 3.0545654296875, 3.32763671875, 3.6007080078125, 3.873779296875, 4.1468505859375, 4.419921875, 4.6929931640625, 4.966064453125, 5.2391357421875, 5.51220703125, 5.7852783203125, 6.058349609375, 6.3314208984375, 6.6044921875, 6.8775634765625, 7.150634765625, 7.4237060546875, 7.69677734375, 7.9698486328125, 8.242919921875, 8.5159912109375, 8.7890625]}, "gradients/decoder.transformer.h.14.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 2.0, 2.0, 9.0, 7.0, 11.0, 18.0, 34.0, 38.0, 66.0, 97.0, 128.0, 186.0, 303.0, 405.0, 569.0, 846.0, 1233.0, 1806.0, 2724.0, 3994.0, 6004.0, 9300.0, 14247.0, 22228.0, 34446.0, 54242.0, 84153.0, 128026.0, 172214.0, 166816.0, 121291.0, 79023.0, 51003.0, 32600.0, 20929.0, 13491.0, 8797.0, 5585.0, 3755.0, 2577.0, 1730.0, 1107.0, 823.0, 503.0, 378.0, 259.0, 171.0, 135.0, 82.0, 59.0, 29.0, 30.0, 21.0, 12.0, 8.0, 9.0, 4.0, 2.0, 2.0, 0.0, 1.0], "bins": [-0.87451171875, -0.8471221923828125, -0.819732666015625, -0.7923431396484375, -0.76495361328125, -0.7375640869140625, -0.710174560546875, -0.6827850341796875, -0.6553955078125, -0.6280059814453125, -0.600616455078125, -0.5732269287109375, -0.54583740234375, -0.5184478759765625, -0.491058349609375, -0.4636688232421875, -0.436279296875, -0.4088897705078125, -0.381500244140625, -0.3541107177734375, -0.32672119140625, -0.2993316650390625, -0.271942138671875, -0.2445526123046875, -0.2171630859375, -0.1897735595703125, -0.162384033203125, -0.1349945068359375, -0.10760498046875, -0.0802154541015625, -0.052825927734375, -0.0254364013671875, 0.001953125, 0.0293426513671875, 0.056732177734375, 0.0841217041015625, 0.11151123046875, 0.1389007568359375, 0.166290283203125, 0.1936798095703125, 0.2210693359375, 0.2484588623046875, 0.275848388671875, 0.3032379150390625, 0.33062744140625, 0.3580169677734375, 0.385406494140625, 0.4127960205078125, 0.440185546875, 0.4675750732421875, 0.494964599609375, 0.5223541259765625, 0.54974365234375, 0.5771331787109375, 0.604522705078125, 0.6319122314453125, 0.6593017578125, 0.6866912841796875, 0.714080810546875, 0.7414703369140625, 0.76885986328125, 0.7962493896484375, 0.823638916015625, 0.8510284423828125, 0.87841796875]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 4.0, 4.0, 4.0, 9.0, 9.0, 5.0, 8.0, 7.0, 15.0, 10.0, 15.0, 22.0, 25.0, 31.0, 34.0, 38.0, 32.0, 45.0, 49.0, 44.0, 46.0, 40.0, 1060.0, 30.0, 54.0, 44.0, 49.0, 35.0, 37.0, 27.0, 30.0, 36.0, 29.0, 23.0, 22.0, 12.0, 17.0, 5.0, 6.0, 9.0, 2.0, 3.0, 5.0, 1.0, 2.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.46484375, -6.2701416015625, -6.075439453125, -5.8807373046875, -5.68603515625, -5.4913330078125, -5.296630859375, -5.1019287109375, -4.9072265625, -4.7125244140625, -4.517822265625, -4.3231201171875, -4.12841796875, -3.9337158203125, -3.739013671875, -3.5443115234375, -3.349609375, -3.1549072265625, -2.960205078125, -2.7655029296875, -2.57080078125, -2.3760986328125, -2.181396484375, -1.9866943359375, -1.7919921875, -1.5972900390625, -1.402587890625, -1.2078857421875, -1.01318359375, -0.8184814453125, -0.623779296875, -0.4290771484375, -0.234375, -0.0396728515625, 0.155029296875, 0.3497314453125, 0.54443359375, 0.7391357421875, 0.933837890625, 1.1285400390625, 1.3232421875, 1.5179443359375, 1.712646484375, 1.9073486328125, 2.10205078125, 2.2967529296875, 2.491455078125, 2.6861572265625, 2.880859375, 3.0755615234375, 3.270263671875, 3.4649658203125, 3.65966796875, 3.8543701171875, 4.049072265625, 4.2437744140625, 4.4384765625, 4.6331787109375, 4.827880859375, 5.0225830078125, 5.21728515625, 5.4119873046875, 5.606689453125, 5.8013916015625, 5.99609375]}, "gradients/decoder.transformer.h.14.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 2.0, 4.0, 2.0, 7.0, 10.0, 16.0, 21.0, 28.0, 62.0, 72.0, 110.0, 151.0, 196.0, 324.0, 473.0, 710.0, 1067.0, 1591.0, 2248.0, 3343.0, 5333.0, 7968.0, 12231.0, 19250.0, 29620.0, 46246.0, 72228.0, 108004.0, 147190.0, 1208993.0, 139916.0, 101452.0, 67031.0, 43032.0, 27269.0, 17653.0, 11319.0, 7437.0, 4908.0, 3149.0, 2063.0, 1336.0, 902.0, 704.0, 442.0, 316.0, 215.0, 166.0, 112.0, 56.0, 48.0, 38.0, 27.0, 12.0, 14.0, 10.0, 7.0, 3.0, 4.0, 4.0, 1.0, 2.0], "bins": [-0.59814453125, -0.5791015625, -0.56005859375, -0.541015625, -0.52197265625, -0.5029296875, -0.48388671875, -0.46484375, -0.44580078125, -0.4267578125, -0.40771484375, -0.388671875, -0.36962890625, -0.3505859375, -0.33154296875, -0.3125, -0.29345703125, -0.2744140625, -0.25537109375, -0.236328125, -0.21728515625, -0.1982421875, -0.17919921875, -0.16015625, -0.14111328125, -0.1220703125, -0.10302734375, -0.083984375, -0.06494140625, -0.0458984375, -0.02685546875, -0.0078125, 0.01123046875, 0.0302734375, 0.04931640625, 0.068359375, 0.08740234375, 0.1064453125, 0.12548828125, 0.14453125, 0.16357421875, 0.1826171875, 0.20166015625, 0.220703125, 0.23974609375, 0.2587890625, 0.27783203125, 0.296875, 0.31591796875, 0.3349609375, 0.35400390625, 0.373046875, 0.39208984375, 0.4111328125, 0.43017578125, 0.44921875, 0.46826171875, 0.4873046875, 0.50634765625, 0.525390625, 0.54443359375, 0.5634765625, 0.58251953125, 0.6015625, 0.62060546875]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 2.0, 5.0, 5.0, 4.0, 4.0, 4.0, 9.0, 11.0, 11.0, 15.0, 24.0, 39.0, 42.0, 49.0, 70.0, 66.0, 95.0, 85.0, 77.0, 84.0, 68.0, 62.0, 55.0, 33.0, 20.0, 20.0, 8.0, 11.0, 6.0, 4.0, 4.0, 4.0, 2.0, 3.0, 3.0, 0.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.011077880859375, -0.010755538940429688, -0.010433197021484375, -0.010110855102539062, -0.00978851318359375, -0.009466171264648438, -0.009143829345703125, -0.008821487426757812, -0.0084991455078125, -0.008176803588867188, -0.007854461669921875, -0.0075321197509765625, -0.00720977783203125, -0.0068874359130859375, -0.006565093994140625, -0.0062427520751953125, -0.00592041015625, -0.0055980682373046875, -0.005275726318359375, -0.0049533843994140625, -0.00463104248046875, -0.0043087005615234375, -0.003986358642578125, -0.0036640167236328125, -0.0033416748046875, -0.0030193328857421875, -0.002696990966796875, -0.0023746490478515625, -0.00205230712890625, -0.0017299652099609375, -0.001407623291015625, -0.0010852813720703125, -0.000762939453125, -0.0004405975341796875, -0.000118255615234375, 0.0002040863037109375, 0.00052642822265625, 0.0008487701416015625, 0.001171112060546875, 0.0014934539794921875, 0.0018157958984375, 0.0021381378173828125, 0.002460479736328125, 0.0027828216552734375, 0.00310516357421875, 0.0034275054931640625, 0.003749847412109375, 0.0040721893310546875, 0.00439453125, 0.0047168731689453125, 0.005039215087890625, 0.0053615570068359375, 0.00568389892578125, 0.0060062408447265625, 0.006328582763671875, 0.0066509246826171875, 0.0069732666015625, 0.0072956085205078125, 0.007617950439453125, 0.007940292358398438, 0.00826263427734375, 0.008584976196289062, 0.008907318115234375, 0.009229660034179688, 0.009552001953125]}, "gradients/decoder.transformer.h.14.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 0.0, 0.0, 4.0, 5.0, 1.0, 6.0, 3.0, 9.0, 4.0, 14.0, 12.0, 35.0, 29.0, 60.0, 83.0, 121.0, 239.0, 836.0, 79156.0, 965590.0, 1596.0, 331.0, 152.0, 65.0, 60.0, 34.0, 23.0, 28.0, 14.0, 15.0, 5.0, 7.0, 4.0, 7.0, 2.0, 5.0, 2.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.21533203125, -0.20819854736328125, -0.2010650634765625, -0.19393157958984375, -0.186798095703125, -0.17966461181640625, -0.1725311279296875, -0.16539764404296875, -0.15826416015625, -0.15113067626953125, -0.1439971923828125, -0.13686370849609375, -0.129730224609375, -0.12259674072265625, -0.1154632568359375, -0.10832977294921875, -0.1011962890625, -0.09406280517578125, -0.0869293212890625, -0.07979583740234375, -0.072662353515625, -0.06552886962890625, -0.0583953857421875, -0.05126190185546875, -0.04412841796875, -0.03699493408203125, -0.0298614501953125, -0.02272796630859375, -0.015594482421875, -0.00846099853515625, -0.0013275146484375, 0.00580596923828125, 0.012939453125, 0.02007293701171875, 0.0272064208984375, 0.03433990478515625, 0.041473388671875, 0.04860687255859375, 0.0557403564453125, 0.06287384033203125, 0.07000732421875, 0.07714080810546875, 0.0842742919921875, 0.09140777587890625, 0.098541259765625, 0.10567474365234375, 0.1128082275390625, 0.11994171142578125, 0.1270751953125, 0.13420867919921875, 0.1413421630859375, 0.14847564697265625, 0.155609130859375, 0.16274261474609375, 0.1698760986328125, 0.17700958251953125, 0.18414306640625, 0.19127655029296875, 0.1984100341796875, 0.20554351806640625, 0.212677001953125, 0.21981048583984375, 0.2269439697265625, 0.23407745361328125, 0.2412109375]}, "gradients/decoder.transformer.h.14.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 4.0, 8.0, 18.0, 56.0, 132.0, 275.0, 266.0, 151.0, 62.0, 24.0, 12.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006108611822128296, -0.005644149612635374, -0.005179687403142452, -0.004715224727988243, -0.004250762518495321, -0.0037863003090023994, -0.003321837866678834, -0.0028573754243552685, -0.0023929132148623466, -0.001928450888954103, -0.0014639885630458593, -0.0009995262371376157, -0.000535063911229372, -7.06017017364502e-05, 0.0003938607405871153, 0.0008583231829106808, 0.0013227853924036026, 0.0017872477183118463, 0.00225171004422009, 0.0027161724865436554, 0.0031806346960365772, 0.003645096905529499, 0.004109559580683708, 0.00457402179017663, 0.005038483999669552, 0.005502946209162474, 0.0059674084186553955, 0.006431871093809605, 0.0068963333033025265, 0.007360795512795448, 0.007825258187949657, 0.008289720863103867, 0.008754182606935501, 0.00921864528208971, 0.009683107025921345, 0.010147569701075554, 0.010612031444907188, 0.011076494120061398, 0.011540956795215607, 0.012005418539047241, 0.01246988121420145, 0.01293434388935566, 0.013398805633187294, 0.013863268308341503, 0.014327730983495712, 0.014792192727327347, 0.015256655402481556, 0.015721118077635765, 0.0161855798214674, 0.016650041565299034, 0.017114505171775818, 0.017578966915607452, 0.018043428659439087, 0.01850789040327072, 0.018972354009747505, 0.01943681575357914, 0.019901279360055923, 0.020365741103887558, 0.020830204710364342, 0.021294666454195976, 0.02175912819802761, 0.022223591804504395, 0.02268805354833603, 0.023152515292167664, 0.023616977035999298]}, "gradients/decoder.transformer.h.14.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 3.0, 2.0, 4.0, 7.0, 5.0, 7.0, 11.0, 18.0, 13.0, 29.0, 25.0, 31.0, 33.0, 38.0, 31.0, 40.0, 54.0, 41.0, 49.0, 38.0, 49.0, 52.0, 45.0, 45.0, 46.0, 38.0, 37.0, 33.0, 33.0, 34.0, 25.0, 20.0, 25.0, 11.0, 9.0, 10.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 2.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005811810493469238, -0.005631326697766781, -0.005450842902064323, -0.005270359106361866, -0.005089875310659409, -0.004909391514956951, -0.004728907719254494, -0.004548423923552036, -0.004367940127849579, -0.004187456332147121, -0.004006972536444664, -0.0038264887407422066, -0.003646004945039749, -0.0034655211493372917, -0.0032850373536348343, -0.003104553557932377, -0.0029240697622299194, -0.002743585966527462, -0.0025631021708250046, -0.002382618375122547, -0.0022021345794200897, -0.0020216507837176323, -0.0018411669880151749, -0.0016606831923127174, -0.00148019939661026, -0.0012997156009078026, -0.0011192318052053452, -0.0009387480095028877, -0.0007582642138004303, -0.0005777804180979729, -0.00039729662239551544, -0.00021681282669305801, -3.6329030990600586e-05, 0.00014415476471185684, 0.00032463856041431427, 0.0005051223561167717, 0.0006856061518192291, 0.0008660899475216866, 0.001046573743224144, 0.0012270575389266014, 0.0014075413346290588, 0.0015880251303315163, 0.0017685089260339737, 0.0019489927217364311, 0.0021294765174388885, 0.002309960313141346, 0.0024904441088438034, 0.002670927904546261, 0.0028514117002487183, 0.0030318954959511757, 0.003212379291653633, 0.0033928630873560905, 0.003573346883058548, 0.0037538306787610054, 0.003934314474463463, 0.00411479827016592, 0.004295282065868378, 0.004475765861570835, 0.0046562496572732925, 0.00483673345297575, 0.005017217248678207, 0.005197701044380665, 0.005378184840083122, 0.00555866863578558, 0.005739152431488037]}, "gradients/decoder.transformer.h.14.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 3.0, 7.0, 7.0, 9.0, 17.0, 13.0, 16.0, 18.0, 20.0, 16.0, 27.0, 39.0, 25.0, 29.0, 34.0, 32.0, 37.0, 34.0, 37.0, 43.0, 36.0, 39.0, 38.0, 48.0, 36.0, 40.0, 39.0, 25.0, 31.0, 26.0, 27.0, 17.0, 25.0, 20.0, 17.0, 16.0, 12.0, 9.0, 7.0, 10.0, 8.0, 1.0, 6.0, 3.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-8.6875, -8.4144287109375, -8.141357421875, -7.8682861328125, -7.59521484375, -7.3221435546875, -7.049072265625, -6.7760009765625, -6.5029296875, -6.2298583984375, -5.956787109375, -5.6837158203125, -5.41064453125, -5.1375732421875, -4.864501953125, -4.5914306640625, -4.318359375, -4.0452880859375, -3.772216796875, -3.4991455078125, -3.22607421875, -2.9530029296875, -2.679931640625, -2.4068603515625, -2.1337890625, -1.8607177734375, -1.587646484375, -1.3145751953125, -1.04150390625, -0.7684326171875, -0.495361328125, -0.2222900390625, 0.05078125, 0.3238525390625, 0.596923828125, 0.8699951171875, 1.14306640625, 1.4161376953125, 1.689208984375, 1.9622802734375, 2.2353515625, 2.5084228515625, 2.781494140625, 3.0545654296875, 3.32763671875, 3.6007080078125, 3.873779296875, 4.1468505859375, 4.419921875, 4.6929931640625, 4.966064453125, 5.2391357421875, 5.51220703125, 5.7852783203125, 6.058349609375, 6.3314208984375, 6.6044921875, 6.8775634765625, 7.150634765625, 7.4237060546875, 7.69677734375, 7.9698486328125, 8.242919921875, 8.5159912109375, 8.7890625]}, "gradients/decoder.transformer.h.14.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 0.0, 5.0, 3.0, 7.0, 10.0, 21.0, 32.0, 36.0, 57.0, 77.0, 130.0, 186.0, 283.0, 442.0, 683.0, 1041.0, 1702.0, 2937.0, 4825.0, 8338.0, 14985.0, 28162.0, 55509.0, 117268.0, 337990.0, 266436.0, 100505.0, 49144.0, 25338.0, 13534.0, 7575.0, 4293.0, 2715.0, 1586.0, 946.0, 562.0, 387.0, 253.0, 181.0, 112.0, 90.0, 59.0, 37.0, 25.0, 18.0, 13.0, 8.0, 8.0, 3.0, 6.0, 1.0, 2.0], "bins": [-7.4453125, -7.24359130859375, -7.0418701171875, -6.84014892578125, -6.638427734375, -6.43670654296875, -6.2349853515625, -6.03326416015625, -5.83154296875, -5.62982177734375, -5.4281005859375, -5.22637939453125, -5.024658203125, -4.82293701171875, -4.6212158203125, -4.41949462890625, -4.2177734375, -4.01605224609375, -3.8143310546875, -3.61260986328125, -3.410888671875, -3.20916748046875, -3.0074462890625, -2.80572509765625, -2.60400390625, -2.40228271484375, -2.2005615234375, -1.99884033203125, -1.797119140625, -1.59539794921875, -1.3936767578125, -1.19195556640625, -0.990234375, -0.78851318359375, -0.5867919921875, -0.38507080078125, -0.183349609375, 0.01837158203125, 0.2200927734375, 0.42181396484375, 0.62353515625, 0.82525634765625, 1.0269775390625, 1.22869873046875, 1.430419921875, 1.63214111328125, 1.8338623046875, 2.03558349609375, 2.2373046875, 2.43902587890625, 2.6407470703125, 2.84246826171875, 3.044189453125, 3.24591064453125, 3.4476318359375, 3.64935302734375, 3.85107421875, 4.05279541015625, 4.2545166015625, 4.45623779296875, 4.657958984375, 4.85968017578125, 5.0614013671875, 5.26312255859375, 5.46484375]}, "gradients/decoder.transformer.h.14.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 4.0, 4.0, 3.0, 2.0, 6.0, 4.0, 8.0, 11.0, 17.0, 17.0, 12.0, 16.0, 25.0, 26.0, 25.0, 27.0, 29.0, 51.0, 35.0, 49.0, 54.0, 90.0, 197.0, 1623.0, 212.0, 92.0, 48.0, 38.0, 38.0, 48.0, 32.0, 40.0, 22.0, 33.0, 20.0, 17.0, 10.0, 14.0, 9.0, 10.0, 11.0, 2.0, 4.0, 7.0, 5.0, 7.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0], "bins": [-31.640625, -30.695068359375, -29.74951171875, -28.803955078125, -27.8583984375, -26.912841796875, -25.96728515625, -25.021728515625, -24.076171875, -23.130615234375, -22.18505859375, -21.239501953125, -20.2939453125, -19.348388671875, -18.40283203125, -17.457275390625, -16.51171875, -15.566162109375, -14.62060546875, -13.675048828125, -12.7294921875, -11.783935546875, -10.83837890625, -9.892822265625, -8.947265625, -8.001708984375, -7.05615234375, -6.110595703125, -5.1650390625, -4.219482421875, -3.27392578125, -2.328369140625, -1.3828125, -0.437255859375, 0.50830078125, 1.453857421875, 2.3994140625, 3.344970703125, 4.29052734375, 5.236083984375, 6.181640625, 7.127197265625, 8.07275390625, 9.018310546875, 9.9638671875, 10.909423828125, 11.85498046875, 12.800537109375, 13.74609375, 14.691650390625, 15.63720703125, 16.582763671875, 17.5283203125, 18.473876953125, 19.41943359375, 20.364990234375, 21.310546875, 22.256103515625, 23.20166015625, 24.147216796875, 25.0927734375, 26.038330078125, 26.98388671875, 27.929443359375, 28.875]}, "gradients/decoder.transformer.h.14.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 8.0, 12.0, 7.0, 8.0, 10.0, 19.0, 28.0, 21.0, 48.0, 71.0, 85.0, 154.0, 199.0, 281.0, 452.0, 1984.0, 214476.0, 2921967.0, 4186.0, 655.0, 321.0, 223.0, 140.0, 92.0, 71.0, 57.0, 31.0, 35.0, 20.0, 14.0, 12.0, 3.0, 6.0, 6.0, 4.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-108.75, -105.8994140625, -103.048828125, -100.1982421875, -97.34765625, -94.4970703125, -91.646484375, -88.7958984375, -85.9453125, -83.0947265625, -80.244140625, -77.3935546875, -74.54296875, -71.6923828125, -68.841796875, -65.9912109375, -63.140625, -60.2900390625, -57.439453125, -54.5888671875, -51.73828125, -48.8876953125, -46.037109375, -43.1865234375, -40.3359375, -37.4853515625, -34.634765625, -31.7841796875, -28.93359375, -26.0830078125, -23.232421875, -20.3818359375, -17.53125, -14.6806640625, -11.830078125, -8.9794921875, -6.12890625, -3.2783203125, -0.427734375, 2.4228515625, 5.2734375, 8.1240234375, 10.974609375, 13.8251953125, 16.67578125, 19.5263671875, 22.376953125, 25.2275390625, 28.078125, 30.9287109375, 33.779296875, 36.6298828125, 39.48046875, 42.3310546875, 45.181640625, 48.0322265625, 50.8828125, 53.7333984375, 56.583984375, 59.4345703125, 62.28515625, 65.1357421875, 67.986328125, 70.8369140625, 73.6875]}, "gradients/decoder.transformer.h.14.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 76.0, 887.0, 56.0], "bins": [-794.597900390625, -781.8685913085938, -769.1393432617188, -756.4100341796875, -743.6807250976562, -730.951416015625, -718.22216796875, -705.4928588867188, -692.7635498046875, -680.0342407226562, -667.3049926757812, -654.57568359375, -641.8463745117188, -629.1170654296875, -616.3878173828125, -603.6585083007812, -590.92919921875, -578.1998901367188, -565.4706420898438, -552.7413330078125, -540.0120239257812, -527.28271484375, -514.553466796875, -501.82415771484375, -489.09490966796875, -476.3656311035156, -463.6363220214844, -450.90704345703125, -438.177734375, -425.4484558105469, -412.71917724609375, -399.9898681640625, -387.26055908203125, -374.5312805175781, -361.8019714355469, -349.07269287109375, -336.3433837890625, -323.6141052246094, -310.88482666015625, -298.155517578125, -285.4262390136719, -272.69696044921875, -259.9676513671875, -247.23837280273438, -234.50906372070312, -221.77978515625, -209.0504913330078, -196.32119750976562, -183.59190368652344, -170.86260986328125, -158.13331604003906, -145.40402221679688, -132.67474365234375, -119.94544219970703, -107.21615600585938, -94.48686218261719, -81.757568359375, -69.02827453613281, -56.29898452758789, -43.56969451904297, -30.84040069580078, -18.111106872558594, -5.3818206787109375, 7.34747314453125, 20.07676887512207]}, "gradients/decoder.transformer.h.14.ln_1.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 6.0, 3.0, 4.0, 5.0, 8.0, 6.0, 11.0, 7.0, 16.0, 22.0, 22.0, 19.0, 29.0, 20.0, 29.0, 31.0, 42.0, 39.0, 36.0, 48.0, 47.0, 51.0, 36.0, 40.0, 39.0, 48.0, 36.0, 42.0, 35.0, 31.0, 26.0, 28.0, 26.0, 21.0, 27.0, 12.0, 8.0, 10.0, 12.0, 6.0, 8.0, 4.0, 3.0, 6.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-85.42178344726562, -82.57671356201172, -79.73163604736328, -76.88656616210938, -74.04149627685547, -71.19642639160156, -68.35134887695312, -65.50627899169922, -62.66120910644531, -59.81613540649414, -56.971065521240234, -54.12599182128906, -51.280921936035156, -48.435848236083984, -45.59077453613281, -42.745704650878906, -39.900630950927734, -37.05555725097656, -34.210487365722656, -31.365413665771484, -28.520343780517578, -25.675270080566406, -22.830198287963867, -19.985126495361328, -17.14005470275879, -14.29498291015625, -11.449911117553711, -8.604838371276855, -5.759766578674316, -2.9146947860717773, -0.06962203979492188, 2.775449752807617, 5.620521545410156, 8.465593338012695, 11.310665130615234, 14.15573787689209, 17.000808715820312, 19.845882415771484, 22.690954208374023, 25.536026000976562, 28.3810977935791, 31.22616958618164, 34.07124328613281, 36.91631317138672, 39.76138687133789, 42.6064567565918, 45.45153045654297, 48.296600341796875, 51.14167404174805, 53.98674774169922, 56.831817626953125, 59.6768913269043, 62.5219612121582, 65.36703491210938, 68.21210479736328, 71.05717468261719, 73.90225219726562, 76.74732208251953, 79.59239959716797, 82.43746948242188, 85.28253936767578, 88.12760925292969, 90.97268676757812, 93.81775665283203, 96.66282653808594]}, "gradients/decoder.transformer.h.13.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 5.0, 5.0, 4.0, 10.0, 16.0, 15.0, 20.0, 11.0, 19.0, 24.0, 19.0, 24.0, 29.0, 29.0, 35.0, 44.0, 21.0, 35.0, 44.0, 42.0, 34.0, 41.0, 42.0, 40.0, 36.0, 43.0, 39.0, 32.0, 25.0, 31.0, 24.0, 17.0, 25.0, 21.0, 17.0, 9.0, 12.0, 15.0, 9.0, 9.0, 6.0, 6.0, 7.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.09375, -8.810302734375, -8.52685546875, -8.243408203125, -7.9599609375, -7.676513671875, -7.39306640625, -7.109619140625, -6.826171875, -6.542724609375, -6.25927734375, -5.975830078125, -5.6923828125, -5.408935546875, -5.12548828125, -4.842041015625, -4.55859375, -4.275146484375, -3.99169921875, -3.708251953125, -3.4248046875, -3.141357421875, -2.85791015625, -2.574462890625, -2.291015625, -2.007568359375, -1.72412109375, -1.440673828125, -1.1572265625, -0.873779296875, -0.59033203125, -0.306884765625, -0.0234375, 0.260009765625, 0.54345703125, 0.826904296875, 1.1103515625, 1.393798828125, 1.67724609375, 1.960693359375, 2.244140625, 2.527587890625, 2.81103515625, 3.094482421875, 3.3779296875, 3.661376953125, 3.94482421875, 4.228271484375, 4.51171875, 4.795166015625, 5.07861328125, 5.362060546875, 5.6455078125, 5.928955078125, 6.21240234375, 6.495849609375, 6.779296875, 7.062744140625, 7.34619140625, 7.629638671875, 7.9130859375, 8.196533203125, 8.47998046875, 8.763427734375, 9.046875]}, "gradients/decoder.transformer.h.13.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 5.0, 2.0, 2.0, 8.0, 6.0, 6.0, 13.0, 7.0, 7.0, 10.0, 19.0, 14.0, 16.0, 20.0, 25.0, 24.0, 29.0, 35.0, 66.0, 145.0, 275.0, 781.0, 3489.0, 21147.0, 264430.0, 2790658.0, 1045280.0, 58333.0, 7078.0, 1459.0, 400.0, 167.0, 76.0, 41.0, 32.0, 22.0, 14.0, 24.0, 19.0, 18.0, 11.0, 17.0, 15.0, 10.0, 7.0, 2.0, 8.0, 6.0, 8.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-29.03125, -28.1162109375, -27.201171875, -26.2861328125, -25.37109375, -24.4560546875, -23.541015625, -22.6259765625, -21.7109375, -20.7958984375, -19.880859375, -18.9658203125, -18.05078125, -17.1357421875, -16.220703125, -15.3056640625, -14.390625, -13.4755859375, -12.560546875, -11.6455078125, -10.73046875, -9.8154296875, -8.900390625, -7.9853515625, -7.0703125, -6.1552734375, -5.240234375, -4.3251953125, -3.41015625, -2.4951171875, -1.580078125, -0.6650390625, 0.25, 1.1650390625, 2.080078125, 2.9951171875, 3.91015625, 4.8251953125, 5.740234375, 6.6552734375, 7.5703125, 8.4853515625, 9.400390625, 10.3154296875, 11.23046875, 12.1455078125, 13.060546875, 13.9755859375, 14.890625, 15.8056640625, 16.720703125, 17.6357421875, 18.55078125, 19.4658203125, 20.380859375, 21.2958984375, 22.2109375, 23.1259765625, 24.041015625, 24.9560546875, 25.87109375, 26.7861328125, 27.701171875, 28.6162109375, 29.53125]}, "gradients/decoder.transformer.h.13.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 2.0, 4.0, 9.0, 7.0, 13.0, 13.0, 23.0, 33.0, 48.0, 58.0, 59.0, 68.0, 113.0, 137.0, 187.0, 235.0, 334.0, 374.0, 419.0, 389.0, 377.0, 276.0, 230.0, 174.0, 128.0, 86.0, 61.0, 51.0, 42.0, 32.0, 25.0, 18.0, 13.0, 10.0, 7.0, 3.0, 5.0, 6.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.3125, -18.723388671875, -18.13427734375, -17.545166015625, -16.9560546875, -16.366943359375, -15.77783203125, -15.188720703125, -14.599609375, -14.010498046875, -13.42138671875, -12.832275390625, -12.2431640625, -11.654052734375, -11.06494140625, -10.475830078125, -9.88671875, -9.297607421875, -8.70849609375, -8.119384765625, -7.5302734375, -6.941162109375, -6.35205078125, -5.762939453125, -5.173828125, -4.584716796875, -3.99560546875, -3.406494140625, -2.8173828125, -2.228271484375, -1.63916015625, -1.050048828125, -0.4609375, 0.128173828125, 0.71728515625, 1.306396484375, 1.8955078125, 2.484619140625, 3.07373046875, 3.662841796875, 4.251953125, 4.841064453125, 5.43017578125, 6.019287109375, 6.6083984375, 7.197509765625, 7.78662109375, 8.375732421875, 8.96484375, 9.553955078125, 10.14306640625, 10.732177734375, 11.3212890625, 11.910400390625, 12.49951171875, 13.088623046875, 13.677734375, 14.266845703125, 14.85595703125, 15.445068359375, 16.0341796875, 16.623291015625, 17.21240234375, 17.801513671875, 18.390625]}, "gradients/decoder.transformer.h.13.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 2.0, 3.0, 7.0, 7.0, 11.0, 16.0, 17.0, 18.0, 23.0, 30.0, 48.0, 58.0, 68.0, 83.0, 128.0, 158.0, 215.0, 338.0, 588.0, 2523.0, 50452.0, 3441446.0, 684614.0, 10741.0, 1131.0, 421.0, 250.0, 194.0, 142.0, 109.0, 104.0, 93.0, 57.0, 54.0, 31.0, 19.0, 29.0, 23.0, 4.0, 9.0, 4.0, 9.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-64.9375, -62.828125, -60.71875, -58.609375, -56.5, -54.390625, -52.28125, -50.171875, -48.0625, -45.953125, -43.84375, -41.734375, -39.625, -37.515625, -35.40625, -33.296875, -31.1875, -29.078125, -26.96875, -24.859375, -22.75, -20.640625, -18.53125, -16.421875, -14.3125, -12.203125, -10.09375, -7.984375, -5.875, -3.765625, -1.65625, 0.453125, 2.5625, 4.671875, 6.78125, 8.890625, 11.0, 13.109375, 15.21875, 17.328125, 19.4375, 21.546875, 23.65625, 25.765625, 27.875, 29.984375, 32.09375, 34.203125, 36.3125, 38.421875, 40.53125, 42.640625, 44.75, 46.859375, 48.96875, 51.078125, 53.1875, 55.296875, 57.40625, 59.515625, 61.625, 63.734375, 65.84375, 67.953125, 70.0625]}, "gradients/decoder.transformer.h.13.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 15.0, 31.0, 64.0, 116.0, 185.0, 207.0, 180.0, 104.0, 63.0, 30.0, 10.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-193.2103271484375, -187.75582885742188, -182.30133056640625, -176.84681701660156, -171.39231872558594, -165.9378204345703, -160.48330688476562, -155.02880859375, -149.57431030273438, -144.11981201171875, -138.66531372070312, -133.21080017089844, -127.75630187988281, -122.30180358886719, -116.84729766845703, -111.39279174804688, -105.93829345703125, -100.48379516601562, -95.02928924560547, -89.57478332519531, -84.12028503417969, -78.66578674316406, -73.2112808227539, -67.75677490234375, -62.302276611328125, -56.847774505615234, -51.393272399902344, -45.93877029418945, -40.48426818847656, -35.02976608276367, -29.57526397705078, -24.12076187133789, -18.666275024414062, -13.211772918701172, -7.757270812988281, -2.3027687072753906, 3.1517333984375, 8.60623550415039, 14.060737609863281, 19.515239715576172, 24.969741821289062, 30.424243927001953, 35.878746032714844, 41.333248138427734, 46.787750244140625, 52.242252349853516, 57.696754455566406, 63.1512565612793, 68.60575866699219, 74.06025695800781, 79.51476287841797, 84.96926879882812, 90.42376708984375, 95.87826538085938, 101.33277130126953, 106.78727722167969, 112.24177551269531, 117.69627380371094, 123.1507797241211, 128.60528564453125, 134.05978393554688, 139.5142822265625, 144.96878051757812, 150.4232940673828, 155.87779235839844]}, "gradients/decoder.transformer.h.13.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 3.0, 2.0, 4.0, 5.0, 6.0, 7.0, 12.0, 10.0, 3.0, 14.0, 12.0, 20.0, 14.0, 26.0, 20.0, 34.0, 26.0, 28.0, 36.0, 42.0, 44.0, 47.0, 33.0, 35.0, 35.0, 41.0, 49.0, 36.0, 30.0, 33.0, 33.0, 27.0, 37.0, 37.0, 29.0, 17.0, 20.0, 16.0, 16.0, 18.0, 13.0, 11.0, 11.0, 6.0, 0.0, 4.0, 1.0, 6.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-71.32232666015625, -69.15310668945312, -66.98388671875, -64.81466674804688, -62.64544677734375, -60.476226806640625, -58.307003021240234, -56.13778305053711, -53.968563079833984, -51.79934310913086, -49.630123138427734, -47.46090316772461, -45.29167938232422, -43.122459411621094, -40.95323944091797, -38.784019470214844, -36.61479949951172, -34.445579528808594, -32.27635955810547, -30.10713768005371, -27.937917709350586, -25.76869773864746, -23.599475860595703, -21.430255889892578, -19.261035919189453, -17.091815948486328, -14.922595024108887, -12.753374099731445, -10.58415412902832, -8.414934158325195, -6.245713233947754, -4.0764923095703125, -1.9072723388671875, 0.2619481086730957, 2.431168556213379, 4.600389003753662, 6.769609451293945, 8.93882942199707, 11.108050346374512, 13.277271270751953, 15.446491241455078, 17.615711212158203, 19.784931182861328, 21.954153060913086, 24.12337303161621, 26.292593002319336, 28.461814880371094, 30.63103485107422, 32.800254821777344, 34.96947479248047, 37.138694763183594, 39.30791473388672, 41.477134704589844, 43.64635467529297, 45.81557846069336, 47.984798431396484, 50.15401840209961, 52.323238372802734, 54.49245834350586, 56.661678314208984, 58.830902099609375, 61.0001220703125, 63.169342041015625, 65.33856201171875, 67.50778198242188]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 10.0, 12.0, 10.0, 18.0, 20.0, 14.0, 23.0, 26.0, 29.0, 33.0, 34.0, 44.0, 53.0, 35.0, 37.0, 37.0, 35.0, 30.0, 39.0, 44.0, 39.0, 49.0, 36.0, 26.0, 31.0, 27.0, 32.0, 30.0, 18.0, 13.0, 16.0, 21.0, 17.0, 10.0, 5.0, 9.0, 7.0, 8.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4453125, -8.1480712890625, -7.850830078125, -7.5535888671875, -7.25634765625, -6.9591064453125, -6.661865234375, -6.3646240234375, -6.0673828125, -5.7701416015625, -5.472900390625, -5.1756591796875, -4.87841796875, -4.5811767578125, -4.283935546875, -3.9866943359375, -3.689453125, -3.3922119140625, -3.094970703125, -2.7977294921875, -2.50048828125, -2.2032470703125, -1.906005859375, -1.6087646484375, -1.3115234375, -1.0142822265625, -0.717041015625, -0.4197998046875, -0.12255859375, 0.1746826171875, 0.471923828125, 0.7691650390625, 1.06640625, 1.3636474609375, 1.660888671875, 1.9581298828125, 2.25537109375, 2.5526123046875, 2.849853515625, 3.1470947265625, 3.4443359375, 3.7415771484375, 4.038818359375, 4.3360595703125, 4.63330078125, 4.9305419921875, 5.227783203125, 5.5250244140625, 5.822265625, 6.1195068359375, 6.416748046875, 6.7139892578125, 7.01123046875, 7.3084716796875, 7.605712890625, 7.9029541015625, 8.2001953125, 8.4974365234375, 8.794677734375, 9.0919189453125, 9.38916015625, 9.6864013671875, 9.983642578125, 10.2808837890625, 10.578125]}, "gradients/decoder.transformer.h.13.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 5.0, 5.0, 8.0, 4.0, 11.0, 16.0, 18.0, 35.0, 64.0, 96.0, 142.0, 253.0, 420.0, 652.0, 1136.0, 1964.0, 3391.0, 5929.0, 10503.0, 18932.0, 34967.0, 63022.0, 113498.0, 189250.0, 229557.0, 164039.0, 93874.0, 51790.0, 28792.0, 15648.0, 8591.0, 5027.0, 2752.0, 1657.0, 971.0, 624.0, 356.0, 211.0, 140.0, 82.0, 43.0, 35.0, 22.0, 14.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.16796875, -1.1329345703125, -1.097900390625, -1.0628662109375, -1.02783203125, -0.9927978515625, -0.957763671875, -0.9227294921875, -0.8876953125, -0.8526611328125, -0.817626953125, -0.7825927734375, -0.74755859375, -0.7125244140625, -0.677490234375, -0.6424560546875, -0.607421875, -0.5723876953125, -0.537353515625, -0.5023193359375, -0.46728515625, -0.4322509765625, -0.397216796875, -0.3621826171875, -0.3271484375, -0.2921142578125, -0.257080078125, -0.2220458984375, -0.18701171875, -0.1519775390625, -0.116943359375, -0.0819091796875, -0.046875, -0.0118408203125, 0.023193359375, 0.0582275390625, 0.09326171875, 0.1282958984375, 0.163330078125, 0.1983642578125, 0.2333984375, 0.2684326171875, 0.303466796875, 0.3385009765625, 0.37353515625, 0.4085693359375, 0.443603515625, 0.4786376953125, 0.513671875, 0.5487060546875, 0.583740234375, 0.6187744140625, 0.65380859375, 0.6888427734375, 0.723876953125, 0.7589111328125, 0.7939453125, 0.8289794921875, 0.864013671875, 0.8990478515625, 0.93408203125, 0.9691162109375, 1.004150390625, 1.0391845703125, 1.07421875]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 6.0, 0.0, 4.0, 1.0, 5.0, 5.0, 11.0, 8.0, 9.0, 15.0, 14.0, 18.0, 23.0, 19.0, 26.0, 25.0, 23.0, 36.0, 31.0, 45.0, 25.0, 42.0, 42.0, 43.0, 1070.0, 42.0, 29.0, 33.0, 53.0, 43.0, 34.0, 27.0, 25.0, 26.0, 32.0, 21.0, 12.0, 16.0, 13.0, 16.0, 17.0, 9.0, 3.0, 6.0, 10.0, 8.0, 5.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.734375, -5.54803466796875, -5.3616943359375, -5.17535400390625, -4.989013671875, -4.80267333984375, -4.6163330078125, -4.42999267578125, -4.24365234375, -4.05731201171875, -3.8709716796875, -3.68463134765625, -3.498291015625, -3.31195068359375, -3.1256103515625, -2.93927001953125, -2.7529296875, -2.56658935546875, -2.3802490234375, -2.19390869140625, -2.007568359375, -1.82122802734375, -1.6348876953125, -1.44854736328125, -1.26220703125, -1.07586669921875, -0.8895263671875, -0.70318603515625, -0.516845703125, -0.33050537109375, -0.1441650390625, 0.04217529296875, 0.228515625, 0.41485595703125, 0.6011962890625, 0.78753662109375, 0.973876953125, 1.16021728515625, 1.3465576171875, 1.53289794921875, 1.71923828125, 1.90557861328125, 2.0919189453125, 2.27825927734375, 2.464599609375, 2.65093994140625, 2.8372802734375, 3.02362060546875, 3.2099609375, 3.39630126953125, 3.5826416015625, 3.76898193359375, 3.955322265625, 4.14166259765625, 4.3280029296875, 4.51434326171875, 4.70068359375, 4.88702392578125, 5.0733642578125, 5.25970458984375, 5.446044921875, 5.63238525390625, 5.8187255859375, 6.00506591796875, 6.19140625]}, "gradients/decoder.transformer.h.13.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 3.0, 3.0, 8.0, 13.0, 21.0, 29.0, 45.0, 55.0, 88.0, 138.0, 178.0, 297.0, 475.0, 674.0, 1118.0, 1674.0, 2638.0, 4137.0, 6425.0, 10188.0, 16468.0, 25674.0, 41313.0, 64570.0, 99300.0, 142540.0, 1218778.0, 152835.0, 109563.0, 72208.0, 46393.0, 29048.0, 18422.0, 11516.0, 7384.0, 4593.0, 2950.0, 1881.0, 1182.0, 823.0, 482.0, 336.0, 231.0, 171.0, 115.0, 58.0, 39.0, 16.0, 19.0, 13.0, 6.0, 2.0, 2.0, 5.0, 3.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.630859375, -0.610260009765625, -0.58966064453125, -0.569061279296875, -0.5484619140625, -0.527862548828125, -0.50726318359375, -0.486663818359375, -0.466064453125, -0.445465087890625, -0.42486572265625, -0.404266357421875, -0.3836669921875, -0.363067626953125, -0.34246826171875, -0.321868896484375, -0.30126953125, -0.280670166015625, -0.26007080078125, -0.239471435546875, -0.2188720703125, -0.198272705078125, -0.17767333984375, -0.157073974609375, -0.136474609375, -0.115875244140625, -0.09527587890625, -0.074676513671875, -0.0540771484375, -0.033477783203125, -0.01287841796875, 0.007720947265625, 0.0283203125, 0.048919677734375, 0.06951904296875, 0.090118408203125, 0.1107177734375, 0.131317138671875, 0.15191650390625, 0.172515869140625, 0.193115234375, 0.213714599609375, 0.23431396484375, 0.254913330078125, 0.2755126953125, 0.296112060546875, 0.31671142578125, 0.337310791015625, 0.35791015625, 0.378509521484375, 0.39910888671875, 0.419708251953125, 0.4403076171875, 0.460906982421875, 0.48150634765625, 0.502105712890625, 0.522705078125, 0.543304443359375, 0.56390380859375, 0.584503173828125, 0.6051025390625, 0.625701904296875, 0.64630126953125, 0.666900634765625, 0.6875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.bias": {"_type": "histogram", "values": [3.0, 1.0, 1.0, 3.0, 0.0, 1.0, 7.0, 0.0, 3.0, 6.0, 7.0, 6.0, 11.0, 12.0, 12.0, 18.0, 15.0, 20.0, 22.0, 29.0, 29.0, 39.0, 39.0, 51.0, 52.0, 54.0, 59.0, 49.0, 57.0, 44.0, 44.0, 40.0, 42.0, 34.0, 38.0, 39.0, 26.0, 12.0, 13.0, 20.0, 17.0, 10.0, 4.0, 5.0, 6.0, 4.0, 5.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005443572998046875, -0.005242288112640381, -0.005041003227233887, -0.004839718341827393, -0.0046384334564208984, -0.004437148571014404, -0.00423586368560791, -0.004034578800201416, -0.003833293914794922, -0.0036320090293884277, -0.0034307241439819336, -0.0032294392585754395, -0.0030281543731689453, -0.002826869487762451, -0.002625584602355957, -0.002424299716949463, -0.0022230148315429688, -0.0020217299461364746, -0.0018204450607299805, -0.0016191601753234863, -0.0014178752899169922, -0.001216590404510498, -0.001015305519104004, -0.0008140206336975098, -0.0006127357482910156, -0.0004114508628845215, -0.00021016597747802734, -8.881092071533203e-06, 0.00019240379333496094, 0.0003936886787414551, 0.0005949735641479492, 0.0007962584495544434, 0.0009975433349609375, 0.0011988282203674316, 0.0014001131057739258, 0.00160139799118042, 0.001802682876586914, 0.002003967761993408, 0.0022052526473999023, 0.0024065375328063965, 0.0026078224182128906, 0.0028091073036193848, 0.003010392189025879, 0.003211677074432373, 0.003412961959838867, 0.0036142468452453613, 0.0038155317306518555, 0.00401681661605835, 0.004218101501464844, 0.004419386386871338, 0.004620671272277832, 0.004821956157684326, 0.00502324104309082, 0.0052245259284973145, 0.005425810813903809, 0.005627095699310303, 0.005828380584716797, 0.006029665470123291, 0.006230950355529785, 0.006432235240936279, 0.0066335201263427734, 0.006834805011749268, 0.007036089897155762, 0.007237374782562256, 0.00743865966796875]}, "gradients/decoder.transformer.h.13.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 5.0, 2.0, 4.0, 9.0, 13.0, 19.0, 22.0, 21.0, 32.0, 30.0, 49.0, 55.0, 74.0, 97.0, 209.0, 367.0, 1504.0, 294693.0, 747935.0, 2343.0, 432.0, 202.0, 116.0, 71.0, 50.0, 41.0, 31.0, 26.0, 19.0, 18.0, 12.0, 10.0, 10.0, 5.0, 4.0, 5.0, 3.0, 3.0, 4.0, 4.0, 1.0, 1.0, 3.0, 1.0], "bins": [-0.1866455078125, -0.18174362182617188, -0.17684173583984375, -0.17193984985351562, -0.1670379638671875, -0.16213607788085938, -0.15723419189453125, -0.15233230590820312, -0.147430419921875, -0.14252853393554688, -0.13762664794921875, -0.13272476196289062, -0.1278228759765625, -0.12292098999023438, -0.11801910400390625, -0.11311721801757812, -0.10821533203125, -0.10331344604492188, -0.09841156005859375, -0.09350967407226562, -0.0886077880859375, -0.08370590209960938, -0.07880401611328125, -0.07390213012695312, -0.069000244140625, -0.06409835815429688, -0.05919647216796875, -0.054294586181640625, -0.0493927001953125, -0.044490814208984375, -0.03958892822265625, -0.034687042236328125, -0.02978515625, -0.024883270263671875, -0.01998138427734375, -0.015079498291015625, -0.0101776123046875, -0.005275726318359375, -0.00037384033203125, 0.004528045654296875, 0.009429931640625, 0.014331817626953125, 0.01923370361328125, 0.024135589599609375, 0.0290374755859375, 0.033939361572265625, 0.03884124755859375, 0.043743133544921875, 0.04864501953125, 0.053546905517578125, 0.05844879150390625, 0.06335067749023438, 0.0682525634765625, 0.07315444946289062, 0.07805633544921875, 0.08295822143554688, 0.087860107421875, 0.09276199340820312, 0.09766387939453125, 0.10256576538085938, 0.1074676513671875, 0.11236953735351562, 0.11727142333984375, 0.12217330932617188, 0.1270751953125]}, "gradients/decoder.transformer.h.13.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 4.0, 9.0, 8.0, 19.0, 13.0, 23.0, 32.0, 58.0, 76.0, 87.0, 113.0, 102.0, 94.0, 102.0, 60.0, 62.0, 46.0, 28.0, 23.0, 10.0, 12.0, 7.0, 5.0, 4.0, 2.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006243600510060787, -0.006086657755076885, -0.005929714534431696, -0.005772771779447794, -0.005615829024463892, -0.00545888626947999, -0.005301943048834801, -0.005145000293850899, -0.004988057538866997, -0.004831114783883095, -0.0046741715632379055, -0.0045172288082540035, -0.0043602860532701015, -0.0042033432982862, -0.00404640007764101, -0.0038894573226571083, -0.0037325143348425627, -0.003575571347028017, -0.003418628592044115, -0.0032616856042295694, -0.0031047428492456675, -0.002947799861431122, -0.00279085710644722, -0.0026339141186326742, -0.0024769711308181286, -0.002320028143003583, -0.002163085388019681, -0.0020061424002051353, -0.0018491996452212334, -0.0016922566574066877, -0.001535313786007464, -0.0013783709146082401, -0.0012214283924549818, -0.001064485521055758, -0.0009075426496565342, -0.0007505997200496495, -0.0005936568486504257, -0.00043671397725120187, -0.00027977104764431715, -0.00012282817624509335, 3.411469515413046e-05, 0.0001910575811052695, 0.0003480004670564085, 0.0005049433675594628, 0.0006618862389586866, 0.0008188291103579104, 0.0009757720399647951, 0.001132714911364019, 0.0012896577827632427, 0.0014466006541624665, 0.0016035435255616903, 0.001760486513376236, 0.001917429268360138, 0.0020743722561746836, 0.002231315243989229, 0.002388257998973131, 0.002545200753957033, 0.002702143741771579, 0.0028590864967554808, 0.0030160294845700264, 0.0031729722395539284, 0.003329915227368474, 0.0034868582151830196, 0.0036438009701669216, 0.0038007439579814672]}, "gradients/decoder.transformer.h.13.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 7.0, 6.0, 6.0, 6.0, 14.0, 6.0, 12.0, 21.0, 20.0, 18.0, 31.0, 29.0, 30.0, 33.0, 36.0, 27.0, 40.0, 34.0, 45.0, 39.0, 44.0, 35.0, 43.0, 50.0, 31.0, 41.0, 42.0, 36.0, 25.0, 32.0, 27.0, 25.0, 23.0, 18.0, 5.0, 15.0, 8.0, 9.0, 10.0, 5.0, 5.0, 5.0, 4.0, 1.0, 0.0, 3.0, 2.0, 0.0, 2.0, 3.0], "bins": [-0.004159212112426758, -0.00403998326510191, -0.0039207544177770615, -0.0038015255704522133, -0.003682296723127365, -0.003563067875802517, -0.0034438390284776688, -0.0033246101811528206, -0.0032053813338279724, -0.0030861524865031242, -0.002966923639178276, -0.002847694791853428, -0.0027284659445285797, -0.0026092370972037315, -0.0024900082498788834, -0.002370779402554035, -0.002251550555229187, -0.002132321707904339, -0.0020130928605794907, -0.0018938640132546425, -0.0017746351659297943, -0.0016554063186049461, -0.001536177471280098, -0.0014169486239552498, -0.0012977197766304016, -0.0011784909293055534, -0.0010592620819807053, -0.0009400332346558571, -0.0008208043873310089, -0.0007015755400061607, -0.0005823466926813126, -0.0004631178453564644, -0.0003438889980316162, -0.00022466015070676804, -0.00010543130338191986, 1.3797543942928314e-05, 0.0001330263912677765, 0.00025225523859262466, 0.00037148408591747284, 0.000490712933242321, 0.0006099417805671692, 0.0007291706278920174, 0.0008483994752168655, 0.0009676283225417137, 0.0010868571698665619, 0.00120608601719141, 0.0013253148645162582, 0.0014445437118411064, 0.0015637725591659546, 0.0016830014064908028, 0.001802230253815651, 0.0019214591011404991, 0.0020406879484653473, 0.0021599167957901955, 0.0022791456431150436, 0.002398374490439892, 0.00251760333776474, 0.002636832185089588, 0.0027560610324144363, 0.0028752898797392845, 0.0029945187270641327, 0.003113747574388981, 0.003232976421713829, 0.003352205269038677, 0.0034714341163635254]}, "gradients/decoder.transformer.h.13.attn.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 10.0, 12.0, 10.0, 18.0, 20.0, 14.0, 24.0, 25.0, 29.0, 33.0, 34.0, 44.0, 53.0, 35.0, 37.0, 37.0, 35.0, 30.0, 39.0, 44.0, 39.0, 49.0, 36.0, 26.0, 31.0, 27.0, 32.0, 30.0, 18.0, 13.0, 16.0, 21.0, 17.0, 10.0, 5.0, 9.0, 7.0, 8.0, 1.0, 4.0, 4.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.4453125, -8.1480712890625, -7.850830078125, -7.5535888671875, -7.25634765625, -6.9591064453125, -6.661865234375, -6.3646240234375, -6.0673828125, -5.7701416015625, -5.472900390625, -5.1756591796875, -4.87841796875, -4.5811767578125, -4.283935546875, -3.9866943359375, -3.689453125, -3.3922119140625, -3.094970703125, -2.7977294921875, -2.50048828125, -2.2032470703125, -1.906005859375, -1.6087646484375, -1.3115234375, -1.0142822265625, -0.717041015625, -0.4197998046875, -0.12255859375, 0.1746826171875, 0.471923828125, 0.7691650390625, 1.06640625, 1.3636474609375, 1.660888671875, 1.9581298828125, 2.25537109375, 2.5526123046875, 2.849853515625, 3.1470947265625, 3.4443359375, 3.7415771484375, 4.038818359375, 4.3360595703125, 4.63330078125, 4.9305419921875, 5.227783203125, 5.5250244140625, 5.822265625, 6.1195068359375, 6.416748046875, 6.7139892578125, 7.01123046875, 7.3084716796875, 7.605712890625, 7.9029541015625, 8.2001953125, 8.4974365234375, 8.794677734375, 9.0919189453125, 9.38916015625, 9.6864013671875, 9.983642578125, 10.2808837890625, 10.578125]}, "gradients/decoder.transformer.h.13.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 4.0, 1.0, 2.0, 7.0, 9.0, 9.0, 15.0, 18.0, 37.0, 43.0, 66.0, 82.0, 135.0, 186.0, 325.0, 506.0, 710.0, 1117.0, 1903.0, 3032.0, 5013.0, 8690.0, 16196.0, 32838.0, 77556.0, 210283.0, 384809.0, 175671.0, 65811.0, 28816.0, 14570.0, 7926.0, 4599.0, 2783.0, 1725.0, 1020.0, 703.0, 452.0, 306.0, 208.0, 106.0, 87.0, 58.0, 37.0, 25.0, 22.0, 15.0, 9.0, 5.0, 5.0, 6.0, 3.0, 3.0, 1.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.953125, -5.75738525390625, -5.5616455078125, -5.36590576171875, -5.170166015625, -4.97442626953125, -4.7786865234375, -4.58294677734375, -4.38720703125, -4.19146728515625, -3.9957275390625, -3.79998779296875, -3.604248046875, -3.40850830078125, -3.2127685546875, -3.01702880859375, -2.8212890625, -2.62554931640625, -2.4298095703125, -2.23406982421875, -2.038330078125, -1.84259033203125, -1.6468505859375, -1.45111083984375, -1.25537109375, -1.05963134765625, -0.8638916015625, -0.66815185546875, -0.472412109375, -0.27667236328125, -0.0809326171875, 0.11480712890625, 0.310546875, 0.50628662109375, 0.7020263671875, 0.89776611328125, 1.093505859375, 1.28924560546875, 1.4849853515625, 1.68072509765625, 1.87646484375, 2.07220458984375, 2.2679443359375, 2.46368408203125, 2.659423828125, 2.85516357421875, 3.0509033203125, 3.24664306640625, 3.4423828125, 3.63812255859375, 3.8338623046875, 4.02960205078125, 4.225341796875, 4.42108154296875, 4.6168212890625, 4.81256103515625, 5.00830078125, 5.20404052734375, 5.3997802734375, 5.59552001953125, 5.791259765625, 5.98699951171875, 6.1827392578125, 6.37847900390625, 6.57421875]}, "gradients/decoder.transformer.h.13.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 4.0, 3.0, 3.0, 4.0, 6.0, 6.0, 11.0, 11.0, 13.0, 13.0, 14.0, 18.0, 20.0, 26.0, 28.0, 43.0, 37.0, 31.0, 38.0, 47.0, 68.0, 91.0, 252.0, 1627.0, 138.0, 71.0, 64.0, 43.0, 50.0, 34.0, 42.0, 40.0, 25.0, 26.0, 16.0, 15.0, 20.0, 15.0, 9.0, 4.0, 5.0, 6.0, 6.0, 4.0, 5.0, 0.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-32.96875, -31.94677734375, -30.9248046875, -29.90283203125, -28.880859375, -27.85888671875, -26.8369140625, -25.81494140625, -24.79296875, -23.77099609375, -22.7490234375, -21.72705078125, -20.705078125, -19.68310546875, -18.6611328125, -17.63916015625, -16.6171875, -15.59521484375, -14.5732421875, -13.55126953125, -12.529296875, -11.50732421875, -10.4853515625, -9.46337890625, -8.44140625, -7.41943359375, -6.3974609375, -5.37548828125, -4.353515625, -3.33154296875, -2.3095703125, -1.28759765625, -0.265625, 0.75634765625, 1.7783203125, 2.80029296875, 3.822265625, 4.84423828125, 5.8662109375, 6.88818359375, 7.91015625, 8.93212890625, 9.9541015625, 10.97607421875, 11.998046875, 13.02001953125, 14.0419921875, 15.06396484375, 16.0859375, 17.10791015625, 18.1298828125, 19.15185546875, 20.173828125, 21.19580078125, 22.2177734375, 23.23974609375, 24.26171875, 25.28369140625, 26.3056640625, 27.32763671875, 28.349609375, 29.37158203125, 30.3935546875, 31.41552734375, 32.4375]}, "gradients/decoder.transformer.h.13.attn.c_attn.weight": {"_type": "histogram", "values": [3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 4.0, 10.0, 16.0, 20.0, 19.0, 32.0, 49.0, 60.0, 98.0, 131.0, 184.0, 282.0, 427.0, 1203.0, 76820.0, 3060961.0, 3770.0, 543.0, 299.0, 223.0, 166.0, 104.0, 75.0, 50.0, 44.0, 32.0, 18.0, 19.0, 11.0, 9.0, 3.0, 6.0, 1.0, 2.0, 1.0, 6.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.125, -66.96875, -63.8125, -60.65625, -57.5, -54.34375, -51.1875, -48.03125, -44.875, -41.71875, -38.5625, -35.40625, -32.25, -29.09375, -25.9375, -22.78125, -19.625, -16.46875, -13.3125, -10.15625, -7.0, -3.84375, -0.6875, 2.46875, 5.625, 8.78125, 11.9375, 15.09375, 18.25, 21.40625, 24.5625, 27.71875, 30.875, 34.03125, 37.1875, 40.34375, 43.5, 46.65625, 49.8125, 52.96875, 56.125, 59.28125, 62.4375, 65.59375, 68.75, 71.90625, 75.0625, 78.21875, 81.375, 84.53125, 87.6875, 90.84375, 94.0, 97.15625, 100.3125, 103.46875, 106.625, 109.78125, 112.9375, 116.09375, 119.25, 122.40625, 125.5625, 128.71875, 131.875]}, "gradients/decoder.transformer.h.13.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 40.0, 554.0, 411.0, 15.0, 1.0, 1.0], "bins": [-429.1835021972656, -422.0173034667969, -414.85107421875, -407.68487548828125, -400.5186767578125, -393.3524475097656, -386.1862487792969, -379.0200500488281, -371.85382080078125, -364.6876220703125, -357.5213928222656, -350.3551940917969, -343.1889953613281, -336.02276611328125, -328.8565673828125, -321.69036865234375, -314.524169921875, -307.35797119140625, -300.1917419433594, -293.0255432128906, -285.8593444824219, -278.693115234375, -271.52691650390625, -264.3607177734375, -257.1944885253906, -250.0282745361328, -242.86207580566406, -235.69586181640625, -228.52964782714844, -221.3634490966797, -214.19723510742188, -207.03103637695312, -199.86483764648438, -192.69862365722656, -185.5324249267578, -178.3662109375, -171.1999969482422, -164.03379821777344, -156.86758422851562, -149.70138549804688, -142.53515625, -135.3689422607422, -128.20274353027344, -121.03652954101562, -113.87032318115234, -106.70411682128906, -99.53790283203125, -92.37169647216797, -85.20549011230469, -78.0392837524414, -70.8730697631836, -63.70686340332031, -56.54065704345703, -49.374446868896484, -42.20823669433594, -35.042030334472656, -27.875822067260742, -20.709613800048828, -13.543404579162598, -6.377195358276367, 0.7890129089355469, 7.955221176147461, 15.121431350708008, 22.28763771057129, 29.453847885131836]}, "gradients/decoder.transformer.h.13.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 9.0, 7.0, 9.0, 6.0, 11.0, 11.0, 11.0, 15.0, 13.0, 18.0, 18.0, 27.0, 22.0, 25.0, 30.0, 31.0, 45.0, 30.0, 39.0, 35.0, 40.0, 40.0, 50.0, 33.0, 39.0, 32.0, 36.0, 47.0, 34.0, 28.0, 22.0, 19.0, 20.0, 17.0, 19.0, 19.0, 13.0, 15.0, 13.0, 5.0, 9.0, 8.0, 11.0, 5.0, 4.0, 3.0, 3.0, 7.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-80.92066192626953, -78.45547485351562, -75.99028778076172, -73.52510070800781, -71.0599136352539, -68.5947265625, -66.1295394897461, -63.66435623168945, -61.19916915893555, -58.73398208618164, -56.268795013427734, -53.80360794067383, -51.33842468261719, -48.87323760986328, -46.408050537109375, -43.94286346435547, -41.47767639160156, -39.012489318847656, -36.54730224609375, -34.082115173339844, -31.61693000793457, -29.151742935180664, -26.68655776977539, -24.221370697021484, -21.756183624267578, -19.290996551513672, -16.825809478759766, -14.360624313354492, -11.895437240600586, -9.43025016784668, -6.96506404876709, -4.4998779296875, -2.0346908569335938, 0.4304957389831543, 2.8956823348999023, 5.36086893081665, 7.826055526733398, 10.291242599487305, 12.756428718566895, 15.221614837646484, 17.68680191040039, 20.151988983154297, 22.617176055908203, 25.082361221313477, 27.547548294067383, 30.01273536682129, 32.47792053222656, 34.94310760498047, 37.408294677734375, 39.87348175048828, 42.33866882324219, 44.803855895996094, 47.26904296875, 49.734230041503906, 52.19941329956055, 54.66460037231445, 57.12978744506836, 59.594974517822266, 62.06016159057617, 64.52534484863281, 66.99053192138672, 69.45571899414062, 71.92090606689453, 74.38609313964844, 76.85128021240234]}, "gradients/decoder.transformer.h.12.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 4.0, 4.0, 8.0, 7.0, 6.0, 10.0, 13.0, 19.0, 11.0, 18.0, 23.0, 25.0, 28.0, 28.0, 32.0, 34.0, 47.0, 39.0, 42.0, 48.0, 36.0, 36.0, 38.0, 42.0, 49.0, 33.0, 37.0, 28.0, 36.0, 33.0, 27.0, 29.0, 22.0, 16.0, 19.0, 19.0, 13.0, 9.0, 9.0, 9.0, 7.0, 6.0, 2.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-8.9765625, -8.664306640625, -8.35205078125, -8.039794921875, -7.7275390625, -7.415283203125, -7.10302734375, -6.790771484375, -6.478515625, -6.166259765625, -5.85400390625, -5.541748046875, -5.2294921875, -4.917236328125, -4.60498046875, -4.292724609375, -3.98046875, -3.668212890625, -3.35595703125, -3.043701171875, -2.7314453125, -2.419189453125, -2.10693359375, -1.794677734375, -1.482421875, -1.170166015625, -0.85791015625, -0.545654296875, -0.2333984375, 0.078857421875, 0.39111328125, 0.703369140625, 1.015625, 1.327880859375, 1.64013671875, 1.952392578125, 2.2646484375, 2.576904296875, 2.88916015625, 3.201416015625, 3.513671875, 3.825927734375, 4.13818359375, 4.450439453125, 4.7626953125, 5.074951171875, 5.38720703125, 5.699462890625, 6.01171875, 6.323974609375, 6.63623046875, 6.948486328125, 7.2607421875, 7.572998046875, 7.88525390625, 8.197509765625, 8.509765625, 8.822021484375, 9.13427734375, 9.446533203125, 9.7587890625, 10.071044921875, 10.38330078125, 10.695556640625, 11.0078125]}, "gradients/decoder.transformer.h.12.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 4.0, 4.0, 6.0, 4.0, 7.0, 9.0, 7.0, 19.0, 8.0, 21.0, 23.0, 23.0, 48.0, 48.0, 81.0, 126.0, 277.0, 648.0, 2085.0, 9355.0, 68109.0, 840155.0, 2696558.0, 522397.0, 44947.0, 6701.0, 1485.0, 511.0, 207.0, 119.0, 79.0, 54.0, 46.0, 14.0, 22.0, 14.0, 13.0, 11.0, 13.0, 8.0, 8.0, 6.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.40625, -21.644287109375, -20.88232421875, -20.120361328125, -19.3583984375, -18.596435546875, -17.83447265625, -17.072509765625, -16.310546875, -15.548583984375, -14.78662109375, -14.024658203125, -13.2626953125, -12.500732421875, -11.73876953125, -10.976806640625, -10.21484375, -9.452880859375, -8.69091796875, -7.928955078125, -7.1669921875, -6.405029296875, -5.64306640625, -4.881103515625, -4.119140625, -3.357177734375, -2.59521484375, -1.833251953125, -1.0712890625, -0.309326171875, 0.45263671875, 1.214599609375, 1.9765625, 2.738525390625, 3.50048828125, 4.262451171875, 5.0244140625, 5.786376953125, 6.54833984375, 7.310302734375, 8.072265625, 8.834228515625, 9.59619140625, 10.358154296875, 11.1201171875, 11.882080078125, 12.64404296875, 13.406005859375, 14.16796875, 14.929931640625, 15.69189453125, 16.453857421875, 17.2158203125, 17.977783203125, 18.73974609375, 19.501708984375, 20.263671875, 21.025634765625, 21.78759765625, 22.549560546875, 23.3115234375, 24.073486328125, 24.83544921875, 25.597412109375, 26.359375]}, "gradients/decoder.transformer.h.12.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 2.0, 3.0, 4.0, 1.0, 4.0, 10.0, 9.0, 8.0, 15.0, 17.0, 29.0, 31.0, 47.0, 56.0, 79.0, 96.0, 128.0, 167.0, 266.0, 349.0, 443.0, 512.0, 442.0, 356.0, 274.0, 206.0, 135.0, 106.0, 80.0, 51.0, 40.0, 29.0, 27.0, 18.0, 10.0, 11.0, 7.0, 4.0, 4.0, 4.0, 1.0, 4.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-22.65625, -22.0205078125, -21.384765625, -20.7490234375, -20.11328125, -19.4775390625, -18.841796875, -18.2060546875, -17.5703125, -16.9345703125, -16.298828125, -15.6630859375, -15.02734375, -14.3916015625, -13.755859375, -13.1201171875, -12.484375, -11.8486328125, -11.212890625, -10.5771484375, -9.94140625, -9.3056640625, -8.669921875, -8.0341796875, -7.3984375, -6.7626953125, -6.126953125, -5.4912109375, -4.85546875, -4.2197265625, -3.583984375, -2.9482421875, -2.3125, -1.6767578125, -1.041015625, -0.4052734375, 0.23046875, 0.8662109375, 1.501953125, 2.1376953125, 2.7734375, 3.4091796875, 4.044921875, 4.6806640625, 5.31640625, 5.9521484375, 6.587890625, 7.2236328125, 7.859375, 8.4951171875, 9.130859375, 9.7666015625, 10.40234375, 11.0380859375, 11.673828125, 12.3095703125, 12.9453125, 13.5810546875, 14.216796875, 14.8525390625, 15.48828125, 16.1240234375, 16.759765625, 17.3955078125, 18.03125]}, "gradients/decoder.transformer.h.12.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 5.0, 4.0, 9.0, 6.0, 6.0, 13.0, 11.0, 19.0, 25.0, 20.0, 47.0, 56.0, 66.0, 77.0, 119.0, 166.0, 190.0, 303.0, 558.0, 2521.0, 146843.0, 3946246.0, 93165.0, 2105.0, 497.0, 294.0, 208.0, 175.0, 118.0, 106.0, 80.0, 59.0, 35.0, 39.0, 23.0, 16.0, 15.0, 17.0, 9.0, 6.0, 6.0, 1.0, 3.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-60.84375, -58.45361328125, -56.0634765625, -53.67333984375, -51.283203125, -48.89306640625, -46.5029296875, -44.11279296875, -41.72265625, -39.33251953125, -36.9423828125, -34.55224609375, -32.162109375, -29.77197265625, -27.3818359375, -24.99169921875, -22.6015625, -20.21142578125, -17.8212890625, -15.43115234375, -13.041015625, -10.65087890625, -8.2607421875, -5.87060546875, -3.48046875, -1.09033203125, 1.2998046875, 3.68994140625, 6.080078125, 8.47021484375, 10.8603515625, 13.25048828125, 15.640625, 18.03076171875, 20.4208984375, 22.81103515625, 25.201171875, 27.59130859375, 29.9814453125, 32.37158203125, 34.76171875, 37.15185546875, 39.5419921875, 41.93212890625, 44.322265625, 46.71240234375, 49.1025390625, 51.49267578125, 53.8828125, 56.27294921875, 58.6630859375, 61.05322265625, 63.443359375, 65.83349609375, 68.2236328125, 70.61376953125, 73.00390625, 75.39404296875, 77.7841796875, 80.17431640625, 82.564453125, 84.95458984375, 87.3447265625, 89.73486328125, 92.125]}, "gradients/decoder.transformer.h.12.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 11.0, 16.0, 32.0, 66.0, 97.0, 160.0, 180.0, 166.0, 134.0, 78.0, 39.0, 20.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-144.386962890625, -140.22299194335938, -136.05902099609375, -131.89505004882812, -127.73107147216797, -123.56710052490234, -119.40312194824219, -115.23915100097656, -111.07518005371094, -106.91120910644531, -102.74723815917969, -98.58325958251953, -94.4192886352539, -90.25531768798828, -86.09133911132812, -81.9273681640625, -77.76339721679688, -73.59942626953125, -69.43545532226562, -65.27147674560547, -61.107505798339844, -56.94353485107422, -52.77956008911133, -48.61558532714844, -44.45161437988281, -40.28764343261719, -36.1236686706543, -31.95969581604004, -27.79572296142578, -23.631750106811523, -19.467777252197266, -15.303804397583008, -11.139816284179688, -6.97584342956543, -2.811870574951172, 1.352102279663086, 5.516075134277344, 9.680047988891602, 13.84402084350586, 18.007993698120117, 22.171966552734375, 26.335939407348633, 30.49991226196289, 34.66388702392578, 38.827857971191406, 42.99182891845703, 47.15580368041992, 51.31977844238281, 55.48374938964844, 59.64772033691406, 63.81169509887695, 67.97566986083984, 72.13964080810547, 76.3036117553711, 80.46759033203125, 84.63156127929688, 88.7955322265625, 92.95950317382812, 97.12347412109375, 101.2874526977539, 105.45142364501953, 109.61539459228516, 113.77937316894531, 117.94334411621094, 122.10731506347656]}, "gradients/decoder.transformer.h.12.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 1.0, 7.0, 8.0, 10.0, 12.0, 8.0, 14.0, 22.0, 27.0, 14.0, 32.0, 31.0, 30.0, 44.0, 38.0, 39.0, 39.0, 44.0, 32.0, 41.0, 45.0, 48.0, 34.0, 40.0, 33.0, 36.0, 32.0, 36.0, 25.0, 34.0, 21.0, 26.0, 17.0, 10.0, 14.0, 12.0, 13.0, 10.0, 9.0, 4.0, 6.0, 2.0, 0.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-64.89410400390625, -62.799903869628906, -60.70570373535156, -58.61150360107422, -56.517303466796875, -54.42310333251953, -52.32890701293945, -50.23470687866211, -48.140506744384766, -46.04630661010742, -43.95210647583008, -41.857906341552734, -39.763710021972656, -37.66950988769531, -35.57530975341797, -33.481109619140625, -31.38690948486328, -29.292709350585938, -27.198509216308594, -25.104310989379883, -23.01011085510254, -20.915910720825195, -18.821712493896484, -16.72751235961914, -14.633312225341797, -12.539112091064453, -10.444912910461426, -8.350713729858398, -6.256513595581055, -4.162313461303711, -2.0681142807006836, 0.02608489990234375, 2.1202774047851562, 4.214477062225342, 6.308676719665527, 8.402875900268555, 10.497076034545898, 12.591276168823242, 14.68547534942627, 16.779674530029297, 18.87387466430664, 20.968074798583984, 23.062274932861328, 25.15647315979004, 27.250673294067383, 29.344873428344727, 31.439071655273438, 33.53327178955078, 35.627471923828125, 37.72167205810547, 39.81587219238281, 41.910072326660156, 44.0042724609375, 46.098472595214844, 48.19266891479492, 50.286869049072266, 52.38106918334961, 54.47526931762695, 56.5694694519043, 58.66366958618164, 60.75786590576172, 62.85206604003906, 64.9462661743164, 67.04046630859375, 69.1346664428711]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 9.0, 7.0, 12.0, 13.0, 11.0, 16.0, 20.0, 23.0, 22.0, 26.0, 37.0, 41.0, 35.0, 35.0, 37.0, 45.0, 50.0, 43.0, 35.0, 43.0, 36.0, 38.0, 29.0, 37.0, 39.0, 34.0, 28.0, 24.0, 23.0, 20.0, 31.0, 18.0, 15.0, 14.0, 15.0, 8.0, 3.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.2528076171875, -8.950927734375, -8.6490478515625, -8.34716796875, -8.0452880859375, -7.743408203125, -7.4415283203125, -7.1396484375, -6.8377685546875, -6.535888671875, -6.2340087890625, -5.93212890625, -5.6302490234375, -5.328369140625, -5.0264892578125, -4.724609375, -4.4227294921875, -4.120849609375, -3.8189697265625, -3.51708984375, -3.2152099609375, -2.913330078125, -2.6114501953125, -2.3095703125, -2.0076904296875, -1.705810546875, -1.4039306640625, -1.10205078125, -0.8001708984375, -0.498291015625, -0.1964111328125, 0.10546875, 0.4073486328125, 0.709228515625, 1.0111083984375, 1.31298828125, 1.6148681640625, 1.916748046875, 2.2186279296875, 2.5205078125, 2.8223876953125, 3.124267578125, 3.4261474609375, 3.72802734375, 4.0299072265625, 4.331787109375, 4.6336669921875, 4.935546875, 5.2374267578125, 5.539306640625, 5.8411865234375, 6.14306640625, 6.4449462890625, 6.746826171875, 7.0487060546875, 7.3505859375, 7.6524658203125, 7.954345703125, 8.2562255859375, 8.55810546875, 8.8599853515625, 9.161865234375, 9.4637451171875, 9.765625]}, "gradients/decoder.transformer.h.12.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 2.0, 4.0, 0.0, 3.0, 3.0, 4.0, 8.0, 12.0, 14.0, 23.0, 27.0, 53.0, 88.0, 112.0, 172.0, 251.0, 395.0, 570.0, 942.0, 1540.0, 2333.0, 3672.0, 6208.0, 10079.0, 17286.0, 29915.0, 51632.0, 88926.0, 147179.0, 206991.0, 187122.0, 120599.0, 71579.0, 41194.0, 23848.0, 13961.0, 8287.0, 5059.0, 3092.0, 1918.0, 1234.0, 753.0, 498.0, 355.0, 211.0, 129.0, 90.0, 60.0, 42.0, 17.0, 21.0, 18.0, 11.0, 8.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0], "bins": [-1.0654296875, -1.0329437255859375, -1.000457763671875, -0.9679718017578125, -0.93548583984375, -0.9029998779296875, -0.870513916015625, -0.8380279541015625, -0.8055419921875, -0.7730560302734375, -0.740570068359375, -0.7080841064453125, -0.67559814453125, -0.6431121826171875, -0.610626220703125, -0.5781402587890625, -0.545654296875, -0.5131683349609375, -0.480682373046875, -0.4481964111328125, -0.41571044921875, -0.3832244873046875, -0.350738525390625, -0.3182525634765625, -0.2857666015625, -0.2532806396484375, -0.220794677734375, -0.1883087158203125, -0.15582275390625, -0.1233367919921875, -0.090850830078125, -0.0583648681640625, -0.02587890625, 0.0066070556640625, 0.039093017578125, 0.0715789794921875, 0.10406494140625, 0.1365509033203125, 0.169036865234375, 0.2015228271484375, 0.2340087890625, 0.2664947509765625, 0.298980712890625, 0.3314666748046875, 0.36395263671875, 0.3964385986328125, 0.428924560546875, 0.4614105224609375, 0.493896484375, 0.5263824462890625, 0.558868408203125, 0.5913543701171875, 0.62384033203125, 0.6563262939453125, 0.688812255859375, 0.7212982177734375, 0.7537841796875, 0.7862701416015625, 0.818756103515625, 0.8512420654296875, 0.88372802734375, 0.9162139892578125, 0.948699951171875, 0.9811859130859375, 1.013671875]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 1.0, 2.0, 6.0, 9.0, 4.0, 10.0, 4.0, 10.0, 12.0, 20.0, 14.0, 20.0, 22.0, 15.0, 23.0, 18.0, 38.0, 32.0, 40.0, 41.0, 36.0, 42.0, 43.0, 1071.0, 39.0, 34.0, 47.0, 42.0, 34.0, 44.0, 30.0, 31.0, 20.0, 25.0, 21.0, 21.0, 21.0, 14.0, 11.0, 16.0, 13.0, 4.0, 2.0, 10.0, 3.0, 6.0, 3.0, 6.0, 0.0, 5.0, 1.0, 2.0, 0.0, 2.0], "bins": [-6.37890625, -6.19122314453125, -6.0035400390625, -5.81585693359375, -5.628173828125, -5.44049072265625, -5.2528076171875, -5.06512451171875, -4.87744140625, -4.68975830078125, -4.5020751953125, -4.31439208984375, -4.126708984375, -3.93902587890625, -3.7513427734375, -3.56365966796875, -3.3759765625, -3.18829345703125, -3.0006103515625, -2.81292724609375, -2.625244140625, -2.43756103515625, -2.2498779296875, -2.06219482421875, -1.87451171875, -1.68682861328125, -1.4991455078125, -1.31146240234375, -1.123779296875, -0.93609619140625, -0.7484130859375, -0.56072998046875, -0.373046875, -0.18536376953125, 0.0023193359375, 0.19000244140625, 0.377685546875, 0.56536865234375, 0.7530517578125, 0.94073486328125, 1.12841796875, 1.31610107421875, 1.5037841796875, 1.69146728515625, 1.879150390625, 2.06683349609375, 2.2545166015625, 2.44219970703125, 2.6298828125, 2.81756591796875, 3.0052490234375, 3.19293212890625, 3.380615234375, 3.56829833984375, 3.7559814453125, 3.94366455078125, 4.13134765625, 4.31903076171875, 4.5067138671875, 4.69439697265625, 4.882080078125, 5.06976318359375, 5.2574462890625, 5.44512939453125, 5.6328125]}, "gradients/decoder.transformer.h.12.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 11.0, 6.0, 15.0, 28.0, 41.0, 74.0, 108.0, 187.0, 278.0, 415.0, 661.0, 1070.0, 1634.0, 2623.0, 4078.0, 6631.0, 10832.0, 17757.0, 28481.0, 45684.0, 74160.0, 113751.0, 159769.0, 1223382.0, 143651.0, 98124.0, 62237.0, 38881.0, 23584.0, 14698.0, 9054.0, 5568.0, 3580.0, 2194.0, 1422.0, 932.0, 549.0, 368.0, 216.0, 148.0, 92.0, 63.0, 37.0, 22.0, 17.0, 10.0, 7.0, 6.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.677734375, -0.6553802490234375, -0.633026123046875, -0.6106719970703125, -0.58831787109375, -0.5659637451171875, -0.543609619140625, -0.5212554931640625, -0.4989013671875, -0.4765472412109375, -0.454193115234375, -0.4318389892578125, -0.40948486328125, -0.3871307373046875, -0.364776611328125, -0.3424224853515625, -0.320068359375, -0.2977142333984375, -0.275360107421875, -0.2530059814453125, -0.23065185546875, -0.2082977294921875, -0.185943603515625, -0.1635894775390625, -0.1412353515625, -0.1188812255859375, -0.096527099609375, -0.0741729736328125, -0.05181884765625, -0.0294647216796875, -0.007110595703125, 0.0152435302734375, 0.03759765625, 0.0599517822265625, 0.082305908203125, 0.1046600341796875, 0.12701416015625, 0.1493682861328125, 0.171722412109375, 0.1940765380859375, 0.2164306640625, 0.2387847900390625, 0.261138916015625, 0.2834930419921875, 0.30584716796875, 0.3282012939453125, 0.350555419921875, 0.3729095458984375, 0.395263671875, 0.4176177978515625, 0.439971923828125, 0.4623260498046875, 0.48468017578125, 0.5070343017578125, 0.529388427734375, 0.5517425537109375, 0.5740966796875, 0.5964508056640625, 0.618804931640625, 0.6411590576171875, 0.66351318359375, 0.6858673095703125, 0.708221435546875, 0.7305755615234375, 0.7529296875]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 4.0, 8.0, 5.0, 10.0, 12.0, 14.0, 17.0, 28.0, 25.0, 31.0, 40.0, 54.0, 55.0, 58.0, 77.0, 75.0, 66.0, 66.0, 67.0, 65.0, 54.0, 34.0, 36.0, 18.0, 19.0, 13.0, 5.0, 7.0, 6.0, 6.0, 9.0, 6.0, 0.0, 0.0, 4.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.006961822509765625, -0.006736636161804199, -0.0065114498138427734, -0.006286263465881348, -0.006061077117919922, -0.005835890769958496, -0.00561070442199707, -0.0053855180740356445, -0.005160331726074219, -0.004935145378112793, -0.004709959030151367, -0.004484772682189941, -0.004259586334228516, -0.00403439998626709, -0.003809213638305664, -0.0035840272903442383, -0.0033588409423828125, -0.0031336545944213867, -0.002908468246459961, -0.002683281898498535, -0.0024580955505371094, -0.0022329092025756836, -0.002007722854614258, -0.001782536506652832, -0.0015573501586914062, -0.0013321638107299805, -0.0011069774627685547, -0.0008817911148071289, -0.0006566047668457031, -0.00043141841888427734, -0.00020623207092285156, 1.895427703857422e-05, 0.000244140625, 0.0004693269729614258, 0.0006945133209228516, 0.0009196996688842773, 0.0011448860168457031, 0.001370072364807129, 0.0015952587127685547, 0.0018204450607299805, 0.0020456314086914062, 0.002270817756652832, 0.002496004104614258, 0.0027211904525756836, 0.0029463768005371094, 0.003171563148498535, 0.003396749496459961, 0.0036219358444213867, 0.0038471221923828125, 0.004072308540344238, 0.004297494888305664, 0.00452268123626709, 0.004747867584228516, 0.004973053932189941, 0.005198240280151367, 0.005423426628112793, 0.005648612976074219, 0.0058737993240356445, 0.00609898567199707, 0.006324172019958496, 0.006549358367919922, 0.006774544715881348, 0.0069997310638427734, 0.007224917411804199, 0.007450103759765625]}, "gradients/decoder.transformer.h.12.crossattention.q_attn.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 4.0, 10.0, 7.0, 6.0, 7.0, 14.0, 11.0, 13.0, 16.0, 27.0, 31.0, 55.0, 87.0, 117.0, 193.0, 317.0, 1224.0, 57901.0, 977767.0, 9280.0, 634.0, 265.0, 165.0, 128.0, 67.0, 41.0, 40.0, 26.0, 24.0, 13.0, 11.0, 10.0, 13.0, 4.0, 7.0, 5.0, 4.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.14892578125, -0.144317626953125, -0.13970947265625, -0.135101318359375, -0.1304931640625, -0.125885009765625, -0.12127685546875, -0.116668701171875, -0.112060546875, -0.107452392578125, -0.10284423828125, -0.098236083984375, -0.0936279296875, -0.089019775390625, -0.08441162109375, -0.079803466796875, -0.0751953125, -0.070587158203125, -0.06597900390625, -0.061370849609375, -0.0567626953125, -0.052154541015625, -0.04754638671875, -0.042938232421875, -0.038330078125, -0.033721923828125, -0.02911376953125, -0.024505615234375, -0.0198974609375, -0.015289306640625, -0.01068115234375, -0.006072998046875, -0.00146484375, 0.003143310546875, 0.00775146484375, 0.012359619140625, 0.0169677734375, 0.021575927734375, 0.02618408203125, 0.030792236328125, 0.035400390625, 0.040008544921875, 0.04461669921875, 0.049224853515625, 0.0538330078125, 0.058441162109375, 0.06304931640625, 0.067657470703125, 0.072265625, 0.076873779296875, 0.08148193359375, 0.086090087890625, 0.0906982421875, 0.095306396484375, 0.09991455078125, 0.104522705078125, 0.109130859375, 0.113739013671875, 0.11834716796875, 0.122955322265625, 0.1275634765625, 0.132171630859375, 0.13677978515625, 0.141387939453125, 0.14599609375]}, "gradients/decoder.transformer.h.12.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 0.0, 11.0, 163.0, 705.0, 131.0, 6.0], "bins": [-0.07777281850576401, -0.07650747150182724, -0.07524211704730988, -0.07397677004337311, -0.07271141558885574, -0.07144606858491898, -0.07018071413040161, -0.06891536712646484, -0.06765001267194748, -0.06638466566801071, -0.06511931121349335, -0.06385396420955658, -0.06258860975503922, -0.06132325902581215, -0.06005790829658508, -0.058792561292648315, -0.05752721056342125, -0.05626185983419418, -0.05499650910496712, -0.05373115837574005, -0.052465807646512985, -0.05120045691728592, -0.04993510618805885, -0.04866975545883179, -0.04740440845489502, -0.046139057725667953, -0.04487370699644089, -0.04360835626721382, -0.042343005537986755, -0.04107765480875969, -0.03981230407953262, -0.038546957075595856, -0.03728159889578819, -0.03601624816656113, -0.03475089743733406, -0.033485546708106995, -0.03222019597887993, -0.030954845249652863, -0.029689496383070946, -0.02842414565384388, -0.027158796787261963, -0.025893446058034897, -0.02462809532880783, -0.023362744599580765, -0.0220973938703537, -0.020832043141126633, -0.019566694274544716, -0.01830134354531765, -0.017035992816090584, -0.015770642086863518, -0.014505291357636452, -0.01323994155973196, -0.011974590830504894, -0.010709240101277828, -0.009443890303373337, -0.00817853957414627, -0.006913188379257917, -0.005647838115692139, -0.004382487386465073, -0.0031171368900686502, -0.0018517863936722279, -0.0005864356644451618, 0.0006789145991206169, 0.0019442648626863956, 0.0032096155919134617]}, "gradients/decoder.transformer.h.12.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 4.0, 2.0, 4.0, 6.0, 5.0, 8.0, 3.0, 6.0, 11.0, 13.0, 15.0, 21.0, 13.0, 19.0, 20.0, 31.0, 29.0, 33.0, 29.0, 51.0, 34.0, 49.0, 44.0, 46.0, 49.0, 62.0, 43.0, 46.0, 31.0, 34.0, 38.0, 29.0, 25.0, 26.0, 21.0, 23.0, 15.0, 13.0, 17.0, 14.0, 7.0, 7.0, 6.0, 4.0, 3.0, 0.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0040964484214782715, -0.003973698243498802, -0.003850948065519333, -0.0037281978875398636, -0.0036054477095603943, -0.003482697531580925, -0.0033599473536014557, -0.0032371971756219864, -0.003114446997642517, -0.002991696819663048, -0.0028689466416835785, -0.002746196463704109, -0.00262344628572464, -0.0025006961077451706, -0.0023779459297657013, -0.002255195751786232, -0.0021324455738067627, -0.0020096953958272934, -0.001886945217847824, -0.0017641950398683548, -0.0016414448618888855, -0.0015186946839094162, -0.001395944505929947, -0.0012731943279504776, -0.0011504441499710083, -0.001027693971991539, -0.0009049437940120697, -0.0007821936160326004, -0.0006594434380531311, -0.0005366932600736618, -0.0004139430820941925, -0.0002911929041147232, -0.0001684427261352539, -4.569254815578461e-05, 7.705762982368469e-05, 0.000199807807803154, 0.0003225579857826233, 0.0004453081637620926, 0.0005680583417415619, 0.0006908085197210312, 0.0008135586977005005, 0.0009363088756799698, 0.001059059053659439, 0.0011818092316389084, 0.0013045594096183777, 0.001427309587597847, 0.0015500597655773163, 0.0016728099435567856, 0.0017955601215362549, 0.0019183102995157242, 0.0020410604774951935, 0.0021638106554746628, 0.002286560833454132, 0.0024093110114336014, 0.0025320611894130707, 0.00265481136739254, 0.0027775615453720093, 0.0029003117233514786, 0.003023061901330948, 0.003145812079310417, 0.0032685622572898865, 0.0033913124352693558, 0.003514062613248825, 0.0036368127912282944, 0.0037595629692077637]}, "gradients/decoder.transformer.h.12.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 6.0, 9.0, 7.0, 12.0, 13.0, 11.0, 16.0, 20.0, 23.0, 22.0, 28.0, 36.0, 40.0, 35.0, 35.0, 38.0, 45.0, 50.0, 42.0, 36.0, 43.0, 35.0, 38.0, 29.0, 39.0, 37.0, 37.0, 25.0, 24.0, 23.0, 20.0, 31.0, 18.0, 16.0, 14.0, 14.0, 8.0, 3.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.5546875, -9.252685546875, -8.95068359375, -8.648681640625, -8.3466796875, -8.044677734375, -7.74267578125, -7.440673828125, -7.138671875, -6.836669921875, -6.53466796875, -6.232666015625, -5.9306640625, -5.628662109375, -5.32666015625, -5.024658203125, -4.72265625, -4.420654296875, -4.11865234375, -3.816650390625, -3.5146484375, -3.212646484375, -2.91064453125, -2.608642578125, -2.306640625, -2.004638671875, -1.70263671875, -1.400634765625, -1.0986328125, -0.796630859375, -0.49462890625, -0.192626953125, 0.109375, 0.411376953125, 0.71337890625, 1.015380859375, 1.3173828125, 1.619384765625, 1.92138671875, 2.223388671875, 2.525390625, 2.827392578125, 3.12939453125, 3.431396484375, 3.7333984375, 4.035400390625, 4.33740234375, 4.639404296875, 4.94140625, 5.243408203125, 5.54541015625, 5.847412109375, 6.1494140625, 6.451416015625, 6.75341796875, 7.055419921875, 7.357421875, 7.659423828125, 7.96142578125, 8.263427734375, 8.5654296875, 8.867431640625, 9.16943359375, 9.471435546875, 9.7734375]}, "gradients/decoder.transformer.h.12.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 1.0, 2.0, 2.0, 7.0, 11.0, 11.0, 14.0, 18.0, 20.0, 36.0, 52.0, 79.0, 117.0, 194.0, 331.0, 603.0, 1223.0, 2215.0, 4833.0, 11499.0, 35272.0, 140720.0, 547711.0, 223840.0, 51831.0, 15679.0, 6285.0, 2810.0, 1301.0, 758.0, 410.0, 230.0, 141.0, 75.0, 72.0, 46.0, 27.0, 17.0, 23.0, 11.0, 7.0, 8.0, 7.0, 5.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.171875, -8.882080078125, -8.59228515625, -8.302490234375, -8.0126953125, -7.722900390625, -7.43310546875, -7.143310546875, -6.853515625, -6.563720703125, -6.27392578125, -5.984130859375, -5.6943359375, -5.404541015625, -5.11474609375, -4.824951171875, -4.53515625, -4.245361328125, -3.95556640625, -3.665771484375, -3.3759765625, -3.086181640625, -2.79638671875, -2.506591796875, -2.216796875, -1.927001953125, -1.63720703125, -1.347412109375, -1.0576171875, -0.767822265625, -0.47802734375, -0.188232421875, 0.1015625, 0.391357421875, 0.68115234375, 0.970947265625, 1.2607421875, 1.550537109375, 1.84033203125, 2.130126953125, 2.419921875, 2.709716796875, 2.99951171875, 3.289306640625, 3.5791015625, 3.868896484375, 4.15869140625, 4.448486328125, 4.73828125, 5.028076171875, 5.31787109375, 5.607666015625, 5.8974609375, 6.187255859375, 6.47705078125, 6.766845703125, 7.056640625, 7.346435546875, 7.63623046875, 7.926025390625, 8.2158203125, 8.505615234375, 8.79541015625, 9.085205078125, 9.375]}, "gradients/decoder.transformer.h.12.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 2.0, 6.0, 2.0, 8.0, 8.0, 2.0, 9.0, 4.0, 16.0, 15.0, 25.0, 30.0, 26.0, 28.0, 53.0, 36.0, 51.0, 47.0, 53.0, 112.0, 1811.0, 233.0, 53.0, 60.0, 53.0, 53.0, 37.0, 40.0, 33.0, 26.0, 24.0, 20.0, 22.0, 13.0, 14.0, 6.0, 4.0, 3.0, 5.0, 6.0, 2.0, 7.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-35.34375, -34.1923828125, -33.041015625, -31.8896484375, -30.73828125, -29.5869140625, -28.435546875, -27.2841796875, -26.1328125, -24.9814453125, -23.830078125, -22.6787109375, -21.52734375, -20.3759765625, -19.224609375, -18.0732421875, -16.921875, -15.7705078125, -14.619140625, -13.4677734375, -12.31640625, -11.1650390625, -10.013671875, -8.8623046875, -7.7109375, -6.5595703125, -5.408203125, -4.2568359375, -3.10546875, -1.9541015625, -0.802734375, 0.3486328125, 1.5, 2.6513671875, 3.802734375, 4.9541015625, 6.10546875, 7.2568359375, 8.408203125, 9.5595703125, 10.7109375, 11.8623046875, 13.013671875, 14.1650390625, 15.31640625, 16.4677734375, 17.619140625, 18.7705078125, 19.921875, 21.0732421875, 22.224609375, 23.3759765625, 24.52734375, 25.6787109375, 26.830078125, 27.9814453125, 29.1328125, 30.2841796875, 31.435546875, 32.5869140625, 33.73828125, 34.8896484375, 36.041015625, 37.1923828125, 38.34375]}, "gradients/decoder.transformer.h.12.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 10.0, 8.0, 9.0, 6.0, 10.0, 21.0, 30.0, 43.0, 57.0, 69.0, 115.0, 176.0, 282.0, 495.0, 2258.0, 2961852.0, 177831.0, 1270.0, 413.0, 259.0, 151.0, 104.0, 67.0, 55.0, 27.0, 17.0, 13.0, 11.0, 15.0, 4.0, 10.0, 4.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-113.6875, -110.4296875, -107.171875, -103.9140625, -100.65625, -97.3984375, -94.140625, -90.8828125, -87.625, -84.3671875, -81.109375, -77.8515625, -74.59375, -71.3359375, -68.078125, -64.8203125, -61.5625, -58.3046875, -55.046875, -51.7890625, -48.53125, -45.2734375, -42.015625, -38.7578125, -35.5, -32.2421875, -28.984375, -25.7265625, -22.46875, -19.2109375, -15.953125, -12.6953125, -9.4375, -6.1796875, -2.921875, 0.3359375, 3.59375, 6.8515625, 10.109375, 13.3671875, 16.625, 19.8828125, 23.140625, 26.3984375, 29.65625, 32.9140625, 36.171875, 39.4296875, 42.6875, 45.9453125, 49.203125, 52.4609375, 55.71875, 58.9765625, 62.234375, 65.4921875, 68.75, 72.0078125, 75.265625, 78.5234375, 81.78125, 85.0390625, 88.296875, 91.5546875, 94.8125]}, "gradients/decoder.transformer.h.12.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 332.0, 681.0, 5.0, 0.0, 0.0, 1.0], "bins": [-538.5452880859375, -529.4317016601562, -520.3180541992188, -511.2044677734375, -502.09088134765625, -492.9772644042969, -483.8636779785156, -474.75006103515625, -465.636474609375, -456.5228576660156, -447.4092712402344, -438.295654296875, -429.18206787109375, -420.0684509277344, -410.9548645019531, -401.84124755859375, -392.7276306152344, -383.614013671875, -374.50042724609375, -365.3868103027344, -356.2732238769531, -347.15960693359375, -338.0460205078125, -328.9324035644531, -319.81878662109375, -310.7051696777344, -301.5915832519531, -292.47796630859375, -283.3643798828125, -274.2507629394531, -265.1371765136719, -256.0235595703125, -246.90994262695312, -237.7963409423828, -228.6827392578125, -219.5691375732422, -210.45553588867188, -201.3419189453125, -192.2283172607422, -183.11471557617188, -174.00111389160156, -164.88751220703125, -155.77391052246094, -146.66030883789062, -137.54669189453125, -128.43310546875, -119.31948852539062, -110.20588684082031, -101.09228515625, -91.97868347167969, -82.86508178710938, -73.75147247314453, -64.63787078857422, -55.524269104003906, -46.41066360473633, -37.29705810546875, -28.183460235595703, -19.069856643676758, -9.956253051757812, -0.8426494598388672, 8.270954132080078, 17.38455581665039, 26.49816131591797, 35.61176681518555, 44.72536849975586]}, "gradients/decoder.transformer.h.12.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 6.0, 9.0, 12.0, 15.0, 17.0, 18.0, 22.0, 29.0, 24.0, 30.0, 36.0, 33.0, 43.0, 39.0, 50.0, 39.0, 43.0, 50.0, 49.0, 46.0, 49.0, 40.0, 35.0, 29.0, 36.0, 26.0, 23.0, 27.0, 21.0, 14.0, 13.0, 14.0, 9.0, 13.0, 10.0, 9.0, 5.0, 2.0, 4.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-85.31979370117188, -82.54969024658203, -79.77959442138672, -77.00949096679688, -74.23938751220703, -71.46929168701172, -68.69918823242188, -65.92909240722656, -63.15898895263672, -60.38888931274414, -57.6187858581543, -54.84868621826172, -52.07858657836914, -49.30848693847656, -46.53838348388672, -43.76828384399414, -40.9981803894043, -38.22808074951172, -35.457977294921875, -32.6878776550293, -29.91777801513672, -27.147676467895508, -24.377574920654297, -21.60747528076172, -18.837373733520508, -16.067272186279297, -13.297172546386719, -10.527070999145508, -7.756970405578613, -4.986869812011719, -2.216768264770508, 0.5533313751220703, 3.3234329223632812, 6.093533515930176, 8.86363410949707, 11.633735656738281, 14.403836250305176, 17.17393684387207, 19.94403839111328, 22.71413803100586, 25.48423957824707, 28.25434112548828, 31.02444076538086, 33.79454040527344, 36.56464385986328, 39.33474349975586, 42.10484313964844, 44.87494659423828, 47.64504623413086, 50.41514587402344, 53.18524932861328, 55.95534896850586, 58.72544860839844, 61.49555206298828, 64.26565551757812, 67.03575134277344, 69.80585479736328, 72.57595825195312, 75.34605407714844, 78.11615753173828, 80.88626098632812, 83.65635681152344, 86.42646026611328, 89.19656372070312, 91.96665954589844]}, "gradients/decoder.transformer.h.11.mlp.c_proj.bias": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 2.0, 1.0, 6.0, 2.0, 6.0, 8.0, 8.0, 7.0, 13.0, 16.0, 14.0, 16.0, 25.0, 22.0, 38.0, 33.0, 35.0, 38.0, 37.0, 34.0, 36.0, 43.0, 47.0, 59.0, 37.0, 33.0, 31.0, 33.0, 39.0, 41.0, 28.0, 31.0, 20.0, 24.0, 20.0, 22.0, 23.0, 8.0, 20.0, 10.0, 8.0, 10.0, 7.0, 5.0, 3.0, 8.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.765625, -9.4566650390625, -9.147705078125, -8.8387451171875, -8.52978515625, -8.2208251953125, -7.911865234375, -7.6029052734375, -7.2939453125, -6.9849853515625, -6.676025390625, -6.3670654296875, -6.05810546875, -5.7491455078125, -5.440185546875, -5.1312255859375, -4.822265625, -4.5133056640625, -4.204345703125, -3.8953857421875, -3.58642578125, -3.2774658203125, -2.968505859375, -2.6595458984375, -2.3505859375, -2.0416259765625, -1.732666015625, -1.4237060546875, -1.11474609375, -0.8057861328125, -0.496826171875, -0.1878662109375, 0.12109375, 0.4300537109375, 0.739013671875, 1.0479736328125, 1.35693359375, 1.6658935546875, 1.974853515625, 2.2838134765625, 2.5927734375, 2.9017333984375, 3.210693359375, 3.5196533203125, 3.82861328125, 4.1375732421875, 4.446533203125, 4.7554931640625, 5.064453125, 5.3734130859375, 5.682373046875, 5.9913330078125, 6.30029296875, 6.6092529296875, 6.918212890625, 7.2271728515625, 7.5361328125, 7.8450927734375, 8.154052734375, 8.4630126953125, 8.77197265625, 9.0809326171875, 9.389892578125, 9.6988525390625, 10.0078125]}, "gradients/decoder.transformer.h.11.mlp.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 5.0, 7.0, 4.0, 8.0, 10.0, 8.0, 12.0, 12.0, 14.0, 20.0, 22.0, 28.0, 34.0, 35.0, 61.0, 62.0, 103.0, 144.0, 253.0, 413.0, 882.0, 2376.0, 8546.0, 44151.0, 415328.0, 2309488.0, 1253330.0, 133082.0, 18710.0, 4170.0, 1421.0, 560.0, 285.0, 186.0, 103.0, 85.0, 73.0, 42.0, 39.0, 40.0, 18.0, 26.0, 17.0, 20.0, 8.0, 14.0, 12.0, 6.0, 9.0, 8.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-22.65625, -21.985107421875, -21.31396484375, -20.642822265625, -19.9716796875, -19.300537109375, -18.62939453125, -17.958251953125, -17.287109375, -16.615966796875, -15.94482421875, -15.273681640625, -14.6025390625, -13.931396484375, -13.26025390625, -12.589111328125, -11.91796875, -11.246826171875, -10.57568359375, -9.904541015625, -9.2333984375, -8.562255859375, -7.89111328125, -7.219970703125, -6.548828125, -5.877685546875, -5.20654296875, -4.535400390625, -3.8642578125, -3.193115234375, -2.52197265625, -1.850830078125, -1.1796875, -0.508544921875, 0.16259765625, 0.833740234375, 1.5048828125, 2.176025390625, 2.84716796875, 3.518310546875, 4.189453125, 4.860595703125, 5.53173828125, 6.202880859375, 6.8740234375, 7.545166015625, 8.21630859375, 8.887451171875, 9.55859375, 10.229736328125, 10.90087890625, 11.572021484375, 12.2431640625, 12.914306640625, 13.58544921875, 14.256591796875, 14.927734375, 15.598876953125, 16.27001953125, 16.941162109375, 17.6123046875, 18.283447265625, 18.95458984375, 19.625732421875, 20.296875]}, "gradients/decoder.transformer.h.11.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 6.0, 5.0, 2.0, 9.0, 7.0, 18.0, 24.0, 32.0, 44.0, 68.0, 109.0, 159.0, 204.0, 269.0, 393.0, 511.0, 546.0, 477.0, 342.0, 260.0, 168.0, 132.0, 84.0, 55.0, 50.0, 41.0, 21.0, 11.0, 11.0, 8.0, 2.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-24.84375, -24.1416015625, -23.439453125, -22.7373046875, -22.03515625, -21.3330078125, -20.630859375, -19.9287109375, -19.2265625, -18.5244140625, -17.822265625, -17.1201171875, -16.41796875, -15.7158203125, -15.013671875, -14.3115234375, -13.609375, -12.9072265625, -12.205078125, -11.5029296875, -10.80078125, -10.0986328125, -9.396484375, -8.6943359375, -7.9921875, -7.2900390625, -6.587890625, -5.8857421875, -5.18359375, -4.4814453125, -3.779296875, -3.0771484375, -2.375, -1.6728515625, -0.970703125, -0.2685546875, 0.43359375, 1.1357421875, 1.837890625, 2.5400390625, 3.2421875, 3.9443359375, 4.646484375, 5.3486328125, 6.05078125, 6.7529296875, 7.455078125, 8.1572265625, 8.859375, 9.5615234375, 10.263671875, 10.9658203125, 11.66796875, 12.3701171875, 13.072265625, 13.7744140625, 14.4765625, 15.1787109375, 15.880859375, 16.5830078125, 17.28515625, 17.9873046875, 18.689453125, 19.3916015625, 20.09375]}, "gradients/decoder.transformer.h.11.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 5.0, 0.0, 4.0, 7.0, 7.0, 13.0, 19.0, 34.0, 44.0, 71.0, 92.0, 115.0, 175.0, 270.0, 378.0, 749.0, 10190.0, 3988672.0, 190556.0, 1358.0, 489.0, 315.0, 207.0, 159.0, 119.0, 75.0, 49.0, 46.0, 21.0, 14.0, 7.0, 10.0, 6.0, 4.0, 6.0, 4.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-109.625, -106.2744140625, -102.923828125, -99.5732421875, -96.22265625, -92.8720703125, -89.521484375, -86.1708984375, -82.8203125, -79.4697265625, -76.119140625, -72.7685546875, -69.41796875, -66.0673828125, -62.716796875, -59.3662109375, -56.015625, -52.6650390625, -49.314453125, -45.9638671875, -42.61328125, -39.2626953125, -35.912109375, -32.5615234375, -29.2109375, -25.8603515625, -22.509765625, -19.1591796875, -15.80859375, -12.4580078125, -9.107421875, -5.7568359375, -2.40625, 0.9443359375, 4.294921875, 7.6455078125, 10.99609375, 14.3466796875, 17.697265625, 21.0478515625, 24.3984375, 27.7490234375, 31.099609375, 34.4501953125, 37.80078125, 41.1513671875, 44.501953125, 47.8525390625, 51.203125, 54.5537109375, 57.904296875, 61.2548828125, 64.60546875, 67.9560546875, 71.306640625, 74.6572265625, 78.0078125, 81.3583984375, 84.708984375, 88.0595703125, 91.41015625, 94.7607421875, 98.111328125, 101.4619140625, 104.8125]}, "gradients/decoder.transformer.h.11.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 39.0, 278.0, 518.0, 164.0, 19.0, 1.0, 1.0], "bins": [-743.01708984375, -730.5066528320312, -717.9962158203125, -705.4857788085938, -692.975341796875, -680.4649047851562, -667.9544677734375, -655.4440307617188, -642.93359375, -630.4231567382812, -617.9127197265625, -605.4022827148438, -592.891845703125, -580.3814086914062, -567.8709716796875, -555.3605346679688, -542.8501586914062, -530.3397216796875, -517.8292846679688, -505.31884765625, -492.80841064453125, -480.2979736328125, -467.78753662109375, -455.2771301269531, -442.76666259765625, -430.2562255859375, -417.74578857421875, -405.2353515625, -392.72491455078125, -380.2144775390625, -367.70404052734375, -355.1936340332031, -342.6832275390625, -330.17279052734375, -317.662353515625, -305.15191650390625, -292.6414794921875, -280.13104248046875, -267.62060546875, -255.11019897460938, -242.59974670410156, -230.0893096923828, -217.57887268066406, -205.06845092773438, -192.55801391601562, -180.04757690429688, -167.53713989257812, -155.02670288085938, -142.51626586914062, -130.00582885742188, -117.49539947509766, -104.9849624633789, -92.47453308105469, -79.96409606933594, -67.45365905761719, -54.94322967529297, -42.43280029296875, -29.922367095947266, -17.41193199157715, -4.901496887207031, 7.608936309814453, 20.119369506835938, 32.62980651855469, 45.140235900878906, 57.650672912597656]}, "gradients/decoder.transformer.h.11.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 5.0, 2.0, 4.0, 5.0, 12.0, 4.0, 6.0, 18.0, 7.0, 19.0, 20.0, 16.0, 30.0, 29.0, 31.0, 30.0, 27.0, 37.0, 34.0, 51.0, 41.0, 40.0, 59.0, 52.0, 40.0, 47.0, 39.0, 33.0, 35.0, 30.0, 35.0, 26.0, 17.0, 21.0, 20.0, 21.0, 15.0, 14.0, 8.0, 8.0, 8.0, 9.0, 2.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0], "bins": [-72.4144287109375, -70.39883422851562, -68.38323211669922, -66.36763763427734, -64.35203552246094, -62.33644104003906, -60.32084274291992, -58.30524444580078, -56.28964614868164, -54.2740478515625, -52.25844955444336, -50.24285125732422, -48.227256774902344, -46.21165466308594, -44.19606018066406, -42.18046188354492, -40.16486358642578, -38.14926528930664, -36.1336669921875, -34.11806869506836, -32.10247039794922, -30.08687400817871, -28.071277618408203, -26.055679321289062, -24.040081024169922, -22.02448272705078, -20.00888442993164, -17.993288040161133, -15.977689743041992, -13.962091445922852, -11.946494102478027, -9.930896759033203, -7.9152984619140625, -5.89970064163208, -3.8841028213500977, -1.8685050010681152, 0.1470928192138672, 2.162691116333008, 4.178288459777832, 6.193885803222656, 8.209484100341797, 10.225082397460938, 12.240679740905762, 14.256277084350586, 16.271875381469727, 18.287473678588867, 20.303070068359375, 22.318668365478516, 24.334266662597656, 26.349864959716797, 28.365463256835938, 30.381059646606445, 32.39665985107422, 34.412254333496094, 36.427852630615234, 38.443450927734375, 40.459049224853516, 42.474647521972656, 44.4902458190918, 46.50584411621094, 48.52143859863281, 50.53704071044922, 52.552635192871094, 54.568233489990234, 56.583831787109375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 9.0, 9.0, 5.0, 16.0, 13.0, 13.0, 18.0, 22.0, 23.0, 24.0, 27.0, 30.0, 46.0, 37.0, 35.0, 42.0, 45.0, 44.0, 36.0, 52.0, 38.0, 34.0, 45.0, 42.0, 31.0, 33.0, 20.0, 35.0, 23.0, 28.0, 15.0, 19.0, 12.0, 20.0, 13.0, 12.0, 8.0, 9.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.875, -9.5689697265625, -9.262939453125, -8.9569091796875, -8.65087890625, -8.3448486328125, -8.038818359375, -7.7327880859375, -7.4267578125, -7.1207275390625, -6.814697265625, -6.5086669921875, -6.20263671875, -5.8966064453125, -5.590576171875, -5.2845458984375, -4.978515625, -4.6724853515625, -4.366455078125, -4.0604248046875, -3.75439453125, -3.4483642578125, -3.142333984375, -2.8363037109375, -2.5302734375, -2.2242431640625, -1.918212890625, -1.6121826171875, -1.30615234375, -1.0001220703125, -0.694091796875, -0.3880615234375, -0.08203125, 0.2239990234375, 0.530029296875, 0.8360595703125, 1.14208984375, 1.4481201171875, 1.754150390625, 2.0601806640625, 2.3662109375, 2.6722412109375, 2.978271484375, 3.2843017578125, 3.59033203125, 3.8963623046875, 4.202392578125, 4.5084228515625, 4.814453125, 5.1204833984375, 5.426513671875, 5.7325439453125, 6.03857421875, 6.3446044921875, 6.650634765625, 6.9566650390625, 7.2626953125, 7.5687255859375, 7.874755859375, 8.1807861328125, 8.48681640625, 8.7928466796875, 9.098876953125, 9.4049072265625, 9.7109375]}, "gradients/decoder.transformer.h.11.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 1.0, 1.0, 2.0, 6.0, 8.0, 12.0, 16.0, 24.0, 19.0, 41.0, 54.0, 126.0, 174.0, 282.0, 444.0, 689.0, 1079.0, 1690.0, 2761.0, 4658.0, 7942.0, 13559.0, 23548.0, 41906.0, 73488.0, 127080.0, 201233.0, 212615.0, 142105.0, 82460.0, 46757.0, 26382.0, 15017.0, 8782.0, 5188.0, 3233.0, 1951.0, 1228.0, 731.0, 436.0, 289.0, 207.0, 117.0, 70.0, 42.0, 35.0, 21.0, 17.0, 11.0, 12.0, 7.0, 3.0, 1.0, 1.0, 2.0, 4.0, 0.0, 1.0, 1.0], "bins": [-1.072265625, -1.0388641357421875, -1.005462646484375, -0.9720611572265625, -0.93865966796875, -0.9052581787109375, -0.871856689453125, -0.8384552001953125, -0.8050537109375, -0.7716522216796875, -0.738250732421875, -0.7048492431640625, -0.67144775390625, -0.6380462646484375, -0.604644775390625, -0.5712432861328125, -0.537841796875, -0.5044403076171875, -0.471038818359375, -0.4376373291015625, -0.40423583984375, -0.3708343505859375, -0.337432861328125, -0.3040313720703125, -0.2706298828125, -0.2372283935546875, -0.203826904296875, -0.1704254150390625, -0.13702392578125, -0.1036224365234375, -0.070220947265625, -0.0368194580078125, -0.00341796875, 0.0299835205078125, 0.063385009765625, 0.0967864990234375, 0.13018798828125, 0.1635894775390625, 0.196990966796875, 0.2303924560546875, 0.2637939453125, 0.2971954345703125, 0.330596923828125, 0.3639984130859375, 0.39739990234375, 0.4308013916015625, 0.464202880859375, 0.4976043701171875, 0.531005859375, 0.5644073486328125, 0.597808837890625, 0.6312103271484375, 0.66461181640625, 0.6980133056640625, 0.731414794921875, 0.7648162841796875, 0.7982177734375, 0.8316192626953125, 0.865020751953125, 0.8984222412109375, 0.93182373046875, 0.9652252197265625, 0.998626708984375, 1.0320281982421875, 1.0654296875]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 8.0, 7.0, 6.0, 13.0, 8.0, 16.0, 15.0, 12.0, 21.0, 12.0, 22.0, 35.0, 29.0, 31.0, 26.0, 33.0, 45.0, 34.0, 38.0, 25.0, 33.0, 1060.0, 51.0, 35.0, 22.0, 38.0, 37.0, 33.0, 28.0, 33.0, 26.0, 27.0, 26.0, 27.0, 20.0, 19.0, 15.0, 11.0, 9.0, 11.0, 6.0, 9.0, 2.0, 8.0, 3.0, 2.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-5.91796875, -5.73358154296875, -5.5491943359375, -5.36480712890625, -5.180419921875, -4.99603271484375, -4.8116455078125, -4.62725830078125, -4.44287109375, -4.25848388671875, -4.0740966796875, -3.88970947265625, -3.705322265625, -3.52093505859375, -3.3365478515625, -3.15216064453125, -2.9677734375, -2.78338623046875, -2.5989990234375, -2.41461181640625, -2.230224609375, -2.04583740234375, -1.8614501953125, -1.67706298828125, -1.49267578125, -1.30828857421875, -1.1239013671875, -0.93951416015625, -0.755126953125, -0.57073974609375, -0.3863525390625, -0.20196533203125, -0.017578125, 0.16680908203125, 0.3511962890625, 0.53558349609375, 0.719970703125, 0.90435791015625, 1.0887451171875, 1.27313232421875, 1.45751953125, 1.64190673828125, 1.8262939453125, 2.01068115234375, 2.195068359375, 2.37945556640625, 2.5638427734375, 2.74822998046875, 2.9326171875, 3.11700439453125, 3.3013916015625, 3.48577880859375, 3.670166015625, 3.85455322265625, 4.0389404296875, 4.22332763671875, 4.40771484375, 4.59210205078125, 4.7764892578125, 4.96087646484375, 5.145263671875, 5.32965087890625, 5.5140380859375, 5.69842529296875, 5.8828125]}, "gradients/decoder.transformer.h.11.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 1.0, 5.0, 9.0, 12.0, 13.0, 22.0, 37.0, 56.0, 78.0, 133.0, 166.0, 274.0, 442.0, 757.0, 1196.0, 1880.0, 3091.0, 5088.0, 8118.0, 12685.0, 20401.0, 32354.0, 50949.0, 79351.0, 118048.0, 161481.0, 1207399.0, 133833.0, 93194.0, 61506.0, 39002.0, 24408.0, 15393.0, 9727.0, 6051.0, 3796.0, 2284.0, 1446.0, 933.0, 562.0, 365.0, 204.0, 125.0, 97.0, 51.0, 41.0, 27.0, 14.0, 12.0, 6.0, 11.0, 3.0, 3.0, 2.0, 1.0, 1.0], "bins": [-0.71044921875, -0.6896743774414062, -0.6688995361328125, -0.6481246948242188, -0.627349853515625, -0.6065750122070312, -0.5858001708984375, -0.5650253295898438, -0.54425048828125, -0.5234756469726562, -0.5027008056640625, -0.48192596435546875, -0.461151123046875, -0.44037628173828125, -0.4196014404296875, -0.39882659912109375, -0.3780517578125, -0.35727691650390625, -0.3365020751953125, -0.31572723388671875, -0.294952392578125, -0.27417755126953125, -0.2534027099609375, -0.23262786865234375, -0.21185302734375, -0.19107818603515625, -0.1703033447265625, -0.14952850341796875, -0.128753662109375, -0.10797882080078125, -0.0872039794921875, -0.06642913818359375, -0.045654296875, -0.02487945556640625, -0.0041046142578125, 0.01667022705078125, 0.037445068359375, 0.05821990966796875, 0.0789947509765625, 0.09976959228515625, 0.12054443359375, 0.14131927490234375, 0.1620941162109375, 0.18286895751953125, 0.203643798828125, 0.22441864013671875, 0.2451934814453125, 0.26596832275390625, 0.2867431640625, 0.30751800537109375, 0.3282928466796875, 0.34906768798828125, 0.369842529296875, 0.39061737060546875, 0.4113922119140625, 0.43216705322265625, 0.45294189453125, 0.47371673583984375, 0.4944915771484375, 0.5152664184570312, 0.536041259765625, 0.5568161010742188, 0.5775909423828125, 0.5983657836914062, 0.619140625]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 1.0, 2.0, 1.0, 4.0, 2.0, 4.0, 4.0, 6.0, 10.0, 14.0, 8.0, 9.0, 13.0, 22.0, 20.0, 25.0, 27.0, 24.0, 34.0, 38.0, 39.0, 39.0, 47.0, 47.0, 46.0, 41.0, 49.0, 46.0, 50.0, 33.0, 41.0, 35.0, 28.0, 31.0, 25.0, 26.0, 24.0, 13.0, 13.0, 11.0, 5.0, 9.0, 11.0, 8.0, 8.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0], "bins": [-0.0055389404296875, -0.0053809285163879395, -0.005222916603088379, -0.005064904689788818, -0.004906892776489258, -0.004748880863189697, -0.004590868949890137, -0.004432857036590576, -0.004274845123291016, -0.004116833209991455, -0.0039588212966918945, -0.003800809383392334, -0.0036427974700927734, -0.003484785556793213, -0.0033267736434936523, -0.003168761730194092, -0.0030107498168945312, -0.0028527379035949707, -0.00269472599029541, -0.0025367140769958496, -0.002378702163696289, -0.0022206902503967285, -0.002062678337097168, -0.0019046664237976074, -0.0017466545104980469, -0.0015886425971984863, -0.0014306306838989258, -0.0012726187705993652, -0.0011146068572998047, -0.0009565949440002441, -0.0007985830307006836, -0.000640571117401123, -0.0004825592041015625, -0.00032454729080200195, -0.0001665353775024414, -8.52346420288086e-06, 0.0001494884490966797, 0.00030750036239624023, 0.0004655122756958008, 0.0006235241889953613, 0.0007815361022949219, 0.0009395480155944824, 0.001097559928894043, 0.0012555718421936035, 0.001413583755493164, 0.0015715956687927246, 0.0017296075820922852, 0.0018876194953918457, 0.0020456314086914062, 0.002203643321990967, 0.0023616552352905273, 0.002519667148590088, 0.0026776790618896484, 0.002835690975189209, 0.0029937028884887695, 0.00315171480178833, 0.0033097267150878906, 0.003467738628387451, 0.0036257505416870117, 0.0037837624549865723, 0.003941774368286133, 0.004099786281585693, 0.004257798194885254, 0.0044158101081848145, 0.004573822021484375]}, "gradients/decoder.transformer.h.11.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 4.0, 5.0, 6.0, 7.0, 10.0, 6.0, 6.0, 13.0, 16.0, 13.0, 20.0, 28.0, 21.0, 39.0, 44.0, 54.0, 102.0, 116.0, 219.0, 624.0, 13418.0, 974122.0, 57452.0, 1287.0, 290.0, 138.0, 104.0, 74.0, 76.0, 43.0, 32.0, 36.0, 13.0, 28.0, 16.0, 11.0, 20.0, 3.0, 5.0, 12.0, 3.0, 7.0, 4.0, 3.0, 1.0, 4.0, 1.0, 0.0, 3.0, 3.0, 2.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.116455078125, -0.1126556396484375, -0.108856201171875, -0.1050567626953125, -0.10125732421875, -0.0974578857421875, -0.093658447265625, -0.0898590087890625, -0.0860595703125, -0.0822601318359375, -0.078460693359375, -0.0746612548828125, -0.07086181640625, -0.0670623779296875, -0.063262939453125, -0.0594635009765625, -0.0556640625, -0.0518646240234375, -0.048065185546875, -0.0442657470703125, -0.04046630859375, -0.0366668701171875, -0.032867431640625, -0.0290679931640625, -0.0252685546875, -0.0214691162109375, -0.017669677734375, -0.0138702392578125, -0.01007080078125, -0.0062713623046875, -0.002471923828125, 0.0013275146484375, 0.005126953125, 0.0089263916015625, 0.012725830078125, 0.0165252685546875, 0.02032470703125, 0.0241241455078125, 0.027923583984375, 0.0317230224609375, 0.0355224609375, 0.0393218994140625, 0.043121337890625, 0.0469207763671875, 0.05072021484375, 0.0545196533203125, 0.058319091796875, 0.0621185302734375, 0.06591796875, 0.0697174072265625, 0.073516845703125, 0.0773162841796875, 0.08111572265625, 0.0849151611328125, 0.088714599609375, 0.0925140380859375, 0.0963134765625, 0.1001129150390625, 0.103912353515625, 0.1077117919921875, 0.11151123046875, 0.1153106689453125, 0.119110107421875, 0.1229095458984375, 0.126708984375]}, "gradients/decoder.transformer.h.11.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 7.0, 17.0, 33.0, 83.0, 186.0, 279.0, 228.0, 120.0, 32.0, 18.0, 7.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0032854918390512466, -0.0029052465688437223, -0.0025250010658055544, -0.00214475579559803, -0.001764510408975184, -0.0013842650223523378, -0.0010040197521448135, -0.0006237742491066456, -0.00024352897889912128, 0.00013671637861989439, 0.0005169617361389101, 0.0008972070645540953, 0.0012774524511769414, 0.0016576978377997875, 0.002037943108007312, 0.0024181886110454798, 0.002798433881253004, 0.0031786791514605284, 0.0035589246544986963, 0.003939169924706221, 0.004319415427744389, 0.004699660465121269, 0.005079905968159437, 0.005460151471197605, 0.005840396508574486, 0.006220642011612654, 0.006600887048989534, 0.006981132552027702, 0.00736137805506587, 0.007741623558104038, 0.008121868595480919, 0.008502114564180374, 0.008882359601557255, 0.009262604638934135, 0.00964285060763359, 0.010023095645010471, 0.010403340682387352, 0.010783586651086807, 0.011163831688463688, 0.011544076725840569, 0.011924322694540024, 0.012304567731916904, 0.01268481370061636, 0.01306505873799324, 0.013445303775370121, 0.013825549744069576, 0.014205794781446457, 0.014586040750145912, 0.014966284856200218, 0.015346529893577099, 0.01572677493095398, 0.016107020899653435, 0.01648726686835289, 0.016867510974407196, 0.01724775694310665, 0.017628002911806107, 0.018008248880505562, 0.018388494849205017, 0.018768738955259323, 0.01914898492395878, 0.019529230892658234, 0.01990947499871254, 0.020289720967411995, 0.02066996693611145, 0.021050211042165756]}, "gradients/decoder.transformer.h.11.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 3.0, 4.0, 4.0, 5.0, 5.0, 7.0, 18.0, 11.0, 18.0, 24.0, 14.0, 25.0, 27.0, 24.0, 29.0, 43.0, 32.0, 44.0, 48.0, 44.0, 53.0, 45.0, 32.0, 49.0, 39.0, 48.0, 35.0, 42.0, 24.0, 32.0, 30.0, 28.0, 16.0, 24.0, 16.0, 15.0, 7.0, 11.0, 11.0, 7.0, 6.0, 3.0, 4.0, 2.0, 2.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.003509700298309326, -0.0033970950171351433, -0.0032844897359609604, -0.0031718844547867775, -0.0030592791736125946, -0.0029466738924384117, -0.002834068611264229, -0.002721463330090046, -0.002608858048915863, -0.00249625276774168, -0.0023836474865674973, -0.0022710422053933144, -0.0021584369242191315, -0.0020458316430449486, -0.0019332263618707657, -0.0018206210806965828, -0.0017080157995224, -0.001595410518348217, -0.0014828052371740341, -0.0013701999559998512, -0.0012575946748256683, -0.0011449893936514854, -0.0010323841124773026, -0.0009197788313031197, -0.0008071735501289368, -0.0006945682689547539, -0.000581962987780571, -0.0004693577066063881, -0.0003567524254322052, -0.0002441471442580223, -0.00013154186308383942, -1.8936581909656525e-05, 9.366869926452637e-05, 0.00020627398043870926, 0.00031887926161289215, 0.00043148454278707504, 0.0005440898239612579, 0.0006566951051354408, 0.0007693003863096237, 0.0008819056674838066, 0.0009945109486579895, 0.0011071162298321724, 0.0012197215110063553, 0.0013323267921805382, 0.001444932073354721, 0.001557537354528904, 0.0016701426357030869, 0.0017827479168772697, 0.0018953531980514526, 0.0020079584792256355, 0.0021205637603998184, 0.0022331690415740013, 0.002345774322748184, 0.002458379603922367, 0.00257098488509655, 0.002683590166270733, 0.0027961954474449158, 0.0029088007286190987, 0.0030214060097932816, 0.0031340112909674644, 0.0032466165721416473, 0.0033592218533158302, 0.003471827134490013, 0.003584432415664196, 0.003697037696838379]}, "gradients/decoder.transformer.h.11.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 4.0, 1.0, 3.0, 1.0, 0.0, 9.0, 9.0, 5.0, 16.0, 13.0, 13.0, 18.0, 22.0, 23.0, 24.0, 27.0, 30.0, 46.0, 37.0, 35.0, 42.0, 45.0, 44.0, 36.0, 52.0, 38.0, 34.0, 45.0, 41.0, 32.0, 33.0, 20.0, 35.0, 23.0, 28.0, 15.0, 19.0, 12.0, 20.0, 13.0, 12.0, 8.0, 9.0, 5.0, 5.0, 5.0, 1.0, 5.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-9.875, -9.5689697265625, -9.262939453125, -8.9569091796875, -8.65087890625, -8.3448486328125, -8.038818359375, -7.7327880859375, -7.4267578125, -7.1207275390625, -6.814697265625, -6.5086669921875, -6.20263671875, -5.8966064453125, -5.590576171875, -5.2845458984375, -4.978515625, -4.6724853515625, -4.366455078125, -4.0604248046875, -3.75439453125, -3.4483642578125, -3.142333984375, -2.8363037109375, -2.5302734375, -2.2242431640625, -1.918212890625, -1.6121826171875, -1.30615234375, -1.0001220703125, -0.694091796875, -0.3880615234375, -0.08203125, 0.2239990234375, 0.530029296875, 0.8360595703125, 1.14208984375, 1.4481201171875, 1.754150390625, 2.0601806640625, 2.3662109375, 2.6722412109375, 2.978271484375, 3.2843017578125, 3.59033203125, 3.8963623046875, 4.202392578125, 4.5084228515625, 4.814453125, 5.1204833984375, 5.426513671875, 5.7325439453125, 6.03857421875, 6.3446044921875, 6.650634765625, 6.9566650390625, 7.2626953125, 7.5687255859375, 7.874755859375, 8.1807861328125, 8.48681640625, 8.7928466796875, 9.098876953125, 9.4049072265625, 9.7109375]}, "gradients/decoder.transformer.h.11.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 6.0, 7.0, 8.0, 17.0, 15.0, 19.0, 28.0, 38.0, 71.0, 94.0, 171.0, 358.0, 611.0, 1134.0, 2244.0, 4577.0, 8902.0, 18126.0, 38922.0, 97050.0, 305107.0, 372709.0, 113715.0, 44262.0, 20170.0, 9789.0, 5025.0, 2558.0, 1215.0, 651.0, 362.0, 214.0, 126.0, 72.0, 54.0, 32.0, 22.0, 15.0, 20.0, 15.0, 5.0, 9.0, 6.0, 4.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-6.50390625, -6.29461669921875, -6.0853271484375, -5.87603759765625, -5.666748046875, -5.45745849609375, -5.2481689453125, -5.03887939453125, -4.82958984375, -4.62030029296875, -4.4110107421875, -4.20172119140625, -3.992431640625, -3.78314208984375, -3.5738525390625, -3.36456298828125, -3.1552734375, -2.94598388671875, -2.7366943359375, -2.52740478515625, -2.318115234375, -2.10882568359375, -1.8995361328125, -1.69024658203125, -1.48095703125, -1.27166748046875, -1.0623779296875, -0.85308837890625, -0.643798828125, -0.43450927734375, -0.2252197265625, -0.01593017578125, 0.193359375, 0.40264892578125, 0.6119384765625, 0.82122802734375, 1.030517578125, 1.23980712890625, 1.4490966796875, 1.65838623046875, 1.86767578125, 2.07696533203125, 2.2862548828125, 2.49554443359375, 2.704833984375, 2.91412353515625, 3.1234130859375, 3.33270263671875, 3.5419921875, 3.75128173828125, 3.9605712890625, 4.16986083984375, 4.379150390625, 4.58843994140625, 4.7977294921875, 5.00701904296875, 5.21630859375, 5.42559814453125, 5.6348876953125, 5.84417724609375, 6.053466796875, 6.26275634765625, 6.4720458984375, 6.68133544921875, 6.890625]}, "gradients/decoder.transformer.h.11.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 3.0, 3.0, 8.0, 5.0, 9.0, 11.0, 12.0, 9.0, 14.0, 22.0, 28.0, 23.0, 28.0, 35.0, 39.0, 36.0, 52.0, 54.0, 72.0, 265.0, 1669.0, 166.0, 80.0, 66.0, 46.0, 46.0, 46.0, 41.0, 33.0, 27.0, 21.0, 14.0, 12.0, 12.0, 7.0, 12.0, 5.0, 6.0, 8.0, 2.0, 0.0, 3.0, 2.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-38.8125, -37.61083984375, -36.4091796875, -35.20751953125, -34.005859375, -32.80419921875, -31.6025390625, -30.40087890625, -29.19921875, -27.99755859375, -26.7958984375, -25.59423828125, -24.392578125, -23.19091796875, -21.9892578125, -20.78759765625, -19.5859375, -18.38427734375, -17.1826171875, -15.98095703125, -14.779296875, -13.57763671875, -12.3759765625, -11.17431640625, -9.97265625, -8.77099609375, -7.5693359375, -6.36767578125, -5.166015625, -3.96435546875, -2.7626953125, -1.56103515625, -0.359375, 0.84228515625, 2.0439453125, 3.24560546875, 4.447265625, 5.64892578125, 6.8505859375, 8.05224609375, 9.25390625, 10.45556640625, 11.6572265625, 12.85888671875, 14.060546875, 15.26220703125, 16.4638671875, 17.66552734375, 18.8671875, 20.06884765625, 21.2705078125, 22.47216796875, 23.673828125, 24.87548828125, 26.0771484375, 27.27880859375, 28.48046875, 29.68212890625, 30.8837890625, 32.08544921875, 33.287109375, 34.48876953125, 35.6904296875, 36.89208984375, 38.09375]}, "gradients/decoder.transformer.h.11.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 5.0, 5.0, 16.0, 9.0, 18.0, 18.0, 24.0, 29.0, 50.0, 60.0, 84.0, 119.0, 128.0, 164.0, 280.0, 480.0, 1462.0, 140676.0, 2997112.0, 3323.0, 555.0, 293.0, 199.0, 143.0, 115.0, 70.0, 56.0, 35.0, 45.0, 22.0, 22.0, 17.0, 14.0, 17.0, 8.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-88.375, -85.5390625, -82.703125, -79.8671875, -77.03125, -74.1953125, -71.359375, -68.5234375, -65.6875, -62.8515625, -60.015625, -57.1796875, -54.34375, -51.5078125, -48.671875, -45.8359375, -43.0, -40.1640625, -37.328125, -34.4921875, -31.65625, -28.8203125, -25.984375, -23.1484375, -20.3125, -17.4765625, -14.640625, -11.8046875, -8.96875, -6.1328125, -3.296875, -0.4609375, 2.375, 5.2109375, 8.046875, 10.8828125, 13.71875, 16.5546875, 19.390625, 22.2265625, 25.0625, 27.8984375, 30.734375, 33.5703125, 36.40625, 39.2421875, 42.078125, 44.9140625, 47.75, 50.5859375, 53.421875, 56.2578125, 59.09375, 61.9296875, 64.765625, 67.6015625, 70.4375, 73.2734375, 76.109375, 78.9453125, 81.78125, 84.6171875, 87.453125, 90.2890625, 93.125]}, "gradients/decoder.transformer.h.11.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 7.0, 18.0, 38.0, 58.0, 88.0, 150.0, 167.0, 176.0, 124.0, 82.0, 59.0, 22.0, 10.0, 4.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.597721099853516, -37.487117767333984, -36.37651443481445, -35.26591110229492, -34.15530776977539, -33.044700622558594, -31.934099197387695, -30.823495864868164, -29.712890625, -28.60228729248047, -27.491683959960938, -26.381080627441406, -25.270475387573242, -24.15987205505371, -23.04926872253418, -21.93866539001465, -20.828062057495117, -19.717458724975586, -18.606855392456055, -17.49625015258789, -16.38564682006836, -15.275043487548828, -14.164440155029297, -13.053836822509766, -11.943232536315918, -10.832629203796387, -9.722024917602539, -8.611421585083008, -7.500817775726318, -6.390213966369629, -5.279610633850098, -4.169006824493408, -3.0584030151367188, -1.9477993249893188, -0.837195634841919, 0.2734079360961914, 1.3840117454528809, 2.4946155548095703, 3.6052188873291016, 4.715822696685791, 5.8264265060424805, 6.93703031539917, 8.04763412475586, 9.15823745727539, 10.268840789794922, 11.37944507598877, 12.4900484085083, 13.600652694702148, 14.71125602722168, 15.821859359741211, 16.932462692260742, 18.043067932128906, 19.153671264648438, 20.26427459716797, 21.3748779296875, 22.48548126220703, 23.596084594726562, 24.706687927246094, 25.817291259765625, 26.927894592285156, 28.03849983215332, 29.14910316467285, 30.259706497192383, 31.370309829711914, 32.48091506958008]}, "gradients/decoder.transformer.h.11.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 2.0, 5.0, 2.0, 4.0, 5.0, 6.0, 6.0, 23.0, 18.0, 11.0, 22.0, 18.0, 20.0, 32.0, 29.0, 31.0, 39.0, 35.0, 26.0, 38.0, 44.0, 46.0, 35.0, 44.0, 33.0, 42.0, 49.0, 38.0, 37.0, 32.0, 33.0, 25.0, 27.0, 37.0, 24.0, 14.0, 16.0, 10.0, 9.0, 10.0, 6.0, 7.0, 4.0, 2.0, 1.0, 3.0, 4.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-83.06470489501953, -80.42549133300781, -77.7862777709961, -75.14705657958984, -72.50784301757812, -69.8686294555664, -67.22941589355469, -64.59020233154297, -61.950984954833984, -59.311771392822266, -56.67255401611328, -54.03334045410156, -51.394126892089844, -48.75490951538086, -46.11569595336914, -43.476478576660156, -40.83726501464844, -38.19805145263672, -35.558834075927734, -32.919620513916016, -30.280405044555664, -27.641189575195312, -25.001976013183594, -22.362760543823242, -19.72354507446289, -17.08432960510254, -14.445115089416504, -11.805900573730469, -9.166685104370117, -6.527469635009766, -3.8882551193237305, -1.2490406036376953, 1.3901824951171875, 4.029397487640381, 6.668612480163574, 9.30782699584961, 11.947042465209961, 14.586257934570312, 17.22547149658203, 19.864686965942383, 22.503902435302734, 25.143117904663086, 27.782333374023438, 30.421546936035156, 33.060760498046875, 35.69997787475586, 38.33919143676758, 40.97840881347656, 43.61762237548828, 46.2568359375, 48.896053314208984, 51.5352668762207, 54.17448425292969, 56.813697814941406, 59.452911376953125, 62.092124938964844, 64.73133850097656, 67.37055206298828, 70.009765625, 72.64898681640625, 75.28820037841797, 77.92741394042969, 80.5666275024414, 83.20584106445312, 85.84506225585938]}, "gradients/decoder.transformer.h.10.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 7.0, 3.0, 12.0, 8.0, 11.0, 13.0, 20.0, 21.0, 21.0, 14.0, 26.0, 25.0, 44.0, 35.0, 35.0, 40.0, 48.0, 43.0, 39.0, 43.0, 39.0, 31.0, 38.0, 40.0, 44.0, 34.0, 28.0, 30.0, 32.0, 26.0, 20.0, 18.0, 15.0, 12.0, 18.0, 20.0, 11.0, 6.0, 9.0, 10.0, 2.0, 4.0, 1.0, 3.0, 1.0, 4.0, 2.0, 0.0, 0.0, 2.0, 0.0, 1.0], "bins": [-9.9921875, -9.6815185546875, -9.370849609375, -9.0601806640625, -8.74951171875, -8.4388427734375, -8.128173828125, -7.8175048828125, -7.5068359375, -7.1961669921875, -6.885498046875, -6.5748291015625, -6.26416015625, -5.9534912109375, -5.642822265625, -5.3321533203125, -5.021484375, -4.7108154296875, -4.400146484375, -4.0894775390625, -3.77880859375, -3.4681396484375, -3.157470703125, -2.8468017578125, -2.5361328125, -2.2254638671875, -1.914794921875, -1.6041259765625, -1.29345703125, -0.9827880859375, -0.672119140625, -0.3614501953125, -0.05078125, 0.2598876953125, 0.570556640625, 0.8812255859375, 1.19189453125, 1.5025634765625, 1.813232421875, 2.1239013671875, 2.4345703125, 2.7452392578125, 3.055908203125, 3.3665771484375, 3.67724609375, 3.9879150390625, 4.298583984375, 4.6092529296875, 4.919921875, 5.2305908203125, 5.541259765625, 5.8519287109375, 6.16259765625, 6.4732666015625, 6.783935546875, 7.0946044921875, 7.4052734375, 7.7159423828125, 8.026611328125, 8.3372802734375, 8.64794921875, 8.9586181640625, 9.269287109375, 9.5799560546875, 9.890625]}, "gradients/decoder.transformer.h.10.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 3.0, 2.0, 6.0, 3.0, 4.0, 14.0, 12.0, 9.0, 18.0, 23.0, 17.0, 16.0, 33.0, 37.0, 45.0, 63.0, 179.0, 350.0, 1477.0, 8524.0, 85086.0, 1813026.0, 2167839.0, 105554.0, 9493.0, 1554.0, 403.0, 166.0, 65.0, 39.0, 46.0, 35.0, 23.0, 23.0, 19.0, 16.0, 20.0, 16.0, 9.0, 3.0, 3.0, 5.0, 7.0, 2.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-31.484375, -30.501708984375, -29.51904296875, -28.536376953125, -27.5537109375, -26.571044921875, -25.58837890625, -24.605712890625, -23.623046875, -22.640380859375, -21.65771484375, -20.675048828125, -19.6923828125, -18.709716796875, -17.72705078125, -16.744384765625, -15.76171875, -14.779052734375, -13.79638671875, -12.813720703125, -11.8310546875, -10.848388671875, -9.86572265625, -8.883056640625, -7.900390625, -6.917724609375, -5.93505859375, -4.952392578125, -3.9697265625, -2.987060546875, -2.00439453125, -1.021728515625, -0.0390625, 0.943603515625, 1.92626953125, 2.908935546875, 3.8916015625, 4.874267578125, 5.85693359375, 6.839599609375, 7.822265625, 8.804931640625, 9.78759765625, 10.770263671875, 11.7529296875, 12.735595703125, 13.71826171875, 14.700927734375, 15.68359375, 16.666259765625, 17.64892578125, 18.631591796875, 19.6142578125, 20.596923828125, 21.57958984375, 22.562255859375, 23.544921875, 24.527587890625, 25.51025390625, 26.492919921875, 27.4755859375, 28.458251953125, 29.44091796875, 30.423583984375, 31.40625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 4.0, 2.0, 3.0, 4.0, 7.0, 2.0, 5.0, 9.0, 10.0, 11.0, 29.0, 32.0, 41.0, 49.0, 82.0, 82.0, 131.0, 127.0, 222.0, 264.0, 316.0, 408.0, 415.0, 412.0, 308.0, 262.0, 205.0, 153.0, 96.0, 92.0, 57.0, 54.0, 50.0, 30.0, 15.0, 21.0, 16.0, 11.0, 11.0, 10.0, 4.0, 4.0, 8.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.3203125, -14.8013916015625, -14.282470703125, -13.7635498046875, -13.24462890625, -12.7257080078125, -12.206787109375, -11.6878662109375, -11.1689453125, -10.6500244140625, -10.131103515625, -9.6121826171875, -9.09326171875, -8.5743408203125, -8.055419921875, -7.5364990234375, -7.017578125, -6.4986572265625, -5.979736328125, -5.4608154296875, -4.94189453125, -4.4229736328125, -3.904052734375, -3.3851318359375, -2.8662109375, -2.3472900390625, -1.828369140625, -1.3094482421875, -0.79052734375, -0.2716064453125, 0.247314453125, 0.7662353515625, 1.28515625, 1.8040771484375, 2.322998046875, 2.8419189453125, 3.36083984375, 3.8797607421875, 4.398681640625, 4.9176025390625, 5.4365234375, 5.9554443359375, 6.474365234375, 6.9932861328125, 7.51220703125, 8.0311279296875, 8.550048828125, 9.0689697265625, 9.587890625, 10.1068115234375, 10.625732421875, 11.1446533203125, 11.66357421875, 12.1824951171875, 12.701416015625, 13.2203369140625, 13.7392578125, 14.2581787109375, 14.777099609375, 15.2960205078125, 15.81494140625, 16.3338623046875, 16.852783203125, 17.3717041015625, 17.890625]}, "gradients/decoder.transformer.h.10.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 8.0, 5.0, 10.0, 9.0, 17.0, 17.0, 20.0, 28.0, 36.0, 48.0, 65.0, 87.0, 103.0, 120.0, 174.0, 212.0, 298.0, 509.0, 2326.0, 221669.0, 3934266.0, 31538.0, 1105.0, 433.0, 291.0, 191.0, 173.0, 134.0, 103.0, 67.0, 61.0, 46.0, 30.0, 22.0, 23.0, 12.0, 6.0, 7.0, 5.0, 3.0, 6.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-90.3125, -87.681640625, -85.05078125, -82.419921875, -79.7890625, -77.158203125, -74.52734375, -71.896484375, -69.265625, -66.634765625, -64.00390625, -61.373046875, -58.7421875, -56.111328125, -53.48046875, -50.849609375, -48.21875, -45.587890625, -42.95703125, -40.326171875, -37.6953125, -35.064453125, -32.43359375, -29.802734375, -27.171875, -24.541015625, -21.91015625, -19.279296875, -16.6484375, -14.017578125, -11.38671875, -8.755859375, -6.125, -3.494140625, -0.86328125, 1.767578125, 4.3984375, 7.029296875, 9.66015625, 12.291015625, 14.921875, 17.552734375, 20.18359375, 22.814453125, 25.4453125, 28.076171875, 30.70703125, 33.337890625, 35.96875, 38.599609375, 41.23046875, 43.861328125, 46.4921875, 49.123046875, 51.75390625, 54.384765625, 57.015625, 59.646484375, 62.27734375, 64.908203125, 67.5390625, 70.169921875, 72.80078125, 75.431640625, 78.0625]}, "gradients/decoder.transformer.h.10.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 19.0, 61.0, 169.0, 291.0, 258.0, 152.0, 54.0, 11.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-269.2635803222656, -262.8293762207031, -256.3951721191406, -249.9609832763672, -243.52679443359375, -237.09259033203125, -230.65838623046875, -224.2241973876953, -217.79000854492188, -211.35580444335938, -204.92161560058594, -198.48741149902344, -192.05322265625, -185.6190185546875, -179.184814453125, -172.75062561035156, -166.31642150878906, -159.88221740722656, -153.44802856445312, -147.01382446289062, -140.5796356201172, -134.1454315185547, -127.71123504638672, -121.27703857421875, -114.84284210205078, -108.40864562988281, -101.97444915771484, -95.54025268554688, -89.10604858398438, -82.67185974121094, -76.23765563964844, -69.80345916748047, -63.3692626953125, -56.93506622314453, -50.50086975097656, -44.06666946411133, -37.63247299194336, -31.19827651977539, -24.764076232910156, -18.329879760742188, -11.895683288574219, -5.461485862731934, 0.9727115631103516, 7.406909942626953, 13.841106414794922, 20.27530288696289, 26.709503173828125, 33.143699645996094, 39.57789611816406, 46.01209259033203, 52.4462890625, 58.880489349365234, 65.31468200683594, 71.74888610839844, 78.1830825805664, 84.61727905273438, 91.05147552490234, 97.48567199707031, 103.91986846923828, 110.35406494140625, 116.78826904296875, 123.22245788574219, 129.6566619873047, 136.09085083007812, 142.52505493164062]}, "gradients/decoder.transformer.h.10.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 7.0, 2.0, 1.0, 7.0, 4.0, 7.0, 11.0, 10.0, 8.0, 12.0, 17.0, 17.0, 14.0, 19.0, 25.0, 26.0, 24.0, 35.0, 36.0, 21.0, 42.0, 36.0, 50.0, 42.0, 31.0, 43.0, 35.0, 38.0, 48.0, 36.0, 28.0, 40.0, 39.0, 28.0, 20.0, 21.0, 21.0, 17.0, 24.0, 8.0, 14.0, 11.0, 8.0, 9.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-65.9259033203125, -64.07484436035156, -62.22378158569336, -60.372718811035156, -58.52165985107422, -56.670597076416016, -54.81953430175781, -52.968475341796875, -51.11741256713867, -49.26634979248047, -47.41529083251953, -45.56422805786133, -43.713165283203125, -41.86210632324219, -40.011043548583984, -38.15998077392578, -36.308921813964844, -34.45785903930664, -32.6068000793457, -30.7557373046875, -28.90467643737793, -27.05361557006836, -25.202552795410156, -23.351491928100586, -21.500431060791016, -19.649370193481445, -17.798309326171875, -15.947246551513672, -14.096185684204102, -12.245124816894531, -10.394062995910645, -8.543001174926758, -6.6919403076171875, -4.840878963470459, -2.9898176193237305, -1.138756275177002, 0.7123050689697266, 2.563365936279297, 4.414427757263184, 6.26548957824707, 8.11655044555664, 9.967611312866211, 11.818673133850098, 13.669734954833984, 15.520795822143555, 17.371856689453125, 19.222919464111328, 21.0739803314209, 22.92504119873047, 24.77610206604004, 26.62716293334961, 28.478225708007812, 30.329286575317383, 32.18034744262695, 34.031410217285156, 35.882469177246094, 37.7335319519043, 39.5845947265625, 41.43565368652344, 43.28671646118164, 45.137779235839844, 46.98883819580078, 48.839900970458984, 50.69096374511719, 52.542022705078125]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 1.0, 2.0, 5.0, 2.0, 12.0, 20.0, 11.0, 11.0, 23.0, 19.0, 24.0, 26.0, 23.0, 35.0, 29.0, 33.0, 41.0, 40.0, 39.0, 47.0, 51.0, 47.0, 43.0, 30.0, 38.0, 39.0, 36.0, 29.0, 32.0, 28.0, 28.0, 36.0, 13.0, 20.0, 15.0, 8.0, 12.0, 11.0, 13.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.59375, -9.287353515625, -8.98095703125, -8.674560546875, -8.3681640625, -8.061767578125, -7.75537109375, -7.448974609375, -7.142578125, -6.836181640625, -6.52978515625, -6.223388671875, -5.9169921875, -5.610595703125, -5.30419921875, -4.997802734375, -4.69140625, -4.385009765625, -4.07861328125, -3.772216796875, -3.4658203125, -3.159423828125, -2.85302734375, -2.546630859375, -2.240234375, -1.933837890625, -1.62744140625, -1.321044921875, -1.0146484375, -0.708251953125, -0.40185546875, -0.095458984375, 0.2109375, 0.517333984375, 0.82373046875, 1.130126953125, 1.4365234375, 1.742919921875, 2.04931640625, 2.355712890625, 2.662109375, 2.968505859375, 3.27490234375, 3.581298828125, 3.8876953125, 4.194091796875, 4.50048828125, 4.806884765625, 5.11328125, 5.419677734375, 5.72607421875, 6.032470703125, 6.3388671875, 6.645263671875, 6.95166015625, 7.258056640625, 7.564453125, 7.870849609375, 8.17724609375, 8.483642578125, 8.7900390625, 9.096435546875, 9.40283203125, 9.709228515625, 10.015625]}, "gradients/decoder.transformer.h.10.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 9.0, 5.0, 4.0, 11.0, 22.0, 27.0, 26.0, 37.0, 63.0, 92.0, 173.0, 289.0, 444.0, 610.0, 915.0, 1467.0, 2351.0, 3712.0, 5765.0, 9369.0, 14953.0, 24527.0, 40062.0, 65818.0, 107544.0, 164162.0, 195680.0, 153577.0, 98895.0, 61154.0, 37009.0, 22448.0, 13802.0, 8753.0, 5473.0, 3283.0, 2106.0, 1402.0, 899.0, 545.0, 371.0, 239.0, 163.0, 97.0, 74.0, 40.0, 39.0, 12.0, 14.0, 9.0, 9.0, 8.0, 3.0, 1.0, 4.0, 3.0], "bins": [-0.98095703125, -0.95245361328125, -0.9239501953125, -0.89544677734375, -0.866943359375, -0.83843994140625, -0.8099365234375, -0.78143310546875, -0.7529296875, -0.72442626953125, -0.6959228515625, -0.66741943359375, -0.638916015625, -0.61041259765625, -0.5819091796875, -0.55340576171875, -0.52490234375, -0.49639892578125, -0.4678955078125, -0.43939208984375, -0.410888671875, -0.38238525390625, -0.3538818359375, -0.32537841796875, -0.296875, -0.26837158203125, -0.2398681640625, -0.21136474609375, -0.182861328125, -0.15435791015625, -0.1258544921875, -0.09735107421875, -0.06884765625, -0.04034423828125, -0.0118408203125, 0.01666259765625, 0.045166015625, 0.07366943359375, 0.1021728515625, 0.13067626953125, 0.1591796875, 0.18768310546875, 0.2161865234375, 0.24468994140625, 0.273193359375, 0.30169677734375, 0.3302001953125, 0.35870361328125, 0.38720703125, 0.41571044921875, 0.4442138671875, 0.47271728515625, 0.501220703125, 0.52972412109375, 0.5582275390625, 0.58673095703125, 0.615234375, 0.64373779296875, 0.6722412109375, 0.70074462890625, 0.729248046875, 0.75775146484375, 0.7862548828125, 0.81475830078125, 0.84326171875]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 5.0, 10.0, 4.0, 10.0, 14.0, 15.0, 8.0, 11.0, 13.0, 17.0, 12.0, 19.0, 31.0, 34.0, 28.0, 45.0, 40.0, 38.0, 42.0, 39.0, 34.0, 35.0, 1059.0, 43.0, 33.0, 38.0, 34.0, 34.0, 34.0, 37.0, 30.0, 23.0, 20.0, 19.0, 20.0, 15.0, 13.0, 16.0, 12.0, 10.0, 12.0, 8.0, 4.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-6.0703125, -5.88861083984375, -5.7069091796875, -5.52520751953125, -5.343505859375, -5.16180419921875, -4.9801025390625, -4.79840087890625, -4.61669921875, -4.43499755859375, -4.2532958984375, -4.07159423828125, -3.889892578125, -3.70819091796875, -3.5264892578125, -3.34478759765625, -3.1630859375, -2.98138427734375, -2.7996826171875, -2.61798095703125, -2.436279296875, -2.25457763671875, -2.0728759765625, -1.89117431640625, -1.70947265625, -1.52777099609375, -1.3460693359375, -1.16436767578125, -0.982666015625, -0.80096435546875, -0.6192626953125, -0.43756103515625, -0.255859375, -0.07415771484375, 0.1075439453125, 0.28924560546875, 0.470947265625, 0.65264892578125, 0.8343505859375, 1.01605224609375, 1.19775390625, 1.37945556640625, 1.5611572265625, 1.74285888671875, 1.924560546875, 2.10626220703125, 2.2879638671875, 2.46966552734375, 2.6513671875, 2.83306884765625, 3.0147705078125, 3.19647216796875, 3.378173828125, 3.55987548828125, 3.7415771484375, 3.92327880859375, 4.10498046875, 4.28668212890625, 4.4683837890625, 4.65008544921875, 4.831787109375, 5.01348876953125, 5.1951904296875, 5.37689208984375, 5.55859375]}, "gradients/decoder.transformer.h.10.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 4.0, 5.0, 2.0, 17.0, 16.0, 20.0, 34.0, 45.0, 73.0, 98.0, 140.0, 243.0, 331.0, 500.0, 767.0, 1175.0, 1846.0, 2632.0, 4227.0, 6625.0, 10201.0, 15843.0, 25089.0, 39552.0, 62081.0, 94810.0, 135367.0, 1206662.0, 159363.0, 114195.0, 77685.0, 49630.0, 31489.0, 19927.0, 12939.0, 8187.0, 5334.0, 3429.0, 2257.0, 1511.0, 977.0, 622.0, 395.0, 239.0, 203.0, 119.0, 83.0, 55.0, 22.0, 31.0, 17.0, 16.0, 3.0, 4.0, 3.0, 3.0, 1.0, 2.0], "bins": [-0.685546875, -0.6652374267578125, -0.644927978515625, -0.6246185302734375, -0.60430908203125, -0.5839996337890625, -0.563690185546875, -0.5433807373046875, -0.5230712890625, -0.5027618408203125, -0.482452392578125, -0.4621429443359375, -0.44183349609375, -0.4215240478515625, -0.401214599609375, -0.3809051513671875, -0.360595703125, -0.3402862548828125, -0.319976806640625, -0.2996673583984375, -0.27935791015625, -0.2590484619140625, -0.238739013671875, -0.2184295654296875, -0.1981201171875, -0.1778106689453125, -0.157501220703125, -0.1371917724609375, -0.11688232421875, -0.0965728759765625, -0.076263427734375, -0.0559539794921875, -0.03564453125, -0.0153350830078125, 0.004974365234375, 0.0252838134765625, 0.04559326171875, 0.0659027099609375, 0.086212158203125, 0.1065216064453125, 0.1268310546875, 0.1471405029296875, 0.167449951171875, 0.1877593994140625, 0.20806884765625, 0.2283782958984375, 0.248687744140625, 0.2689971923828125, 0.289306640625, 0.3096160888671875, 0.329925537109375, 0.3502349853515625, 0.37054443359375, 0.3908538818359375, 0.411163330078125, 0.4314727783203125, 0.4517822265625, 0.4720916748046875, 0.492401123046875, 0.5127105712890625, 0.53302001953125, 0.5533294677734375, 0.573638916015625, 0.5939483642578125, 0.6142578125]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 5.0, 8.0, 3.0, 7.0, 11.0, 15.0, 17.0, 16.0, 25.0, 28.0, 43.0, 38.0, 48.0, 75.0, 72.0, 94.0, 88.0, 69.0, 78.0, 59.0, 50.0, 30.0, 23.0, 23.0, 16.0, 13.0, 10.0, 4.0, 6.0, 6.0, 6.0, 3.0, 4.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00814056396484375, -0.00788867473602295, -0.0076367855072021484, -0.007384896278381348, -0.007133007049560547, -0.006881117820739746, -0.006629228591918945, -0.0063773393630981445, -0.006125450134277344, -0.005873560905456543, -0.005621671676635742, -0.005369782447814941, -0.005117893218994141, -0.00486600399017334, -0.004614114761352539, -0.004362225532531738, -0.0041103363037109375, -0.0038584470748901367, -0.003606557846069336, -0.003354668617248535, -0.0031027793884277344, -0.0028508901596069336, -0.002599000930786133, -0.002347111701965332, -0.0020952224731445312, -0.0018433332443237305, -0.0015914440155029297, -0.001339554786682129, -0.0010876655578613281, -0.0008357763290405273, -0.0005838871002197266, -0.0003319978713989258, -8.0108642578125e-05, 0.00017178058624267578, 0.00042366981506347656, 0.0006755590438842773, 0.0009274482727050781, 0.001179337501525879, 0.0014312267303466797, 0.0016831159591674805, 0.0019350051879882812, 0.002186894416809082, 0.002438783645629883, 0.0026906728744506836, 0.0029425621032714844, 0.003194451332092285, 0.003446340560913086, 0.0036982297897338867, 0.0039501190185546875, 0.004202008247375488, 0.004453897476196289, 0.00470578670501709, 0.004957675933837891, 0.005209565162658691, 0.005461454391479492, 0.005713343620300293, 0.005965232849121094, 0.0062171220779418945, 0.006469011306762695, 0.006720900535583496, 0.006972789764404297, 0.007224678993225098, 0.0074765682220458984, 0.007728457450866699, 0.0079803466796875]}, "gradients/decoder.transformer.h.10.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 4.0, 3.0, 5.0, 5.0, 6.0, 4.0, 8.0, 9.0, 16.0, 25.0, 27.0, 25.0, 40.0, 64.0, 100.0, 164.0, 369.0, 4519.0, 1029888.0, 12130.0, 500.0, 188.0, 116.0, 78.0, 61.0, 48.0, 27.0, 23.0, 22.0, 19.0, 11.0, 14.0, 9.0, 7.0, 4.0, 2.0, 7.0, 2.0, 3.0, 0.0, 3.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.17041015625, -0.16501426696777344, -0.15961837768554688, -0.1542224884033203, -0.14882659912109375, -0.1434307098388672, -0.13803482055664062, -0.13263893127441406, -0.1272430419921875, -0.12184715270996094, -0.11645126342773438, -0.11105537414550781, -0.10565948486328125, -0.10026359558105469, -0.09486770629882812, -0.08947181701660156, -0.084075927734375, -0.07868003845214844, -0.07328414916992188, -0.06788825988769531, -0.06249237060546875, -0.05709648132324219, -0.051700592041015625, -0.04630470275878906, -0.0409088134765625, -0.03551292419433594, -0.030117034912109375, -0.024721145629882812, -0.01932525634765625, -0.013929367065429688, -0.008533477783203125, -0.0031375885009765625, 0.00225830078125, 0.0076541900634765625, 0.013050079345703125, 0.018445968627929688, 0.02384185791015625, 0.029237747192382812, 0.034633636474609375, 0.04002952575683594, 0.0454254150390625, 0.05082130432128906, 0.056217193603515625, 0.06161308288574219, 0.06700897216796875, 0.07240486145019531, 0.07780075073242188, 0.08319664001464844, 0.088592529296875, 0.09398841857910156, 0.09938430786132812, 0.10478019714355469, 0.11017608642578125, 0.11557197570800781, 0.12096786499023438, 0.12636375427246094, 0.1317596435546875, 0.13715553283691406, 0.14255142211914062, 0.1479473114013672, 0.15334320068359375, 0.1587390899658203, 0.16413497924804688, 0.16953086853027344, 0.1749267578125]}, "gradients/decoder.transformer.h.10.ln_cross_attn.weight": {"_type": "histogram", "values": [7.0, 391.0, 608.0, 12.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0034315327648073435, -0.001782377134077251, -0.00013322150334715843, 0.0015159340109676123, 0.0031650897581130266, 0.004814245738089085, 0.006463401019573212, 0.008112557232379913, 0.00976171251386404, 0.011410867795348167, 0.013060024008154869, 0.014709179289638996, 0.016358334571123123, 0.018007490783929825, 0.019656646996736526, 0.021305803209543228, 0.02295495755970478, 0.024604113772511482, 0.026253268122673035, 0.027902424335479736, 0.029551580548286438, 0.03120073676109314, 0.03284989297389984, 0.03449904918670654, 0.036148201674222946, 0.03779735788702965, 0.03944651409983635, 0.04109566658735275, 0.042744822800159454, 0.044393979012966156, 0.04604313522577286, 0.04769229143857956, 0.04934144392609596, 0.050990600138902664, 0.052639756351709366, 0.05428890883922577, 0.05593806505203247, 0.05758722126483917, 0.059236377477645874, 0.060885533690452576, 0.06253468990325928, 0.06418384611606598, 0.06583300232887268, 0.06748215854167938, 0.06913131475448608, 0.07078047096729279, 0.07242962718009949, 0.07407878339290619, 0.0757279321551323, 0.077377088367939, 0.0790262445807457, 0.0806754007935524, 0.0823245570063591, 0.0839737132191658, 0.0856228619813919, 0.08727201819419861, 0.08892118185758591, 0.09057033807039261, 0.09221949428319931, 0.09386865049600601, 0.09551780670881271, 0.09716696292161942, 0.09881611168384552, 0.10046526789665222, 0.10211442410945892]}, "gradients/decoder.transformer.h.10.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 8.0, 9.0, 6.0, 15.0, 11.0, 15.0, 21.0, 22.0, 19.0, 24.0, 21.0, 26.0, 32.0, 40.0, 47.0, 36.0, 41.0, 40.0, 39.0, 46.0, 49.0, 40.0, 45.0, 45.0, 31.0, 33.0, 21.0, 33.0, 32.0, 20.0, 22.0, 22.0, 20.0, 17.0, 11.0, 13.0, 7.0, 4.0, 9.0, 9.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.004518568515777588, -0.004389395006000996, -0.004260221496224403, -0.004131047986447811, -0.004001874476671219, -0.0038727009668946266, -0.0037435274571180344, -0.003614353947341442, -0.00348518043756485, -0.0033560069277882576, -0.0032268334180116653, -0.003097659908235073, -0.002968486398458481, -0.0028393128886818886, -0.0027101393789052963, -0.002580965869128704, -0.002451792359352112, -0.0023226188495755196, -0.0021934453397989273, -0.002064271830022335, -0.0019350983202457428, -0.0018059248104691505, -0.0016767513006925583, -0.001547577790915966, -0.0014184042811393738, -0.0012892307713627815, -0.0011600572615861893, -0.001030883751809597, -0.0009017102420330048, -0.0007725367322564125, -0.0006433632224798203, -0.000514189712703228, -0.00038501620292663574, -0.0002558426931500435, -0.00012666918337345123, 2.5043264031410217e-06, 0.00013167783617973328, 0.00026085134595632553, 0.0003900248557329178, 0.00051919836550951, 0.0006483718752861023, 0.0007775453850626945, 0.0009067188948392868, 0.001035892404615879, 0.0011650659143924713, 0.0012942394241690636, 0.0014234129339456558, 0.001552586443722248, 0.0016817599534988403, 0.0018109334632754326, 0.0019401069730520248, 0.002069280482828617, 0.0021984539926052094, 0.0023276275023818016, 0.002456801012158394, 0.002585974521934986, 0.0027151480317115784, 0.0028443215414881706, 0.002973495051264763, 0.003102668561041355, 0.0032318420708179474, 0.0033610155805945396, 0.003490189090371132, 0.003619362600147724, 0.0037485361099243164]}, "gradients/decoder.transformer.h.10.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 3.0, 3.0, 7.0, 1.0, 2.0, 5.0, 2.0, 12.0, 20.0, 11.0, 11.0, 23.0, 19.0, 24.0, 26.0, 23.0, 35.0, 29.0, 33.0, 41.0, 40.0, 39.0, 47.0, 51.0, 47.0, 42.0, 31.0, 38.0, 39.0, 36.0, 29.0, 32.0, 28.0, 28.0, 36.0, 13.0, 20.0, 15.0, 8.0, 12.0, 11.0, 13.0, 7.0, 6.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-9.59375, -9.287353515625, -8.98095703125, -8.674560546875, -8.3681640625, -8.061767578125, -7.75537109375, -7.448974609375, -7.142578125, -6.836181640625, -6.52978515625, -6.223388671875, -5.9169921875, -5.610595703125, -5.30419921875, -4.997802734375, -4.69140625, -4.385009765625, -4.07861328125, -3.772216796875, -3.4658203125, -3.159423828125, -2.85302734375, -2.546630859375, -2.240234375, -1.933837890625, -1.62744140625, -1.321044921875, -1.0146484375, -0.708251953125, -0.40185546875, -0.095458984375, 0.2109375, 0.517333984375, 0.82373046875, 1.130126953125, 1.4365234375, 1.742919921875, 2.04931640625, 2.355712890625, 2.662109375, 2.968505859375, 3.27490234375, 3.581298828125, 3.8876953125, 4.194091796875, 4.50048828125, 4.806884765625, 5.11328125, 5.419677734375, 5.72607421875, 6.032470703125, 6.3388671875, 6.645263671875, 6.95166015625, 7.258056640625, 7.564453125, 7.870849609375, 8.17724609375, 8.483642578125, 8.7900390625, 9.096435546875, 9.40283203125, 9.709228515625, 10.015625]}, "gradients/decoder.transformer.h.10.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 5.0, 5.0, 4.0, 7.0, 8.0, 13.0, 15.0, 25.0, 32.0, 46.0, 51.0, 73.0, 136.0, 150.0, 240.0, 375.0, 670.0, 1417.0, 3204.0, 8004.0, 20953.0, 58814.0, 192869.0, 507883.0, 168509.0, 52836.0, 18757.0, 7298.0, 2982.0, 1361.0, 676.0, 387.0, 233.0, 132.0, 101.0, 65.0, 61.0, 39.0, 33.0, 19.0, 22.0, 16.0, 7.0, 5.0, 8.0, 5.0, 3.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.265625, -9.939208984375, -9.61279296875, -9.286376953125, -8.9599609375, -8.633544921875, -8.30712890625, -7.980712890625, -7.654296875, -7.327880859375, -7.00146484375, -6.675048828125, -6.3486328125, -6.022216796875, -5.69580078125, -5.369384765625, -5.04296875, -4.716552734375, -4.39013671875, -4.063720703125, -3.7373046875, -3.410888671875, -3.08447265625, -2.758056640625, -2.431640625, -2.105224609375, -1.77880859375, -1.452392578125, -1.1259765625, -0.799560546875, -0.47314453125, -0.146728515625, 0.1796875, 0.506103515625, 0.83251953125, 1.158935546875, 1.4853515625, 1.811767578125, 2.13818359375, 2.464599609375, 2.791015625, 3.117431640625, 3.44384765625, 3.770263671875, 4.0966796875, 4.423095703125, 4.74951171875, 5.075927734375, 5.40234375, 5.728759765625, 6.05517578125, 6.381591796875, 6.7080078125, 7.034423828125, 7.36083984375, 7.687255859375, 8.013671875, 8.340087890625, 8.66650390625, 8.992919921875, 9.3193359375, 9.645751953125, 9.97216796875, 10.298583984375, 10.625]}, "gradients/decoder.transformer.h.10.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 6.0, 1.0, 2.0, 3.0, 8.0, 4.0, 2.0, 7.0, 8.0, 8.0, 11.0, 9.0, 14.0, 16.0, 16.0, 32.0, 25.0, 28.0, 50.0, 39.0, 56.0, 50.0, 54.0, 90.0, 308.0, 1585.0, 162.0, 58.0, 57.0, 46.0, 43.0, 41.0, 31.0, 25.0, 21.0, 23.0, 24.0, 25.0, 16.0, 11.0, 10.0, 7.0, 6.0, 4.0, 8.0, 4.0, 3.0, 4.0, 3.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.703125, -26.754150390625, -25.80517578125, -24.856201171875, -23.9072265625, -22.958251953125, -22.00927734375, -21.060302734375, -20.111328125, -19.162353515625, -18.21337890625, -17.264404296875, -16.3154296875, -15.366455078125, -14.41748046875, -13.468505859375, -12.51953125, -11.570556640625, -10.62158203125, -9.672607421875, -8.7236328125, -7.774658203125, -6.82568359375, -5.876708984375, -4.927734375, -3.978759765625, -3.02978515625, -2.080810546875, -1.1318359375, -0.182861328125, 0.76611328125, 1.715087890625, 2.6640625, 3.613037109375, 4.56201171875, 5.510986328125, 6.4599609375, 7.408935546875, 8.35791015625, 9.306884765625, 10.255859375, 11.204833984375, 12.15380859375, 13.102783203125, 14.0517578125, 15.000732421875, 15.94970703125, 16.898681640625, 17.84765625, 18.796630859375, 19.74560546875, 20.694580078125, 21.6435546875, 22.592529296875, 23.54150390625, 24.490478515625, 25.439453125, 26.388427734375, 27.33740234375, 28.286376953125, 29.2353515625, 30.184326171875, 31.13330078125, 32.082275390625, 33.03125]}, "gradients/decoder.transformer.h.10.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 5.0, 16.0, 15.0, 14.0, 20.0, 35.0, 46.0, 63.0, 87.0, 104.0, 174.0, 261.0, 504.0, 1367.0, 40567.0, 3092917.0, 7553.0, 828.0, 382.0, 232.0, 152.0, 112.0, 63.0, 52.0, 30.0, 29.0, 22.0, 9.0, 15.0, 8.0, 4.0, 4.0, 4.0, 3.0, 3.0, 0.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-105.75, -102.8388671875, -99.927734375, -97.0166015625, -94.10546875, -91.1943359375, -88.283203125, -85.3720703125, -82.4609375, -79.5498046875, -76.638671875, -73.7275390625, -70.81640625, -67.9052734375, -64.994140625, -62.0830078125, -59.171875, -56.2607421875, -53.349609375, -50.4384765625, -47.52734375, -44.6162109375, -41.705078125, -38.7939453125, -35.8828125, -32.9716796875, -30.060546875, -27.1494140625, -24.23828125, -21.3271484375, -18.416015625, -15.5048828125, -12.59375, -9.6826171875, -6.771484375, -3.8603515625, -0.94921875, 1.9619140625, 4.873046875, 7.7841796875, 10.6953125, 13.6064453125, 16.517578125, 19.4287109375, 22.33984375, 25.2509765625, 28.162109375, 31.0732421875, 33.984375, 36.8955078125, 39.806640625, 42.7177734375, 45.62890625, 48.5400390625, 51.451171875, 54.3623046875, 57.2734375, 60.1845703125, 63.095703125, 66.0068359375, 68.91796875, 71.8291015625, 74.740234375, 77.6513671875, 80.5625]}, "gradients/decoder.transformer.h.10.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 19.0, 115.0, 299.0, 356.0, 182.0, 35.0, 9.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-136.70484924316406, -133.67849731445312, -130.6521453857422, -127.62578582763672, -124.59943389892578, -121.57308197021484, -118.5467300415039, -115.52037048339844, -112.4940185546875, -109.46766662597656, -106.44131469726562, -103.41495513916016, -100.38860321044922, -97.36225128173828, -94.33589935302734, -91.30953979492188, -88.28318786621094, -85.2568359375, -82.23048400878906, -79.2041244506836, -76.17777252197266, -73.15142059326172, -70.12506866455078, -67.09870910644531, -64.0723648071289, -61.04601287841797, -58.019657135009766, -54.99330520629883, -51.966949462890625, -48.94059753417969, -45.91424560546875, -42.88788986206055, -39.86153030395508, -36.83517837524414, -33.80882263183594, -30.782470703125, -27.756114959716797, -24.72976303100586, -21.70340919494629, -18.67705535888672, -15.650701522827148, -12.624347686767578, -9.597993850708008, -6.571640968322754, -3.5452871322631836, -0.5189332962036133, 2.5074195861816406, 5.533773422241211, 8.560127258300781, 11.586481094360352, 14.612834930419922, 17.63918685913086, 20.665542602539062, 23.69189453125, 26.71824836730957, 29.74460220336914, 32.770957946777344, 35.79730987548828, 38.823665618896484, 41.85001754760742, 44.876373291015625, 47.90272521972656, 50.9290771484375, 53.9554328918457, 56.98178482055664]}, "gradients/decoder.transformer.h.10.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 2.0, 3.0, 4.0, 9.0, 9.0, 9.0, 14.0, 5.0, 9.0, 17.0, 27.0, 13.0, 24.0, 36.0, 46.0, 29.0, 24.0, 35.0, 30.0, 35.0, 46.0, 50.0, 46.0, 36.0, 40.0, 36.0, 42.0, 37.0, 29.0, 32.0, 37.0, 30.0, 26.0, 21.0, 26.0, 18.0, 8.0, 9.0, 16.0, 7.0, 5.0, 7.0, 3.0, 5.0, 4.0, 3.0, 1.0, 4.0, 0.0, 1.0, 4.0, 3.0], "bins": [-80.87769317626953, -78.50401306152344, -76.13034057617188, -73.75666809082031, -71.38298797607422, -69.00930786132812, -66.63563537597656, -64.261962890625, -61.888282775878906, -59.51460647583008, -57.14093017578125, -54.76725387573242, -52.393577575683594, -50.019901275634766, -47.64622497558594, -45.27254867553711, -42.89887237548828, -40.52519607543945, -38.151519775390625, -35.7778434753418, -33.40416717529297, -31.03049087524414, -28.656814575195312, -26.283138275146484, -23.909461975097656, -21.535785675048828, -19.162109375, -16.788433074951172, -14.414756774902344, -12.041080474853516, -9.667404174804688, -7.293727874755859, -4.9200592041015625, -2.5463829040527344, -0.17270660400390625, 2.200969696044922, 4.57464599609375, 6.948322296142578, 9.321998596191406, 11.695674896240234, 14.069351196289062, 16.44302749633789, 18.81670379638672, 21.190380096435547, 23.564056396484375, 25.937732696533203, 28.31140899658203, 30.68508529663086, 33.05876159667969, 35.432437896728516, 37.806114196777344, 40.17979049682617, 42.553466796875, 44.92714309692383, 47.300819396972656, 49.674495697021484, 52.04817199707031, 54.42184829711914, 56.79552459716797, 59.1692008972168, 61.542877197265625, 63.91655349731445, 66.29022979736328, 68.66390991210938, 71.03758239746094]}, "gradients/decoder.transformer.h.9.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 5.0, 6.0, 3.0, 2.0, 1.0, 11.0, 13.0, 13.0, 13.0, 19.0, 17.0, 29.0, 18.0, 26.0, 28.0, 35.0, 32.0, 39.0, 40.0, 34.0, 43.0, 55.0, 51.0, 39.0, 38.0, 39.0, 39.0, 33.0, 35.0, 32.0, 21.0, 34.0, 33.0, 25.0, 18.0, 14.0, 17.0, 7.0, 11.0, 9.0, 11.0, 4.0, 6.0, 5.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-10.3046875, -9.9801025390625, -9.655517578125, -9.3309326171875, -9.00634765625, -8.6817626953125, -8.357177734375, -8.0325927734375, -7.7080078125, -7.3834228515625, -7.058837890625, -6.7342529296875, -6.40966796875, -6.0850830078125, -5.760498046875, -5.4359130859375, -5.111328125, -4.7867431640625, -4.462158203125, -4.1375732421875, -3.81298828125, -3.4884033203125, -3.163818359375, -2.8392333984375, -2.5146484375, -2.1900634765625, -1.865478515625, -1.5408935546875, -1.21630859375, -0.8917236328125, -0.567138671875, -0.2425537109375, 0.08203125, 0.4066162109375, 0.731201171875, 1.0557861328125, 1.38037109375, 1.7049560546875, 2.029541015625, 2.3541259765625, 2.6787109375, 3.0032958984375, 3.327880859375, 3.6524658203125, 3.97705078125, 4.3016357421875, 4.626220703125, 4.9508056640625, 5.275390625, 5.5999755859375, 5.924560546875, 6.2491455078125, 6.57373046875, 6.8983154296875, 7.222900390625, 7.5474853515625, 7.8720703125, 8.1966552734375, 8.521240234375, 8.8458251953125, 9.17041015625, 9.4949951171875, 9.819580078125, 10.1441650390625, 10.46875]}, "gradients/decoder.transformer.h.9.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 9.0, 12.0, 9.0, 11.0, 19.0, 19.0, 26.0, 28.0, 23.0, 47.0, 63.0, 99.0, 196.0, 367.0, 970.0, 4355.0, 32710.0, 662498.0, 3198662.0, 272339.0, 17579.0, 2633.0, 769.0, 305.0, 165.0, 93.0, 69.0, 43.0, 37.0, 22.0, 17.0, 18.0, 18.0, 8.0, 9.0, 6.0, 6.0, 8.0, 4.0, 4.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-32.59375, -31.5869140625, -30.580078125, -29.5732421875, -28.56640625, -27.5595703125, -26.552734375, -25.5458984375, -24.5390625, -23.5322265625, -22.525390625, -21.5185546875, -20.51171875, -19.5048828125, -18.498046875, -17.4912109375, -16.484375, -15.4775390625, -14.470703125, -13.4638671875, -12.45703125, -11.4501953125, -10.443359375, -9.4365234375, -8.4296875, -7.4228515625, -6.416015625, -5.4091796875, -4.40234375, -3.3955078125, -2.388671875, -1.3818359375, -0.375, 0.6318359375, 1.638671875, 2.6455078125, 3.65234375, 4.6591796875, 5.666015625, 6.6728515625, 7.6796875, 8.6865234375, 9.693359375, 10.7001953125, 11.70703125, 12.7138671875, 13.720703125, 14.7275390625, 15.734375, 16.7412109375, 17.748046875, 18.7548828125, 19.76171875, 20.7685546875, 21.775390625, 22.7822265625, 23.7890625, 24.7958984375, 25.802734375, 26.8095703125, 27.81640625, 28.8232421875, 29.830078125, 30.8369140625, 31.84375]}, "gradients/decoder.transformer.h.9.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 4.0, 1.0, 4.0, 5.0, 6.0, 7.0, 19.0, 19.0, 37.0, 44.0, 79.0, 120.0, 145.0, 238.0, 430.0, 569.0, 668.0, 594.0, 413.0, 239.0, 141.0, 97.0, 64.0, 48.0, 34.0, 20.0, 7.0, 11.0, 7.0, 6.0, 3.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.640625, -20.853271484375, -20.06591796875, -19.278564453125, -18.4912109375, -17.703857421875, -16.91650390625, -16.129150390625, -15.341796875, -14.554443359375, -13.76708984375, -12.979736328125, -12.1923828125, -11.405029296875, -10.61767578125, -9.830322265625, -9.04296875, -8.255615234375, -7.46826171875, -6.680908203125, -5.8935546875, -5.106201171875, -4.31884765625, -3.531494140625, -2.744140625, -1.956787109375, -1.16943359375, -0.382080078125, 0.4052734375, 1.192626953125, 1.97998046875, 2.767333984375, 3.5546875, 4.342041015625, 5.12939453125, 5.916748046875, 6.7041015625, 7.491455078125, 8.27880859375, 9.066162109375, 9.853515625, 10.640869140625, 11.42822265625, 12.215576171875, 13.0029296875, 13.790283203125, 14.57763671875, 15.364990234375, 16.15234375, 16.939697265625, 17.72705078125, 18.514404296875, 19.3017578125, 20.089111328125, 20.87646484375, 21.663818359375, 22.451171875, 23.238525390625, 24.02587890625, 24.813232421875, 25.6005859375, 26.387939453125, 27.17529296875, 27.962646484375, 28.75]}, "gradients/decoder.transformer.h.9.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 8.0, 9.0, 14.0, 26.0, 29.0, 43.0, 93.0, 121.0, 174.0, 307.0, 444.0, 1433.0, 795435.0, 3392565.0, 2108.0, 557.0, 269.0, 235.0, 154.0, 86.0, 58.0, 48.0, 30.0, 12.0, 7.0, 8.0, 1.0, 3.0, 3.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-163.75, -159.2109375, -154.671875, -150.1328125, -145.59375, -141.0546875, -136.515625, -131.9765625, -127.4375, -122.8984375, -118.359375, -113.8203125, -109.28125, -104.7421875, -100.203125, -95.6640625, -91.125, -86.5859375, -82.046875, -77.5078125, -72.96875, -68.4296875, -63.890625, -59.3515625, -54.8125, -50.2734375, -45.734375, -41.1953125, -36.65625, -32.1171875, -27.578125, -23.0390625, -18.5, -13.9609375, -9.421875, -4.8828125, -0.34375, 4.1953125, 8.734375, 13.2734375, 17.8125, 22.3515625, 26.890625, 31.4296875, 35.96875, 40.5078125, 45.046875, 49.5859375, 54.125, 58.6640625, 63.203125, 67.7421875, 72.28125, 76.8203125, 81.359375, 85.8984375, 90.4375, 94.9765625, 99.515625, 104.0546875, 108.59375, 113.1328125, 117.671875, 122.2109375, 126.75]}, "gradients/decoder.transformer.h.9.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 4.0, 12.0, 27.0, 44.0, 85.0, 133.0, 182.0, 175.0, 143.0, 99.0, 57.0, 29.0, 17.0, 7.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-95.95034790039062, -92.30764770507812, -88.66495513916016, -85.02226257324219, -81.37956237792969, -77.73686218261719, -74.09416961669922, -70.45147705078125, -66.80877685546875, -63.166080474853516, -59.52338409423828, -55.88068771362305, -52.23799133300781, -48.59529495239258, -44.952598571777344, -41.30990219116211, -37.667205810546875, -34.02450942993164, -30.381813049316406, -26.739116668701172, -23.096420288085938, -19.453723907470703, -15.811027526855469, -12.168331146240234, -8.525634765625, -4.882938385009766, -1.2402420043945312, 2.402454376220703, 6.0451507568359375, 9.687847137451172, 13.330543518066406, 16.97323989868164, 20.615936279296875, 24.25863265991211, 27.901329040527344, 31.544025421142578, 35.18672180175781, 38.82941818237305, 42.47211456298828, 46.114810943603516, 49.75750732421875, 53.400203704833984, 57.04290008544922, 60.68559646606445, 64.32829284667969, 67.97099304199219, 71.61368560791016, 75.25637817382812, 78.89907836914062, 82.54177856445312, 86.1844711303711, 89.82716369628906, 93.46986389160156, 97.11256408691406, 100.75525665283203, 104.39794921875, 108.0406494140625, 111.683349609375, 115.32604217529297, 118.96873474121094, 122.61143493652344, 126.25413513183594, 129.89682006835938, 133.53952026367188, 137.18222045898438]}, "gradients/decoder.transformer.h.9.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 5.0, 6.0, 14.0, 8.0, 19.0, 16.0, 10.0, 13.0, 23.0, 21.0, 23.0, 38.0, 27.0, 43.0, 46.0, 36.0, 40.0, 43.0, 33.0, 51.0, 29.0, 45.0, 39.0, 47.0, 32.0, 35.0, 37.0, 36.0, 27.0, 33.0, 30.0, 18.0, 14.0, 13.0, 9.0, 9.0, 7.0, 11.0, 8.0, 2.0, 3.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 1.0], "bins": [-61.39698791503906, -59.54039001464844, -57.68379211425781, -55.82719802856445, -53.97060012817383, -52.1140022277832, -50.257408142089844, -48.40081024169922, -46.544212341308594, -44.68761444091797, -42.831016540527344, -40.974422454833984, -39.11782455444336, -37.261226654052734, -35.404632568359375, -33.54803466796875, -31.691436767578125, -29.8348388671875, -27.978242874145508, -26.121646881103516, -24.26504898071289, -22.408451080322266, -20.551855087280273, -18.69525909423828, -16.838661193847656, -14.982064247131348, -13.125467300415039, -11.26887035369873, -9.412273406982422, -7.555676460266113, -5.699079513549805, -3.842482566833496, -1.9858856201171875, -0.1292886734008789, 1.7273082733154297, 3.5839052200317383, 5.440502166748047, 7.2970991134643555, 9.153696060180664, 11.010293006896973, 12.866889953613281, 14.72348690032959, 16.5800838470459, 18.43667984008789, 20.293277740478516, 22.14987564086914, 24.006471633911133, 25.863067626953125, 27.71966552734375, 29.576263427734375, 31.432859420776367, 33.28945541381836, 35.146053314208984, 37.00265121459961, 38.85924530029297, 40.715843200683594, 42.57244110107422, 44.429039001464844, 46.28563690185547, 48.14223098754883, 49.99882888793945, 51.85542678833008, 53.71202087402344, 55.56861877441406, 57.42521667480469]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 7.0, 8.0, 9.0, 10.0, 18.0, 18.0, 22.0, 36.0, 30.0, 30.0, 33.0, 35.0, 30.0, 48.0, 55.0, 44.0, 53.0, 48.0, 37.0, 41.0, 47.0, 44.0, 32.0, 28.0, 42.0, 23.0, 27.0, 28.0, 16.0, 18.0, 16.0, 13.0, 12.0, 10.0, 6.0, 9.0, 3.0, 4.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1953125, -9.8502197265625, -9.505126953125, -9.1600341796875, -8.81494140625, -8.4698486328125, -8.124755859375, -7.7796630859375, -7.4345703125, -7.0894775390625, -6.744384765625, -6.3992919921875, -6.05419921875, -5.7091064453125, -5.364013671875, -5.0189208984375, -4.673828125, -4.3287353515625, -3.983642578125, -3.6385498046875, -3.29345703125, -2.9483642578125, -2.603271484375, -2.2581787109375, -1.9130859375, -1.5679931640625, -1.222900390625, -0.8778076171875, -0.53271484375, -0.1876220703125, 0.157470703125, 0.5025634765625, 0.84765625, 1.1927490234375, 1.537841796875, 1.8829345703125, 2.22802734375, 2.5731201171875, 2.918212890625, 3.2633056640625, 3.6083984375, 3.9534912109375, 4.298583984375, 4.6436767578125, 4.98876953125, 5.3338623046875, 5.678955078125, 6.0240478515625, 6.369140625, 6.7142333984375, 7.059326171875, 7.4044189453125, 7.74951171875, 8.0946044921875, 8.439697265625, 8.7847900390625, 9.1298828125, 9.4749755859375, 9.820068359375, 10.1651611328125, 10.51025390625, 10.8553466796875, 11.200439453125, 11.5455322265625, 11.890625]}, "gradients/decoder.transformer.h.9.crossattention.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 3.0, 2.0, 1.0, 4.0, 5.0, 11.0, 4.0, 13.0, 22.0, 29.0, 62.0, 68.0, 101.0, 159.0, 253.0, 428.0, 567.0, 935.0, 1365.0, 2185.0, 3394.0, 5331.0, 8496.0, 14018.0, 22837.0, 37391.0, 62160.0, 102072.0, 162014.0, 203365.0, 161362.0, 101644.0, 61097.0, 37276.0, 22773.0, 13786.0, 8455.0, 5430.0, 3358.0, 2132.0, 1375.0, 873.0, 573.0, 388.0, 272.0, 165.0, 120.0, 72.0, 49.0, 21.0, 22.0, 5.0, 11.0, 6.0, 5.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.033203125, -1.00140380859375, -0.9696044921875, -0.93780517578125, -0.906005859375, -0.87420654296875, -0.8424072265625, -0.81060791015625, -0.77880859375, -0.74700927734375, -0.7152099609375, -0.68341064453125, -0.651611328125, -0.61981201171875, -0.5880126953125, -0.55621337890625, -0.5244140625, -0.49261474609375, -0.4608154296875, -0.42901611328125, -0.397216796875, -0.36541748046875, -0.3336181640625, -0.30181884765625, -0.27001953125, -0.23822021484375, -0.2064208984375, -0.17462158203125, -0.142822265625, -0.11102294921875, -0.0792236328125, -0.04742431640625, -0.015625, 0.01617431640625, 0.0479736328125, 0.07977294921875, 0.111572265625, 0.14337158203125, 0.1751708984375, 0.20697021484375, 0.23876953125, 0.27056884765625, 0.3023681640625, 0.33416748046875, 0.365966796875, 0.39776611328125, 0.4295654296875, 0.46136474609375, 0.4931640625, 0.52496337890625, 0.5567626953125, 0.58856201171875, 0.620361328125, 0.65216064453125, 0.6839599609375, 0.71575927734375, 0.74755859375, 0.77935791015625, 0.8111572265625, 0.84295654296875, 0.874755859375, 0.90655517578125, 0.9383544921875, 0.97015380859375, 1.001953125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.bias": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 1.0, 4.0, 2.0, 5.0, 4.0, 4.0, 11.0, 5.0, 12.0, 19.0, 12.0, 16.0, 19.0, 24.0, 22.0, 37.0, 25.0, 29.0, 30.0, 26.0, 47.0, 45.0, 53.0, 39.0, 1062.0, 42.0, 35.0, 42.0, 37.0, 42.0, 41.0, 35.0, 27.0, 24.0, 29.0, 22.0, 15.0, 13.0, 12.0, 14.0, 6.0, 15.0, 7.0, 10.0, 3.0, 3.0, 2.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-5.76171875, -5.55523681640625, -5.3487548828125, -5.14227294921875, -4.935791015625, -4.72930908203125, -4.5228271484375, -4.31634521484375, -4.10986328125, -3.90338134765625, -3.6968994140625, -3.49041748046875, -3.283935546875, -3.07745361328125, -2.8709716796875, -2.66448974609375, -2.4580078125, -2.25152587890625, -2.0450439453125, -1.83856201171875, -1.632080078125, -1.42559814453125, -1.2191162109375, -1.01263427734375, -0.80615234375, -0.59967041015625, -0.3931884765625, -0.18670654296875, 0.019775390625, 0.22625732421875, 0.4327392578125, 0.63922119140625, 0.845703125, 1.05218505859375, 1.2586669921875, 1.46514892578125, 1.671630859375, 1.87811279296875, 2.0845947265625, 2.29107666015625, 2.49755859375, 2.70404052734375, 2.9105224609375, 3.11700439453125, 3.323486328125, 3.52996826171875, 3.7364501953125, 3.94293212890625, 4.1494140625, 4.35589599609375, 4.5623779296875, 4.76885986328125, 4.975341796875, 5.18182373046875, 5.3883056640625, 5.59478759765625, 5.80126953125, 6.00775146484375, 6.2142333984375, 6.42071533203125, 6.627197265625, 6.83367919921875, 7.0401611328125, 7.24664306640625, 7.453125]}, "gradients/decoder.transformer.h.9.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 5.0, 6.0, 20.0, 14.0, 32.0, 31.0, 80.0, 95.0, 143.0, 225.0, 343.0, 512.0, 794.0, 1158.0, 1690.0, 2622.0, 4117.0, 6346.0, 9638.0, 15229.0, 23375.0, 35632.0, 55180.0, 83900.0, 121278.0, 340511.0, 1020260.0, 124786.0, 86563.0, 57284.0, 36765.0, 23924.0, 15565.0, 10084.0, 6352.0, 4274.0, 2846.0, 1819.0, 1228.0, 824.0, 558.0, 316.0, 240.0, 160.0, 105.0, 74.0, 39.0, 30.0, 24.0, 16.0, 9.0, 5.0, 5.0, 3.0, 4.0, 0.0, 1.0], "bins": [-0.6884765625, -0.6676406860351562, -0.6468048095703125, -0.6259689331054688, -0.605133056640625, -0.5842971801757812, -0.5634613037109375, -0.5426254272460938, -0.52178955078125, -0.5009536743164062, -0.4801177978515625, -0.45928192138671875, -0.438446044921875, -0.41761016845703125, -0.3967742919921875, -0.37593841552734375, -0.3551025390625, -0.33426666259765625, -0.3134307861328125, -0.29259490966796875, -0.271759033203125, -0.25092315673828125, -0.2300872802734375, -0.20925140380859375, -0.18841552734375, -0.16757965087890625, -0.1467437744140625, -0.12590789794921875, -0.105072021484375, -0.08423614501953125, -0.0634002685546875, -0.04256439208984375, -0.021728515625, -0.00089263916015625, 0.0199432373046875, 0.04077911376953125, 0.061614990234375, 0.08245086669921875, 0.1032867431640625, 0.12412261962890625, 0.14495849609375, 0.16579437255859375, 0.1866302490234375, 0.20746612548828125, 0.228302001953125, 0.24913787841796875, 0.2699737548828125, 0.29080963134765625, 0.3116455078125, 0.33248138427734375, 0.3533172607421875, 0.37415313720703125, 0.394989013671875, 0.41582489013671875, 0.4366607666015625, 0.45749664306640625, 0.47833251953125, 0.49916839599609375, 0.5200042724609375, 0.5408401489257812, 0.561676025390625, 0.5825119018554688, 0.6033477783203125, 0.6241836547851562, 0.64501953125]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 5.0, 2.0, 2.0, 2.0, 4.0, 5.0, 6.0, 4.0, 5.0, 6.0, 8.0, 11.0, 18.0, 9.0, 15.0, 26.0, 16.0, 22.0, 44.0, 64.0, 64.0, 68.0, 68.0, 81.0, 73.0, 64.0, 56.0, 51.0, 37.0, 40.0, 19.0, 18.0, 16.0, 16.0, 7.0, 10.0, 8.0, 6.0, 13.0, 8.0, 4.0, 1.0, 6.0, 1.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.006893157958984375, -0.0066803693771362305, -0.006467580795288086, -0.006254792213439941, -0.006042003631591797, -0.005829215049743652, -0.005616426467895508, -0.005403637886047363, -0.005190849304199219, -0.004978060722351074, -0.00476527214050293, -0.004552483558654785, -0.004339694976806641, -0.004126906394958496, -0.0039141178131103516, -0.003701329231262207, -0.0034885406494140625, -0.003275752067565918, -0.0030629634857177734, -0.002850174903869629, -0.0026373863220214844, -0.00242459774017334, -0.0022118091583251953, -0.0019990205764770508, -0.0017862319946289062, -0.0015734434127807617, -0.0013606548309326172, -0.0011478662490844727, -0.0009350776672363281, -0.0007222890853881836, -0.0005095005035400391, -0.00029671192169189453, -8.392333984375e-05, 0.00012886524200439453, 0.00034165382385253906, 0.0005544424057006836, 0.0007672309875488281, 0.0009800195693969727, 0.0011928081512451172, 0.0014055967330932617, 0.0016183853149414062, 0.0018311738967895508, 0.0020439624786376953, 0.00225675106048584, 0.0024695396423339844, 0.002682328224182129, 0.0028951168060302734, 0.003107905387878418, 0.0033206939697265625, 0.003533482551574707, 0.0037462711334228516, 0.003959059715270996, 0.004171848297119141, 0.004384636878967285, 0.00459742546081543, 0.004810214042663574, 0.005023002624511719, 0.005235791206359863, 0.005448579788208008, 0.005661368370056152, 0.005874156951904297, 0.006086945533752441, 0.006299734115600586, 0.0065125226974487305, 0.006725311279296875]}, "gradients/decoder.transformer.h.9.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 1.0, 2.0, 1.0, 7.0, 8.0, 9.0, 15.0, 14.0, 25.0, 20.0, 28.0, 46.0, 39.0, 62.0, 81.0, 160.0, 327.0, 951.0, 66375.0, 972372.0, 6838.0, 499.0, 229.0, 129.0, 86.0, 53.0, 35.0, 23.0, 20.0, 20.0, 21.0, 19.0, 10.0, 9.0, 5.0, 7.0, 4.0, 3.0, 4.0, 1.0, 0.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1715087890625, -0.16635704040527344, -0.16120529174804688, -0.1560535430908203, -0.15090179443359375, -0.1457500457763672, -0.14059829711914062, -0.13544654846191406, -0.1302947998046875, -0.12514305114746094, -0.11999130249023438, -0.11483955383300781, -0.10968780517578125, -0.10453605651855469, -0.09938430786132812, -0.09423255920410156, -0.089080810546875, -0.08392906188964844, -0.07877731323242188, -0.07362556457519531, -0.06847381591796875, -0.06332206726074219, -0.058170318603515625, -0.05301856994628906, -0.0478668212890625, -0.04271507263183594, -0.037563323974609375, -0.03241157531738281, -0.02725982666015625, -0.022108078002929688, -0.016956329345703125, -0.011804580688476562, -0.00665283203125, -0.0015010833740234375, 0.003650665283203125, 0.008802413940429688, 0.01395416259765625, 0.019105911254882812, 0.024257659912109375, 0.029409408569335938, 0.0345611572265625, 0.03971290588378906, 0.044864654541015625, 0.05001640319824219, 0.05516815185546875, 0.06031990051269531, 0.06547164916992188, 0.07062339782714844, 0.075775146484375, 0.08092689514160156, 0.08607864379882812, 0.09123039245605469, 0.09638214111328125, 0.10153388977050781, 0.10668563842773438, 0.11183738708496094, 0.1169891357421875, 0.12214088439941406, 0.12729263305664062, 0.1324443817138672, 0.13759613037109375, 0.1427478790283203, 0.14789962768554688, 0.15305137634277344, 0.158203125]}, "gradients/decoder.transformer.h.9.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 2.0, 25.0, 57.0, 177.0, 388.0, 240.0, 90.0, 24.0, 9.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.03152065351605415, -0.030872805044054985, -0.030224956572055817, -0.029577108100056648, -0.02892925962805748, -0.02828141115605831, -0.027633562684059143, -0.026985714212059975, -0.026337865740060806, -0.025690017268061638, -0.02504216879606247, -0.0243943203240633, -0.023746471852064133, -0.023098623380064964, -0.022450774908065796, -0.021802926436066628, -0.02115507796406746, -0.02050722949206829, -0.019859381020069122, -0.019211532548069954, -0.018563684076070786, -0.017915835604071617, -0.01726798713207245, -0.01662013866007328, -0.015972288325428963, -0.015324439853429794, -0.014676591381430626, -0.014028742909431458, -0.013380894437432289, -0.01273304596543312, -0.012085197493433952, -0.011437349021434784, -0.010789499618113041, -0.010141651146113873, -0.009493802674114704, -0.008845954202115536, -0.008198105730116367, -0.007550257258117199, -0.006902408320456743, -0.006254559848457575, -0.0056067113764584064, -0.004958862904459238, -0.00431101443246007, -0.0036631657276302576, -0.003015317255631089, -0.002367468783631921, -0.0017196200788021088, -0.0010717716068029404, -0.00042392313480377197, 0.00022392539540305734, 0.0008717739256098866, 0.0015196225140243769, 0.0021674709860235453, 0.0028153194580227137, 0.0034631681628525257, 0.004111016634851694, 0.0047588651068508625, 0.005406713578850031, 0.006054562050849199, 0.006702410988509655, 0.007350259460508823, 0.007998107932507992, 0.00864595640450716, 0.009293804876506329, 0.009941653348505497]}, "gradients/decoder.transformer.h.9.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 3.0, 6.0, 6.0, 8.0, 7.0, 6.0, 5.0, 8.0, 9.0, 11.0, 17.0, 23.0, 21.0, 24.0, 21.0, 29.0, 32.0, 36.0, 39.0, 48.0, 32.0, 45.0, 29.0, 50.0, 45.0, 42.0, 41.0, 32.0, 37.0, 27.0, 43.0, 35.0, 35.0, 21.0, 22.0, 19.0, 16.0, 17.0, 24.0, 13.0, 3.0, 1.0, 5.0, 7.0, 5.0, 3.0, 3.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.003565967082977295, -0.0034563280642032623, -0.0033466890454292297, -0.003237050026655197, -0.0031274110078811646, -0.003017771989107132, -0.0029081329703330994, -0.0027984939515590668, -0.002688854932785034, -0.0025792159140110016, -0.002469576895236969, -0.0023599378764629364, -0.002250298857688904, -0.002140659838914871, -0.0020310208201408386, -0.001921381801366806, -0.0018117427825927734, -0.0017021037638187408, -0.0015924647450447083, -0.0014828257262706757, -0.001373186707496643, -0.0012635476887226105, -0.0011539086699485779, -0.0010442696511745453, -0.0009346306324005127, -0.0008249916136264801, -0.0007153525948524475, -0.0006057135760784149, -0.0004960745573043823, -0.00038643553853034973, -0.00027679651975631714, -0.00016715750098228455, -5.751848220825195e-05, 5.212053656578064e-05, 0.00016175955533981323, 0.0002713985741138458, 0.0003810375928878784, 0.000490676611661911, 0.0006003156304359436, 0.0007099546492099762, 0.0008195936679840088, 0.0009292326867580414, 0.001038871705532074, 0.0011485107243061066, 0.0012581497430801392, 0.0013677887618541718, 0.0014774277806282043, 0.001587066799402237, 0.0016967058181762695, 0.0018063448369503021, 0.0019159838557243347, 0.0020256228744983673, 0.0021352618932724, 0.0022449009120464325, 0.002354539930820465, 0.0024641789495944977, 0.0025738179683685303, 0.002683456987142563, 0.0027930960059165955, 0.002902735024690628, 0.0030123740434646606, 0.0031220130622386932, 0.003231652081012726, 0.0033412910997867584, 0.003450930118560791]}, "gradients/decoder.transformer.h.9.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 3.0, 7.0, 8.0, 9.0, 10.0, 18.0, 18.0, 22.0, 36.0, 30.0, 30.0, 33.0, 35.0, 30.0, 48.0, 55.0, 44.0, 53.0, 48.0, 37.0, 41.0, 47.0, 44.0, 32.0, 28.0, 42.0, 23.0, 28.0, 27.0, 16.0, 18.0, 16.0, 13.0, 12.0, 10.0, 6.0, 9.0, 3.0, 4.0, 8.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.1953125, -9.8502197265625, -9.505126953125, -9.1600341796875, -8.81494140625, -8.4698486328125, -8.124755859375, -7.7796630859375, -7.4345703125, -7.0894775390625, -6.744384765625, -6.3992919921875, -6.05419921875, -5.7091064453125, -5.364013671875, -5.0189208984375, -4.673828125, -4.3287353515625, -3.983642578125, -3.6385498046875, -3.29345703125, -2.9483642578125, -2.603271484375, -2.2581787109375, -1.9130859375, -1.5679931640625, -1.222900390625, -0.8778076171875, -0.53271484375, -0.1876220703125, 0.157470703125, 0.5025634765625, 0.84765625, 1.1927490234375, 1.537841796875, 1.8829345703125, 2.22802734375, 2.5731201171875, 2.918212890625, 3.2633056640625, 3.6083984375, 3.9534912109375, 4.298583984375, 4.6436767578125, 4.98876953125, 5.3338623046875, 5.678955078125, 6.0240478515625, 6.369140625, 6.7142333984375, 7.059326171875, 7.4044189453125, 7.74951171875, 8.0946044921875, 8.439697265625, 8.7847900390625, 9.1298828125, 9.4749755859375, 9.820068359375, 10.1651611328125, 10.51025390625, 10.8553466796875, 11.200439453125, 11.5455322265625, 11.890625]}, "gradients/decoder.transformer.h.9.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 8.0, 7.0, 12.0, 17.0, 32.0, 36.0, 42.0, 69.0, 98.0, 118.0, 191.0, 263.0, 460.0, 929.0, 2792.0, 12846.0, 88210.0, 777322.0, 140417.0, 18357.0, 3696.0, 1159.0, 538.0, 289.0, 190.0, 105.0, 86.0, 58.0, 44.0, 39.0, 28.0, 21.0, 21.0, 10.0, 8.0, 10.0, 5.0, 3.0, 6.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.59375, -17.965576171875, -17.33740234375, -16.709228515625, -16.0810546875, -15.452880859375, -14.82470703125, -14.196533203125, -13.568359375, -12.940185546875, -12.31201171875, -11.683837890625, -11.0556640625, -10.427490234375, -9.79931640625, -9.171142578125, -8.54296875, -7.914794921875, -7.28662109375, -6.658447265625, -6.0302734375, -5.402099609375, -4.77392578125, -4.145751953125, -3.517578125, -2.889404296875, -2.26123046875, -1.633056640625, -1.0048828125, -0.376708984375, 0.25146484375, 0.879638671875, 1.5078125, 2.135986328125, 2.76416015625, 3.392333984375, 4.0205078125, 4.648681640625, 5.27685546875, 5.905029296875, 6.533203125, 7.161376953125, 7.78955078125, 8.417724609375, 9.0458984375, 9.674072265625, 10.30224609375, 10.930419921875, 11.55859375, 12.186767578125, 12.81494140625, 13.443115234375, 14.0712890625, 14.699462890625, 15.32763671875, 15.955810546875, 16.583984375, 17.212158203125, 17.84033203125, 18.468505859375, 19.0966796875, 19.724853515625, 20.35302734375, 20.981201171875, 21.609375]}, "gradients/decoder.transformer.h.9.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 5.0, 2.0, 1.0, 3.0, 1.0, 5.0, 0.0, 3.0, 6.0, 3.0, 5.0, 11.0, 9.0, 6.0, 25.0, 17.0, 27.0, 26.0, 38.0, 28.0, 38.0, 47.0, 49.0, 51.0, 93.0, 214.0, 1764.0, 138.0, 76.0, 53.0, 44.0, 40.0, 41.0, 36.0, 30.0, 26.0, 15.0, 18.0, 8.0, 12.0, 15.0, 8.0, 13.0, 6.0, 0.0, 0.0, 4.0, 2.0, 1.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.65625, -37.5322265625, -36.408203125, -35.2841796875, -34.16015625, -33.0361328125, -31.912109375, -30.7880859375, -29.6640625, -28.5400390625, -27.416015625, -26.2919921875, -25.16796875, -24.0439453125, -22.919921875, -21.7958984375, -20.671875, -19.5478515625, -18.423828125, -17.2998046875, -16.17578125, -15.0517578125, -13.927734375, -12.8037109375, -11.6796875, -10.5556640625, -9.431640625, -8.3076171875, -7.18359375, -6.0595703125, -4.935546875, -3.8115234375, -2.6875, -1.5634765625, -0.439453125, 0.6845703125, 1.80859375, 2.9326171875, 4.056640625, 5.1806640625, 6.3046875, 7.4287109375, 8.552734375, 9.6767578125, 10.80078125, 11.9248046875, 13.048828125, 14.1728515625, 15.296875, 16.4208984375, 17.544921875, 18.6689453125, 19.79296875, 20.9169921875, 22.041015625, 23.1650390625, 24.2890625, 25.4130859375, 26.537109375, 27.6611328125, 28.78515625, 29.9091796875, 31.033203125, 32.1572265625, 33.28125]}, "gradients/decoder.transformer.h.9.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 5.0, 1.0, 1.0, 3.0, 2.0, 0.0, 5.0, 11.0, 9.0, 13.0, 11.0, 14.0, 14.0, 21.0, 28.0, 41.0, 53.0, 53.0, 99.0, 129.0, 244.0, 545.0, 4878.0, 3124970.0, 12981.0, 704.0, 297.0, 170.0, 97.0, 67.0, 53.0, 55.0, 20.0, 29.0, 25.0, 18.0, 5.0, 12.0, 9.0, 4.0, 4.0, 5.0, 3.0, 1.0, 3.0, 2.0, 2.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-99.625, -96.2587890625, -92.892578125, -89.5263671875, -86.16015625, -82.7939453125, -79.427734375, -76.0615234375, -72.6953125, -69.3291015625, -65.962890625, -62.5966796875, -59.23046875, -55.8642578125, -52.498046875, -49.1318359375, -45.765625, -42.3994140625, -39.033203125, -35.6669921875, -32.30078125, -28.9345703125, -25.568359375, -22.2021484375, -18.8359375, -15.4697265625, -12.103515625, -8.7373046875, -5.37109375, -2.0048828125, 1.361328125, 4.7275390625, 8.09375, 11.4599609375, 14.826171875, 18.1923828125, 21.55859375, 24.9248046875, 28.291015625, 31.6572265625, 35.0234375, 38.3896484375, 41.755859375, 45.1220703125, 48.48828125, 51.8544921875, 55.220703125, 58.5869140625, 61.953125, 65.3193359375, 68.685546875, 72.0517578125, 75.41796875, 78.7841796875, 82.150390625, 85.5166015625, 88.8828125, 92.2490234375, 95.615234375, 98.9814453125, 102.34765625, 105.7138671875, 109.080078125, 112.4462890625, 115.8125]}, "gradients/decoder.transformer.h.9.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 7.0, 6.0, 12.0, 26.0, 41.0, 56.0, 88.0, 109.0, 126.0, 126.0, 89.0, 115.0, 85.0, 52.0, 34.0, 20.0, 13.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.07749938964844, -33.27366256713867, -32.46982192993164, -31.665983200073242, -30.862144470214844, -30.058307647705078, -29.25446891784668, -28.45063018798828, -27.646791458129883, -26.842952728271484, -26.039113998413086, -25.235275268554688, -24.431438446044922, -23.62759780883789, -22.823760986328125, -22.019922256469727, -21.216083526611328, -20.41224479675293, -19.60840606689453, -18.804567337036133, -18.000728607177734, -17.19689178466797, -16.39305305480957, -15.589214324951172, -14.785375595092773, -13.981536865234375, -13.177698135375977, -12.373860359191895, -11.570021629333496, -10.766182899475098, -9.962345123291016, -9.158506393432617, -8.354665756225586, -7.5508270263671875, -6.746988773345947, -5.943150520324707, -5.139311790466309, -4.33547306060791, -3.53163480758667, -2.7277965545654297, -1.9239578247070312, -1.120119333267212, -0.3162808418273926, 0.48755764961242676, 1.291396141052246, 2.0952348709106445, 2.8990731239318848, 3.702911376953125, 4.506750106811523, 5.310588836669922, 6.114427089691162, 6.918265342712402, 7.722104072570801, 8.5259428024292, 9.329780578613281, 10.13361930847168, 10.937458038330078, 11.741296768188477, 12.545135498046875, 13.348973274230957, 14.152812004089355, 14.956650733947754, 15.760488510131836, 16.564327239990234, 17.368165969848633]}, "gradients/decoder.transformer.h.9.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 3.0, 5.0, 9.0, 9.0, 12.0, 6.0, 13.0, 11.0, 12.0, 18.0, 15.0, 12.0, 20.0, 25.0, 29.0, 29.0, 26.0, 30.0, 30.0, 34.0, 38.0, 42.0, 37.0, 33.0, 36.0, 41.0, 47.0, 39.0, 29.0, 26.0, 35.0, 23.0, 31.0, 18.0, 16.0, 24.0, 18.0, 23.0, 15.0, 18.0, 15.0, 11.0, 10.0, 11.0, 8.0, 5.0, 8.0, 1.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0], "bins": [-82.13314819335938, -79.55266571044922, -76.97217559814453, -74.39169311523438, -71.81120300292969, -69.23072052001953, -66.65023803710938, -64.06974792480469, -61.48926544189453, -58.90877914428711, -56.32829284667969, -53.74781036376953, -51.16732406616211, -48.58683776855469, -46.00635528564453, -43.42586898803711, -40.84538269042969, -38.264896392822266, -35.684410095214844, -33.10392761230469, -30.523441314697266, -27.942955017089844, -25.362470626831055, -22.781986236572266, -20.201499938964844, -17.621013641357422, -15.040529251098633, -12.460043907165527, -9.879558563232422, -7.299073219299316, -4.718587875366211, -2.138103485107422, 0.44237518310546875, 3.022860527038574, 5.60334587097168, 8.183831214904785, 10.76431655883789, 13.344801902770996, 15.925287246704102, 18.50577163696289, 21.086257934570312, 23.666744232177734, 26.247228622436523, 28.827713012695312, 31.408199310302734, 33.988685607910156, 36.56916809082031, 39.149654388427734, 41.730140686035156, 44.31062698364258, 46.89111328125, 49.471595764160156, 52.05208206176758, 54.632568359375, 57.213050842285156, 59.79353713989258, 62.3740234375, 64.95450592041016, 67.53499603271484, 70.115478515625, 72.69596862792969, 75.27645111083984, 77.85693359375, 80.43742370605469, 83.01790618896484]}, "gradients/decoder.transformer.h.8.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 4.0, 5.0, 8.0, 10.0, 6.0, 14.0, 17.0, 21.0, 22.0, 32.0, 37.0, 28.0, 39.0, 32.0, 39.0, 49.0, 44.0, 43.0, 53.0, 46.0, 47.0, 47.0, 35.0, 37.0, 42.0, 29.0, 20.0, 37.0, 26.0, 16.0, 18.0, 22.0, 17.0, 13.0, 4.0, 11.0, 10.0, 10.0, 6.0, 3.0, 2.0, 6.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.7890625, -10.432373046875, -10.07568359375, -9.718994140625, -9.3623046875, -9.005615234375, -8.64892578125, -8.292236328125, -7.935546875, -7.578857421875, -7.22216796875, -6.865478515625, -6.5087890625, -6.152099609375, -5.79541015625, -5.438720703125, -5.08203125, -4.725341796875, -4.36865234375, -4.011962890625, -3.6552734375, -3.298583984375, -2.94189453125, -2.585205078125, -2.228515625, -1.871826171875, -1.51513671875, -1.158447265625, -0.8017578125, -0.445068359375, -0.08837890625, 0.268310546875, 0.625, 0.981689453125, 1.33837890625, 1.695068359375, 2.0517578125, 2.408447265625, 2.76513671875, 3.121826171875, 3.478515625, 3.835205078125, 4.19189453125, 4.548583984375, 4.9052734375, 5.261962890625, 5.61865234375, 5.975341796875, 6.33203125, 6.688720703125, 7.04541015625, 7.402099609375, 7.7587890625, 8.115478515625, 8.47216796875, 8.828857421875, 9.185546875, 9.542236328125, 9.89892578125, 10.255615234375, 10.6123046875, 10.968994140625, 11.32568359375, 11.682373046875, 12.0390625]}, "gradients/decoder.transformer.h.8.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 1.0, 4.0, 7.0, 10.0, 10.0, 16.0, 41.0, 34.0, 56.0, 83.0, 126.0, 180.0, 263.0, 454.0, 735.0, 1293.0, 2320.0, 4349.0, 9096.0, 20396.0, 50759.0, 144051.0, 420610.0, 971971.0, 1310910.0, 796083.0, 294379.0, 99122.0, 37028.0, 15059.0, 6960.0, 3395.0, 1745.0, 1007.0, 579.0, 371.0, 260.0, 160.0, 111.0, 78.0, 37.0, 49.0, 24.0, 20.0, 7.0, 14.0, 5.0, 5.0, 5.0, 4.0, 3.0, 1.0, 4.0, 2.0], "bins": [-11.4140625, -11.0816650390625, -10.749267578125, -10.4168701171875, -10.08447265625, -9.7520751953125, -9.419677734375, -9.0872802734375, -8.7548828125, -8.4224853515625, -8.090087890625, -7.7576904296875, -7.42529296875, -7.0928955078125, -6.760498046875, -6.4281005859375, -6.095703125, -5.7633056640625, -5.430908203125, -5.0985107421875, -4.76611328125, -4.4337158203125, -4.101318359375, -3.7689208984375, -3.4365234375, -3.1041259765625, -2.771728515625, -2.4393310546875, -2.10693359375, -1.7745361328125, -1.442138671875, -1.1097412109375, -0.77734375, -0.4449462890625, -0.112548828125, 0.2198486328125, 0.55224609375, 0.8846435546875, 1.217041015625, 1.5494384765625, 1.8818359375, 2.2142333984375, 2.546630859375, 2.8790283203125, 3.21142578125, 3.5438232421875, 3.876220703125, 4.2086181640625, 4.541015625, 4.8734130859375, 5.205810546875, 5.5382080078125, 5.87060546875, 6.2030029296875, 6.535400390625, 6.8677978515625, 7.2001953125, 7.5325927734375, 7.864990234375, 8.1973876953125, 8.52978515625, 8.8621826171875, 9.194580078125, 9.5269775390625, 9.859375]}, "gradients/decoder.transformer.h.8.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 3.0, 4.0, 1.0, 3.0, 6.0, 17.0, 11.0, 23.0, 40.0, 54.0, 69.0, 107.0, 123.0, 191.0, 244.0, 358.0, 440.0, 520.0, 448.0, 386.0, 275.0, 202.0, 150.0, 135.0, 84.0, 54.0, 44.0, 29.0, 24.0, 16.0, 4.0, 5.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.5625, -24.88525390625, -24.2080078125, -23.53076171875, -22.853515625, -22.17626953125, -21.4990234375, -20.82177734375, -20.14453125, -19.46728515625, -18.7900390625, -18.11279296875, -17.435546875, -16.75830078125, -16.0810546875, -15.40380859375, -14.7265625, -14.04931640625, -13.3720703125, -12.69482421875, -12.017578125, -11.34033203125, -10.6630859375, -9.98583984375, -9.30859375, -8.63134765625, -7.9541015625, -7.27685546875, -6.599609375, -5.92236328125, -5.2451171875, -4.56787109375, -3.890625, -3.21337890625, -2.5361328125, -1.85888671875, -1.181640625, -0.50439453125, 0.1728515625, 0.85009765625, 1.52734375, 2.20458984375, 2.8818359375, 3.55908203125, 4.236328125, 4.91357421875, 5.5908203125, 6.26806640625, 6.9453125, 7.62255859375, 8.2998046875, 8.97705078125, 9.654296875, 10.33154296875, 11.0087890625, 11.68603515625, 12.36328125, 13.04052734375, 13.7177734375, 14.39501953125, 15.072265625, 15.74951171875, 16.4267578125, 17.10400390625, 17.78125]}, "gradients/decoder.transformer.h.8.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 3.0, 6.0, 8.0, 14.0, 21.0, 16.0, 38.0, 68.0, 80.0, 127.0, 138.0, 187.0, 248.0, 325.0, 706.0, 2594.0, 170583.0, 3981655.0, 34053.0, 1577.0, 556.0, 374.0, 221.0, 180.0, 147.0, 111.0, 77.0, 40.0, 36.0, 37.0, 14.0, 16.0, 12.0, 2.0, 8.0, 6.0, 2.0, 3.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-81.5, -78.8154296875, -76.130859375, -73.4462890625, -70.76171875, -68.0771484375, -65.392578125, -62.7080078125, -60.0234375, -57.3388671875, -54.654296875, -51.9697265625, -49.28515625, -46.6005859375, -43.916015625, -41.2314453125, -38.546875, -35.8623046875, -33.177734375, -30.4931640625, -27.80859375, -25.1240234375, -22.439453125, -19.7548828125, -17.0703125, -14.3857421875, -11.701171875, -9.0166015625, -6.33203125, -3.6474609375, -0.962890625, 1.7216796875, 4.40625, 7.0908203125, 9.775390625, 12.4599609375, 15.14453125, 17.8291015625, 20.513671875, 23.1982421875, 25.8828125, 28.5673828125, 31.251953125, 33.9365234375, 36.62109375, 39.3056640625, 41.990234375, 44.6748046875, 47.359375, 50.0439453125, 52.728515625, 55.4130859375, 58.09765625, 60.7822265625, 63.466796875, 66.1513671875, 68.8359375, 71.5205078125, 74.205078125, 76.8896484375, 79.57421875, 82.2587890625, 84.943359375, 87.6279296875, 90.3125]}, "gradients/decoder.transformer.h.8.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 29.0, 241.0, 529.0, 199.0, 19.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-596.387451171875, -585.2305908203125, -574.07373046875, -562.9168701171875, -551.7600708007812, -540.6032104492188, -529.4463500976562, -518.2894897460938, -507.13262939453125, -495.97576904296875, -484.8189392089844, -473.6620788574219, -462.5052185058594, -451.348388671875, -440.1915283203125, -429.03466796875, -417.8778381347656, -406.7209777832031, -395.56414794921875, -384.40728759765625, -373.25042724609375, -362.09356689453125, -350.9367370605469, -339.7798767089844, -328.623046875, -317.4661865234375, -306.3093566894531, -295.1524963378906, -283.9956359863281, -272.83880615234375, -261.68194580078125, -250.52508544921875, -239.36819458007812, -228.2113494873047, -217.0544891357422, -205.89764404296875, -194.74078369140625, -183.5839385986328, -172.42709350585938, -161.27023315429688, -150.1134033203125, -138.95655822753906, -127.79969787597656, -116.64285278320312, -105.48600006103516, -94.32914733886719, -83.17230224609375, -72.01544952392578, -60.85858917236328, -49.70173645019531, -38.54488754272461, -27.388038635253906, -16.231185913085938, -5.074333190917969, 6.082511901855469, 17.239364624023438, 28.396217346191406, 39.553070068359375, 50.70991897583008, 61.86676788330078, 73.02362060546875, 84.18047332763672, 95.33731842041016, 106.49417114257812, 117.6510238647461]}, "gradients/decoder.transformer.h.8.ln_2.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 3.0, 1.0, 2.0, 6.0, 5.0, 5.0, 13.0, 13.0, 12.0, 18.0, 19.0, 18.0, 29.0, 12.0, 22.0, 28.0, 40.0, 33.0, 34.0, 32.0, 44.0, 37.0, 38.0, 38.0, 48.0, 49.0, 31.0, 38.0, 37.0, 34.0, 39.0, 30.0, 33.0, 36.0, 26.0, 17.0, 10.0, 19.0, 7.0, 17.0, 11.0, 7.0, 8.0, 7.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-70.13406372070312, -68.04097747802734, -65.94789123535156, -63.854801177978516, -61.761714935302734, -59.66862487792969, -57.575538635253906, -55.482452392578125, -53.389366149902344, -51.29627990722656, -49.203189849853516, -47.110103607177734, -45.01701736450195, -42.923927307128906, -40.830841064453125, -38.737754821777344, -36.6446647644043, -34.551578521728516, -32.45848846435547, -30.365402221679688, -28.272315979003906, -26.179227828979492, -24.086139678955078, -21.993053436279297, -19.899965286254883, -17.80687713623047, -15.713790893554688, -13.620702743530273, -11.527615547180176, -9.434528350830078, -7.341440200805664, -5.248353004455566, -3.1552658081054688, -1.062178373336792, 1.0309090614318848, 3.1239967346191406, 5.217083930969238, 7.310171127319336, 9.40325927734375, 11.496346473693848, 13.589433670043945, 15.682520866394043, 17.77560806274414, 19.868696212768555, 21.96178436279297, 24.05487060546875, 26.147958755493164, 28.241046905517578, 30.33413314819336, 32.42721939086914, 34.52030944824219, 36.61339569091797, 38.70648193359375, 40.79956817626953, 42.89265823364258, 44.98574447631836, 47.078834533691406, 49.17192077636719, 51.265010833740234, 53.358097076416016, 55.4511833190918, 57.544273376464844, 59.637359619140625, 61.730445861816406, 63.82353210449219]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 7.0, 12.0, 16.0, 22.0, 15.0, 26.0, 22.0, 36.0, 24.0, 32.0, 39.0, 33.0, 47.0, 44.0, 51.0, 42.0, 45.0, 51.0, 41.0, 56.0, 34.0, 42.0, 38.0, 33.0, 31.0, 20.0, 21.0, 14.0, 17.0, 7.0, 24.0, 12.0, 11.0, 6.0, 9.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3828125, -10.028564453125, -9.67431640625, -9.320068359375, -8.9658203125, -8.611572265625, -8.25732421875, -7.903076171875, -7.548828125, -7.194580078125, -6.84033203125, -6.486083984375, -6.1318359375, -5.777587890625, -5.42333984375, -5.069091796875, -4.71484375, -4.360595703125, -4.00634765625, -3.652099609375, -3.2978515625, -2.943603515625, -2.58935546875, -2.235107421875, -1.880859375, -1.526611328125, -1.17236328125, -0.818115234375, -0.4638671875, -0.109619140625, 0.24462890625, 0.598876953125, 0.953125, 1.307373046875, 1.66162109375, 2.015869140625, 2.3701171875, 2.724365234375, 3.07861328125, 3.432861328125, 3.787109375, 4.141357421875, 4.49560546875, 4.849853515625, 5.2041015625, 5.558349609375, 5.91259765625, 6.266845703125, 6.62109375, 6.975341796875, 7.32958984375, 7.683837890625, 8.0380859375, 8.392333984375, 8.74658203125, 9.100830078125, 9.455078125, 9.809326171875, 10.16357421875, 10.517822265625, 10.8720703125, 11.226318359375, 11.58056640625, 11.934814453125, 12.2890625]}, "gradients/decoder.transformer.h.8.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 4.0, 4.0, 6.0, 10.0, 11.0, 28.0, 35.0, 41.0, 60.0, 113.0, 136.0, 232.0, 323.0, 483.0, 736.0, 1160.0, 1719.0, 2601.0, 3908.0, 6001.0, 8915.0, 14006.0, 21739.0, 34029.0, 53211.0, 83041.0, 127094.0, 172639.0, 169631.0, 122752.0, 80216.0, 51193.0, 32910.0, 20671.0, 13412.0, 8743.0, 5702.0, 3714.0, 2388.0, 1605.0, 1101.0, 718.0, 535.0, 327.0, 201.0, 176.0, 93.0, 70.0, 40.0, 28.0, 20.0, 11.0, 8.0, 4.0, 6.0, 3.0, 4.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.853515625, -0.8259429931640625, -0.798370361328125, -0.7707977294921875, -0.74322509765625, -0.7156524658203125, -0.688079833984375, -0.6605072021484375, -0.6329345703125, -0.6053619384765625, -0.577789306640625, -0.5502166748046875, -0.52264404296875, -0.4950714111328125, -0.467498779296875, -0.4399261474609375, -0.412353515625, -0.3847808837890625, -0.357208251953125, -0.3296356201171875, -0.30206298828125, -0.2744903564453125, -0.246917724609375, -0.2193450927734375, -0.1917724609375, -0.1641998291015625, -0.136627197265625, -0.1090545654296875, -0.08148193359375, -0.0539093017578125, -0.026336669921875, 0.0012359619140625, 0.02880859375, 0.0563812255859375, 0.083953857421875, 0.1115264892578125, 0.13909912109375, 0.1666717529296875, 0.194244384765625, 0.2218170166015625, 0.2493896484375, 0.2769622802734375, 0.304534912109375, 0.3321075439453125, 0.35968017578125, 0.3872528076171875, 0.414825439453125, 0.4423980712890625, 0.469970703125, 0.4975433349609375, 0.525115966796875, 0.5526885986328125, 0.58026123046875, 0.6078338623046875, 0.635406494140625, 0.6629791259765625, 0.6905517578125, 0.7181243896484375, 0.745697021484375, 0.7732696533203125, 0.80084228515625, 0.8284149169921875, 0.855987548828125, 0.8835601806640625, 0.9111328125]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 7.0, 9.0, 4.0, 4.0, 13.0, 15.0, 17.0, 14.0, 19.0, 14.0, 24.0, 26.0, 35.0, 21.0, 26.0, 44.0, 34.0, 36.0, 43.0, 31.0, 37.0, 42.0, 1063.0, 39.0, 45.0, 29.0, 34.0, 29.0, 26.0, 34.0, 25.0, 28.0, 30.0, 32.0, 15.0, 23.0, 11.0, 13.0, 12.0, 3.0, 8.0, 3.0, 4.0, 4.0, 5.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.19140625, -5.98565673828125, -5.7799072265625, -5.57415771484375, -5.368408203125, -5.16265869140625, -4.9569091796875, -4.75115966796875, -4.54541015625, -4.33966064453125, -4.1339111328125, -3.92816162109375, -3.722412109375, -3.51666259765625, -3.3109130859375, -3.10516357421875, -2.8994140625, -2.69366455078125, -2.4879150390625, -2.28216552734375, -2.076416015625, -1.87066650390625, -1.6649169921875, -1.45916748046875, -1.25341796875, -1.04766845703125, -0.8419189453125, -0.63616943359375, -0.430419921875, -0.22467041015625, -0.0189208984375, 0.18682861328125, 0.392578125, 0.59832763671875, 0.8040771484375, 1.00982666015625, 1.215576171875, 1.42132568359375, 1.6270751953125, 1.83282470703125, 2.03857421875, 2.24432373046875, 2.4500732421875, 2.65582275390625, 2.861572265625, 3.06732177734375, 3.2730712890625, 3.47882080078125, 3.6845703125, 3.89031982421875, 4.0960693359375, 4.30181884765625, 4.507568359375, 4.71331787109375, 4.9190673828125, 5.12481689453125, 5.33056640625, 5.53631591796875, 5.7420654296875, 5.94781494140625, 6.153564453125, 6.35931396484375, 6.5650634765625, 6.77081298828125, 6.9765625]}, "gradients/decoder.transformer.h.8.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 3.0, 6.0, 5.0, 6.0, 18.0, 26.0, 36.0, 41.0, 57.0, 102.0, 130.0, 208.0, 315.0, 435.0, 605.0, 911.0, 1413.0, 2055.0, 3040.0, 4672.0, 6751.0, 10236.0, 15731.0, 23237.0, 34790.0, 51641.0, 75302.0, 105388.0, 136438.0, 1194006.0, 127662.0, 95447.0, 66967.0, 45876.0, 31172.0, 20810.0, 13822.0, 9325.0, 6070.0, 4073.0, 2637.0, 1893.0, 1231.0, 856.0, 550.0, 401.0, 255.0, 157.0, 100.0, 83.0, 59.0, 27.0, 23.0, 21.0, 8.0, 5.0, 6.0, 2.0, 3.0, 1.0, 3.0], "bins": [-0.6279296875, -0.6085205078125, -0.589111328125, -0.5697021484375, -0.55029296875, -0.5308837890625, -0.511474609375, -0.4920654296875, -0.47265625, -0.4532470703125, -0.433837890625, -0.4144287109375, -0.39501953125, -0.3756103515625, -0.356201171875, -0.3367919921875, -0.3173828125, -0.2979736328125, -0.278564453125, -0.2591552734375, -0.23974609375, -0.2203369140625, -0.200927734375, -0.1815185546875, -0.162109375, -0.1427001953125, -0.123291015625, -0.1038818359375, -0.08447265625, -0.0650634765625, -0.045654296875, -0.0262451171875, -0.0068359375, 0.0125732421875, 0.031982421875, 0.0513916015625, 0.07080078125, 0.0902099609375, 0.109619140625, 0.1290283203125, 0.1484375, 0.1678466796875, 0.187255859375, 0.2066650390625, 0.22607421875, 0.2454833984375, 0.264892578125, 0.2843017578125, 0.3037109375, 0.3231201171875, 0.342529296875, 0.3619384765625, 0.38134765625, 0.4007568359375, 0.420166015625, 0.4395751953125, 0.458984375, 0.4783935546875, 0.497802734375, 0.5172119140625, 0.53662109375, 0.5560302734375, 0.575439453125, 0.5948486328125, 0.6142578125]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 3.0, 1.0, 1.0, 4.0, 6.0, 11.0, 6.0, 12.0, 14.0, 7.0, 15.0, 15.0, 25.0, 31.0, 29.0, 45.0, 47.0, 41.0, 63.0, 57.0, 52.0, 59.0, 50.0, 63.0, 55.0, 46.0, 38.0, 38.0, 44.0, 31.0, 18.0, 18.0, 12.0, 12.0, 7.0, 8.0, 5.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.005855560302734375, -0.005664348602294922, -0.005473136901855469, -0.005281925201416016, -0.0050907135009765625, -0.004899501800537109, -0.004708290100097656, -0.004517078399658203, -0.00432586669921875, -0.004134654998779297, -0.003943443298339844, -0.0037522315979003906, -0.0035610198974609375, -0.0033698081970214844, -0.0031785964965820312, -0.002987384796142578, -0.002796173095703125, -0.002604961395263672, -0.0024137496948242188, -0.0022225379943847656, -0.0020313262939453125, -0.0018401145935058594, -0.0016489028930664062, -0.0014576911926269531, -0.0012664794921875, -0.0010752677917480469, -0.0008840560913085938, -0.0006928443908691406, -0.0005016326904296875, -0.0003104209899902344, -0.00011920928955078125, 7.200241088867188e-05, 0.000263214111328125, 0.0004544258117675781, 0.0006456375122070312, 0.0008368492126464844, 0.0010280609130859375, 0.0012192726135253906, 0.0014104843139648438, 0.0016016960144042969, 0.00179290771484375, 0.001984119415283203, 0.0021753311157226562, 0.0023665428161621094, 0.0025577545166015625, 0.0027489662170410156, 0.0029401779174804688, 0.003131389617919922, 0.003322601318359375, 0.003513813018798828, 0.0037050247192382812, 0.0038962364196777344, 0.0040874481201171875, 0.004278659820556641, 0.004469871520996094, 0.004661083221435547, 0.004852294921875, 0.005043506622314453, 0.005234718322753906, 0.005425930023193359, 0.0056171417236328125, 0.005808353424072266, 0.005999565124511719, 0.006190776824951172, 0.006381988525390625]}, "gradients/decoder.transformer.h.8.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0, 4.0, 9.0, 3.0, 4.0, 10.0, 7.0, 14.0, 22.0, 17.0, 21.0, 36.0, 41.0, 75.0, 82.0, 101.0, 164.0, 285.0, 740.0, 19583.0, 1015007.0, 10688.0, 730.0, 280.0, 152.0, 83.0, 105.0, 67.0, 49.0, 38.0, 25.0, 28.0, 10.0, 17.0, 15.0, 8.0, 9.0, 10.0, 3.0, 6.0, 2.0, 1.0, 4.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.132080078125, -0.12788009643554688, -0.12368011474609375, -0.11948013305664062, -0.1152801513671875, -0.11108016967773438, -0.10688018798828125, -0.10268020629882812, -0.098480224609375, -0.09428024291992188, -0.09008026123046875, -0.08588027954101562, -0.0816802978515625, -0.07748031616210938, -0.07328033447265625, -0.06908035278320312, -0.06488037109375, -0.060680389404296875, -0.05648040771484375, -0.052280426025390625, -0.0480804443359375, -0.043880462646484375, -0.03968048095703125, -0.035480499267578125, -0.031280517578125, -0.027080535888671875, -0.02288055419921875, -0.018680572509765625, -0.0144805908203125, -0.010280609130859375, -0.00608062744140625, -0.001880645751953125, 0.0023193359375, 0.006519317626953125, 0.01071929931640625, 0.014919281005859375, 0.0191192626953125, 0.023319244384765625, 0.02751922607421875, 0.031719207763671875, 0.035919189453125, 0.040119171142578125, 0.04431915283203125, 0.048519134521484375, 0.0527191162109375, 0.056919097900390625, 0.06111907958984375, 0.06531906127929688, 0.06951904296875, 0.07371902465820312, 0.07791900634765625, 0.08211898803710938, 0.0863189697265625, 0.09051895141601562, 0.09471893310546875, 0.09891891479492188, 0.103118896484375, 0.10731887817382812, 0.11151885986328125, 0.11571884155273438, 0.1199188232421875, 0.12411880493164062, 0.12831878662109375, 0.13251876831054688, 0.13671875]}, "gradients/decoder.transformer.h.8.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 10.0, 417.0, 563.0, 24.0, 1.0, 1.0], "bins": [-0.07816892117261887, -0.0768674984574318, -0.07556608319282532, -0.07426466047763824, -0.07296324521303177, -0.0716618224978447, -0.07036040723323822, -0.06905898451805115, -0.06775756925344467, -0.0664561465382576, -0.06515473127365112, -0.06385330855846405, -0.06255189329385757, -0.0612504743039608, -0.059949055314064026, -0.05864763259887695, -0.05734621360898018, -0.056044794619083405, -0.05474337562918663, -0.053441956639289856, -0.05214053764939308, -0.05083911865949631, -0.04953769966959953, -0.04823628067970276, -0.046934857964515686, -0.04563343897461891, -0.04433201998472214, -0.04303060099482536, -0.04172918200492859, -0.040427763015031815, -0.03912634402513504, -0.03782492130994797, -0.03652350604534149, -0.03522208705544472, -0.03392066806554794, -0.03261924907565117, -0.031317830085754395, -0.03001641109585762, -0.028714990243315697, -0.027413571253418922, -0.026112154126167297, -0.024810735136270523, -0.02350931614637375, -0.022207897156476974, -0.0209064781665802, -0.019605059176683426, -0.018303638324141502, -0.017002219334244728, -0.015700798481702805, -0.01439937949180603, -0.013097960501909256, -0.011796540580689907, -0.010495121590793133, -0.009193702600896358, -0.00789228267967701, -0.006590863689780235, -0.005289445631206036, -0.003988026641309261, -0.0026866071857511997, -0.0013851879630237818, -8.376874029636383e-05, 0.0012176502496004105, 0.002519069705158472, 0.0038204891607165337, 0.005121908150613308]}, "gradients/decoder.transformer.h.8.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 2.0, 2.0, 4.0, 10.0, 7.0, 13.0, 9.0, 8.0, 10.0, 16.0, 17.0, 18.0, 30.0, 18.0, 26.0, 35.0, 41.0, 37.0, 45.0, 48.0, 49.0, 40.0, 54.0, 45.0, 52.0, 48.0, 40.0, 41.0, 38.0, 36.0, 30.0, 30.0, 28.0, 12.0, 7.0, 16.0, 16.0, 4.0, 10.0, 6.0, 5.0, 5.0, 0.0, 2.0, 2.0, 2.0, 2.0], "bins": [-0.004800736904144287, -0.004676404409110546, -0.004552071914076805, -0.004427739419043064, -0.004303406924009323, -0.004179074428975582, -0.004054741933941841, -0.0039304094389081, -0.003806076943874359, -0.003681744448840618, -0.003557411953806877, -0.003433079458773136, -0.003308746963739395, -0.003184414468705654, -0.003060081973671913, -0.002935749478638172, -0.002811416983604431, -0.00268708448857069, -0.002562751993536949, -0.002438419498503208, -0.002314087003469467, -0.002189754508435726, -0.002065422013401985, -0.0019410895183682442, -0.0018167570233345032, -0.0016924245283007622, -0.0015680920332670212, -0.0014437595382332802, -0.0013194270431995392, -0.0011950945481657982, -0.0010707620531320572, -0.0009464295580983162, -0.0008220970630645752, -0.0006977645680308342, -0.0005734320729970932, -0.0004490995779633522, -0.0003247670829296112, -0.0002004345878958702, -7.610209286212921e-05, 4.8230402171611786e-05, 0.00017256289720535278, 0.0002968953922390938, 0.0004212278872728348, 0.0005455603823065758, 0.0006698928773403168, 0.0007942253723740578, 0.0009185578674077988, 0.0010428903624415398, 0.0011672228574752808, 0.0012915553525090218, 0.0014158878475427628, 0.0015402203425765038, 0.0016645528376102448, 0.0017888853326439857, 0.0019132178276777267, 0.0020375503227114677, 0.0021618828177452087, 0.0022862153127789497, 0.0024105478078126907, 0.0025348803028464317, 0.0026592127978801727, 0.0027835452929139137, 0.0029078777879476547, 0.0030322102829813957, 0.0031565427780151367]}, "gradients/decoder.transformer.h.8.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 9.0, 7.0, 12.0, 16.0, 22.0, 15.0, 26.0, 22.0, 36.0, 24.0, 32.0, 39.0, 33.0, 47.0, 44.0, 51.0, 42.0, 46.0, 50.0, 41.0, 56.0, 34.0, 42.0, 38.0, 33.0, 31.0, 20.0, 21.0, 14.0, 17.0, 7.0, 24.0, 12.0, 11.0, 6.0, 9.0, 6.0, 1.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3828125, -10.028564453125, -9.67431640625, -9.320068359375, -8.9658203125, -8.611572265625, -8.25732421875, -7.903076171875, -7.548828125, -7.194580078125, -6.84033203125, -6.486083984375, -6.1318359375, -5.777587890625, -5.42333984375, -5.069091796875, -4.71484375, -4.360595703125, -4.00634765625, -3.652099609375, -3.2978515625, -2.943603515625, -2.58935546875, -2.235107421875, -1.880859375, -1.526611328125, -1.17236328125, -0.818115234375, -0.4638671875, -0.109619140625, 0.24462890625, 0.598876953125, 0.953125, 1.307373046875, 1.66162109375, 2.015869140625, 2.3701171875, 2.724365234375, 3.07861328125, 3.432861328125, 3.787109375, 4.141357421875, 4.49560546875, 4.849853515625, 5.2041015625, 5.558349609375, 5.91259765625, 6.266845703125, 6.62109375, 6.975341796875, 7.32958984375, 7.683837890625, 8.0380859375, 8.392333984375, 8.74658203125, 9.100830078125, 9.455078125, 9.809326171875, 10.16357421875, 10.517822265625, 10.8720703125, 11.226318359375, 11.58056640625, 11.934814453125, 12.2890625]}, "gradients/decoder.transformer.h.8.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 0.0, 1.0, 1.0, 6.0, 8.0, 15.0, 15.0, 14.0, 31.0, 40.0, 60.0, 106.0, 175.0, 367.0, 758.0, 1691.0, 4033.0, 9280.0, 21973.0, 55841.0, 167651.0, 454943.0, 217418.0, 68221.0, 26479.0, 10820.0, 4715.0, 2077.0, 875.0, 428.0, 190.0, 109.0, 66.0, 38.0, 34.0, 30.0, 13.0, 7.0, 11.0, 9.0, 8.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.3125, -9.964111328125, -9.61572265625, -9.267333984375, -8.9189453125, -8.570556640625, -8.22216796875, -7.873779296875, -7.525390625, -7.177001953125, -6.82861328125, -6.480224609375, -6.1318359375, -5.783447265625, -5.43505859375, -5.086669921875, -4.73828125, -4.389892578125, -4.04150390625, -3.693115234375, -3.3447265625, -2.996337890625, -2.64794921875, -2.299560546875, -1.951171875, -1.602783203125, -1.25439453125, -0.906005859375, -0.5576171875, -0.209228515625, 0.13916015625, 0.487548828125, 0.8359375, 1.184326171875, 1.53271484375, 1.881103515625, 2.2294921875, 2.577880859375, 2.92626953125, 3.274658203125, 3.623046875, 3.971435546875, 4.31982421875, 4.668212890625, 5.0166015625, 5.364990234375, 5.71337890625, 6.061767578125, 6.41015625, 6.758544921875, 7.10693359375, 7.455322265625, 7.8037109375, 8.152099609375, 8.50048828125, 8.848876953125, 9.197265625, 9.545654296875, 9.89404296875, 10.242431640625, 10.5908203125, 10.939208984375, 11.28759765625, 11.635986328125, 11.984375]}, "gradients/decoder.transformer.h.8.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 1.0, 7.0, 10.0, 10.0, 7.0, 10.0, 12.0, 23.0, 23.0, 22.0, 18.0, 21.0, 30.0, 45.0, 46.0, 49.0, 53.0, 67.0, 153.0, 1583.0, 318.0, 110.0, 60.0, 39.0, 34.0, 54.0, 31.0, 37.0, 24.0, 30.0, 20.0, 22.0, 9.0, 13.0, 14.0, 10.0, 13.0, 6.0, 3.0, 3.0, 4.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0], "bins": [-35.8125, -34.783203125, -33.75390625, -32.724609375, -31.6953125, -30.666015625, -29.63671875, -28.607421875, -27.578125, -26.548828125, -25.51953125, -24.490234375, -23.4609375, -22.431640625, -21.40234375, -20.373046875, -19.34375, -18.314453125, -17.28515625, -16.255859375, -15.2265625, -14.197265625, -13.16796875, -12.138671875, -11.109375, -10.080078125, -9.05078125, -8.021484375, -6.9921875, -5.962890625, -4.93359375, -3.904296875, -2.875, -1.845703125, -0.81640625, 0.212890625, 1.2421875, 2.271484375, 3.30078125, 4.330078125, 5.359375, 6.388671875, 7.41796875, 8.447265625, 9.4765625, 10.505859375, 11.53515625, 12.564453125, 13.59375, 14.623046875, 15.65234375, 16.681640625, 17.7109375, 18.740234375, 19.76953125, 20.798828125, 21.828125, 22.857421875, 23.88671875, 24.916015625, 25.9453125, 26.974609375, 28.00390625, 29.033203125, 30.0625]}, "gradients/decoder.transformer.h.8.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 3.0, 7.0, 3.0, 8.0, 13.0, 15.0, 12.0, 19.0, 20.0, 26.0, 31.0, 51.0, 82.0, 101.0, 108.0, 164.0, 218.0, 322.0, 656.0, 4472.0, 313013.0, 2809294.0, 14724.0, 1013.0, 385.0, 262.0, 162.0, 119.0, 81.0, 73.0, 55.0, 50.0, 35.0, 18.0, 18.0, 15.0, 13.0, 16.0, 6.0, 6.0, 6.0, 6.0, 3.0, 4.0, 4.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.65625, -52.90283203125, -51.1494140625, -49.39599609375, -47.642578125, -45.88916015625, -44.1357421875, -42.38232421875, -40.62890625, -38.87548828125, -37.1220703125, -35.36865234375, -33.615234375, -31.86181640625, -30.1083984375, -28.35498046875, -26.6015625, -24.84814453125, -23.0947265625, -21.34130859375, -19.587890625, -17.83447265625, -16.0810546875, -14.32763671875, -12.57421875, -10.82080078125, -9.0673828125, -7.31396484375, -5.560546875, -3.80712890625, -2.0537109375, -0.30029296875, 1.453125, 3.20654296875, 4.9599609375, 6.71337890625, 8.466796875, 10.22021484375, 11.9736328125, 13.72705078125, 15.48046875, 17.23388671875, 18.9873046875, 20.74072265625, 22.494140625, 24.24755859375, 26.0009765625, 27.75439453125, 29.5078125, 31.26123046875, 33.0146484375, 34.76806640625, 36.521484375, 38.27490234375, 40.0283203125, 41.78173828125, 43.53515625, 45.28857421875, 47.0419921875, 48.79541015625, 50.548828125, 52.30224609375, 54.0556640625, 55.80908203125, 57.5625]}, "gradients/decoder.transformer.h.8.ln_1.weight": {"_type": "histogram", "values": [11.0, 207.0, 612.0, 180.0, 9.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.5772066116333, -8.724058151245117, -2.8709096908569336, 2.9822378158569336, 8.835387229919434, 14.688536643981934, 20.541683197021484, 26.394832611083984, 32.247982025146484, 38.101131439208984, 43.95427703857422, 49.80742645263672, 55.66057586669922, 61.51372528076172, 67.36686706542969, 73.22001647949219, 79.07316589355469, 84.92631530761719, 90.77946472167969, 96.63261413574219, 102.48576354980469, 108.33891296386719, 114.19205474853516, 120.04520416259766, 125.89835357666016, 131.75149536132812, 137.60464477539062, 143.45779418945312, 149.31094360351562, 155.16409301757812, 161.01724243164062, 166.87039184570312, 172.72354125976562, 178.57669067382812, 184.42984008789062, 190.28298950195312, 196.13613891601562, 201.98928833007812, 207.84243774414062, 213.69558715820312, 219.54873657226562, 225.40188598632812, 231.25503540039062, 237.10818481445312, 242.96133422851562, 248.81448364257812, 254.66763305664062, 260.5207824707031, 266.3739013671875, 272.22705078125, 278.0802001953125, 283.933349609375, 289.7864990234375, 295.6396484375, 301.4927978515625, 307.345947265625, 313.1990966796875, 319.05224609375, 324.9053955078125, 330.758544921875, 336.6116943359375, 342.46484375, 348.3179931640625, 354.171142578125, 360.0242919921875]}, "gradients/decoder.transformer.h.8.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 0.0, 6.0, 4.0, 7.0, 10.0, 7.0, 12.0, 16.0, 15.0, 24.0, 14.0, 20.0, 24.0, 33.0, 33.0, 30.0, 36.0, 40.0, 34.0, 45.0, 37.0, 46.0, 45.0, 38.0, 56.0, 53.0, 23.0, 35.0, 29.0, 26.0, 23.0, 27.0, 26.0, 18.0, 26.0, 13.0, 12.0, 11.0, 9.0, 12.0, 12.0, 1.0, 8.0, 3.0, 5.0, 3.0, 4.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-80.3714599609375, -77.92533874511719, -75.4792251586914, -73.0331039428711, -70.58698272705078, -68.140869140625, -65.69474792480469, -63.248626708984375, -60.80250930786133, -58.35639190673828, -55.91027069091797, -53.46415328979492, -51.018035888671875, -48.57191467285156, -46.125797271728516, -43.67967987060547, -41.233558654785156, -38.78744125366211, -36.3413200378418, -33.89520263671875, -31.44908332824707, -29.00296401977539, -26.556846618652344, -24.110727310180664, -21.664608001708984, -19.218488693237305, -16.772369384765625, -14.326251983642578, -11.880132675170898, -9.434013366699219, -6.9878950119018555, -4.541776657104492, -2.0956497192382812, 0.35046911239624023, 2.7965879440307617, 5.242706775665283, 7.688825607299805, 10.134944915771484, 12.581063270568848, 15.027181625366211, 17.47330093383789, 19.91942024230957, 22.36553955078125, 24.811656951904297, 27.257776260375977, 29.703895568847656, 32.1500129699707, 34.59613037109375, 37.04225158691406, 39.48836898803711, 41.93449020385742, 44.38060760498047, 46.82672882080078, 49.27284622192383, 51.718963623046875, 54.16508483886719, 56.611202239990234, 59.05731964111328, 61.503440856933594, 63.94955825805664, 66.39567565917969, 68.841796875, 71.28791809082031, 73.7340316772461, 76.1801528930664]}, "gradients/decoder.transformer.h.7.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 2.0, 5.0, 5.0, 2.0, 5.0, 13.0, 15.0, 20.0, 19.0, 21.0, 31.0, 24.0, 33.0, 25.0, 34.0, 41.0, 36.0, 51.0, 38.0, 49.0, 51.0, 41.0, 50.0, 50.0, 45.0, 37.0, 39.0, 37.0, 29.0, 19.0, 24.0, 20.0, 14.0, 16.0, 17.0, 11.0, 11.0, 7.0, 8.0, 8.0, 4.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.515625, -10.1484375, -9.78125, -9.4140625, -9.046875, -8.6796875, -8.3125, -7.9453125, -7.578125, -7.2109375, -6.84375, -6.4765625, -6.109375, -5.7421875, -5.375, -5.0078125, -4.640625, -4.2734375, -3.90625, -3.5390625, -3.171875, -2.8046875, -2.4375, -2.0703125, -1.703125, -1.3359375, -0.96875, -0.6015625, -0.234375, 0.1328125, 0.5, 0.8671875, 1.234375, 1.6015625, 1.96875, 2.3359375, 2.703125, 3.0703125, 3.4375, 3.8046875, 4.171875, 4.5390625, 4.90625, 5.2734375, 5.640625, 6.0078125, 6.375, 6.7421875, 7.109375, 7.4765625, 7.84375, 8.2109375, 8.578125, 8.9453125, 9.3125, 9.6796875, 10.046875, 10.4140625, 10.78125, 11.1484375, 11.515625, 11.8828125, 12.25, 12.6171875, 12.984375]}, "gradients/decoder.transformer.h.7.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 3.0, 4.0, 4.0, 6.0, 5.0, 9.0, 15.0, 15.0, 19.0, 24.0, 22.0, 25.0, 37.0, 38.0, 55.0, 73.0, 89.0, 161.0, 406.0, 1489.0, 9157.0, 86087.0, 1482364.0, 2428205.0, 167567.0, 14926.0, 2284.0, 521.0, 230.0, 96.0, 52.0, 55.0, 50.0, 38.0, 37.0, 19.0, 18.0, 12.0, 13.0, 11.0, 16.0, 8.0, 7.0, 7.0, 4.0, 5.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-25.875, -24.986572265625, -24.09814453125, -23.209716796875, -22.3212890625, -21.432861328125, -20.54443359375, -19.656005859375, -18.767578125, -17.879150390625, -16.99072265625, -16.102294921875, -15.2138671875, -14.325439453125, -13.43701171875, -12.548583984375, -11.66015625, -10.771728515625, -9.88330078125, -8.994873046875, -8.1064453125, -7.218017578125, -6.32958984375, -5.441162109375, -4.552734375, -3.664306640625, -2.77587890625, -1.887451171875, -0.9990234375, -0.110595703125, 0.77783203125, 1.666259765625, 2.5546875, 3.443115234375, 4.33154296875, 5.219970703125, 6.1083984375, 6.996826171875, 7.88525390625, 8.773681640625, 9.662109375, 10.550537109375, 11.43896484375, 12.327392578125, 13.2158203125, 14.104248046875, 14.99267578125, 15.881103515625, 16.76953125, 17.657958984375, 18.54638671875, 19.434814453125, 20.3232421875, 21.211669921875, 22.10009765625, 22.988525390625, 23.876953125, 24.765380859375, 25.65380859375, 26.542236328125, 27.4306640625, 28.319091796875, 29.20751953125, 30.095947265625, 30.984375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 2.0, 0.0, 3.0, 8.0, 2.0, 9.0, 11.0, 15.0, 8.0, 27.0, 27.0, 50.0, 59.0, 71.0, 96.0, 148.0, 158.0, 234.0, 335.0, 443.0, 440.0, 431.0, 392.0, 280.0, 219.0, 146.0, 118.0, 103.0, 60.0, 38.0, 30.0, 29.0, 23.0, 15.0, 14.0, 7.0, 4.0, 10.0, 7.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 4.0], "bins": [-21.8125, -21.2506103515625, -20.688720703125, -20.1268310546875, -19.56494140625, -19.0030517578125, -18.441162109375, -17.8792724609375, -17.3173828125, -16.7554931640625, -16.193603515625, -15.6317138671875, -15.06982421875, -14.5079345703125, -13.946044921875, -13.3841552734375, -12.822265625, -12.2603759765625, -11.698486328125, -11.1365966796875, -10.57470703125, -10.0128173828125, -9.450927734375, -8.8890380859375, -8.3271484375, -7.7652587890625, -7.203369140625, -6.6414794921875, -6.07958984375, -5.5177001953125, -4.955810546875, -4.3939208984375, -3.83203125, -3.2701416015625, -2.708251953125, -2.1463623046875, -1.58447265625, -1.0225830078125, -0.460693359375, 0.1011962890625, 0.6630859375, 1.2249755859375, 1.786865234375, 2.3487548828125, 2.91064453125, 3.4725341796875, 4.034423828125, 4.5963134765625, 5.158203125, 5.7200927734375, 6.281982421875, 6.8438720703125, 7.40576171875, 7.9676513671875, 8.529541015625, 9.0914306640625, 9.6533203125, 10.2152099609375, 10.777099609375, 11.3389892578125, 11.90087890625, 12.4627685546875, 13.024658203125, 13.5865478515625, 14.1484375]}, "gradients/decoder.transformer.h.7.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 4.0, 1.0, 1.0, 5.0, 3.0, 4.0, 10.0, 11.0, 21.0, 22.0, 14.0, 33.0, 38.0, 62.0, 78.0, 114.0, 167.0, 203.0, 303.0, 626.0, 2854.0, 235784.0, 3931361.0, 20020.0, 1137.0, 414.0, 247.0, 191.0, 136.0, 121.0, 88.0, 60.0, 48.0, 23.0, 22.0, 17.0, 13.0, 9.0, 8.0, 7.0, 3.0, 2.0, 4.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-91.375, -88.4541015625, -85.533203125, -82.6123046875, -79.69140625, -76.7705078125, -73.849609375, -70.9287109375, -68.0078125, -65.0869140625, -62.166015625, -59.2451171875, -56.32421875, -53.4033203125, -50.482421875, -47.5615234375, -44.640625, -41.7197265625, -38.798828125, -35.8779296875, -32.95703125, -30.0361328125, -27.115234375, -24.1943359375, -21.2734375, -18.3525390625, -15.431640625, -12.5107421875, -9.58984375, -6.6689453125, -3.748046875, -0.8271484375, 2.09375, 5.0146484375, 7.935546875, 10.8564453125, 13.77734375, 16.6982421875, 19.619140625, 22.5400390625, 25.4609375, 28.3818359375, 31.302734375, 34.2236328125, 37.14453125, 40.0654296875, 42.986328125, 45.9072265625, 48.828125, 51.7490234375, 54.669921875, 57.5908203125, 60.51171875, 63.4326171875, 66.353515625, 69.2744140625, 72.1953125, 75.1162109375, 78.037109375, 80.9580078125, 83.87890625, 86.7998046875, 89.720703125, 92.6416015625, 95.5625]}, "gradients/decoder.transformer.h.7.ln_2.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 6.0, 23.0, 80.0, 142.0, 225.0, 215.0, 173.0, 97.0, 36.0, 12.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-192.38648986816406, -188.0321044921875, -183.67770385742188, -179.32330322265625, -174.9689178466797, -170.61453247070312, -166.2601318359375, -161.90573120117188, -157.5513458251953, -153.19696044921875, -148.84255981445312, -144.4881591796875, -140.13377380371094, -135.77938842773438, -131.42498779296875, -127.07059478759766, -122.71620178222656, -118.36180877685547, -114.00741577148438, -109.65302276611328, -105.29862976074219, -100.9442367553711, -96.58984375, -92.2354507446289, -87.88105773925781, -83.52666473388672, -79.17227172851562, -74.81787872314453, -70.46348571777344, -66.10909271240234, -61.75469970703125, -57.400306701660156, -53.045921325683594, -48.6915283203125, -44.337135314941406, -39.98274230957031, -35.62834930419922, -31.273956298828125, -26.91956329345703, -22.565170288085938, -18.210777282714844, -13.85638427734375, -9.501991271972656, -5.1475982666015625, -0.7932052612304688, 3.561187744140625, 7.915580749511719, 12.269973754882812, 16.624366760253906, 20.978759765625, 25.333152770996094, 29.687545776367188, 34.04193878173828, 38.396331787109375, 42.75072479248047, 47.10511779785156, 51.459510803222656, 55.81390380859375, 60.168296813964844, 64.52268981933594, 68.87708282470703, 73.23147583007812, 77.58586883544922, 81.94026184082031, 86.2946548461914]}, "gradients/decoder.transformer.h.7.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 3.0, 5.0, 4.0, 6.0, 9.0, 10.0, 13.0, 26.0, 16.0, 20.0, 25.0, 27.0, 25.0, 37.0, 51.0, 37.0, 30.0, 53.0, 43.0, 46.0, 54.0, 46.0, 44.0, 40.0, 47.0, 48.0, 26.0, 31.0, 34.0, 27.0, 22.0, 30.0, 11.0, 20.0, 11.0, 6.0, 7.0, 6.0, 3.0, 3.0, 2.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-65.0369873046875, -62.9004020690918, -60.763816833496094, -58.62723159790039, -56.49064636230469, -54.35406494140625, -52.21747970581055, -50.080894470214844, -47.94430923461914, -45.80772399902344, -43.671138763427734, -41.53455352783203, -39.397972106933594, -37.261383056640625, -35.12480163574219, -32.988216400146484, -30.85163116455078, -28.715045928955078, -26.578460693359375, -24.441877365112305, -22.3052921295166, -20.1687068939209, -18.032123565673828, -15.895538330078125, -13.758953094482422, -11.622367858886719, -9.485783576965332, -7.349198818206787, -5.212614059448242, -3.076028823852539, -0.9394445419311523, 1.1971397399902344, 3.3337249755859375, 5.470309734344482, 7.606894493103027, 9.743478775024414, 11.880064010620117, 14.01664924621582, 16.15323257446289, 18.289817810058594, 20.426403045654297, 22.56298828125, 24.699573516845703, 26.836156845092773, 28.972742080688477, 31.10932731628418, 33.24591064453125, 35.38249588012695, 37.519081115722656, 39.65566635131836, 41.79225158691406, 43.928836822509766, 46.06542205810547, 48.202003479003906, 50.33858871459961, 52.47517395019531, 54.611759185791016, 56.74834442138672, 58.88492965698242, 61.021514892578125, 63.15809631347656, 65.29468536376953, 67.43126678466797, 69.56785583496094, 71.70443725585938]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 3.0, 10.0, 10.0, 10.0, 15.0, 17.0, 21.0, 14.0, 28.0, 17.0, 20.0, 34.0, 34.0, 31.0, 40.0, 45.0, 44.0, 41.0, 44.0, 50.0, 54.0, 49.0, 37.0, 40.0, 37.0, 30.0, 29.0, 25.0, 19.0, 26.0, 20.0, 16.0, 19.0, 12.0, 11.0, 12.0, 16.0, 6.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.796875, -10.450927734375, -10.10498046875, -9.759033203125, -9.4130859375, -9.067138671875, -8.72119140625, -8.375244140625, -8.029296875, -7.683349609375, -7.33740234375, -6.991455078125, -6.6455078125, -6.299560546875, -5.95361328125, -5.607666015625, -5.26171875, -4.915771484375, -4.56982421875, -4.223876953125, -3.8779296875, -3.531982421875, -3.18603515625, -2.840087890625, -2.494140625, -2.148193359375, -1.80224609375, -1.456298828125, -1.1103515625, -0.764404296875, -0.41845703125, -0.072509765625, 0.2734375, 0.619384765625, 0.96533203125, 1.311279296875, 1.6572265625, 2.003173828125, 2.34912109375, 2.695068359375, 3.041015625, 3.386962890625, 3.73291015625, 4.078857421875, 4.4248046875, 4.770751953125, 5.11669921875, 5.462646484375, 5.80859375, 6.154541015625, 6.50048828125, 6.846435546875, 7.1923828125, 7.538330078125, 7.88427734375, 8.230224609375, 8.576171875, 8.922119140625, 9.26806640625, 9.614013671875, 9.9599609375, 10.305908203125, 10.65185546875, 10.997802734375, 11.34375]}, "gradients/decoder.transformer.h.7.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 7.0, 10.0, 8.0, 11.0, 22.0, 30.0, 47.0, 79.0, 112.0, 186.0, 283.0, 462.0, 794.0, 1344.0, 2089.0, 3665.0, 6129.0, 10575.0, 18362.0, 31950.0, 56574.0, 98994.0, 169599.0, 226509.0, 176898.0, 104859.0, 59091.0, 33882.0, 18948.0, 11087.0, 6489.0, 3813.0, 2197.0, 1357.0, 767.0, 455.0, 309.0, 223.0, 118.0, 94.0, 54.0, 28.0, 22.0, 12.0, 8.0, 3.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.11328125, -1.0779876708984375, -1.042694091796875, -1.0074005126953125, -0.97210693359375, -0.9368133544921875, -0.901519775390625, -0.8662261962890625, -0.8309326171875, -0.7956390380859375, -0.760345458984375, -0.7250518798828125, -0.68975830078125, -0.6544647216796875, -0.619171142578125, -0.5838775634765625, -0.548583984375, -0.5132904052734375, -0.477996826171875, -0.4427032470703125, -0.40740966796875, -0.3721160888671875, -0.336822509765625, -0.3015289306640625, -0.2662353515625, -0.2309417724609375, -0.195648193359375, -0.1603546142578125, -0.12506103515625, -0.0897674560546875, -0.054473876953125, -0.0191802978515625, 0.01611328125, 0.0514068603515625, 0.086700439453125, 0.1219940185546875, 0.15728759765625, 0.1925811767578125, 0.227874755859375, 0.2631683349609375, 0.2984619140625, 0.3337554931640625, 0.369049072265625, 0.4043426513671875, 0.43963623046875, 0.4749298095703125, 0.510223388671875, 0.5455169677734375, 0.580810546875, 0.6161041259765625, 0.651397705078125, 0.6866912841796875, 0.72198486328125, 0.7572784423828125, 0.792572021484375, 0.8278656005859375, 0.8631591796875, 0.8984527587890625, 0.933746337890625, 0.9690399169921875, 1.00433349609375, 1.0396270751953125, 1.074920654296875, 1.1102142333984375, 1.1455078125]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 4.0, 5.0, 3.0, 7.0, 9.0, 4.0, 7.0, 19.0, 10.0, 20.0, 21.0, 28.0, 22.0, 20.0, 33.0, 27.0, 37.0, 25.0, 41.0, 34.0, 31.0, 48.0, 1070.0, 43.0, 35.0, 50.0, 41.0, 38.0, 34.0, 30.0, 29.0, 27.0, 18.0, 23.0, 25.0, 22.0, 21.0, 14.0, 12.0, 12.0, 7.0, 6.0, 8.0, 4.0, 4.0, 1.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0], "bins": [-7.14453125, -6.938720703125, -6.73291015625, -6.527099609375, -6.3212890625, -6.115478515625, -5.90966796875, -5.703857421875, -5.498046875, -5.292236328125, -5.08642578125, -4.880615234375, -4.6748046875, -4.468994140625, -4.26318359375, -4.057373046875, -3.8515625, -3.645751953125, -3.43994140625, -3.234130859375, -3.0283203125, -2.822509765625, -2.61669921875, -2.410888671875, -2.205078125, -1.999267578125, -1.79345703125, -1.587646484375, -1.3818359375, -1.176025390625, -0.97021484375, -0.764404296875, -0.55859375, -0.352783203125, -0.14697265625, 0.058837890625, 0.2646484375, 0.470458984375, 0.67626953125, 0.882080078125, 1.087890625, 1.293701171875, 1.49951171875, 1.705322265625, 1.9111328125, 2.116943359375, 2.32275390625, 2.528564453125, 2.734375, 2.940185546875, 3.14599609375, 3.351806640625, 3.5576171875, 3.763427734375, 3.96923828125, 4.175048828125, 4.380859375, 4.586669921875, 4.79248046875, 4.998291015625, 5.2041015625, 5.409912109375, 5.61572265625, 5.821533203125, 6.02734375]}, "gradients/decoder.transformer.h.7.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 2.0, 1.0, 16.0, 6.0, 19.0, 13.0, 34.0, 57.0, 70.0, 128.0, 158.0, 233.0, 346.0, 501.0, 757.0, 1063.0, 1543.0, 2353.0, 3249.0, 5076.0, 7676.0, 10895.0, 16509.0, 24298.0, 36315.0, 53210.0, 77534.0, 107146.0, 138627.0, 1188907.0, 124182.0, 93256.0, 64958.0, 44599.0, 30450.0, 20434.0, 13821.0, 9322.0, 6309.0, 4279.0, 2820.0, 1943.0, 1264.0, 888.0, 590.0, 428.0, 287.0, 166.0, 137.0, 78.0, 60.0, 39.0, 31.0, 30.0, 14.0, 5.0, 6.0, 3.0, 1.0, 3.0, 3.0], "bins": [-0.60986328125, -0.5909652709960938, -0.5720672607421875, -0.5531692504882812, -0.534271240234375, -0.5153732299804688, -0.4964752197265625, -0.47757720947265625, -0.45867919921875, -0.43978118896484375, -0.4208831787109375, -0.40198516845703125, -0.383087158203125, -0.36418914794921875, -0.3452911376953125, -0.32639312744140625, -0.3074951171875, -0.28859710693359375, -0.2696990966796875, -0.25080108642578125, -0.231903076171875, -0.21300506591796875, -0.1941070556640625, -0.17520904541015625, -0.15631103515625, -0.13741302490234375, -0.1185150146484375, -0.09961700439453125, -0.080718994140625, -0.06182098388671875, -0.0429229736328125, -0.02402496337890625, -0.005126953125, 0.01377105712890625, 0.0326690673828125, 0.05156707763671875, 0.070465087890625, 0.08936309814453125, 0.1082611083984375, 0.12715911865234375, 0.14605712890625, 0.16495513916015625, 0.1838531494140625, 0.20275115966796875, 0.221649169921875, 0.24054718017578125, 0.2594451904296875, 0.27834320068359375, 0.2972412109375, 0.31613922119140625, 0.3350372314453125, 0.35393524169921875, 0.372833251953125, 0.39173126220703125, 0.4106292724609375, 0.42952728271484375, 0.44842529296875, 0.46732330322265625, 0.4862213134765625, 0.5051193237304688, 0.524017333984375, 0.5429153442382812, 0.5618133544921875, 0.5807113647460938, 0.599609375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 1.0, 2.0, 8.0, 12.0, 10.0, 10.0, 11.0, 22.0, 14.0, 22.0, 30.0, 50.0, 45.0, 55.0, 58.0, 72.0, 75.0, 62.0, 71.0, 66.0, 49.0, 44.0, 44.0, 32.0, 22.0, 20.0, 16.0, 18.0, 18.0, 12.0, 6.0, 5.0, 2.0, 9.0, 4.0, 4.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00661468505859375, -0.006408393383026123, -0.006202101707458496, -0.005995810031890869, -0.005789518356323242, -0.005583226680755615, -0.005376935005187988, -0.005170643329620361, -0.004964351654052734, -0.004758059978485107, -0.0045517683029174805, -0.0043454766273498535, -0.0041391849517822266, -0.0039328932762146, -0.0037266016006469727, -0.0035203099250793457, -0.0033140182495117188, -0.003107726573944092, -0.002901434898376465, -0.002695143222808838, -0.002488851547241211, -0.002282559871673584, -0.002076268196105957, -0.00186997652053833, -0.0016636848449707031, -0.0014573931694030762, -0.0012511014938354492, -0.0010448098182678223, -0.0008385181427001953, -0.0006322264671325684, -0.0004259347915649414, -0.00021964311599731445, -1.33514404296875e-05, 0.00019294023513793945, 0.0003992319107055664, 0.0006055235862731934, 0.0008118152618408203, 0.0010181069374084473, 0.0012243986129760742, 0.0014306902885437012, 0.0016369819641113281, 0.001843273639678955, 0.002049565315246582, 0.002255856990814209, 0.002462148666381836, 0.002668440341949463, 0.00287473201751709, 0.003081023693084717, 0.0032873153686523438, 0.0034936070442199707, 0.0036998987197875977, 0.0039061903953552246, 0.0041124820709228516, 0.0043187737464904785, 0.0045250654220581055, 0.004731357097625732, 0.004937648773193359, 0.005143940448760986, 0.005350232124328613, 0.00555652379989624, 0.005762815475463867, 0.005969107151031494, 0.006175398826599121, 0.006381690502166748, 0.006587982177734375]}, "gradients/decoder.transformer.h.7.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 4.0, 10.0, 5.0, 5.0, 4.0, 10.0, 9.0, 11.0, 17.0, 21.0, 22.0, 25.0, 38.0, 42.0, 55.0, 77.0, 113.0, 165.0, 325.0, 881.0, 53041.0, 987222.0, 5113.0, 527.0, 249.0, 147.0, 105.0, 58.0, 58.0, 36.0, 26.0, 28.0, 27.0, 17.0, 13.0, 9.0, 7.0, 3.0, 10.0, 8.0, 4.0, 1.0, 2.0, 3.0, 3.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1240234375, -0.11993026733398438, -0.11583709716796875, -0.11174392700195312, -0.1076507568359375, -0.10355758666992188, -0.09946441650390625, -0.09537124633789062, -0.091278076171875, -0.08718490600585938, -0.08309173583984375, -0.07899856567382812, -0.0749053955078125, -0.07081222534179688, -0.06671905517578125, -0.06262588500976562, -0.05853271484375, -0.054439544677734375, -0.05034637451171875, -0.046253204345703125, -0.0421600341796875, -0.038066864013671875, -0.03397369384765625, -0.029880523681640625, -0.025787353515625, -0.021694183349609375, -0.01760101318359375, -0.013507843017578125, -0.0094146728515625, -0.005321502685546875, -0.00122833251953125, 0.002864837646484375, 0.0069580078125, 0.011051177978515625, 0.01514434814453125, 0.019237518310546875, 0.0233306884765625, 0.027423858642578125, 0.03151702880859375, 0.035610198974609375, 0.039703369140625, 0.043796539306640625, 0.04788970947265625, 0.051982879638671875, 0.0560760498046875, 0.060169219970703125, 0.06426239013671875, 0.06835556030273438, 0.07244873046875, 0.07654190063476562, 0.08063507080078125, 0.08472824096679688, 0.0888214111328125, 0.09291458129882812, 0.09700775146484375, 0.10110092163085938, 0.105194091796875, 0.10928726196289062, 0.11338043212890625, 0.11747360229492188, 0.1215667724609375, 0.12565994262695312, 0.12975311279296875, 0.13384628295898438, 0.137939453125]}, "gradients/decoder.transformer.h.7.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 88.0, 680.0, 233.0, 9.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.035988617688417435, -0.03498046472668648, -0.03397230803966522, -0.032964155077934265, -0.03195600211620331, -0.030947847291827202, -0.029939692467451096, -0.02893153950572014, -0.027923384681344032, -0.026915229856967926, -0.02590707689523697, -0.024898922070860863, -0.023890767246484756, -0.0228826142847538, -0.021874459460377693, -0.020866304636001587, -0.01985815167427063, -0.018849996849894524, -0.017841843888163567, -0.01683368906378746, -0.015825536102056503, -0.014817381277680397, -0.01380922645330429, -0.012801072560250759, -0.011792918667197227, -0.010784764774143696, -0.009776610881090164, -0.008768456056714058, -0.007760302163660526, -0.006752148270606995, -0.005743993911892176, -0.004735839553177357, -0.003727683797478676, -0.0027195296715945005, -0.0017113755457103252, -0.0007032214198261499, 0.00030493270605802536, 0.001313086599111557, 0.002321240957826376, 0.003329395316541195, 0.0043375492095947266, 0.005345703102648258, 0.006353857461363077, 0.007362011820077896, 0.008370165713131428, 0.00937831960618496, 0.010386474430561066, 0.011394628323614597, 0.012402782216668129, 0.01341093610972166, 0.014419090002775192, 0.015427244827151299, 0.016435399651527405, 0.017443552613258362, 0.018451707437634468, 0.019459862262010574, 0.02046801522374153, 0.021476170048117638, 0.022484323009848595, 0.0234924778342247, 0.024500630795955658, 0.025508785620331764, 0.02651694044470787, 0.027525093406438828, 0.028533248230814934]}, "gradients/decoder.transformer.h.7.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 0.0, 4.0, 4.0, 2.0, 6.0, 7.0, 10.0, 6.0, 11.0, 12.0, 11.0, 23.0, 13.0, 25.0, 20.0, 26.0, 18.0, 27.0, 29.0, 26.0, 39.0, 37.0, 23.0, 38.0, 36.0, 47.0, 35.0, 29.0, 44.0, 27.0, 27.0, 22.0, 47.0, 32.0, 25.0, 22.0, 25.0, 15.0, 18.0, 22.0, 22.0, 28.0, 14.0, 10.0, 6.0, 6.0, 8.0, 8.0, 6.0, 4.0, 2.0, 2.0, 5.0, 1.0, 1.0, 1.0], "bins": [-0.0030020475387573242, -0.0029143188148736954, -0.0028265900909900665, -0.0027388613671064377, -0.002651132643222809, -0.00256340391933918, -0.002475675195455551, -0.0023879464715719223, -0.0023002177476882935, -0.0022124890238046646, -0.0021247602999210358, -0.002037031576037407, -0.001949302852153778, -0.0018615741282701492, -0.0017738454043865204, -0.0016861166805028915, -0.0015983879566192627, -0.0015106592327356339, -0.001422930508852005, -0.0013352017849683762, -0.0012474730610847473, -0.0011597443372011185, -0.0010720156133174896, -0.0009842868894338608, -0.0008965581655502319, -0.0008088294416666031, -0.0007211007177829742, -0.0006333719938993454, -0.0005456432700157166, -0.0004579145461320877, -0.00037018582224845886, -0.00028245709836483, -0.00019472837448120117, -0.00010699965059757233, -1.927092671394348e-05, 6.845779716968536e-05, 0.0001561865210533142, 0.00024391524493694305, 0.0003316439688205719, 0.00041937269270420074, 0.0005071014165878296, 0.0005948301404714584, 0.0006825588643550873, 0.0007702875882387161, 0.000858016312122345, 0.0009457450360059738, 0.0010334737598896027, 0.0011212024837732315, 0.0012089312076568604, 0.0012966599315404892, 0.001384388655424118, 0.0014721173793077469, 0.0015598461031913757, 0.0016475748270750046, 0.0017353035509586334, 0.0018230322748422623, 0.0019107609987258911, 0.00199848972260952, 0.002086218446493149, 0.0021739471703767776, 0.0022616758942604065, 0.0023494046181440353, 0.002437133342027664, 0.002524862065911293, 0.002612590789794922]}, "gradients/decoder.transformer.h.7.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 2.0, 5.0, 5.0, 3.0, 10.0, 10.0, 10.0, 15.0, 17.0, 21.0, 14.0, 28.0, 17.0, 21.0, 33.0, 34.0, 31.0, 40.0, 45.0, 44.0, 41.0, 44.0, 50.0, 54.0, 49.0, 37.0, 40.0, 37.0, 30.0, 29.0, 25.0, 19.0, 26.0, 20.0, 16.0, 19.0, 12.0, 11.0, 12.0, 16.0, 6.0, 7.0, 3.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-10.796875, -10.450927734375, -10.10498046875, -9.759033203125, -9.4130859375, -9.067138671875, -8.72119140625, -8.375244140625, -8.029296875, -7.683349609375, -7.33740234375, -6.991455078125, -6.6455078125, -6.299560546875, -5.95361328125, -5.607666015625, -5.26171875, -4.915771484375, -4.56982421875, -4.223876953125, -3.8779296875, -3.531982421875, -3.18603515625, -2.840087890625, -2.494140625, -2.148193359375, -1.80224609375, -1.456298828125, -1.1103515625, -0.764404296875, -0.41845703125, -0.072509765625, 0.2734375, 0.619384765625, 0.96533203125, 1.311279296875, 1.6572265625, 2.003173828125, 2.34912109375, 2.695068359375, 3.041015625, 3.386962890625, 3.73291015625, 4.078857421875, 4.4248046875, 4.770751953125, 5.11669921875, 5.462646484375, 5.80859375, 6.154541015625, 6.50048828125, 6.846435546875, 7.1923828125, 7.538330078125, 7.88427734375, 8.230224609375, 8.576171875, 8.922119140625, 9.26806640625, 9.614013671875, 9.9599609375, 10.305908203125, 10.65185546875, 10.997802734375, 11.34375]}, "gradients/decoder.transformer.h.7.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 3.0, 6.0, 5.0, 6.0, 7.0, 12.0, 14.0, 17.0, 25.0, 33.0, 39.0, 51.0, 53.0, 74.0, 120.0, 204.0, 268.0, 535.0, 1431.0, 5978.0, 31393.0, 274150.0, 655872.0, 63441.0, 10709.0, 2332.0, 683.0, 367.0, 205.0, 145.0, 90.0, 61.0, 55.0, 38.0, 28.0, 28.0, 18.0, 13.0, 18.0, 15.0, 7.0, 7.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-21.546875, -20.85595703125, -20.1650390625, -19.47412109375, -18.783203125, -18.09228515625, -17.4013671875, -16.71044921875, -16.01953125, -15.32861328125, -14.6376953125, -13.94677734375, -13.255859375, -12.56494140625, -11.8740234375, -11.18310546875, -10.4921875, -9.80126953125, -9.1103515625, -8.41943359375, -7.728515625, -7.03759765625, -6.3466796875, -5.65576171875, -4.96484375, -4.27392578125, -3.5830078125, -2.89208984375, -2.201171875, -1.51025390625, -0.8193359375, -0.12841796875, 0.5625, 1.25341796875, 1.9443359375, 2.63525390625, 3.326171875, 4.01708984375, 4.7080078125, 5.39892578125, 6.08984375, 6.78076171875, 7.4716796875, 8.16259765625, 8.853515625, 9.54443359375, 10.2353515625, 10.92626953125, 11.6171875, 12.30810546875, 12.9990234375, 13.68994140625, 14.380859375, 15.07177734375, 15.7626953125, 16.45361328125, 17.14453125, 17.83544921875, 18.5263671875, 19.21728515625, 19.908203125, 20.59912109375, 21.2900390625, 21.98095703125, 22.671875]}, "gradients/decoder.transformer.h.7.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 0.0, 3.0, 2.0, 6.0, 5.0, 5.0, 5.0, 7.0, 7.0, 10.0, 11.0, 12.0, 13.0, 16.0, 25.0, 29.0, 30.0, 39.0, 26.0, 43.0, 49.0, 65.0, 70.0, 137.0, 1608.0, 315.0, 100.0, 50.0, 52.0, 40.0, 36.0, 37.0, 31.0, 32.0, 19.0, 21.0, 15.0, 18.0, 20.0, 8.0, 5.0, 11.0, 11.0, 3.0, 2.0, 0.0, 0.0, 5.0, 3.0, 1.0, 0.0, 1.0, 3.0, 2.0], "bins": [-36.78125, -35.723388671875, -34.66552734375, -33.607666015625, -32.5498046875, -31.491943359375, -30.43408203125, -29.376220703125, -28.318359375, -27.260498046875, -26.20263671875, -25.144775390625, -24.0869140625, -23.029052734375, -21.97119140625, -20.913330078125, -19.85546875, -18.797607421875, -17.73974609375, -16.681884765625, -15.6240234375, -14.566162109375, -13.50830078125, -12.450439453125, -11.392578125, -10.334716796875, -9.27685546875, -8.218994140625, -7.1611328125, -6.103271484375, -5.04541015625, -3.987548828125, -2.9296875, -1.871826171875, -0.81396484375, 0.243896484375, 1.3017578125, 2.359619140625, 3.41748046875, 4.475341796875, 5.533203125, 6.591064453125, 7.64892578125, 8.706787109375, 9.7646484375, 10.822509765625, 11.88037109375, 12.938232421875, 13.99609375, 15.053955078125, 16.11181640625, 17.169677734375, 18.2275390625, 19.285400390625, 20.34326171875, 21.401123046875, 22.458984375, 23.516845703125, 24.57470703125, 25.632568359375, 26.6904296875, 27.748291015625, 28.80615234375, 29.864013671875, 30.921875]}, "gradients/decoder.transformer.h.7.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 2.0, 5.0, 4.0, 1.0, 0.0, 1.0, 3.0, 11.0, 9.0, 12.0, 5.0, 16.0, 23.0, 18.0, 25.0, 33.0, 49.0, 49.0, 83.0, 113.0, 162.0, 268.0, 653.0, 3575.0, 1280845.0, 1854245.0, 3944.0, 661.0, 304.0, 148.0, 93.0, 75.0, 70.0, 40.0, 28.0, 31.0, 19.0, 16.0, 12.0, 10.0, 12.0, 11.0, 4.0, 7.0, 7.0, 3.0, 5.0, 1.0, 2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-71.0, -68.552734375, -66.10546875, -63.658203125, -61.2109375, -58.763671875, -56.31640625, -53.869140625, -51.421875, -48.974609375, -46.52734375, -44.080078125, -41.6328125, -39.185546875, -36.73828125, -34.291015625, -31.84375, -29.396484375, -26.94921875, -24.501953125, -22.0546875, -19.607421875, -17.16015625, -14.712890625, -12.265625, -9.818359375, -7.37109375, -4.923828125, -2.4765625, -0.029296875, 2.41796875, 4.865234375, 7.3125, 9.759765625, 12.20703125, 14.654296875, 17.1015625, 19.548828125, 21.99609375, 24.443359375, 26.890625, 29.337890625, 31.78515625, 34.232421875, 36.6796875, 39.126953125, 41.57421875, 44.021484375, 46.46875, 48.916015625, 51.36328125, 53.810546875, 56.2578125, 58.705078125, 61.15234375, 63.599609375, 66.046875, 68.494140625, 70.94140625, 73.388671875, 75.8359375, 78.283203125, 80.73046875, 83.177734375, 85.625]}, "gradients/decoder.transformer.h.7.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 4.0, 45.0, 299.0, 465.0, 178.0, 23.0], "bins": [-242.27796936035156, -238.32241821289062, -234.36688232421875, -230.4113311767578, -226.45578002929688, -222.50022888183594, -218.54469299316406, -214.58914184570312, -210.6335906982422, -206.67803955078125, -202.72250366210938, -198.76695251464844, -194.8114013671875, -190.85585021972656, -186.9003143310547, -182.94476318359375, -178.98922729492188, -175.03367614746094, -171.07814025878906, -167.12258911132812, -163.1670379638672, -159.21148681640625, -155.25595092773438, -151.30039978027344, -147.3448486328125, -143.38929748535156, -139.4337615966797, -135.47821044921875, -131.5226593017578, -127.5671157836914, -123.611572265625, -119.65602111816406, -115.70047760009766, -111.74493408203125, -107.78938293457031, -103.8338394165039, -99.87828826904297, -95.92274475097656, -91.96719360351562, -88.01165008544922, -84.05610656738281, -80.1005630493164, -76.14501190185547, -72.18946838378906, -68.23391723632812, -64.27837371826172, -60.32282638549805, -56.367279052734375, -52.41172790527344, -48.456180572509766, -44.500633239746094, -40.54508972167969, -36.58953857421875, -32.633995056152344, -28.678447723388672, -24.722900390625, -20.767353057861328, -16.811805725097656, -12.8562593460083, -8.900712966918945, -4.945165634155273, -0.9896183013916016, 2.9659271240234375, 6.921474456787109, 10.877021789550781]}, "gradients/decoder.transformer.h.7.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 5.0, 3.0, 6.0, 5.0, 5.0, 10.0, 12.0, 12.0, 8.0, 15.0, 18.0, 23.0, 23.0, 21.0, 29.0, 28.0, 29.0, 32.0, 35.0, 32.0, 35.0, 38.0, 39.0, 46.0, 47.0, 37.0, 37.0, 42.0, 44.0, 30.0, 36.0, 29.0, 24.0, 28.0, 17.0, 22.0, 21.0, 17.0, 19.0, 11.0, 7.0, 2.0, 6.0, 7.0, 5.0, 8.0, 4.0, 3.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-75.22042083740234, -72.49496459960938, -69.76951599121094, -67.04405975341797, -64.318603515625, -61.5931510925293, -58.867698669433594, -56.142242431640625, -53.41679000854492, -50.69133758544922, -47.96588134765625, -45.24042892456055, -42.514976501464844, -39.789520263671875, -37.06406784057617, -34.33861541748047, -31.6131591796875, -28.887704849243164, -26.162250518798828, -23.436798095703125, -20.71134376525879, -17.985889434814453, -15.26043701171875, -12.534982681274414, -9.809528350830078, -7.0840744972229, -4.358620643615723, -1.6331672668457031, 1.0922870635986328, 3.8177413940429688, 6.543193817138672, 9.268648147583008, 11.994094848632812, 14.719549179077148, 17.445003509521484, 20.170455932617188, 22.895910263061523, 25.62136459350586, 28.346817016601562, 31.0722713470459, 33.797725677490234, 36.52317810058594, 39.248634338378906, 41.97408676147461, 44.69953918457031, 47.42499542236328, 50.150447845458984, 52.87590026855469, 55.601356506347656, 58.32680892944336, 61.05226516723633, 63.77771759033203, 66.503173828125, 69.22862243652344, 71.9540786743164, 74.67953491210938, 77.40498352050781, 80.13043975830078, 82.85588836669922, 85.58134460449219, 88.30680084228516, 91.03225708007812, 93.75770568847656, 96.48316192626953, 99.2086181640625]}, "gradients/decoder.transformer.h.6.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 2.0, 7.0, 3.0, 4.0, 11.0, 6.0, 7.0, 11.0, 16.0, 22.0, 10.0, 21.0, 21.0, 19.0, 31.0, 31.0, 23.0, 27.0, 37.0, 32.0, 53.0, 39.0, 50.0, 39.0, 50.0, 40.0, 41.0, 41.0, 40.0, 30.0, 27.0, 25.0, 23.0, 28.0, 16.0, 18.0, 16.0, 14.0, 18.0, 15.0, 9.0, 15.0, 8.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-10.84375, -10.5103759765625, -10.177001953125, -9.8436279296875, -9.51025390625, -9.1768798828125, -8.843505859375, -8.5101318359375, -8.1767578125, -7.8433837890625, -7.510009765625, -7.1766357421875, -6.84326171875, -6.5098876953125, -6.176513671875, -5.8431396484375, -5.509765625, -5.1763916015625, -4.843017578125, -4.5096435546875, -4.17626953125, -3.8428955078125, -3.509521484375, -3.1761474609375, -2.8427734375, -2.5093994140625, -2.176025390625, -1.8426513671875, -1.50927734375, -1.1759033203125, -0.842529296875, -0.5091552734375, -0.17578125, 0.1575927734375, 0.490966796875, 0.8243408203125, 1.15771484375, 1.4910888671875, 1.824462890625, 2.1578369140625, 2.4912109375, 2.8245849609375, 3.157958984375, 3.4913330078125, 3.82470703125, 4.1580810546875, 4.491455078125, 4.8248291015625, 5.158203125, 5.4915771484375, 5.824951171875, 6.1583251953125, 6.49169921875, 6.8250732421875, 7.158447265625, 7.4918212890625, 7.8251953125, 8.1585693359375, 8.491943359375, 8.8253173828125, 9.15869140625, 9.4920654296875, 9.825439453125, 10.1588134765625, 10.4921875]}, "gradients/decoder.transformer.h.6.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 4.0, 2.0, 2.0, 3.0, 6.0, 3.0, 9.0, 11.0, 8.0, 11.0, 10.0, 10.0, 15.0, 12.0, 12.0, 31.0, 31.0, 36.0, 46.0, 57.0, 96.0, 171.0, 362.0, 830.0, 2822.0, 12230.0, 80965.0, 965423.0, 2655609.0, 424389.0, 40802.0, 7178.0, 1744.0, 578.0, 258.0, 161.0, 78.0, 61.0, 46.0, 27.0, 8.0, 17.0, 15.0, 18.0, 14.0, 13.0, 10.0, 11.0, 11.0, 10.0, 4.0, 7.0, 5.0, 4.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-22.359375, -21.59716796875, -20.8349609375, -20.07275390625, -19.310546875, -18.54833984375, -17.7861328125, -17.02392578125, -16.26171875, -15.49951171875, -14.7373046875, -13.97509765625, -13.212890625, -12.45068359375, -11.6884765625, -10.92626953125, -10.1640625, -9.40185546875, -8.6396484375, -7.87744140625, -7.115234375, -6.35302734375, -5.5908203125, -4.82861328125, -4.06640625, -3.30419921875, -2.5419921875, -1.77978515625, -1.017578125, -0.25537109375, 0.5068359375, 1.26904296875, 2.03125, 2.79345703125, 3.5556640625, 4.31787109375, 5.080078125, 5.84228515625, 6.6044921875, 7.36669921875, 8.12890625, 8.89111328125, 9.6533203125, 10.41552734375, 11.177734375, 11.93994140625, 12.7021484375, 13.46435546875, 14.2265625, 14.98876953125, 15.7509765625, 16.51318359375, 17.275390625, 18.03759765625, 18.7998046875, 19.56201171875, 20.32421875, 21.08642578125, 21.8486328125, 22.61083984375, 23.373046875, 24.13525390625, 24.8974609375, 25.65966796875, 26.421875]}, "gradients/decoder.transformer.h.6.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 5.0, 8.0, 6.0, 8.0, 10.0, 10.0, 14.0, 24.0, 24.0, 30.0, 73.0, 59.0, 80.0, 98.0, 136.0, 140.0, 209.0, 277.0, 376.0, 386.0, 421.0, 379.0, 316.0, 250.0, 183.0, 145.0, 106.0, 64.0, 68.0, 37.0, 33.0, 29.0, 16.0, 14.0, 8.0, 15.0, 9.0, 7.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-17.984375, -17.486328125, -16.98828125, -16.490234375, -15.9921875, -15.494140625, -14.99609375, -14.498046875, -14.0, -13.501953125, -13.00390625, -12.505859375, -12.0078125, -11.509765625, -11.01171875, -10.513671875, -10.015625, -9.517578125, -9.01953125, -8.521484375, -8.0234375, -7.525390625, -7.02734375, -6.529296875, -6.03125, -5.533203125, -5.03515625, -4.537109375, -4.0390625, -3.541015625, -3.04296875, -2.544921875, -2.046875, -1.548828125, -1.05078125, -0.552734375, -0.0546875, 0.443359375, 0.94140625, 1.439453125, 1.9375, 2.435546875, 2.93359375, 3.431640625, 3.9296875, 4.427734375, 4.92578125, 5.423828125, 5.921875, 6.419921875, 6.91796875, 7.416015625, 7.9140625, 8.412109375, 8.91015625, 9.408203125, 9.90625, 10.404296875, 10.90234375, 11.400390625, 11.8984375, 12.396484375, 12.89453125, 13.392578125, 13.890625]}, "gradients/decoder.transformer.h.6.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 5.0, 7.0, 8.0, 12.0, 15.0, 24.0, 28.0, 44.0, 51.0, 56.0, 84.0, 136.0, 140.0, 261.0, 465.0, 1225.0, 11345.0, 1659784.0, 2503227.0, 14684.0, 1240.0, 462.0, 259.0, 187.0, 136.0, 97.0, 68.0, 54.0, 44.0, 26.0, 29.0, 22.0, 12.0, 15.0, 9.0, 5.0, 4.0, 5.0, 7.0, 3.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-70.4375, -68.16796875, -65.8984375, -63.62890625, -61.359375, -59.08984375, -56.8203125, -54.55078125, -52.28125, -50.01171875, -47.7421875, -45.47265625, -43.203125, -40.93359375, -38.6640625, -36.39453125, -34.125, -31.85546875, -29.5859375, -27.31640625, -25.046875, -22.77734375, -20.5078125, -18.23828125, -15.96875, -13.69921875, -11.4296875, -9.16015625, -6.890625, -4.62109375, -2.3515625, -0.08203125, 2.1875, 4.45703125, 6.7265625, 8.99609375, 11.265625, 13.53515625, 15.8046875, 18.07421875, 20.34375, 22.61328125, 24.8828125, 27.15234375, 29.421875, 31.69140625, 33.9609375, 36.23046875, 38.5, 40.76953125, 43.0390625, 45.30859375, 47.578125, 49.84765625, 52.1171875, 54.38671875, 56.65625, 58.92578125, 61.1953125, 63.46484375, 65.734375, 68.00390625, 70.2734375, 72.54296875, 74.8125]}, "gradients/decoder.transformer.h.6.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 56.0, 414.0, 454.0, 87.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-488.49615478515625, -477.9068603515625, -467.31756591796875, -456.728271484375, -446.13897705078125, -435.5496826171875, -424.96038818359375, -414.3711242675781, -403.7818298339844, -393.1925354003906, -382.6032409667969, -372.0139465332031, -361.4246520996094, -350.83538818359375, -340.24609375, -329.65679931640625, -319.0675048828125, -308.47821044921875, -297.888916015625, -287.29962158203125, -276.7103271484375, -266.12103271484375, -255.53175354003906, -244.94247436523438, -234.3531494140625, -223.76385498046875, -213.174560546875, -202.58526611328125, -191.99598693847656, -181.4066925048828, -170.81739807128906, -160.22811889648438, -149.63880920410156, -139.0495147705078, -128.46022033691406, -117.87093353271484, -107.28164672851562, -96.69235229492188, -86.10305786132812, -75.5137710571289, -64.92447662353516, -54.33518600463867, -43.74589538574219, -33.15660095214844, -22.567310333251953, -11.978019714355469, -1.3887252807617188, 9.2005615234375, 19.78985595703125, 30.379146575927734, 40.96843719482422, 51.55773162841797, 62.14702224731445, 72.73631286621094, 83.32560729980469, 93.9148941040039, 104.50418853759766, 115.0934829711914, 125.68276977539062, 136.27206420898438, 146.86135864257812, 157.45065307617188, 168.03994750976562, 178.6292266845703, 189.21852111816406]}, "gradients/decoder.transformer.h.6.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 2.0, 1.0, 5.0, 5.0, 5.0, 5.0, 6.0, 9.0, 12.0, 9.0, 18.0, 11.0, 14.0, 20.0, 23.0, 24.0, 26.0, 26.0, 27.0, 31.0, 27.0, 39.0, 42.0, 35.0, 37.0, 43.0, 36.0, 32.0, 30.0, 32.0, 36.0, 43.0, 29.0, 31.0, 27.0, 25.0, 23.0, 24.0, 22.0, 22.0, 14.0, 13.0, 19.0, 12.0, 9.0, 9.0, 5.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0], "bins": [-56.32893753051758, -54.6518440246582, -52.97475051879883, -51.29765319824219, -49.62055969238281, -47.94346618652344, -46.26637268066406, -44.58927917480469, -42.91218566894531, -41.23509216308594, -39.55799865722656, -37.88090515136719, -36.20380783081055, -34.52671432495117, -32.8496208190918, -31.172527313232422, -29.49542999267578, -27.818336486816406, -26.1412410736084, -24.464147567749023, -22.787052154541016, -21.10995864868164, -19.432865142822266, -17.75577163696289, -16.078676223754883, -14.401581764221191, -12.7244873046875, -11.047393798828125, -9.370299339294434, -7.693204879760742, -6.016111373901367, -4.339016914367676, -2.6619186401367188, -0.9848244190216064, 0.6922698020935059, 2.369363784790039, 4.0464582443237305, 5.723552703857422, 7.400646209716797, 9.077740669250488, 10.75483512878418, 12.431929588317871, 14.109024047851562, 15.786117553710938, 17.463211059570312, 19.14030647277832, 20.817399978637695, 22.494495391845703, 24.171588897705078, 25.848682403564453, 27.52577781677246, 29.202871322631836, 30.879966735839844, 32.55706024169922, 34.234153747558594, 35.91124725341797, 37.588340759277344, 39.26543426513672, 40.942527770996094, 42.61962127685547, 44.29671859741211, 45.973812103271484, 47.65090560913086, 49.327999114990234, 51.005096435546875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 3.0, 5.0, 8.0, 16.0, 6.0, 20.0, 17.0, 31.0, 14.0, 28.0, 40.0, 28.0, 31.0, 41.0, 33.0, 54.0, 50.0, 55.0, 54.0, 46.0, 35.0, 41.0, 58.0, 29.0, 40.0, 30.0, 21.0, 26.0, 20.0, 18.0, 28.0, 10.0, 15.0, 10.0, 8.0, 8.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2734375, -11.892333984375, -11.51123046875, -11.130126953125, -10.7490234375, -10.367919921875, -9.98681640625, -9.605712890625, -9.224609375, -8.843505859375, -8.46240234375, -8.081298828125, -7.7001953125, -7.319091796875, -6.93798828125, -6.556884765625, -6.17578125, -5.794677734375, -5.41357421875, -5.032470703125, -4.6513671875, -4.270263671875, -3.88916015625, -3.508056640625, -3.126953125, -2.745849609375, -2.36474609375, -1.983642578125, -1.6025390625, -1.221435546875, -0.84033203125, -0.459228515625, -0.078125, 0.302978515625, 0.68408203125, 1.065185546875, 1.4462890625, 1.827392578125, 2.20849609375, 2.589599609375, 2.970703125, 3.351806640625, 3.73291015625, 4.114013671875, 4.4951171875, 4.876220703125, 5.25732421875, 5.638427734375, 6.01953125, 6.400634765625, 6.78173828125, 7.162841796875, 7.5439453125, 7.925048828125, 8.30615234375, 8.687255859375, 9.068359375, 9.449462890625, 9.83056640625, 10.211669921875, 10.5927734375, 10.973876953125, 11.35498046875, 11.736083984375, 12.1171875]}, "gradients/decoder.transformer.h.6.crossattention.c_proj.weight": {"_type": "histogram", "values": [3.0, 3.0, 1.0, 4.0, 4.0, 2.0, 5.0, 8.0, 21.0, 8.0, 33.0, 27.0, 53.0, 85.0, 141.0, 167.0, 306.0, 437.0, 617.0, 1029.0, 1480.0, 2315.0, 3522.0, 5573.0, 8629.0, 13435.0, 21766.0, 33993.0, 54627.0, 86496.0, 135225.0, 180931.0, 171300.0, 119684.0, 75993.0, 48224.0, 29891.0, 18909.0, 11861.0, 7726.0, 4960.0, 3164.0, 2039.0, 1227.0, 879.0, 592.0, 386.0, 249.0, 194.0, 116.0, 70.0, 46.0, 42.0, 21.0, 15.0, 14.0, 8.0, 6.0, 7.0, 0.0, 4.0, 1.0, 0.0, 2.0], "bins": [-0.947265625, -0.9175338745117188, -0.8878021240234375, -0.8580703735351562, -0.828338623046875, -0.7986068725585938, -0.7688751220703125, -0.7391433715820312, -0.70941162109375, -0.6796798706054688, -0.6499481201171875, -0.6202163696289062, -0.590484619140625, -0.5607528686523438, -0.5310211181640625, -0.5012893676757812, -0.4715576171875, -0.44182586669921875, -0.4120941162109375, -0.38236236572265625, -0.352630615234375, -0.32289886474609375, -0.2931671142578125, -0.26343536376953125, -0.23370361328125, -0.20397186279296875, -0.1742401123046875, -0.14450836181640625, -0.114776611328125, -0.08504486083984375, -0.0553131103515625, -0.02558135986328125, 0.004150390625, 0.03388214111328125, 0.0636138916015625, 0.09334564208984375, 0.123077392578125, 0.15280914306640625, 0.1825408935546875, 0.21227264404296875, 0.24200439453125, 0.27173614501953125, 0.3014678955078125, 0.33119964599609375, 0.360931396484375, 0.39066314697265625, 0.4203948974609375, 0.45012664794921875, 0.4798583984375, 0.5095901489257812, 0.5393218994140625, 0.5690536499023438, 0.598785400390625, 0.6285171508789062, 0.6582489013671875, 0.6879806518554688, 0.71771240234375, 0.7474441528320312, 0.7771759033203125, 0.8069076538085938, 0.836639404296875, 0.8663711547851562, 0.8961029052734375, 0.9258346557617188, 0.95556640625]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 7.0, 3.0, 5.0, 6.0, 7.0, 10.0, 13.0, 13.0, 18.0, 13.0, 25.0, 23.0, 32.0, 29.0, 37.0, 38.0, 34.0, 39.0, 32.0, 43.0, 48.0, 32.0, 1073.0, 36.0, 43.0, 42.0, 38.0, 27.0, 37.0, 36.0, 23.0, 35.0, 19.0, 17.0, 25.0, 12.0, 8.0, 9.0, 7.0, 6.0, 13.0, 2.0, 6.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-7.44921875, -7.23040771484375, -7.0115966796875, -6.79278564453125, -6.573974609375, -6.35516357421875, -6.1363525390625, -5.91754150390625, -5.69873046875, -5.47991943359375, -5.2611083984375, -5.04229736328125, -4.823486328125, -4.60467529296875, -4.3858642578125, -4.16705322265625, -3.9482421875, -3.72943115234375, -3.5106201171875, -3.29180908203125, -3.072998046875, -2.85418701171875, -2.6353759765625, -2.41656494140625, -2.19775390625, -1.97894287109375, -1.7601318359375, -1.54132080078125, -1.322509765625, -1.10369873046875, -0.8848876953125, -0.66607666015625, -0.447265625, -0.22845458984375, -0.0096435546875, 0.20916748046875, 0.427978515625, 0.64678955078125, 0.8656005859375, 1.08441162109375, 1.30322265625, 1.52203369140625, 1.7408447265625, 1.95965576171875, 2.178466796875, 2.39727783203125, 2.6160888671875, 2.83489990234375, 3.0537109375, 3.27252197265625, 3.4913330078125, 3.71014404296875, 3.928955078125, 4.14776611328125, 4.3665771484375, 4.58538818359375, 4.80419921875, 5.02301025390625, 5.2418212890625, 5.46063232421875, 5.679443359375, 5.89825439453125, 6.1170654296875, 6.33587646484375, 6.5546875]}, "gradients/decoder.transformer.h.6.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 4.0, 1.0, 6.0, 10.0, 21.0, 20.0, 22.0, 44.0, 80.0, 93.0, 138.0, 197.0, 283.0, 398.0, 581.0, 780.0, 1123.0, 1558.0, 2283.0, 3335.0, 4802.0, 7112.0, 10095.0, 14793.0, 20892.0, 30620.0, 44083.0, 63104.0, 86949.0, 114467.0, 1123347.0, 188005.0, 107773.0, 81074.0, 57693.0, 40185.0, 27968.0, 19606.0, 13320.0, 9396.0, 6321.0, 4409.0, 3016.0, 2120.0, 1477.0, 1113.0, 743.0, 490.0, 362.0, 255.0, 170.0, 139.0, 89.0, 60.0, 36.0, 30.0, 20.0, 12.0, 7.0, 11.0, 3.0, 3.0, 3.0], "bins": [-0.58203125, -0.5637741088867188, -0.5455169677734375, -0.5272598266601562, -0.509002685546875, -0.49074554443359375, -0.4724884033203125, -0.45423126220703125, -0.43597412109375, -0.41771697998046875, -0.3994598388671875, -0.38120269775390625, -0.362945556640625, -0.34468841552734375, -0.3264312744140625, -0.30817413330078125, -0.2899169921875, -0.27165985107421875, -0.2534027099609375, -0.23514556884765625, -0.216888427734375, -0.19863128662109375, -0.1803741455078125, -0.16211700439453125, -0.14385986328125, -0.12560272216796875, -0.1073455810546875, -0.08908843994140625, -0.070831298828125, -0.05257415771484375, -0.0343170166015625, -0.01605987548828125, 0.002197265625, 0.02045440673828125, 0.0387115478515625, 0.05696868896484375, 0.075225830078125, 0.09348297119140625, 0.1117401123046875, 0.12999725341796875, 0.14825439453125, 0.16651153564453125, 0.1847686767578125, 0.20302581787109375, 0.221282958984375, 0.23954010009765625, 0.2577972412109375, 0.27605438232421875, 0.2943115234375, 0.31256866455078125, 0.3308258056640625, 0.34908294677734375, 0.367340087890625, 0.38559722900390625, 0.4038543701171875, 0.42211151123046875, 0.44036865234375, 0.45862579345703125, 0.4768829345703125, 0.49514007568359375, 0.513397216796875, 0.5316543579101562, 0.5499114990234375, 0.5681686401367188, 0.58642578125]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 5.0, 10.0, 5.0, 5.0, 6.0, 11.0, 13.0, 4.0, 8.0, 17.0, 20.0, 17.0, 26.0, 28.0, 34.0, 50.0, 45.0, 56.0, 82.0, 83.0, 73.0, 64.0, 72.0, 43.0, 28.0, 36.0, 20.0, 25.0, 20.0, 13.0, 16.0, 17.0, 9.0, 7.0, 9.0, 1.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.007778167724609375, -0.007513225078582764, -0.007248282432556152, -0.006983339786529541, -0.00671839714050293, -0.006453454494476318, -0.006188511848449707, -0.005923569202423096, -0.005658626556396484, -0.005393683910369873, -0.005128741264343262, -0.00486379861831665, -0.004598855972290039, -0.004333913326263428, -0.004068970680236816, -0.003804028034210205, -0.0035390853881835938, -0.0032741427421569824, -0.003009200096130371, -0.0027442574501037598, -0.0024793148040771484, -0.002214372158050537, -0.0019494295120239258, -0.0016844868659973145, -0.0014195442199707031, -0.0011546015739440918, -0.0008896589279174805, -0.0006247162818908691, -0.0003597736358642578, -9.483098983764648e-05, 0.00017011165618896484, 0.00043505430221557617, 0.0006999969482421875, 0.0009649395942687988, 0.0012298822402954102, 0.0014948248863220215, 0.0017597675323486328, 0.002024710178375244, 0.0022896528244018555, 0.002554595470428467, 0.002819538116455078, 0.0030844807624816895, 0.0033494234085083008, 0.003614366054534912, 0.0038793087005615234, 0.004144251346588135, 0.004409193992614746, 0.004674136638641357, 0.004939079284667969, 0.00520402193069458, 0.005468964576721191, 0.005733907222747803, 0.005998849868774414, 0.006263792514801025, 0.006528735160827637, 0.006793677806854248, 0.007058620452880859, 0.007323563098907471, 0.007588505744934082, 0.007853448390960693, 0.008118391036987305, 0.008383333683013916, 0.008648276329040527, 0.008913218975067139, 0.00917816162109375]}, "gradients/decoder.transformer.h.6.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 0.0, 3.0, 3.0, 2.0, 4.0, 3.0, 7.0, 7.0, 8.0, 9.0, 13.0, 24.0, 28.0, 27.0, 42.0, 44.0, 61.0, 98.0, 131.0, 247.0, 551.0, 15081.0, 1025457.0, 5515.0, 500.0, 240.0, 106.0, 69.0, 50.0, 49.0, 40.0, 29.0, 18.0, 22.0, 8.0, 11.0, 4.0, 14.0, 9.0, 6.0, 8.0, 3.0, 1.0, 2.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.229248046875, -0.2227764129638672, -0.21630477905273438, -0.20983314514160156, -0.20336151123046875, -0.19688987731933594, -0.19041824340820312, -0.1839466094970703, -0.1774749755859375, -0.1710033416748047, -0.16453170776367188, -0.15806007385253906, -0.15158843994140625, -0.14511680603027344, -0.13864517211914062, -0.1321735382080078, -0.125701904296875, -0.11923027038574219, -0.11275863647460938, -0.10628700256347656, -0.09981536865234375, -0.09334373474121094, -0.08687210083007812, -0.08040046691894531, -0.0739288330078125, -0.06745719909667969, -0.060985565185546875, -0.05451393127441406, -0.04804229736328125, -0.04157066345214844, -0.035099029541015625, -0.028627395629882812, -0.02215576171875, -0.015684127807617188, -0.009212493896484375, -0.0027408599853515625, 0.00373077392578125, 0.010202407836914062, 0.016674041748046875, 0.023145675659179688, 0.0296173095703125, 0.03608894348144531, 0.042560577392578125, 0.04903221130371094, 0.05550384521484375, 0.06197547912597656, 0.06844711303710938, 0.07491874694824219, 0.081390380859375, 0.08786201477050781, 0.09433364868164062, 0.10080528259277344, 0.10727691650390625, 0.11374855041503906, 0.12022018432617188, 0.1266918182373047, 0.1331634521484375, 0.1396350860595703, 0.14610671997070312, 0.15257835388183594, 0.15904998779296875, 0.16552162170410156, 0.17199325561523438, 0.1784648895263672, 0.1849365234375]}, "gradients/decoder.transformer.h.6.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 24.0, 929.0, 63.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0065441676415503025, -0.00398502591997385, -0.001425884198397398, 0.0011332575231790543, 0.0036923992447555065, 0.006251541431993246, 0.008810682222247124, 0.011369824409484863, 0.013928966596722603, 0.016488108783960342, 0.019047249108552933, 0.021606391295790672, 0.024165533483028412, 0.02672467567026615, 0.02928381785750389, 0.03184295818209648, 0.03440209850668907, 0.03696123883128166, 0.03952038288116455, 0.04207952320575714, 0.04463866353034973, 0.04719780758023262, 0.04975694790482521, 0.0523160919547081, 0.05487523227930069, 0.05743437260389328, 0.05999351665377617, 0.06255266070365906, 0.06511180102825165, 0.06767094135284424, 0.07023008167743683, 0.07278922200202942, 0.07534836232662201, 0.0779075026512146, 0.08046664297580719, 0.08302579075098038, 0.08558493107557297, 0.08814407140016556, 0.09070321172475815, 0.09326235204935074, 0.09582149982452393, 0.09838064014911652, 0.1009397804737091, 0.1034989282488823, 0.10605806857347488, 0.10861720889806747, 0.11117634922266006, 0.11373548954725266, 0.11629462987184525, 0.11885377019643784, 0.12141291052103043, 0.12397205829620361, 0.1265311986207962, 0.1290903389453888, 0.13164947926998138, 0.13420861959457397, 0.13676775991916656, 0.13932690024375916, 0.14188604056835175, 0.14444518089294434, 0.14700432121753693, 0.14956346154212952, 0.1521226167678833, 0.1546817570924759, 0.15724089741706848]}, "gradients/decoder.transformer.h.6.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 6.0, 1.0, 0.0, 4.0, 5.0, 4.0, 5.0, 6.0, 9.0, 9.0, 14.0, 22.0, 22.0, 26.0, 34.0, 36.0, 40.0, 45.0, 43.0, 30.0, 46.0, 51.0, 46.0, 47.0, 58.0, 47.0, 45.0, 45.0, 40.0, 39.0, 28.0, 31.0, 26.0, 17.0, 17.0, 9.0, 15.0, 11.0, 9.0, 11.0, 3.0, 5.0, 0.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.006034553050994873, -0.005863676778972149, -0.005692800506949425, -0.005521924234926701, -0.0053510479629039764, -0.005180171690881252, -0.005009295418858528, -0.004838419146835804, -0.00466754287481308, -0.004496666602790356, -0.0043257903307676315, -0.004154914058744907, -0.003984037786722183, -0.003813161514699459, -0.003642285242676735, -0.0034714089706540108, -0.0033005326986312866, -0.0031296564266085625, -0.0029587801545858383, -0.002787903882563114, -0.00261702761054039, -0.002446151338517666, -0.0022752750664949417, -0.0021043987944722176, -0.0019335225224494934, -0.0017626462504267693, -0.001591769978404045, -0.001420893706381321, -0.0012500174343585968, -0.0010791411623358727, -0.0009082648903131485, -0.0007373886182904243, -0.0005665123462677002, -0.00039563607424497604, -0.0002247598022222519, -5.388353019952774e-05, 0.00011699274182319641, 0.00028786901384592056, 0.0004587452858686447, 0.0006296215578913689, 0.000800497829914093, 0.0009713741019368172, 0.0011422503739595413, 0.0013131266459822655, 0.0014840029180049896, 0.0016548791900277138, 0.001825755462050438, 0.001996631734073162, 0.0021675080060958862, 0.0023383842781186104, 0.0025092605501413345, 0.0026801368221640587, 0.002851013094186783, 0.003021889366209507, 0.003192765638232231, 0.0033636419102549553, 0.0035345181822776794, 0.0037053944543004036, 0.0038762707263231277, 0.004047146998345852, 0.004218023270368576, 0.0043888995423913, 0.004559775814414024, 0.0047306520864367485, 0.004901528358459473]}, "gradients/decoder.transformer.h.6.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 3.0, 4.0, 8.0, 5.0, 3.0, 5.0, 8.0, 16.0, 7.0, 19.0, 17.0, 31.0, 14.0, 28.0, 42.0, 26.0, 32.0, 40.0, 33.0, 54.0, 52.0, 53.0, 55.0, 46.0, 34.0, 42.0, 57.0, 31.0, 38.0, 30.0, 21.0, 26.0, 20.0, 18.0, 28.0, 10.0, 15.0, 10.0, 8.0, 8.0, 6.0, 3.0, 3.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.265625, -11.8846435546875, -11.503662109375, -11.1226806640625, -10.74169921875, -10.3607177734375, -9.979736328125, -9.5987548828125, -9.2177734375, -8.8367919921875, -8.455810546875, -8.0748291015625, -7.69384765625, -7.3128662109375, -6.931884765625, -6.5509033203125, -6.169921875, -5.7889404296875, -5.407958984375, -5.0269775390625, -4.64599609375, -4.2650146484375, -3.884033203125, -3.5030517578125, -3.1220703125, -2.7410888671875, -2.360107421875, -1.9791259765625, -1.59814453125, -1.2171630859375, -0.836181640625, -0.4552001953125, -0.07421875, 0.3067626953125, 0.687744140625, 1.0687255859375, 1.44970703125, 1.8306884765625, 2.211669921875, 2.5926513671875, 2.9736328125, 3.3546142578125, 3.735595703125, 4.1165771484375, 4.49755859375, 4.8785400390625, 5.259521484375, 5.6405029296875, 6.021484375, 6.4024658203125, 6.783447265625, 7.1644287109375, 7.54541015625, 7.9263916015625, 8.307373046875, 8.6883544921875, 9.0693359375, 9.4503173828125, 9.831298828125, 10.2122802734375, 10.59326171875, 10.9742431640625, 11.355224609375, 11.7362060546875, 12.1171875]}, "gradients/decoder.transformer.h.6.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 8.0, 10.0, 8.0, 10.0, 13.0, 18.0, 29.0, 26.0, 41.0, 54.0, 91.0, 109.0, 154.0, 222.0, 275.0, 433.0, 635.0, 1251.0, 4265.0, 20442.0, 217911.0, 749670.0, 41191.0, 7237.0, 1890.0, 849.0, 528.0, 321.0, 246.0, 143.0, 127.0, 91.0, 59.0, 54.0, 30.0, 37.0, 21.0, 18.0, 12.0, 8.0, 7.0, 7.0, 4.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-30.90625, -29.946044921875, -28.98583984375, -28.025634765625, -27.0654296875, -26.105224609375, -25.14501953125, -24.184814453125, -23.224609375, -22.264404296875, -21.30419921875, -20.343994140625, -19.3837890625, -18.423583984375, -17.46337890625, -16.503173828125, -15.54296875, -14.582763671875, -13.62255859375, -12.662353515625, -11.7021484375, -10.741943359375, -9.78173828125, -8.821533203125, -7.861328125, -6.901123046875, -5.94091796875, -4.980712890625, -4.0205078125, -3.060302734375, -2.10009765625, -1.139892578125, -0.1796875, 0.780517578125, 1.74072265625, 2.700927734375, 3.6611328125, 4.621337890625, 5.58154296875, 6.541748046875, 7.501953125, 8.462158203125, 9.42236328125, 10.382568359375, 11.3427734375, 12.302978515625, 13.26318359375, 14.223388671875, 15.18359375, 16.143798828125, 17.10400390625, 18.064208984375, 19.0244140625, 19.984619140625, 20.94482421875, 21.905029296875, 22.865234375, 23.825439453125, 24.78564453125, 25.745849609375, 26.7060546875, 27.666259765625, 28.62646484375, 29.586669921875, 30.546875]}, "gradients/decoder.transformer.h.6.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 5.0, 6.0, 3.0, 6.0, 7.0, 12.0, 12.0, 9.0, 11.0, 25.0, 20.0, 18.0, 19.0, 22.0, 23.0, 40.0, 31.0, 34.0, 37.0, 28.0, 62.0, 82.0, 223.0, 1682.0, 157.0, 64.0, 47.0, 45.0, 37.0, 41.0, 30.0, 46.0, 32.0, 18.0, 13.0, 10.0, 14.0, 15.0, 16.0, 15.0, 9.0, 9.0, 9.0, 3.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 2.0, 0.0, 1.0], "bins": [-30.390625, -29.50634765625, -28.6220703125, -27.73779296875, -26.853515625, -25.96923828125, -25.0849609375, -24.20068359375, -23.31640625, -22.43212890625, -21.5478515625, -20.66357421875, -19.779296875, -18.89501953125, -18.0107421875, -17.12646484375, -16.2421875, -15.35791015625, -14.4736328125, -13.58935546875, -12.705078125, -11.82080078125, -10.9365234375, -10.05224609375, -9.16796875, -8.28369140625, -7.3994140625, -6.51513671875, -5.630859375, -4.74658203125, -3.8623046875, -2.97802734375, -2.09375, -1.20947265625, -0.3251953125, 0.55908203125, 1.443359375, 2.32763671875, 3.2119140625, 4.09619140625, 4.98046875, 5.86474609375, 6.7490234375, 7.63330078125, 8.517578125, 9.40185546875, 10.2861328125, 11.17041015625, 12.0546875, 12.93896484375, 13.8232421875, 14.70751953125, 15.591796875, 16.47607421875, 17.3603515625, 18.24462890625, 19.12890625, 20.01318359375, 20.8974609375, 21.78173828125, 22.666015625, 23.55029296875, 24.4345703125, 25.31884765625, 26.203125]}, "gradients/decoder.transformer.h.6.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 9.0, 9.0, 12.0, 12.0, 20.0, 11.0, 17.0, 15.0, 18.0, 18.0, 28.0, 59.0, 38.0, 65.0, 109.0, 163.0, 285.0, 755.0, 8693.0, 3033000.0, 99291.0, 1853.0, 467.0, 201.0, 129.0, 83.0, 56.0, 49.0, 41.0, 26.0, 26.0, 27.0, 23.0, 18.0, 17.0, 10.0, 9.0, 10.0, 7.0, 7.0, 4.0, 7.0, 5.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-73.125, -70.66796875, -68.2109375, -65.75390625, -63.296875, -60.83984375, -58.3828125, -55.92578125, -53.46875, -51.01171875, -48.5546875, -46.09765625, -43.640625, -41.18359375, -38.7265625, -36.26953125, -33.8125, -31.35546875, -28.8984375, -26.44140625, -23.984375, -21.52734375, -19.0703125, -16.61328125, -14.15625, -11.69921875, -9.2421875, -6.78515625, -4.328125, -1.87109375, 0.5859375, 3.04296875, 5.5, 7.95703125, 10.4140625, 12.87109375, 15.328125, 17.78515625, 20.2421875, 22.69921875, 25.15625, 27.61328125, 30.0703125, 32.52734375, 34.984375, 37.44140625, 39.8984375, 42.35546875, 44.8125, 47.26953125, 49.7265625, 52.18359375, 54.640625, 57.09765625, 59.5546875, 62.01171875, 64.46875, 66.92578125, 69.3828125, 71.83984375, 74.296875, 76.75390625, 79.2109375, 81.66796875, 84.125]}, "gradients/decoder.transformer.h.6.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 4.0, 11.0, 40.0, 136.0, 247.0, 310.0, 176.0, 68.0, 18.0, 4.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.41730499267578, -40.21316146850586, -38.0090217590332, -35.80487823486328, -33.600738525390625, -31.396595001220703, -29.19245147705078, -26.988309860229492, -24.784168243408203, -22.580026626586914, -20.375885009765625, -18.171741485595703, -15.967599868774414, -13.763458251953125, -11.55931568145752, -9.355173110961914, -7.151031494140625, -4.946889400482178, -2.7427473068237305, -0.5386052131652832, 1.665536880493164, 3.869678497314453, 6.073821067810059, 8.277963638305664, 10.482105255126953, 12.686246871948242, 14.890389442443848, 17.094532012939453, 19.298673629760742, 21.50281524658203, 23.706958770751953, 25.911100387573242, 28.11524200439453, 30.31938362121582, 32.52352523803711, 34.72766876220703, 36.93180847167969, 39.13595199584961, 41.34009552001953, 43.54423522949219, 45.74837875366211, 47.95252227783203, 50.15666198730469, 52.36080551147461, 54.56494903564453, 56.76908874511719, 58.97323226928711, 61.17737579345703, 63.38151550292969, 65.58565521240234, 67.78980255126953, 69.99394226074219, 72.19808197021484, 74.4022216796875, 76.60636901855469, 78.81050872802734, 81.0146484375, 83.21878814697266, 85.42293548583984, 87.6270751953125, 89.83121490478516, 92.03535461425781, 94.239501953125, 96.44364166259766, 98.64778900146484]}, "gradients/decoder.transformer.h.6.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 5.0, 3.0, 6.0, 12.0, 10.0, 15.0, 16.0, 16.0, 25.0, 18.0, 13.0, 28.0, 29.0, 34.0, 27.0, 31.0, 31.0, 37.0, 43.0, 29.0, 35.0, 40.0, 42.0, 33.0, 34.0, 30.0, 29.0, 44.0, 34.0, 33.0, 29.0, 24.0, 24.0, 18.0, 15.0, 14.0, 14.0, 17.0, 13.0, 12.0, 8.0, 7.0, 6.0, 5.0, 7.0, 3.0, 4.0, 3.0, 3.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-67.84556579589844, -65.63578796386719, -63.426002502441406, -61.21622085571289, -59.006439208984375, -56.796661376953125, -54.58687973022461, -52.377098083496094, -50.16731643676758, -47.95753479003906, -45.74775314331055, -43.53797149658203, -41.32819366455078, -39.118408203125, -36.90863037109375, -34.698848724365234, -32.48906707763672, -30.279285430908203, -28.069503784179688, -25.859724044799805, -23.64994239807129, -21.440160751342773, -19.23038101196289, -17.020599365234375, -14.81081771850586, -12.601036071777344, -10.391255378723145, -8.181474685668945, -5.97169303894043, -3.761911392211914, -1.5521306991577148, 0.6576499938964844, 2.867431640625, 5.077212810516357, 7.286993980407715, 9.496774673461914, 11.70655632019043, 13.916337966918945, 16.126117706298828, 18.335899353027344, 20.54568099975586, 22.755462646484375, 24.96524429321289, 27.175024032592773, 29.38480567932129, 31.594587326049805, 33.80436706542969, 36.0141487121582, 38.22393035888672, 40.433712005615234, 42.64349365234375, 44.853275299072266, 47.06305694580078, 49.27283477783203, 51.48261642456055, 53.69239807128906, 55.90217971801758, 58.111961364746094, 60.32174301147461, 62.531524658203125, 64.74130249023438, 66.95108795166016, 69.1608657836914, 71.37065124511719, 73.58042907714844]}, "gradients/decoder.transformer.h.5.mlp.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 7.0, 3.0, 5.0, 4.0, 6.0, 5.0, 9.0, 17.0, 19.0, 22.0, 15.0, 15.0, 24.0, 33.0, 22.0, 32.0, 26.0, 35.0, 39.0, 42.0, 50.0, 62.0, 48.0, 51.0, 36.0, 51.0, 35.0, 35.0, 37.0, 33.0, 23.0, 22.0, 17.0, 26.0, 17.0, 20.0, 16.0, 10.0, 6.0, 13.0, 10.0, 4.0, 6.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-12.3359375, -11.9666748046875, -11.597412109375, -11.2281494140625, -10.85888671875, -10.4896240234375, -10.120361328125, -9.7510986328125, -9.3818359375, -9.0125732421875, -8.643310546875, -8.2740478515625, -7.90478515625, -7.5355224609375, -7.166259765625, -6.7969970703125, -6.427734375, -6.0584716796875, -5.689208984375, -5.3199462890625, -4.95068359375, -4.5814208984375, -4.212158203125, -3.8428955078125, -3.4736328125, -3.1043701171875, -2.735107421875, -2.3658447265625, -1.99658203125, -1.6273193359375, -1.258056640625, -0.8887939453125, -0.51953125, -0.1502685546875, 0.218994140625, 0.5882568359375, 0.95751953125, 1.3267822265625, 1.696044921875, 2.0653076171875, 2.4345703125, 2.8038330078125, 3.173095703125, 3.5423583984375, 3.91162109375, 4.2808837890625, 4.650146484375, 5.0194091796875, 5.388671875, 5.7579345703125, 6.127197265625, 6.4964599609375, 6.86572265625, 7.2349853515625, 7.604248046875, 7.9735107421875, 8.3427734375, 8.7120361328125, 9.081298828125, 9.4505615234375, 9.81982421875, 10.1890869140625, 10.558349609375, 10.9276123046875, 11.296875]}, "gradients/decoder.transformer.h.5.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 1.0, 3.0, 4.0, 2.0, 5.0, 10.0, 11.0, 9.0, 14.0, 14.0, 23.0, 28.0, 27.0, 38.0, 53.0, 55.0, 67.0, 89.0, 121.0, 195.0, 246.0, 367.0, 702.0, 1317.0, 3302.0, 10351.0, 42068.0, 272196.0, 1619817.0, 1836395.0, 336930.0, 50749.0, 11710.0, 3725.0, 1448.0, 742.0, 425.0, 258.0, 165.0, 114.0, 104.0, 87.0, 63.0, 50.0, 29.0, 29.0, 35.0, 25.0, 13.0, 14.0, 9.0, 8.0, 9.0, 6.0, 7.0, 6.0, 5.0, 0.0, 1.0, 1.0, 3.0], "bins": [-18.625, -18.0439453125, -17.462890625, -16.8818359375, -16.30078125, -15.7197265625, -15.138671875, -14.5576171875, -13.9765625, -13.3955078125, -12.814453125, -12.2333984375, -11.65234375, -11.0712890625, -10.490234375, -9.9091796875, -9.328125, -8.7470703125, -8.166015625, -7.5849609375, -7.00390625, -6.4228515625, -5.841796875, -5.2607421875, -4.6796875, -4.0986328125, -3.517578125, -2.9365234375, -2.35546875, -1.7744140625, -1.193359375, -0.6123046875, -0.03125, 0.5498046875, 1.130859375, 1.7119140625, 2.29296875, 2.8740234375, 3.455078125, 4.0361328125, 4.6171875, 5.1982421875, 5.779296875, 6.3603515625, 6.94140625, 7.5224609375, 8.103515625, 8.6845703125, 9.265625, 9.8466796875, 10.427734375, 11.0087890625, 11.58984375, 12.1708984375, 12.751953125, 13.3330078125, 13.9140625, 14.4951171875, 15.076171875, 15.6572265625, 16.23828125, 16.8193359375, 17.400390625, 17.9814453125, 18.5625]}, "gradients/decoder.transformer.h.5.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 4.0, 8.0, 7.0, 7.0, 27.0, 35.0, 63.0, 94.0, 157.0, 262.0, 414.0, 706.0, 782.0, 606.0, 377.0, 220.0, 126.0, 79.0, 40.0, 36.0, 14.0, 5.0, 6.0, 6.0, 1.0, 3.0, 2.0, 1.0, 1.0], "bins": [-43.5625, -42.6402587890625, -41.718017578125, -40.7957763671875, -39.87353515625, -38.9512939453125, -38.029052734375, -37.1068115234375, -36.1845703125, -35.2623291015625, -34.340087890625, -33.4178466796875, -32.49560546875, -31.5733642578125, -30.651123046875, -29.7288818359375, -28.806640625, -27.8843994140625, -26.962158203125, -26.0399169921875, -25.11767578125, -24.1954345703125, -23.273193359375, -22.3509521484375, -21.4287109375, -20.5064697265625, -19.584228515625, -18.6619873046875, -17.73974609375, -16.8175048828125, -15.895263671875, -14.9730224609375, -14.05078125, -13.1285400390625, -12.206298828125, -11.2840576171875, -10.36181640625, -9.4395751953125, -8.517333984375, -7.5950927734375, -6.6728515625, -5.7506103515625, -4.828369140625, -3.9061279296875, -2.98388671875, -2.0616455078125, -1.139404296875, -0.2171630859375, 0.705078125, 1.6273193359375, 2.549560546875, 3.4718017578125, 4.39404296875, 5.3162841796875, 6.238525390625, 7.1607666015625, 8.0830078125, 9.0052490234375, 9.927490234375, 10.8497314453125, 11.77197265625, 12.6942138671875, 13.616455078125, 14.5386962890625, 15.4609375]}, "gradients/decoder.transformer.h.5.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 7.0, 7.0, 2.0, 10.0, 13.0, 27.0, 28.0, 43.0, 85.0, 123.0, 238.0, 450.0, 1267.0, 10367.0, 3799627.0, 377348.0, 3083.0, 731.0, 326.0, 183.0, 107.0, 78.0, 45.0, 29.0, 24.0, 12.0, 10.0, 8.0, 6.0, 1.0, 4.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-88.1875, -85.1259765625, -82.064453125, -79.0029296875, -75.94140625, -72.8798828125, -69.818359375, -66.7568359375, -63.6953125, -60.6337890625, -57.572265625, -54.5107421875, -51.44921875, -48.3876953125, -45.326171875, -42.2646484375, -39.203125, -36.1416015625, -33.080078125, -30.0185546875, -26.95703125, -23.8955078125, -20.833984375, -17.7724609375, -14.7109375, -11.6494140625, -8.587890625, -5.5263671875, -2.46484375, 0.5966796875, 3.658203125, 6.7197265625, 9.78125, 12.8427734375, 15.904296875, 18.9658203125, 22.02734375, 25.0888671875, 28.150390625, 31.2119140625, 34.2734375, 37.3349609375, 40.396484375, 43.4580078125, 46.51953125, 49.5810546875, 52.642578125, 55.7041015625, 58.765625, 61.8271484375, 64.888671875, 67.9501953125, 71.01171875, 74.0732421875, 77.134765625, 80.1962890625, 83.2578125, 86.3193359375, 89.380859375, 92.4423828125, 95.50390625, 98.5654296875, 101.626953125, 104.6884765625, 107.75]}, "gradients/decoder.transformer.h.5.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 32.0, 642.0, 333.0, 8.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-897.5950927734375, -881.2247314453125, -864.8543701171875, -848.4840698242188, -832.1137084960938, -815.7433471679688, -799.3729858398438, -783.0026245117188, -766.63232421875, -750.261962890625, -733.8916015625, -717.5213012695312, -701.1509399414062, -684.7805786132812, -668.4102172851562, -652.0398559570312, -635.6694946289062, -619.2991333007812, -602.9287719726562, -586.5584716796875, -570.1881103515625, -553.8177490234375, -537.4473876953125, -521.0770263671875, -504.7066955566406, -488.3363342285156, -471.96600341796875, -455.59564208984375, -439.22528076171875, -422.8549499511719, -406.4845886230469, -390.1142578125, -373.74395751953125, -357.37359619140625, -341.0032653808594, -324.6329040527344, -308.2625732421875, -291.8922119140625, -275.5218505859375, -259.1514892578125, -242.78115844726562, -226.4108123779297, -210.04046630859375, -193.67010498046875, -177.2997589111328, -160.92941284179688, -144.55905151367188, -128.18870544433594, -111.818359375, -95.44801330566406, -79.0776596069336, -62.70730972290039, -46.33695983886719, -29.96661376953125, -13.596260070800781, 2.7740936279296875, 19.144439697265625, 35.51478958129883, 51.88513946533203, 68.2554931640625, 84.62583923339844, 100.99618530273438, 117.36653900146484, 133.7368927001953, 150.10723876953125]}, "gradients/decoder.transformer.h.5.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 0.0, 4.0, 3.0, 4.0, 5.0, 4.0, 7.0, 1.0, 6.0, 9.0, 13.0, 15.0, 18.0, 22.0, 23.0, 17.0, 28.0, 22.0, 40.0, 29.0, 39.0, 33.0, 42.0, 47.0, 45.0, 44.0, 38.0, 32.0, 36.0, 43.0, 38.0, 36.0, 23.0, 30.0, 28.0, 25.0, 20.0, 24.0, 25.0, 16.0, 14.0, 8.0, 10.0, 7.0, 9.0, 9.0, 5.0, 4.0, 5.0, 2.0, 2.0, 0.0, 4.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-59.84124755859375, -58.01295852661133, -56.18466567993164, -54.35637664794922, -52.5280876159668, -50.699798583984375, -48.87150573730469, -47.043216705322266, -45.214927673339844, -43.38663864135742, -41.558345794677734, -39.73005676269531, -37.90176773071289, -36.07347869873047, -34.24518585205078, -32.41689682006836, -30.588603973388672, -28.760313034057617, -26.932024002075195, -25.10373306274414, -23.27544403076172, -21.447153091430664, -19.61886215209961, -17.790573120117188, -15.962282180786133, -14.133992195129395, -12.305702209472656, -10.477411270141602, -8.649121284484863, -6.820831298828125, -4.99254035949707, -3.164250373840332, -1.3359603881835938, 0.49232983589172363, 2.320620059967041, 4.1489105224609375, 5.977200508117676, 7.805490493774414, 9.633781433105469, 11.462071418762207, 13.290361404418945, 15.118651390075684, 16.946941375732422, 18.775232315063477, 20.60352325439453, 22.431812286376953, 24.260103225708008, 26.088394165039062, 27.916683197021484, 29.74497413635254, 31.57326316833496, 33.401554107666016, 35.22984313964844, 37.058135986328125, 38.88642501831055, 40.71471405029297, 42.543006896972656, 44.37129592895508, 46.199588775634766, 48.02787780761719, 49.85616683959961, 51.68445587158203, 53.51274871826172, 55.34103775024414, 57.16932678222656]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 5.0, 9.0, 8.0, 9.0, 12.0, 27.0, 11.0, 23.0, 23.0, 35.0, 32.0, 33.0, 21.0, 45.0, 52.0, 34.0, 46.0, 54.0, 46.0, 56.0, 48.0, 40.0, 33.0, 40.0, 34.0, 40.0, 32.0, 28.0, 29.0, 19.0, 15.0, 15.0, 17.0, 5.0, 13.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.5234375, -13.104248046875, -12.68505859375, -12.265869140625, -11.8466796875, -11.427490234375, -11.00830078125, -10.589111328125, -10.169921875, -9.750732421875, -9.33154296875, -8.912353515625, -8.4931640625, -8.073974609375, -7.65478515625, -7.235595703125, -6.81640625, -6.397216796875, -5.97802734375, -5.558837890625, -5.1396484375, -4.720458984375, -4.30126953125, -3.882080078125, -3.462890625, -3.043701171875, -2.62451171875, -2.205322265625, -1.7861328125, -1.366943359375, -0.94775390625, -0.528564453125, -0.109375, 0.309814453125, 0.72900390625, 1.148193359375, 1.5673828125, 1.986572265625, 2.40576171875, 2.824951171875, 3.244140625, 3.663330078125, 4.08251953125, 4.501708984375, 4.9208984375, 5.340087890625, 5.75927734375, 6.178466796875, 6.59765625, 7.016845703125, 7.43603515625, 7.855224609375, 8.2744140625, 8.693603515625, 9.11279296875, 9.531982421875, 9.951171875, 10.370361328125, 10.78955078125, 11.208740234375, 11.6279296875, 12.047119140625, 12.46630859375, 12.885498046875, 13.3046875]}, "gradients/decoder.transformer.h.5.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 17.0, 14.0, 25.0, 29.0, 39.0, 60.0, 79.0, 146.0, 205.0, 295.0, 445.0, 716.0, 1100.0, 1679.0, 2610.0, 4039.0, 6393.0, 9896.0, 15728.0, 25045.0, 41029.0, 67894.0, 109913.0, 164154.0, 190090.0, 150555.0, 98232.0, 60058.0, 36321.0, 22886.0, 14243.0, 8827.0, 5691.0, 3589.0, 2230.0, 1435.0, 963.0, 615.0, 419.0, 262.0, 198.0, 132.0, 89.0, 45.0, 41.0, 33.0, 14.0, 14.0, 8.0, 5.0, 5.0, 4.0, 2.0, 4.0, 2.0], "bins": [-1.0224609375, -0.9918289184570312, -0.9611968994140625, -0.9305648803710938, -0.899932861328125, -0.8693008422851562, -0.8386688232421875, -0.8080368041992188, -0.77740478515625, -0.7467727661132812, -0.7161407470703125, -0.6855087280273438, -0.654876708984375, -0.6242446899414062, -0.5936126708984375, -0.5629806518554688, -0.5323486328125, -0.5017166137695312, -0.4710845947265625, -0.44045257568359375, -0.409820556640625, -0.37918853759765625, -0.3485565185546875, -0.31792449951171875, -0.28729248046875, -0.25666046142578125, -0.2260284423828125, -0.19539642333984375, -0.164764404296875, -0.13413238525390625, -0.1035003662109375, -0.07286834716796875, -0.042236328125, -0.01160430908203125, 0.0190277099609375, 0.04965972900390625, 0.080291748046875, 0.11092376708984375, 0.1415557861328125, 0.17218780517578125, 0.20281982421875, 0.23345184326171875, 0.2640838623046875, 0.29471588134765625, 0.325347900390625, 0.35597991943359375, 0.3866119384765625, 0.41724395751953125, 0.4478759765625, 0.47850799560546875, 0.5091400146484375, 0.5397720336914062, 0.570404052734375, 0.6010360717773438, 0.6316680908203125, 0.6623001098632812, 0.69293212890625, 0.7235641479492188, 0.7541961669921875, 0.7848281860351562, 0.815460205078125, 0.8460922241210938, 0.8767242431640625, 0.9073562622070312, 0.93798828125]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 2.0, 1.0, 1.0, 4.0, 5.0, 6.0, 6.0, 6.0, 14.0, 20.0, 14.0, 16.0, 22.0, 24.0, 18.0, 29.0, 39.0, 47.0, 35.0, 41.0, 44.0, 44.0, 36.0, 1075.0, 35.0, 44.0, 39.0, 34.0, 42.0, 30.0, 35.0, 34.0, 21.0, 29.0, 19.0, 25.0, 11.0, 20.0, 17.0, 17.0, 8.0, 5.0, 5.0, 4.0, 2.0, 4.0, 2.0, 2.0, 4.0], "bins": [-9.8046875, -9.552490234375, -9.30029296875, -9.048095703125, -8.7958984375, -8.543701171875, -8.29150390625, -8.039306640625, -7.787109375, -7.534912109375, -7.28271484375, -7.030517578125, -6.7783203125, -6.526123046875, -6.27392578125, -6.021728515625, -5.76953125, -5.517333984375, -5.26513671875, -5.012939453125, -4.7607421875, -4.508544921875, -4.25634765625, -4.004150390625, -3.751953125, -3.499755859375, -3.24755859375, -2.995361328125, -2.7431640625, -2.490966796875, -2.23876953125, -1.986572265625, -1.734375, -1.482177734375, -1.22998046875, -0.977783203125, -0.7255859375, -0.473388671875, -0.22119140625, 0.031005859375, 0.283203125, 0.535400390625, 0.78759765625, 1.039794921875, 1.2919921875, 1.544189453125, 1.79638671875, 2.048583984375, 2.30078125, 2.552978515625, 2.80517578125, 3.057373046875, 3.3095703125, 3.561767578125, 3.81396484375, 4.066162109375, 4.318359375, 4.570556640625, 4.82275390625, 5.074951171875, 5.3271484375, 5.579345703125, 5.83154296875, 6.083740234375, 6.3359375]}, "gradients/decoder.transformer.h.5.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 6.0, 3.0, 4.0, 12.0, 16.0, 24.0, 29.0, 49.0, 88.0, 124.0, 161.0, 252.0, 419.0, 653.0, 951.0, 1445.0, 2319.0, 3548.0, 5283.0, 8372.0, 13009.0, 20205.0, 31142.0, 47933.0, 72285.0, 108020.0, 147499.0, 1207613.0, 138059.0, 98401.0, 66332.0, 43174.0, 28339.0, 18243.0, 11888.0, 7398.0, 4888.0, 3226.0, 2005.0, 1300.0, 824.0, 566.0, 354.0, 254.0, 148.0, 93.0, 71.0, 35.0, 27.0, 23.0, 11.0, 7.0, 6.0, 2.0, 6.0, 1.0, 2.0, 1.0], "bins": [-0.759765625, -0.7370071411132812, -0.7142486572265625, -0.6914901733398438, -0.668731689453125, -0.6459732055664062, -0.6232147216796875, -0.6004562377929688, -0.57769775390625, -0.5549392700195312, -0.5321807861328125, -0.5094223022460938, -0.486663818359375, -0.46390533447265625, -0.4411468505859375, -0.41838836669921875, -0.3956298828125, -0.37287139892578125, -0.3501129150390625, -0.32735443115234375, -0.304595947265625, -0.28183746337890625, -0.2590789794921875, -0.23632049560546875, -0.21356201171875, -0.19080352783203125, -0.1680450439453125, -0.14528656005859375, -0.122528076171875, -0.09976959228515625, -0.0770111083984375, -0.05425262451171875, -0.031494140625, -0.00873565673828125, 0.0140228271484375, 0.03678131103515625, 0.059539794921875, 0.08229827880859375, 0.1050567626953125, 0.12781524658203125, 0.15057373046875, 0.17333221435546875, 0.1960906982421875, 0.21884918212890625, 0.241607666015625, 0.26436614990234375, 0.2871246337890625, 0.30988311767578125, 0.3326416015625, 0.35540008544921875, 0.3781585693359375, 0.40091705322265625, 0.423675537109375, 0.44643402099609375, 0.4691925048828125, 0.49195098876953125, 0.51470947265625, 0.5374679565429688, 0.5602264404296875, 0.5829849243164062, 0.605743408203125, 0.6285018920898438, 0.6512603759765625, 0.6740188598632812, 0.69677734375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 6.0, 1.0, 6.0, 6.0, 9.0, 7.0, 8.0, 12.0, 26.0, 30.0, 35.0, 36.0, 66.0, 51.0, 87.0, 64.0, 77.0, 74.0, 77.0, 51.0, 56.0, 51.0, 40.0, 23.0, 21.0, 20.0, 12.0, 15.0, 12.0, 5.0, 7.0, 3.0, 0.0, 4.0, 2.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0106964111328125, -0.010326743125915527, -0.009957075119018555, -0.009587407112121582, -0.00921773910522461, -0.008848071098327637, -0.008478403091430664, -0.008108735084533691, -0.007739067077636719, -0.007369399070739746, -0.0069997310638427734, -0.006630063056945801, -0.006260395050048828, -0.0058907270431518555, -0.005521059036254883, -0.00515139102935791, -0.0047817230224609375, -0.004412055015563965, -0.004042387008666992, -0.0036727190017700195, -0.003303050994873047, -0.0029333829879760742, -0.0025637149810791016, -0.002194046974182129, -0.0018243789672851562, -0.0014547109603881836, -0.001085042953491211, -0.0007153749465942383, -0.0003457069396972656, 2.396106719970703e-05, 0.0003936290740966797, 0.0007632970809936523, 0.001132965087890625, 0.0015026330947875977, 0.0018723011016845703, 0.002241969108581543, 0.0026116371154785156, 0.0029813051223754883, 0.003350973129272461, 0.0037206411361694336, 0.004090309143066406, 0.004459977149963379, 0.0048296451568603516, 0.005199313163757324, 0.005568981170654297, 0.0059386491775512695, 0.006308317184448242, 0.006677985191345215, 0.0070476531982421875, 0.00741732120513916, 0.007786989212036133, 0.008156657218933105, 0.008526325225830078, 0.00889599323272705, 0.009265661239624023, 0.009635329246520996, 0.010004997253417969, 0.010374665260314941, 0.010744333267211914, 0.011114001274108887, 0.01148366928100586, 0.011853337287902832, 0.012223005294799805, 0.012592673301696777, 0.01296234130859375]}, "gradients/decoder.transformer.h.5.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 1.0, 5.0, 4.0, 5.0, 8.0, 11.0, 13.0, 23.0, 26.0, 26.0, 44.0, 52.0, 99.0, 118.0, 254.0, 478.0, 2973.0, 1038591.0, 4511.0, 532.0, 257.0, 175.0, 106.0, 65.0, 51.0, 31.0, 19.0, 20.0, 12.0, 11.0, 9.0, 12.0, 6.0, 0.0, 3.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.29443359375, -0.2861480712890625, -0.277862548828125, -0.2695770263671875, -0.26129150390625, -0.2530059814453125, -0.244720458984375, -0.2364349365234375, -0.2281494140625, -0.2198638916015625, -0.211578369140625, -0.2032928466796875, -0.19500732421875, -0.1867218017578125, -0.178436279296875, -0.1701507568359375, -0.161865234375, -0.1535797119140625, -0.145294189453125, -0.1370086669921875, -0.12872314453125, -0.1204376220703125, -0.112152099609375, -0.1038665771484375, -0.0955810546875, -0.0872955322265625, -0.079010009765625, -0.0707244873046875, -0.06243896484375, -0.0541534423828125, -0.045867919921875, -0.0375823974609375, -0.029296875, -0.0210113525390625, -0.012725830078125, -0.0044403076171875, 0.00384521484375, 0.0121307373046875, 0.020416259765625, 0.0287017822265625, 0.0369873046875, 0.0452728271484375, 0.053558349609375, 0.0618438720703125, 0.07012939453125, 0.0784149169921875, 0.086700439453125, 0.0949859619140625, 0.103271484375, 0.1115570068359375, 0.119842529296875, 0.1281280517578125, 0.13641357421875, 0.1446990966796875, 0.152984619140625, 0.1612701416015625, 0.1695556640625, 0.1778411865234375, 0.186126708984375, 0.1944122314453125, 0.20269775390625, 0.2109832763671875, 0.219268798828125, 0.2275543212890625, 0.23583984375]}, "gradients/decoder.transformer.h.5.ln_cross_attn.weight": {"_type": "histogram", "values": [3.0, 7.0, 417.0, 573.0, 20.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00501313665881753, -0.003385726362466812, -0.0017583160661160946, -0.00013090576976537704, 0.0014965045265853405, 0.0031239143572747707, 0.004751325119286776, 0.0063787358812987804, 0.008006146177649498, 0.009633556008338928, 0.011260966770350933, 0.012888377532362938, 0.014515787363052368, 0.0161431971937418, 0.01777060702443123, 0.019398018717765808, 0.02102542854845524, 0.02265283837914467, 0.024280250072479248, 0.02590765990316868, 0.02753506973385811, 0.02916247956454754, 0.03078988939523697, 0.03241730108857155, 0.03404470905661583, 0.03567212074995041, 0.03729952871799469, 0.03892694041132927, 0.04055435210466385, 0.04218176007270813, 0.04380917176604271, 0.04543658345937729, 0.04706399142742157, 0.04869140312075615, 0.05031881108880043, 0.05194622278213501, 0.05357363075017929, 0.05520104244351387, 0.05682845413684845, 0.05845586210489273, 0.06008327379822731, 0.06171068549156189, 0.06333809345960617, 0.06496550142765045, 0.06659291684627533, 0.06822032481431961, 0.06984773278236389, 0.07147514820098877, 0.07310255616903305, 0.07472996413707733, 0.07635737955570221, 0.07798478752374649, 0.07961219549179077, 0.08123961091041565, 0.08286701887845993, 0.08449442684650421, 0.08612184226512909, 0.08774925023317337, 0.08937666565179825, 0.09100407361984253, 0.09263148158788681, 0.09425888955593109, 0.09588630497455597, 0.09751371294260025, 0.09914112091064453]}, "gradients/decoder.transformer.h.5.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 3.0, 3.0, 5.0, 7.0, 5.0, 11.0, 11.0, 9.0, 10.0, 6.0, 14.0, 17.0, 18.0, 18.0, 24.0, 22.0, 27.0, 21.0, 25.0, 20.0, 39.0, 30.0, 47.0, 43.0, 30.0, 36.0, 35.0, 33.0, 35.0, 30.0, 31.0, 29.0, 42.0, 36.0, 36.0, 23.0, 26.0, 17.0, 26.0, 17.0, 16.0, 15.0, 14.0, 6.0, 11.0, 9.0, 7.0, 1.0, 2.0, 4.0, 3.0, 3.0, 4.0, 0.0, 2.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.0043978095054626465, -0.004244734533131123, -0.004091659560799599, -0.003938584588468075, -0.003785509616136551, -0.003632434643805027, -0.003479359671473503, -0.0033262846991419792, -0.0031732097268104553, -0.0030201347544789314, -0.0028670597821474075, -0.0027139848098158836, -0.0025609098374843597, -0.002407834865152836, -0.002254759892821312, -0.002101684920489788, -0.0019486099481582642, -0.0017955349758267403, -0.0016424600034952164, -0.0014893850311636925, -0.0013363100588321686, -0.0011832350865006447, -0.0010301601141691208, -0.0008770851418375969, -0.000724010169506073, -0.0005709351971745491, -0.0004178602248430252, -0.0002647852525115013, -0.00011171028017997742, 4.136469215154648e-05, 0.00019443966448307037, 0.00034751463681459427, 0.0005005896091461182, 0.0006536645814776421, 0.000806739553809166, 0.0009598145261406898, 0.0011128894984722137, 0.0012659644708037376, 0.0014190394431352615, 0.0015721144154667854, 0.0017251893877983093, 0.0018782643601298332, 0.002031339332461357, 0.002184414304792881, 0.002337489277124405, 0.002490564249455929, 0.0026436392217874527, 0.0027967141941189766, 0.0029497891664505005, 0.0031028641387820244, 0.0032559391111135483, 0.003409014083445072, 0.003562089055776596, 0.00371516402810812, 0.003868239000439644, 0.004021313972771168, 0.004174388945102692, 0.0043274639174342155, 0.0044805388897657394, 0.004633613862097263, 0.004786688834428787, 0.004939763806760311, 0.005092838779091835, 0.005245913751423359, 0.005398988723754883]}, "gradients/decoder.transformer.h.5.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 4.0, 3.0, 6.0, 5.0, 9.0, 8.0, 9.0, 12.0, 27.0, 11.0, 23.0, 23.0, 34.0, 33.0, 33.0, 21.0, 45.0, 52.0, 34.0, 46.0, 54.0, 46.0, 56.0, 48.0, 40.0, 33.0, 40.0, 34.0, 40.0, 32.0, 28.0, 29.0, 19.0, 15.0, 15.0, 17.0, 5.0, 13.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.5234375, -13.104248046875, -12.68505859375, -12.265869140625, -11.8466796875, -11.427490234375, -11.00830078125, -10.589111328125, -10.169921875, -9.750732421875, -9.33154296875, -8.912353515625, -8.4931640625, -8.073974609375, -7.65478515625, -7.235595703125, -6.81640625, -6.397216796875, -5.97802734375, -5.558837890625, -5.1396484375, -4.720458984375, -4.30126953125, -3.882080078125, -3.462890625, -3.043701171875, -2.62451171875, -2.205322265625, -1.7861328125, -1.366943359375, -0.94775390625, -0.528564453125, -0.109375, 0.309814453125, 0.72900390625, 1.148193359375, 1.5673828125, 1.986572265625, 2.40576171875, 2.824951171875, 3.244140625, 3.663330078125, 4.08251953125, 4.501708984375, 4.9208984375, 5.340087890625, 5.75927734375, 6.178466796875, 6.59765625, 7.016845703125, 7.43603515625, 7.855224609375, 8.2744140625, 8.693603515625, 9.11279296875, 9.531982421875, 9.951171875, 10.370361328125, 10.78955078125, 11.208740234375, 11.6279296875, 12.047119140625, 12.46630859375, 12.885498046875, 13.3046875]}, "gradients/decoder.transformer.h.5.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 5.0, 8.0, 11.0, 17.0, 15.0, 30.0, 39.0, 55.0, 45.0, 89.0, 112.0, 204.0, 295.0, 550.0, 1162.0, 2815.0, 7676.0, 24215.0, 89056.0, 340440.0, 424559.0, 111456.0, 30306.0, 9159.0, 3237.0, 1381.0, 597.0, 367.0, 201.0, 128.0, 92.0, 75.0, 44.0, 36.0, 32.0, 13.0, 15.0, 8.0, 9.0, 0.0, 4.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.65625, -17.10595703125, -16.5556640625, -16.00537109375, -15.455078125, -14.90478515625, -14.3544921875, -13.80419921875, -13.25390625, -12.70361328125, -12.1533203125, -11.60302734375, -11.052734375, -10.50244140625, -9.9521484375, -9.40185546875, -8.8515625, -8.30126953125, -7.7509765625, -7.20068359375, -6.650390625, -6.10009765625, -5.5498046875, -4.99951171875, -4.44921875, -3.89892578125, -3.3486328125, -2.79833984375, -2.248046875, -1.69775390625, -1.1474609375, -0.59716796875, -0.046875, 0.50341796875, 1.0537109375, 1.60400390625, 2.154296875, 2.70458984375, 3.2548828125, 3.80517578125, 4.35546875, 4.90576171875, 5.4560546875, 6.00634765625, 6.556640625, 7.10693359375, 7.6572265625, 8.20751953125, 8.7578125, 9.30810546875, 9.8583984375, 10.40869140625, 10.958984375, 11.50927734375, 12.0595703125, 12.60986328125, 13.16015625, 13.71044921875, 14.2607421875, 14.81103515625, 15.361328125, 15.91162109375, 16.4619140625, 17.01220703125, 17.5625]}, "gradients/decoder.transformer.h.5.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 4.0, 1.0, 5.0, 6.0, 9.0, 7.0, 10.0, 13.0, 7.0, 15.0, 11.0, 22.0, 28.0, 26.0, 27.0, 31.0, 40.0, 34.0, 45.0, 55.0, 69.0, 96.0, 186.0, 1464.0, 229.0, 104.0, 95.0, 52.0, 38.0, 45.0, 37.0, 42.0, 31.0, 15.0, 32.0, 24.0, 18.0, 19.0, 13.0, 12.0, 8.0, 8.0, 3.0, 4.0, 2.0, 5.0, 5.0, 0.0, 2.0, 3.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.859375, -24.888427734375, -23.91748046875, -22.946533203125, -21.9755859375, -21.004638671875, -20.03369140625, -19.062744140625, -18.091796875, -17.120849609375, -16.14990234375, -15.178955078125, -14.2080078125, -13.237060546875, -12.26611328125, -11.295166015625, -10.32421875, -9.353271484375, -8.38232421875, -7.411376953125, -6.4404296875, -5.469482421875, -4.49853515625, -3.527587890625, -2.556640625, -1.585693359375, -0.61474609375, 0.356201171875, 1.3271484375, 2.298095703125, 3.26904296875, 4.239990234375, 5.2109375, 6.181884765625, 7.15283203125, 8.123779296875, 9.0947265625, 10.065673828125, 11.03662109375, 12.007568359375, 12.978515625, 13.949462890625, 14.92041015625, 15.891357421875, 16.8623046875, 17.833251953125, 18.80419921875, 19.775146484375, 20.74609375, 21.717041015625, 22.68798828125, 23.658935546875, 24.6298828125, 25.600830078125, 26.57177734375, 27.542724609375, 28.513671875, 29.484619140625, 30.45556640625, 31.426513671875, 32.3974609375, 33.368408203125, 34.33935546875, 35.310302734375, 36.28125]}, "gradients/decoder.transformer.h.5.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 5.0, 6.0, 4.0, 10.0, 16.0, 21.0, 21.0, 30.0, 39.0, 62.0, 114.0, 165.0, 229.0, 421.0, 1062.0, 13566.0, 2620681.0, 502356.0, 5254.0, 727.0, 306.0, 204.0, 128.0, 87.0, 67.0, 46.0, 28.0, 20.0, 15.0, 11.0, 8.0, 2.0, 2.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-42.875, -40.8203125, -38.765625, -36.7109375, -34.65625, -32.6015625, -30.546875, -28.4921875, -26.4375, -24.3828125, -22.328125, -20.2734375, -18.21875, -16.1640625, -14.109375, -12.0546875, -10.0, -7.9453125, -5.890625, -3.8359375, -1.78125, 0.2734375, 2.328125, 4.3828125, 6.4375, 8.4921875, 10.546875, 12.6015625, 14.65625, 16.7109375, 18.765625, 20.8203125, 22.875, 24.9296875, 26.984375, 29.0390625, 31.09375, 33.1484375, 35.203125, 37.2578125, 39.3125, 41.3671875, 43.421875, 45.4765625, 47.53125, 49.5859375, 51.640625, 53.6953125, 55.75, 57.8046875, 59.859375, 61.9140625, 63.96875, 66.0234375, 68.078125, 70.1328125, 72.1875, 74.2421875, 76.296875, 78.3515625, 80.40625, 82.4609375, 84.515625, 86.5703125, 88.625]}, "gradients/decoder.transformer.h.5.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 31.0, 409.0, 526.0, 46.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0], "bins": [-452.2023010253906, -444.0010986328125, -435.79986572265625, -427.5986633300781, -419.3974304199219, -411.19622802734375, -402.9949951171875, -394.7937927246094, -386.59259033203125, -378.3913879394531, -370.1901550292969, -361.98895263671875, -353.7877197265625, -345.5865173339844, -337.3852844238281, -329.18408203125, -320.98284912109375, -312.7816467285156, -304.5804138183594, -296.37921142578125, -288.177978515625, -279.9767761230469, -271.7755432128906, -263.5743408203125, -255.3731231689453, -247.17190551757812, -238.97068786621094, -230.76947021484375, -222.56826782226562, -214.36703491210938, -206.16583251953125, -197.96461486816406, -189.76341247558594, -181.56219482421875, -173.36097717285156, -165.15975952148438, -156.95855712890625, -148.75732421875, -140.55612182617188, -132.3549041748047, -124.1536865234375, -115.95246887207031, -107.75125122070312, -99.55004119873047, -91.34882354736328, -83.1476058959961, -74.94639587402344, -66.74517822265625, -58.54396057128906, -50.342742919921875, -42.14152908325195, -33.94031524658203, -25.739097595214844, -17.537879943847656, -9.336666107177734, -1.1354522705078125, 7.065765380859375, 15.26698112487793, 23.468196868896484, 31.66941261291504, 39.870628356933594, 48.07184600830078, 56.2730598449707, 64.47427368164062, 72.67549133300781]}, "gradients/decoder.transformer.h.5.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 3.0, 2.0, 4.0, 1.0, 8.0, 8.0, 2.0, 11.0, 8.0, 13.0, 17.0, 9.0, 15.0, 16.0, 21.0, 22.0, 23.0, 25.0, 41.0, 33.0, 35.0, 20.0, 39.0, 41.0, 32.0, 39.0, 35.0, 28.0, 30.0, 53.0, 34.0, 43.0, 34.0, 29.0, 23.0, 30.0, 25.0, 24.0, 20.0, 17.0, 16.0, 22.0, 11.0, 11.0, 4.0, 10.0, 5.0, 5.0, 4.0, 1.0, 3.0, 2.0, 4.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-78.55891418457031, -76.28256225585938, -74.00621032714844, -71.7298583984375, -69.4535140991211, -67.17716217041016, -64.90081024169922, -62.62445831298828, -60.348106384277344, -58.071754455566406, -55.795406341552734, -53.5190544128418, -51.24270248413086, -48.96635437011719, -46.69000244140625, -44.41365051269531, -42.13730239868164, -39.8609504699707, -37.58460235595703, -35.308250427246094, -33.031898498535156, -30.75554847717285, -28.479198455810547, -26.20284652709961, -23.926496505737305, -21.650146484375, -19.373794555664062, -17.097444534301758, -14.821093559265137, -12.544742584228516, -10.268392562866211, -7.99204158782959, -5.715690612792969, -3.4393398761749268, -1.1629891395568848, 1.1133613586425781, 3.389712333679199, 5.66606330871582, 7.942413330078125, 10.218764305114746, 12.495115280151367, 14.771466255187988, 17.04781723022461, 19.324167251586914, 21.60051727294922, 23.876869201660156, 26.15321922302246, 28.429569244384766, 30.705921173095703, 32.98227310180664, 35.25862121582031, 37.53497314453125, 39.81132507324219, 42.087677001953125, 44.3640251159668, 46.640377044677734, 48.916725158691406, 51.193077087402344, 53.469425201416016, 55.74577713012695, 58.02212905883789, 60.29847717285156, 62.5748291015625, 64.85118103027344, 67.12753295898438]}, "gradients/decoder.transformer.h.4.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 1.0, 0.0, 4.0, 6.0, 6.0, 6.0, 8.0, 7.0, 13.0, 19.0, 22.0, 11.0, 22.0, 28.0, 30.0, 34.0, 25.0, 41.0, 33.0, 47.0, 48.0, 46.0, 58.0, 36.0, 47.0, 39.0, 54.0, 40.0, 45.0, 24.0, 35.0, 28.0, 30.0, 26.0, 16.0, 15.0, 11.0, 14.0, 13.0, 7.0, 4.0, 8.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-13.0703125, -12.6605224609375, -12.250732421875, -11.8409423828125, -11.43115234375, -11.0213623046875, -10.611572265625, -10.2017822265625, -9.7919921875, -9.3822021484375, -8.972412109375, -8.5626220703125, -8.15283203125, -7.7430419921875, -7.333251953125, -6.9234619140625, -6.513671875, -6.1038818359375, -5.694091796875, -5.2843017578125, -4.87451171875, -4.4647216796875, -4.054931640625, -3.6451416015625, -3.2353515625, -2.8255615234375, -2.415771484375, -2.0059814453125, -1.59619140625, -1.1864013671875, -0.776611328125, -0.3668212890625, 0.04296875, 0.4527587890625, 0.862548828125, 1.2723388671875, 1.68212890625, 2.0919189453125, 2.501708984375, 2.9114990234375, 3.3212890625, 3.7310791015625, 4.140869140625, 4.5506591796875, 4.96044921875, 5.3702392578125, 5.780029296875, 6.1898193359375, 6.599609375, 7.0093994140625, 7.419189453125, 7.8289794921875, 8.23876953125, 8.6485595703125, 9.058349609375, 9.4681396484375, 9.8779296875, 10.2877197265625, 10.697509765625, 11.1072998046875, 11.51708984375, 11.9268798828125, 12.336669921875, 12.7464599609375, 13.15625]}, "gradients/decoder.transformer.h.4.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 5.0, 4.0, 5.0, 6.0, 9.0, 13.0, 7.0, 11.0, 20.0, 16.0, 22.0, 24.0, 23.0, 35.0, 49.0, 86.0, 167.0, 391.0, 1136.0, 4761.0, 31457.0, 534015.0, 3112368.0, 475189.0, 28271.0, 4304.0, 1052.0, 364.0, 154.0, 79.0, 55.0, 27.0, 26.0, 18.0, 22.0, 20.0, 16.0, 12.0, 9.0, 4.0, 14.0, 5.0, 3.0, 5.0, 3.0, 2.0, 2.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-29.296875, -28.335693359375, -27.37451171875, -26.413330078125, -25.4521484375, -24.490966796875, -23.52978515625, -22.568603515625, -21.607421875, -20.646240234375, -19.68505859375, -18.723876953125, -17.7626953125, -16.801513671875, -15.84033203125, -14.879150390625, -13.91796875, -12.956787109375, -11.99560546875, -11.034423828125, -10.0732421875, -9.112060546875, -8.15087890625, -7.189697265625, -6.228515625, -5.267333984375, -4.30615234375, -3.344970703125, -2.3837890625, -1.422607421875, -0.46142578125, 0.499755859375, 1.4609375, 2.422119140625, 3.38330078125, 4.344482421875, 5.3056640625, 6.266845703125, 7.22802734375, 8.189208984375, 9.150390625, 10.111572265625, 11.07275390625, 12.033935546875, 12.9951171875, 13.956298828125, 14.91748046875, 15.878662109375, 16.83984375, 17.801025390625, 18.76220703125, 19.723388671875, 20.6845703125, 21.645751953125, 22.60693359375, 23.568115234375, 24.529296875, 25.490478515625, 26.45166015625, 27.412841796875, 28.3740234375, 29.335205078125, 30.29638671875, 31.257568359375, 32.21875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 7.0, 5.0, 7.0, 11.0, 23.0, 34.0, 31.0, 44.0, 64.0, 89.0, 124.0, 195.0, 308.0, 417.0, 500.0, 532.0, 472.0, 328.0, 258.0, 150.0, 129.0, 77.0, 65.0, 49.0, 44.0, 28.0, 21.0, 10.0, 7.0, 10.0, 8.0, 10.0, 4.0, 2.0, 3.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-15.9765625, -15.4476318359375, -14.918701171875, -14.3897705078125, -13.86083984375, -13.3319091796875, -12.802978515625, -12.2740478515625, -11.7451171875, -11.2161865234375, -10.687255859375, -10.1583251953125, -9.62939453125, -9.1004638671875, -8.571533203125, -8.0426025390625, -7.513671875, -6.9847412109375, -6.455810546875, -5.9268798828125, -5.39794921875, -4.8690185546875, -4.340087890625, -3.8111572265625, -3.2822265625, -2.7532958984375, -2.224365234375, -1.6954345703125, -1.16650390625, -0.6375732421875, -0.108642578125, 0.4202880859375, 0.94921875, 1.4781494140625, 2.007080078125, 2.5360107421875, 3.06494140625, 3.5938720703125, 4.122802734375, 4.6517333984375, 5.1806640625, 5.7095947265625, 6.238525390625, 6.7674560546875, 7.29638671875, 7.8253173828125, 8.354248046875, 8.8831787109375, 9.412109375, 9.9410400390625, 10.469970703125, 10.9989013671875, 11.52783203125, 12.0567626953125, 12.585693359375, 13.1146240234375, 13.6435546875, 14.1724853515625, 14.701416015625, 15.2303466796875, 15.75927734375, 16.2882080078125, 16.817138671875, 17.3460693359375, 17.875]}, "gradients/decoder.transformer.h.4.mlp.c_fc.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 1.0, 2.0, 2.0, 8.0, 12.0, 13.0, 15.0, 17.0, 17.0, 29.0, 39.0, 55.0, 75.0, 134.0, 225.0, 462.0, 1266.0, 4553.0, 27844.0, 311414.0, 3406971.0, 399107.0, 34147.0, 5408.0, 1374.0, 488.0, 215.0, 126.0, 70.0, 49.0, 46.0, 26.0, 18.0, 8.0, 9.0, 10.0, 7.0, 7.0, 5.0, 3.0, 7.0, 0.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-32.34375, -31.21044921875, -30.0771484375, -28.94384765625, -27.810546875, -26.67724609375, -25.5439453125, -24.41064453125, -23.27734375, -22.14404296875, -21.0107421875, -19.87744140625, -18.744140625, -17.61083984375, -16.4775390625, -15.34423828125, -14.2109375, -13.07763671875, -11.9443359375, -10.81103515625, -9.677734375, -8.54443359375, -7.4111328125, -6.27783203125, -5.14453125, -4.01123046875, -2.8779296875, -1.74462890625, -0.611328125, 0.52197265625, 1.6552734375, 2.78857421875, 3.921875, 5.05517578125, 6.1884765625, 7.32177734375, 8.455078125, 9.58837890625, 10.7216796875, 11.85498046875, 12.98828125, 14.12158203125, 15.2548828125, 16.38818359375, 17.521484375, 18.65478515625, 19.7880859375, 20.92138671875, 22.0546875, 23.18798828125, 24.3212890625, 25.45458984375, 26.587890625, 27.72119140625, 28.8544921875, 29.98779296875, 31.12109375, 32.25439453125, 33.3876953125, 34.52099609375, 35.654296875, 36.78759765625, 37.9208984375, 39.05419921875, 40.1875]}, "gradients/decoder.transformer.h.4.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 6.0, 290.0, 695.0, 29.0], "bins": [-1067.7012939453125, -1050.521728515625, -1033.342041015625, -1016.1624755859375, -998.9828491210938, -981.8032836914062, -964.6236572265625, -947.4440307617188, -930.2644653320312, -913.0848388671875, -895.9052734375, -878.7256469726562, -861.5460205078125, -844.366455078125, -827.1868286132812, -810.0072021484375, -792.82763671875, -775.6480102539062, -758.4684448242188, -741.288818359375, -724.1091918945312, -706.9296264648438, -689.75, -672.5703735351562, -655.3907470703125, -638.2111206054688, -621.0315551757812, -603.8519287109375, -586.6723022460938, -569.4927368164062, -552.3131103515625, -535.1334838867188, -517.953857421875, -500.7742614746094, -483.5946350097656, -466.4150390625, -449.2354431152344, -432.05584716796875, -414.876220703125, -397.6966247558594, -380.51702880859375, -363.3374328613281, -346.1578063964844, -328.97821044921875, -311.7986145019531, -294.6190185546875, -277.43939208984375, -260.2597961425781, -243.08016967773438, -225.9005584716797, -208.72096252441406, -191.54135131835938, -174.36175537109375, -157.18214416503906, -140.00253295898438, -122.82292938232422, -105.6433334350586, -88.46372985839844, -71.28411865234375, -54.104515075683594, -36.92491149902344, -19.74530792236328, -2.5656967163085938, 14.613906860351562, 31.79351043701172]}, "gradients/decoder.transformer.h.4.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 4.0, 1.0, 6.0, 10.0, 4.0, 9.0, 13.0, 6.0, 12.0, 21.0, 20.0, 21.0, 24.0, 31.0, 23.0, 36.0, 38.0, 19.0, 35.0, 38.0, 41.0, 42.0, 48.0, 42.0, 44.0, 41.0, 33.0, 38.0, 38.0, 32.0, 32.0, 26.0, 25.0, 23.0, 22.0, 20.0, 13.0, 14.0, 12.0, 12.0, 9.0, 7.0, 7.0, 7.0, 1.0, 2.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-59.52099609375, -57.7048225402832, -55.888648986816406, -54.07247543334961, -52.25630187988281, -50.440128326416016, -48.62395477294922, -46.807777404785156, -44.991607666015625, -43.17543411254883, -41.35926055908203, -39.543087005615234, -37.72691345214844, -35.91073989868164, -34.094566345214844, -32.27838897705078, -30.462215423583984, -28.646041870117188, -26.82986831665039, -25.013694763183594, -23.197521209716797, -21.38134765625, -19.56517219543457, -17.748998641967773, -15.932825088500977, -14.11665153503418, -12.300477981567383, -10.48430347442627, -8.668129920959473, -6.851956367492676, -5.0357818603515625, -3.2196083068847656, -1.4034347534179688, 0.4127390384674072, 2.228912830352783, 4.045086860656738, 5.861260414123535, 7.677433967590332, 9.493608474731445, 11.309782028198242, 13.125955581665039, 14.942129135131836, 16.758302688598633, 18.574478149414062, 20.39065170288086, 22.206825256347656, 24.022998809814453, 25.83917236328125, 27.655345916748047, 29.471519470214844, 31.28769302368164, 33.10386657714844, 34.920040130615234, 36.73621368408203, 38.552391052246094, 40.368560791015625, 42.18473815917969, 44.000911712646484, 45.81708526611328, 47.63325881958008, 49.449432373046875, 51.26560592651367, 53.08177947998047, 54.89795684814453, 56.71412658691406]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 10.0, 13.0, 9.0, 16.0, 15.0, 16.0, 24.0, 24.0, 24.0, 45.0, 30.0, 35.0, 42.0, 38.0, 38.0, 42.0, 39.0, 50.0, 43.0, 45.0, 44.0, 38.0, 40.0, 32.0, 40.0, 27.0, 26.0, 21.0, 23.0, 20.0, 26.0, 13.0, 13.0, 15.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.140625, -11.7418212890625, -11.343017578125, -10.9442138671875, -10.54541015625, -10.1466064453125, -9.747802734375, -9.3489990234375, -8.9501953125, -8.5513916015625, -8.152587890625, -7.7537841796875, -7.35498046875, -6.9561767578125, -6.557373046875, -6.1585693359375, -5.759765625, -5.3609619140625, -4.962158203125, -4.5633544921875, -4.16455078125, -3.7657470703125, -3.366943359375, -2.9681396484375, -2.5693359375, -2.1705322265625, -1.771728515625, -1.3729248046875, -0.97412109375, -0.5753173828125, -0.176513671875, 0.2222900390625, 0.62109375, 1.0198974609375, 1.418701171875, 1.8175048828125, 2.21630859375, 2.6151123046875, 3.013916015625, 3.4127197265625, 3.8115234375, 4.2103271484375, 4.609130859375, 5.0079345703125, 5.40673828125, 5.8055419921875, 6.204345703125, 6.6031494140625, 7.001953125, 7.4007568359375, 7.799560546875, 8.1983642578125, 8.59716796875, 8.9959716796875, 9.394775390625, 9.7935791015625, 10.1923828125, 10.5911865234375, 10.989990234375, 11.3887939453125, 11.78759765625, 12.1864013671875, 12.585205078125, 12.9840087890625, 13.3828125]}, "gradients/decoder.transformer.h.4.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 14.0, 15.0, 25.0, 36.0, 70.0, 92.0, 134.0, 179.0, 318.0, 419.0, 651.0, 1065.0, 1551.0, 2408.0, 3892.0, 6055.0, 9371.0, 15368.0, 24339.0, 39034.0, 63615.0, 104891.0, 161428.0, 195916.0, 156025.0, 100037.0, 61008.0, 37372.0, 23185.0, 14615.0, 9423.0, 5738.0, 3576.0, 2358.0, 1516.0, 988.0, 606.0, 411.0, 266.0, 188.0, 118.0, 80.0, 54.0, 37.0, 24.0, 17.0, 5.0, 8.0, 7.0, 5.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.0400390625, -1.0069732666015625, -0.973907470703125, -0.9408416748046875, -0.90777587890625, -0.8747100830078125, -0.841644287109375, -0.8085784912109375, -0.7755126953125, -0.7424468994140625, -0.709381103515625, -0.6763153076171875, -0.64324951171875, -0.6101837158203125, -0.577117919921875, -0.5440521240234375, -0.510986328125, -0.4779205322265625, -0.444854736328125, -0.4117889404296875, -0.37872314453125, -0.3456573486328125, -0.312591552734375, -0.2795257568359375, -0.2464599609375, -0.2133941650390625, -0.180328369140625, -0.1472625732421875, -0.11419677734375, -0.0811309814453125, -0.048065185546875, -0.0149993896484375, 0.01806640625, 0.0511322021484375, 0.084197998046875, 0.1172637939453125, 0.15032958984375, 0.1833953857421875, 0.216461181640625, 0.2495269775390625, 0.2825927734375, 0.3156585693359375, 0.348724365234375, 0.3817901611328125, 0.41485595703125, 0.4479217529296875, 0.480987548828125, 0.5140533447265625, 0.547119140625, 0.5801849365234375, 0.613250732421875, 0.6463165283203125, 0.67938232421875, 0.7124481201171875, 0.745513916015625, 0.7785797119140625, 0.8116455078125, 0.8447113037109375, 0.877777099609375, 0.9108428955078125, 0.94390869140625, 0.9769744873046875, 1.010040283203125, 1.0431060791015625, 1.076171875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 0.0, 2.0, 4.0, 2.0, 3.0, 6.0, 6.0, 8.0, 11.0, 18.0, 15.0, 17.0, 11.0, 12.0, 22.0, 25.0, 21.0, 34.0, 27.0, 29.0, 37.0, 44.0, 48.0, 40.0, 44.0, 37.0, 1064.0, 39.0, 37.0, 42.0, 39.0, 27.0, 31.0, 28.0, 19.0, 30.0, 20.0, 23.0, 17.0, 17.0, 19.0, 12.0, 15.0, 6.0, 8.0, 5.0, 5.0, 0.0, 4.0, 4.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0], "bins": [-7.86328125, -7.63232421875, -7.4013671875, -7.17041015625, -6.939453125, -6.70849609375, -6.4775390625, -6.24658203125, -6.015625, -5.78466796875, -5.5537109375, -5.32275390625, -5.091796875, -4.86083984375, -4.6298828125, -4.39892578125, -4.16796875, -3.93701171875, -3.7060546875, -3.47509765625, -3.244140625, -3.01318359375, -2.7822265625, -2.55126953125, -2.3203125, -2.08935546875, -1.8583984375, -1.62744140625, -1.396484375, -1.16552734375, -0.9345703125, -0.70361328125, -0.47265625, -0.24169921875, -0.0107421875, 0.22021484375, 0.451171875, 0.68212890625, 0.9130859375, 1.14404296875, 1.375, 1.60595703125, 1.8369140625, 2.06787109375, 2.298828125, 2.52978515625, 2.7607421875, 2.99169921875, 3.22265625, 3.45361328125, 3.6845703125, 3.91552734375, 4.146484375, 4.37744140625, 4.6083984375, 4.83935546875, 5.0703125, 5.30126953125, 5.5322265625, 5.76318359375, 5.994140625, 6.22509765625, 6.4560546875, 6.68701171875, 6.91796875]}, "gradients/decoder.transformer.h.4.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 1.0, 2.0, 8.0, 15.0, 14.0, 25.0, 25.0, 41.0, 78.0, 104.0, 165.0, 238.0, 325.0, 483.0, 841.0, 1258.0, 1855.0, 2712.0, 4128.0, 6449.0, 9906.0, 15792.0, 24065.0, 37856.0, 58073.0, 88034.0, 126928.0, 1139284.0, 222834.0, 120002.0, 82876.0, 54205.0, 35125.0, 22138.0, 14503.0, 9368.0, 6023.0, 3895.0, 2559.0, 1630.0, 1101.0, 701.0, 520.0, 302.0, 213.0, 150.0, 96.0, 70.0, 44.0, 29.0, 21.0, 9.0, 8.0, 5.0, 7.0, 5.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.75048828125, -0.7269744873046875, -0.703460693359375, -0.6799468994140625, -0.65643310546875, -0.6329193115234375, -0.609405517578125, -0.5858917236328125, -0.5623779296875, -0.5388641357421875, -0.515350341796875, -0.4918365478515625, -0.46832275390625, -0.4448089599609375, -0.421295166015625, -0.3977813720703125, -0.374267578125, -0.3507537841796875, -0.327239990234375, -0.3037261962890625, -0.28021240234375, -0.2566986083984375, -0.233184814453125, -0.2096710205078125, -0.1861572265625, -0.1626434326171875, -0.139129638671875, -0.1156158447265625, -0.09210205078125, -0.0685882568359375, -0.045074462890625, -0.0215606689453125, 0.001953125, 0.0254669189453125, 0.048980712890625, 0.0724945068359375, 0.09600830078125, 0.1195220947265625, 0.143035888671875, 0.1665496826171875, 0.1900634765625, 0.2135772705078125, 0.237091064453125, 0.2606048583984375, 0.28411865234375, 0.3076324462890625, 0.331146240234375, 0.3546600341796875, 0.378173828125, 0.4016876220703125, 0.425201416015625, 0.4487152099609375, 0.47222900390625, 0.4957427978515625, 0.519256591796875, 0.5427703857421875, 0.5662841796875, 0.5897979736328125, 0.613311767578125, 0.6368255615234375, 0.66033935546875, 0.6838531494140625, 0.707366943359375, 0.7308807373046875, 0.75439453125]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 4.0, 2.0, 6.0, 4.0, 4.0, 6.0, 6.0, 8.0, 7.0, 4.0, 14.0, 12.0, 15.0, 18.0, 16.0, 25.0, 25.0, 23.0, 49.0, 48.0, 36.0, 54.0, 57.0, 56.0, 43.0, 78.0, 44.0, 42.0, 35.0, 35.0, 30.0, 27.0, 25.0, 28.0, 19.0, 9.0, 10.0, 10.0, 17.0, 10.0, 6.0, 5.0, 4.0, 8.0, 7.0, 3.0, 2.0, 6.0, 2.0, 2.0, 2.0, 2.0, 1.0, 0.0, 1.0], "bins": [-0.00629425048828125, -0.006106317043304443, -0.005918383598327637, -0.00573045015335083, -0.0055425167083740234, -0.005354583263397217, -0.00516664981842041, -0.0049787163734436035, -0.004790782928466797, -0.00460284948348999, -0.004414916038513184, -0.004226982593536377, -0.00403904914855957, -0.0038511157035827637, -0.003663182258605957, -0.0034752488136291504, -0.0032873153686523438, -0.003099381923675537, -0.0029114484786987305, -0.002723515033721924, -0.002535581588745117, -0.0023476481437683105, -0.002159714698791504, -0.0019717812538146973, -0.0017838478088378906, -0.001595914363861084, -0.0014079809188842773, -0.0012200474739074707, -0.001032114028930664, -0.0008441805839538574, -0.0006562471389770508, -0.00046831369400024414, -0.0002803802490234375, -9.244680404663086e-05, 9.548664093017578e-05, 0.0002834200859069824, 0.00047135353088378906, 0.0006592869758605957, 0.0008472204208374023, 0.001035153865814209, 0.0012230873107910156, 0.0014110207557678223, 0.001598954200744629, 0.0017868876457214355, 0.001974821090698242, 0.002162754535675049, 0.0023506879806518555, 0.002538621425628662, 0.0027265548706054688, 0.0029144883155822754, 0.003102421760559082, 0.0032903552055358887, 0.0034782886505126953, 0.003666222095489502, 0.0038541555404663086, 0.004042088985443115, 0.004230022430419922, 0.0044179558753967285, 0.004605889320373535, 0.004793822765350342, 0.0049817562103271484, 0.005169689655303955, 0.005357623100280762, 0.005545556545257568, 0.005733489990234375]}, "gradients/decoder.transformer.h.4.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 5.0, 3.0, 2.0, 3.0, 10.0, 5.0, 5.0, 3.0, 11.0, 6.0, 10.0, 15.0, 16.0, 25.0, 20.0, 17.0, 25.0, 36.0, 45.0, 55.0, 77.0, 95.0, 147.0, 174.0, 291.0, 567.0, 3407.0, 421630.0, 615802.0, 4182.0, 660.0, 315.0, 189.0, 151.0, 122.0, 97.0, 77.0, 47.0, 27.0, 36.0, 15.0, 18.0, 18.0, 15.0, 16.0, 9.0, 8.0, 10.0, 13.0, 9.0, 3.0, 2.0, 5.0, 6.0, 3.0, 3.0, 2.0, 4.0, 2.0, 0.0, 2.0], "bins": [-0.11529541015625, -0.11158084869384766, -0.10786628723144531, -0.10415172576904297, -0.10043716430664062, -0.09672260284423828, -0.09300804138183594, -0.0892934799194336, -0.08557891845703125, -0.0818643569946289, -0.07814979553222656, -0.07443523406982422, -0.07072067260742188, -0.06700611114501953, -0.06329154968261719, -0.059576988220214844, -0.0558624267578125, -0.052147865295410156, -0.04843330383300781, -0.04471874237060547, -0.041004180908203125, -0.03728961944580078, -0.03357505798339844, -0.029860496520996094, -0.02614593505859375, -0.022431373596191406, -0.018716812133789062, -0.015002250671386719, -0.011287689208984375, -0.007573127746582031, -0.0038585662841796875, -0.00014400482177734375, 0.003570556640625, 0.007285118103027344, 0.010999679565429688, 0.014714241027832031, 0.018428802490234375, 0.02214336395263672, 0.025857925415039062, 0.029572486877441406, 0.03328704833984375, 0.037001609802246094, 0.04071617126464844, 0.04443073272705078, 0.048145294189453125, 0.05185985565185547, 0.05557441711425781, 0.059288978576660156, 0.0630035400390625, 0.06671810150146484, 0.07043266296386719, 0.07414722442626953, 0.07786178588867188, 0.08157634735107422, 0.08529090881347656, 0.0890054702758789, 0.09272003173828125, 0.0964345932006836, 0.10014915466308594, 0.10386371612548828, 0.10757827758789062, 0.11129283905029297, 0.11500740051269531, 0.11872196197509766, 0.1224365234375]}, "gradients/decoder.transformer.h.4.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 4.0, 134.0, 769.0, 109.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.008730384521186352, -0.007379175629466772, -0.006027966737747192, -0.004676757380366325, -0.0033255484886467457, -0.001974339596927166, -0.000623130239546299, 0.0007280781865119934, 0.0020792875438928604, 0.00343049643561244, 0.00478170532733202, 0.006132914684712887, 0.0074841235764324665, 0.008835332468152046, 0.010186541825532913, 0.011537750251591206, 0.012888959608972073, 0.01424016896635294, 0.015591377392411232, 0.0169425867497921, 0.018293796107172966, 0.019645005464553833, 0.02099621295928955, 0.022347422316670418, 0.023698631674051285, 0.025049841031432152, 0.02640105038881302, 0.027752257883548737, 0.029103467240929604, 0.03045467659831047, 0.03180588781833649, 0.033157095313072205, 0.03450830653309822, 0.03585951402783394, 0.037210725247859955, 0.03856193274259567, 0.03991314396262169, 0.04126435145735741, 0.04261556267738342, 0.04396677017211914, 0.04531797766685486, 0.046669185161590576, 0.04802039638161659, 0.04937160387635231, 0.050722815096378326, 0.052074022591114044, 0.05342523008584976, 0.05477644130587578, 0.056127652525901794, 0.05747886002063751, 0.05883007124066353, 0.060181278735399246, 0.06153248995542526, 0.06288369745016098, 0.0642349049448967, 0.06558611243963242, 0.06693731993436813, 0.06828852742910385, 0.06963973492383957, 0.07099094986915588, 0.0723421573638916, 0.07369336485862732, 0.07504457235336304, 0.07639577984809875, 0.07774699479341507]}, "gradients/decoder.transformer.h.4.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 7.0, 2.0, 3.0, 5.0, 3.0, 9.0, 15.0, 9.0, 13.0, 7.0, 17.0, 26.0, 31.0, 22.0, 31.0, 36.0, 30.0, 50.0, 43.0, 50.0, 41.0, 54.0, 47.0, 43.0, 50.0, 34.0, 41.0, 33.0, 31.0, 32.0, 29.0, 28.0, 26.0, 27.0, 11.0, 16.0, 11.0, 10.0, 12.0, 7.0, 6.0, 4.0, 3.0, 1.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.004168152809143066, -0.004037458449602127, -0.003906764090061188, -0.0037760697305202484, -0.003645375370979309, -0.0035146810114383698, -0.0033839866518974304, -0.003253292292356491, -0.0031225979328155518, -0.0029919035732746124, -0.002861209213733673, -0.0027305148541927338, -0.0025998204946517944, -0.002469126135110855, -0.0023384317755699158, -0.0022077374160289764, -0.002077043056488037, -0.0019463486969470978, -0.0018156543374061584, -0.0016849599778652191, -0.0015542656183242798, -0.0014235712587833405, -0.0012928768992424011, -0.0011621825397014618, -0.0010314881801605225, -0.0009007938206195831, -0.0007700994610786438, -0.0006394051015377045, -0.0005087107419967651, -0.0003780163824558258, -0.0002473220229148865, -0.00011662766337394714, 1.4066696166992188e-05, 0.00014476105570793152, 0.00027545541524887085, 0.0004061497747898102, 0.0005368441343307495, 0.0006675384938716888, 0.0007982328534126282, 0.0009289272129535675, 0.0010596215724945068, 0.0011903159320354462, 0.0013210102915763855, 0.0014517046511173248, 0.0015823990106582642, 0.0017130933701992035, 0.0018437877297401428, 0.001974482089281082, 0.0021051764488220215, 0.002235870808362961, 0.0023665651679039, 0.0024972595274448395, 0.002627953886985779, 0.002758648246526718, 0.0028893426060676575, 0.003020036965608597, 0.003150731325149536, 0.0032814256846904755, 0.003412120044231415, 0.003542814403772354, 0.0036735087633132935, 0.003804203122854233, 0.003934897482395172, 0.0040655918419361115, 0.004196286201477051]}, "gradients/decoder.transformer.h.4.attn.c_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 3.0, 1.0, 3.0, 4.0, 4.0, 10.0, 13.0, 10.0, 15.0, 15.0, 16.0, 24.0, 25.0, 23.0, 45.0, 31.0, 34.0, 43.0, 38.0, 40.0, 39.0, 39.0, 50.0, 45.0, 43.0, 44.0, 38.0, 40.0, 32.0, 40.0, 27.0, 26.0, 21.0, 23.0, 21.0, 25.0, 13.0, 13.0, 15.0, 5.0, 4.0, 1.0, 3.0, 2.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1328125, -11.734130859375, -11.33544921875, -10.936767578125, -10.5380859375, -10.139404296875, -9.74072265625, -9.342041015625, -8.943359375, -8.544677734375, -8.14599609375, -7.747314453125, -7.3486328125, -6.949951171875, -6.55126953125, -6.152587890625, -5.75390625, -5.355224609375, -4.95654296875, -4.557861328125, -4.1591796875, -3.760498046875, -3.36181640625, -2.963134765625, -2.564453125, -2.165771484375, -1.76708984375, -1.368408203125, -0.9697265625, -0.571044921875, -0.17236328125, 0.226318359375, 0.625, 1.023681640625, 1.42236328125, 1.821044921875, 2.2197265625, 2.618408203125, 3.01708984375, 3.415771484375, 3.814453125, 4.213134765625, 4.61181640625, 5.010498046875, 5.4091796875, 5.807861328125, 6.20654296875, 6.605224609375, 7.00390625, 7.402587890625, 7.80126953125, 8.199951171875, 8.5986328125, 8.997314453125, 9.39599609375, 9.794677734375, 10.193359375, 10.592041015625, 10.99072265625, 11.389404296875, 11.7880859375, 12.186767578125, 12.58544921875, 12.984130859375, 13.3828125]}, "gradients/decoder.transformer.h.4.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 1.0, 4.0, 6.0, 8.0, 7.0, 12.0, 21.0, 26.0, 43.0, 55.0, 88.0, 115.0, 165.0, 264.0, 435.0, 694.0, 1328.0, 2876.0, 7261.0, 20653.0, 62881.0, 202199.0, 447746.0, 203385.0, 63816.0, 20914.0, 7230.0, 3021.0, 1391.0, 690.0, 398.0, 255.0, 175.0, 125.0, 99.0, 46.0, 37.0, 25.0, 18.0, 15.0, 6.0, 14.0, 4.0, 6.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-17.140625, -16.6290283203125, -16.117431640625, -15.6058349609375, -15.09423828125, -14.5826416015625, -14.071044921875, -13.5594482421875, -13.0478515625, -12.5362548828125, -12.024658203125, -11.5130615234375, -11.00146484375, -10.4898681640625, -9.978271484375, -9.4666748046875, -8.955078125, -8.4434814453125, -7.931884765625, -7.4202880859375, -6.90869140625, -6.3970947265625, -5.885498046875, -5.3739013671875, -4.8623046875, -4.3507080078125, -3.839111328125, -3.3275146484375, -2.81591796875, -2.3043212890625, -1.792724609375, -1.2811279296875, -0.76953125, -0.2579345703125, 0.253662109375, 0.7652587890625, 1.27685546875, 1.7884521484375, 2.300048828125, 2.8116455078125, 3.3232421875, 3.8348388671875, 4.346435546875, 4.8580322265625, 5.36962890625, 5.8812255859375, 6.392822265625, 6.9044189453125, 7.416015625, 7.9276123046875, 8.439208984375, 8.9508056640625, 9.46240234375, 9.9739990234375, 10.485595703125, 10.9971923828125, 11.5087890625, 12.0203857421875, 12.531982421875, 13.0435791015625, 13.55517578125, 14.0667724609375, 14.578369140625, 15.0899658203125, 15.6015625]}, "gradients/decoder.transformer.h.4.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 4.0, 2.0, 6.0, 3.0, 8.0, 7.0, 8.0, 14.0, 18.0, 13.0, 20.0, 20.0, 29.0, 47.0, 28.0, 39.0, 46.0, 61.0, 63.0, 84.0, 166.0, 1450.0, 294.0, 168.0, 87.0, 60.0, 43.0, 51.0, 30.0, 31.0, 30.0, 19.0, 19.0, 13.0, 25.0, 13.0, 8.0, 4.0, 6.0, 8.0, 2.0, 2.0, 4.0, 2.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0], "bins": [-36.03125, -34.99853515625, -33.9658203125, -32.93310546875, -31.900390625, -30.86767578125, -29.8349609375, -28.80224609375, -27.76953125, -26.73681640625, -25.7041015625, -24.67138671875, -23.638671875, -22.60595703125, -21.5732421875, -20.54052734375, -19.5078125, -18.47509765625, -17.4423828125, -16.40966796875, -15.376953125, -14.34423828125, -13.3115234375, -12.27880859375, -11.24609375, -10.21337890625, -9.1806640625, -8.14794921875, -7.115234375, -6.08251953125, -5.0498046875, -4.01708984375, -2.984375, -1.95166015625, -0.9189453125, 0.11376953125, 1.146484375, 2.17919921875, 3.2119140625, 4.24462890625, 5.27734375, 6.31005859375, 7.3427734375, 8.37548828125, 9.408203125, 10.44091796875, 11.4736328125, 12.50634765625, 13.5390625, 14.57177734375, 15.6044921875, 16.63720703125, 17.669921875, 18.70263671875, 19.7353515625, 20.76806640625, 21.80078125, 22.83349609375, 23.8662109375, 24.89892578125, 25.931640625, 26.96435546875, 27.9970703125, 29.02978515625, 30.0625]}, "gradients/decoder.transformer.h.4.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 0.0, 4.0, 2.0, 7.0, 6.0, 5.0, 8.0, 11.0, 16.0, 18.0, 38.0, 36.0, 38.0, 68.0, 69.0, 90.0, 133.0, 174.0, 264.0, 489.0, 1159.0, 13021.0, 796338.0, 2307239.0, 23168.0, 1649.0, 519.0, 319.0, 207.0, 129.0, 121.0, 72.0, 67.0, 44.0, 43.0, 31.0, 28.0, 17.0, 13.0, 10.0, 11.0, 4.0, 9.0, 9.0, 2.0, 0.0, 4.0, 1.0, 2.0, 1.0, 0.0, 4.0, 0.0, 0.0, 2.0], "bins": [-49.75, -48.19970703125, -46.6494140625, -45.09912109375, -43.548828125, -41.99853515625, -40.4482421875, -38.89794921875, -37.34765625, -35.79736328125, -34.2470703125, -32.69677734375, -31.146484375, -29.59619140625, -28.0458984375, -26.49560546875, -24.9453125, -23.39501953125, -21.8447265625, -20.29443359375, -18.744140625, -17.19384765625, -15.6435546875, -14.09326171875, -12.54296875, -10.99267578125, -9.4423828125, -7.89208984375, -6.341796875, -4.79150390625, -3.2412109375, -1.69091796875, -0.140625, 1.40966796875, 2.9599609375, 4.51025390625, 6.060546875, 7.61083984375, 9.1611328125, 10.71142578125, 12.26171875, 13.81201171875, 15.3623046875, 16.91259765625, 18.462890625, 20.01318359375, 21.5634765625, 23.11376953125, 24.6640625, 26.21435546875, 27.7646484375, 29.31494140625, 30.865234375, 32.41552734375, 33.9658203125, 35.51611328125, 37.06640625, 38.61669921875, 40.1669921875, 41.71728515625, 43.267578125, 44.81787109375, 46.3681640625, 47.91845703125, 49.46875]}, "gradients/decoder.transformer.h.4.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 5.0, 415.0, 594.0, 6.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-146.52137756347656, -133.27561950683594, -120.02987670898438, -106.78411865234375, -93.53836822509766, -80.29261779785156, -67.04685974121094, -53.801109313964844, -40.55535888671875, -27.309606552124023, -14.063854217529297, -0.8180999755859375, 12.427650451660156, 25.67340087890625, 38.919158935546875, 52.16490936279297, 65.41065979003906, 78.65641021728516, 91.90216064453125, 105.14791870117188, 118.39366912841797, 131.63941955566406, 144.8851776123047, 158.13092041015625, 171.37667846679688, 184.6224365234375, 197.86817932128906, 211.1139373779297, 224.35968017578125, 237.60543823242188, 250.8511962890625, 264.0969543457031, 277.34271240234375, 290.5884704589844, 303.834228515625, 317.0799560546875, 330.3257141113281, 343.57147216796875, 356.8172302246094, 370.06298828125, 383.3087158203125, 396.5544738769531, 409.80023193359375, 423.04595947265625, 436.2917175292969, 449.5374755859375, 462.7832336425781, 476.02899169921875, 489.2747497558594, 502.5205078125, 515.7662353515625, 529.0120239257812, 542.2577514648438, 555.5035400390625, 568.749267578125, 581.9949951171875, 595.2407836914062, 608.4865112304688, 621.7322998046875, 634.97802734375, 648.2238159179688, 661.4695434570312, 674.71533203125, 687.9610595703125, 701.206787109375]}, "gradients/decoder.transformer.h.4.ln_1.bias": {"_type": "histogram", "values": [2.0, 3.0, 1.0, 3.0, 3.0, 1.0, 4.0, 2.0, 10.0, 6.0, 8.0, 3.0, 20.0, 12.0, 17.0, 20.0, 25.0, 16.0, 27.0, 25.0, 25.0, 32.0, 31.0, 45.0, 29.0, 58.0, 29.0, 52.0, 29.0, 31.0, 45.0, 46.0, 47.0, 28.0, 24.0, 28.0, 28.0, 30.0, 28.0, 24.0, 15.0, 15.0, 11.0, 20.0, 12.0, 11.0, 7.0, 7.0, 4.0, 8.0, 0.0, 6.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-58.77857971191406, -56.7213134765625, -54.66404724121094, -52.606781005859375, -50.54951477050781, -48.49224853515625, -46.43497848510742, -44.37771224975586, -42.3204460144043, -40.263179779052734, -38.20591354370117, -36.14864730834961, -34.09137725830078, -32.03411102294922, -29.976844787597656, -27.919578552246094, -25.86231231689453, -23.80504608154297, -21.747779846191406, -19.69051170349121, -17.63324546813965, -15.575979232788086, -13.518712043762207, -11.461444854736328, -9.404178619384766, -7.346911907196045, -5.289645195007324, -3.2323784828186035, -1.1751117706298828, 0.8821544647216797, 2.9394216537475586, 4.9966888427734375, 7.053962707519531, 9.111228942871094, 11.168496131896973, 13.225763320922852, 15.283029556274414, 17.340295791625977, 19.397563934326172, 21.454830169677734, 23.512096405029297, 25.56936264038086, 27.626628875732422, 29.683897018432617, 31.74116325378418, 33.798431396484375, 35.85569763183594, 37.9129638671875, 39.97023010253906, 42.027496337890625, 44.08476257324219, 46.14202880859375, 48.19929504394531, 50.256561279296875, 52.3138313293457, 54.371097564697266, 56.42836380004883, 58.48563003540039, 60.54289627075195, 62.600162506103516, 64.65743255615234, 66.7146987915039, 68.77196502685547, 70.82923126220703, 72.8864974975586]}, "gradients/decoder.transformer.h.3.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 6.0, 3.0, 5.0, 10.0, 8.0, 10.0, 10.0, 12.0, 12.0, 20.0, 24.0, 27.0, 19.0, 36.0, 31.0, 37.0, 42.0, 30.0, 46.0, 53.0, 35.0, 44.0, 37.0, 49.0, 39.0, 31.0, 40.0, 44.0, 26.0, 28.0, 29.0, 21.0, 29.0, 19.0, 22.0, 23.0, 11.0, 8.0, 8.0, 9.0, 3.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-12.71875, -12.3292236328125, -11.939697265625, -11.5501708984375, -11.16064453125, -10.7711181640625, -10.381591796875, -9.9920654296875, -9.6025390625, -9.2130126953125, -8.823486328125, -8.4339599609375, -8.04443359375, -7.6549072265625, -7.265380859375, -6.8758544921875, -6.486328125, -6.0968017578125, -5.707275390625, -5.3177490234375, -4.92822265625, -4.5386962890625, -4.149169921875, -3.7596435546875, -3.3701171875, -2.9805908203125, -2.591064453125, -2.2015380859375, -1.81201171875, -1.4224853515625, -1.032958984375, -0.6434326171875, -0.25390625, 0.1356201171875, 0.525146484375, 0.9146728515625, 1.30419921875, 1.6937255859375, 2.083251953125, 2.4727783203125, 2.8623046875, 3.2518310546875, 3.641357421875, 4.0308837890625, 4.42041015625, 4.8099365234375, 5.199462890625, 5.5889892578125, 5.978515625, 6.3680419921875, 6.757568359375, 7.1470947265625, 7.53662109375, 7.9261474609375, 8.315673828125, 8.7052001953125, 9.0947265625, 9.4842529296875, 9.873779296875, 10.2633056640625, 10.65283203125, 11.0423583984375, 11.431884765625, 11.8214111328125, 12.2109375]}, "gradients/decoder.transformer.h.3.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 5.0, 6.0, 5.0, 11.0, 12.0, 10.0, 14.0, 19.0, 23.0, 33.0, 32.0, 46.0, 54.0, 67.0, 104.0, 148.0, 206.0, 264.0, 329.0, 435.0, 1376.0, 4185589.0, 3527.0, 534.0, 343.0, 273.0, 218.0, 134.0, 113.0, 82.0, 55.0, 38.0, 41.0, 23.0, 25.0, 23.0, 15.0, 12.0, 7.0, 9.0, 8.0, 5.0, 3.0, 6.0, 1.0, 0.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-246.375, -238.322265625, -230.26953125, -222.216796875, -214.1640625, -206.111328125, -198.05859375, -190.005859375, -181.953125, -173.900390625, -165.84765625, -157.794921875, -149.7421875, -141.689453125, -133.63671875, -125.583984375, -117.53125, -109.478515625, -101.42578125, -93.373046875, -85.3203125, -77.267578125, -69.21484375, -61.162109375, -53.109375, -45.056640625, -37.00390625, -28.951171875, -20.8984375, -12.845703125, -4.79296875, 3.259765625, 11.3125, 19.365234375, 27.41796875, 35.470703125, 43.5234375, 51.576171875, 59.62890625, 67.681640625, 75.734375, 83.787109375, 91.83984375, 99.892578125, 107.9453125, 115.998046875, 124.05078125, 132.103515625, 140.15625, 148.208984375, 156.26171875, 164.314453125, 172.3671875, 180.419921875, 188.47265625, 196.525390625, 204.578125, 212.630859375, 220.68359375, 228.736328125, 236.7890625, 244.841796875, 252.89453125, 260.947265625, 269.0]}, "gradients/decoder.transformer.h.3.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 6.0, 9.0, 9.0, 10.0, 17.0, 8.0, 22.0, 17.0, 41.0, 50.0, 65.0, 85.0, 116.0, 174.0, 287.0, 412.0, 575.0, 649.0, 466.0, 310.0, 234.0, 143.0, 89.0, 76.0, 54.0, 34.0, 32.0, 15.0, 17.0, 19.0, 7.0, 4.0, 3.0, 7.0, 2.0, 5.0, 2.0, 4.0, 1.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-20.609375, -20.00634765625, -19.4033203125, -18.80029296875, -18.197265625, -17.59423828125, -16.9912109375, -16.38818359375, -15.78515625, -15.18212890625, -14.5791015625, -13.97607421875, -13.373046875, -12.77001953125, -12.1669921875, -11.56396484375, -10.9609375, -10.35791015625, -9.7548828125, -9.15185546875, -8.548828125, -7.94580078125, -7.3427734375, -6.73974609375, -6.13671875, -5.53369140625, -4.9306640625, -4.32763671875, -3.724609375, -3.12158203125, -2.5185546875, -1.91552734375, -1.3125, -0.70947265625, -0.1064453125, 0.49658203125, 1.099609375, 1.70263671875, 2.3056640625, 2.90869140625, 3.51171875, 4.11474609375, 4.7177734375, 5.32080078125, 5.923828125, 6.52685546875, 7.1298828125, 7.73291015625, 8.3359375, 8.93896484375, 9.5419921875, 10.14501953125, 10.748046875, 11.35107421875, 11.9541015625, 12.55712890625, 13.16015625, 13.76318359375, 14.3662109375, 14.96923828125, 15.572265625, 16.17529296875, 16.7783203125, 17.38134765625, 17.984375]}, "gradients/decoder.transformer.h.3.mlp.c_fc.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 3.0, 2.0, 3.0, 8.0, 6.0, 5.0, 6.0, 5.0, 11.0, 8.0, 18.0, 14.0, 30.0, 29.0, 31.0, 47.0, 53.0, 65.0, 106.0, 282.0, 3018.0, 3820361.0, 368362.0, 1228.0, 178.0, 88.0, 53.0, 62.0, 38.0, 25.0, 27.0, 22.0, 25.0, 17.0, 18.0, 10.0, 8.0, 7.0, 1.0, 5.0, 3.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-109.875, -105.626953125, -101.37890625, -97.130859375, -92.8828125, -88.634765625, -84.38671875, -80.138671875, -75.890625, -71.642578125, -67.39453125, -63.146484375, -58.8984375, -54.650390625, -50.40234375, -46.154296875, -41.90625, -37.658203125, -33.41015625, -29.162109375, -24.9140625, -20.666015625, -16.41796875, -12.169921875, -7.921875, -3.673828125, 0.57421875, 4.822265625, 9.0703125, 13.318359375, 17.56640625, 21.814453125, 26.0625, 30.310546875, 34.55859375, 38.806640625, 43.0546875, 47.302734375, 51.55078125, 55.798828125, 60.046875, 64.294921875, 68.54296875, 72.791015625, 77.0390625, 81.287109375, 85.53515625, 89.783203125, 94.03125, 98.279296875, 102.52734375, 106.775390625, 111.0234375, 115.271484375, 119.51953125, 123.767578125, 128.015625, 132.263671875, 136.51171875, 140.759765625, 145.0078125, 149.255859375, 153.50390625, 157.751953125, 162.0]}, "gradients/decoder.transformer.h.3.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 10.0, 213.0, 599.0, 182.0, 10.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-612.478515625, -601.6349487304688, -590.7913818359375, -579.94775390625, -569.1041870117188, -558.2606201171875, -547.4170532226562, -536.573486328125, -525.7299194335938, -514.8863525390625, -504.0427551269531, -493.1991882324219, -482.3556213378906, -471.51202392578125, -460.66845703125, -449.82489013671875, -438.98126220703125, -428.1376953125, -417.2940979003906, -406.4505310058594, -395.6069641113281, -384.76336669921875, -373.9197998046875, -363.07623291015625, -352.232666015625, -341.38909912109375, -330.5455017089844, -319.7019348144531, -308.8583679199219, -298.0147705078125, -287.17120361328125, -276.32763671875, -265.4840393066406, -254.6404571533203, -243.79689025878906, -232.95330810546875, -222.10972595214844, -211.26614379882812, -200.42257690429688, -189.57899475097656, -178.73541259765625, -167.89183044433594, -157.0482635498047, -146.20468139648438, -135.36109924316406, -124.51752471923828, -113.6739501953125, -102.83036804199219, -91.98680114746094, -81.14322662353516, -70.29964447021484, -59.45606994628906, -48.612491607666016, -37.76891326904297, -26.925338745117188, -16.081756591796875, -5.238182067871094, 5.605395317077637, 16.448972702026367, 27.29254913330078, 38.13612747192383, 48.979705810546875, 59.823280334472656, 70.66686248779297, 81.51043701171875]}, "gradients/decoder.transformer.h.3.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 3.0, 3.0, 0.0, 3.0, 8.0, 6.0, 11.0, 13.0, 9.0, 15.0, 14.0, 19.0, 22.0, 24.0, 34.0, 37.0, 37.0, 48.0, 44.0, 56.0, 45.0, 37.0, 51.0, 47.0, 52.0, 49.0, 42.0, 35.0, 44.0, 28.0, 26.0, 20.0, 32.0, 20.0, 13.0, 14.0, 11.0, 10.0, 9.0, 7.0, 2.0, 4.0, 2.0, 6.0, 0.0, 1.0, 1.0, 0.0, 2.0], "bins": [-79.68128967285156, -77.56857299804688, -75.45584869384766, -73.34313201904297, -71.23041534423828, -69.11769104003906, -67.00497436523438, -64.89225769042969, -62.779537200927734, -60.66681671142578, -58.554100036621094, -56.44137954711914, -54.32865905761719, -52.2159423828125, -50.10322189331055, -47.990501403808594, -45.877784729003906, -43.76506423950195, -41.652347564697266, -39.53962707519531, -37.426910400390625, -35.31418991088867, -33.20146942138672, -31.0887508392334, -28.976032257080078, -26.863313674926758, -24.750595092773438, -22.637874603271484, -20.525156021118164, -18.412437438964844, -16.29971694946289, -14.18699836730957, -12.074287414550781, -9.961568832397461, -7.848849296569824, -5.736130237579346, -3.623411178588867, -1.5106925964355469, 0.6020269393920898, 2.7147464752197266, 4.827465057373047, 6.940184116363525, 9.052903175354004, 11.16562271118164, 13.278341293334961, 15.391059875488281, 17.503780364990234, 19.616498947143555, 21.729217529296875, 23.841936111450195, 25.954654693603516, 28.06737518310547, 30.18009376525879, 32.29281234741211, 34.40553283691406, 36.51824951171875, 38.6309700012207, 40.743690490722656, 42.856407165527344, 44.9691276550293, 47.08184814453125, 49.19456481933594, 51.30728530883789, 53.420005798339844, 55.53272247314453]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 9.0, 10.0, 12.0, 9.0, 14.0, 16.0, 24.0, 25.0, 31.0, 29.0, 34.0, 39.0, 37.0, 53.0, 36.0, 49.0, 54.0, 53.0, 57.0, 42.0, 53.0, 38.0, 42.0, 39.0, 44.0, 27.0, 25.0, 26.0, 13.0, 15.0, 13.0, 8.0, 12.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.59375, -13.1527099609375, -12.711669921875, -12.2706298828125, -11.82958984375, -11.3885498046875, -10.947509765625, -10.5064697265625, -10.0654296875, -9.6243896484375, -9.183349609375, -8.7423095703125, -8.30126953125, -7.8602294921875, -7.419189453125, -6.9781494140625, -6.537109375, -6.0960693359375, -5.655029296875, -5.2139892578125, -4.77294921875, -4.3319091796875, -3.890869140625, -3.4498291015625, -3.0087890625, -2.5677490234375, -2.126708984375, -1.6856689453125, -1.24462890625, -0.8035888671875, -0.362548828125, 0.0784912109375, 0.51953125, 0.9605712890625, 1.401611328125, 1.8426513671875, 2.28369140625, 2.7247314453125, 3.165771484375, 3.6068115234375, 4.0478515625, 4.4888916015625, 4.929931640625, 5.3709716796875, 5.81201171875, 6.2530517578125, 6.694091796875, 7.1351318359375, 7.576171875, 8.0172119140625, 8.458251953125, 8.8992919921875, 9.34033203125, 9.7813720703125, 10.222412109375, 10.6634521484375, 11.1044921875, 11.5455322265625, 11.986572265625, 12.4276123046875, 12.86865234375, 13.3096923828125, 13.750732421875, 14.1917724609375, 14.6328125]}, "gradients/decoder.transformer.h.3.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 10.0, 12.0, 21.0, 21.0, 44.0, 70.0, 87.0, 141.0, 206.0, 282.0, 494.0, 688.0, 1107.0, 1741.0, 2589.0, 4266.0, 6786.0, 11113.0, 17982.0, 28984.0, 47693.0, 77746.0, 124618.0, 179735.0, 186361.0, 135128.0, 84533.0, 51816.0, 31800.0, 19738.0, 12248.0, 7561.0, 4835.0, 2920.0, 1850.0, 1164.0, 728.0, 508.0, 318.0, 212.0, 146.0, 66.0, 57.0, 36.0, 35.0, 21.0, 19.0, 11.0, 4.0, 2.0, 6.0, 2.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.021484375, -0.989654541015625, -0.95782470703125, -0.925994873046875, -0.8941650390625, -0.862335205078125, -0.83050537109375, -0.798675537109375, -0.766845703125, -0.735015869140625, -0.70318603515625, -0.671356201171875, -0.6395263671875, -0.607696533203125, -0.57586669921875, -0.544036865234375, -0.51220703125, -0.480377197265625, -0.44854736328125, -0.416717529296875, -0.3848876953125, -0.353057861328125, -0.32122802734375, -0.289398193359375, -0.257568359375, -0.225738525390625, -0.19390869140625, -0.162078857421875, -0.1302490234375, -0.098419189453125, -0.06658935546875, -0.034759521484375, -0.0029296875, 0.028900146484375, 0.06072998046875, 0.092559814453125, 0.1243896484375, 0.156219482421875, 0.18804931640625, 0.219879150390625, 0.251708984375, 0.283538818359375, 0.31536865234375, 0.347198486328125, 0.3790283203125, 0.410858154296875, 0.44268798828125, 0.474517822265625, 0.50634765625, 0.538177490234375, 0.57000732421875, 0.601837158203125, 0.6336669921875, 0.665496826171875, 0.69732666015625, 0.729156494140625, 0.760986328125, 0.792816162109375, 0.82464599609375, 0.856475830078125, 0.8883056640625, 0.920135498046875, 0.95196533203125, 0.983795166015625, 1.015625]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 2.0, 3.0, 8.0, 3.0, 9.0, 7.0, 11.0, 4.0, 12.0, 10.0, 15.0, 28.0, 22.0, 18.0, 36.0, 35.0, 41.0, 31.0, 37.0, 39.0, 44.0, 42.0, 1074.0, 62.0, 45.0, 44.0, 40.0, 38.0, 57.0, 34.0, 22.0, 28.0, 29.0, 21.0, 22.0, 23.0, 8.0, 9.0, 6.0, 8.0, 3.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-9.140625, -8.8814697265625, -8.622314453125, -8.3631591796875, -8.10400390625, -7.8448486328125, -7.585693359375, -7.3265380859375, -7.0673828125, -6.8082275390625, -6.549072265625, -6.2899169921875, -6.03076171875, -5.7716064453125, -5.512451171875, -5.2532958984375, -4.994140625, -4.7349853515625, -4.475830078125, -4.2166748046875, -3.95751953125, -3.6983642578125, -3.439208984375, -3.1800537109375, -2.9208984375, -2.6617431640625, -2.402587890625, -2.1434326171875, -1.88427734375, -1.6251220703125, -1.365966796875, -1.1068115234375, -0.84765625, -0.5885009765625, -0.329345703125, -0.0701904296875, 0.18896484375, 0.4481201171875, 0.707275390625, 0.9664306640625, 1.2255859375, 1.4847412109375, 1.743896484375, 2.0030517578125, 2.26220703125, 2.5213623046875, 2.780517578125, 3.0396728515625, 3.298828125, 3.5579833984375, 3.817138671875, 4.0762939453125, 4.33544921875, 4.5946044921875, 4.853759765625, 5.1129150390625, 5.3720703125, 5.6312255859375, 5.890380859375, 6.1495361328125, 6.40869140625, 6.6678466796875, 6.927001953125, 7.1861572265625, 7.4453125]}, "gradients/decoder.transformer.h.3.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 4.0, 7.0, 13.0, 4.0, 14.0, 23.0, 46.0, 69.0, 80.0, 104.0, 159.0, 262.0, 370.0, 565.0, 747.0, 1242.0, 1851.0, 2713.0, 4020.0, 5951.0, 8844.0, 13570.0, 20573.0, 30955.0, 46949.0, 69709.0, 102507.0, 138915.0, 1201987.0, 137387.0, 101262.0, 69305.0, 46360.0, 30656.0, 20088.0, 13224.0, 8840.0, 5764.0, 3951.0, 2662.0, 1739.0, 1228.0, 783.0, 543.0, 387.0, 240.0, 151.0, 113.0, 68.0, 53.0, 26.0, 19.0, 15.0, 8.0, 15.0, 3.0, 2.0, 1.0, 2.0, 0.0, 2.0], "bins": [-0.68017578125, -0.6585693359375, -0.636962890625, -0.6153564453125, -0.59375, -0.5721435546875, -0.550537109375, -0.5289306640625, -0.50732421875, -0.4857177734375, -0.464111328125, -0.4425048828125, -0.4208984375, -0.3992919921875, -0.377685546875, -0.3560791015625, -0.33447265625, -0.3128662109375, -0.291259765625, -0.2696533203125, -0.248046875, -0.2264404296875, -0.204833984375, -0.1832275390625, -0.16162109375, -0.1400146484375, -0.118408203125, -0.0968017578125, -0.0751953125, -0.0535888671875, -0.031982421875, -0.0103759765625, 0.01123046875, 0.0328369140625, 0.054443359375, 0.0760498046875, 0.09765625, 0.1192626953125, 0.140869140625, 0.1624755859375, 0.18408203125, 0.2056884765625, 0.227294921875, 0.2489013671875, 0.2705078125, 0.2921142578125, 0.313720703125, 0.3353271484375, 0.35693359375, 0.3785400390625, 0.400146484375, 0.4217529296875, 0.443359375, 0.4649658203125, 0.486572265625, 0.5081787109375, 0.52978515625, 0.5513916015625, 0.572998046875, 0.5946044921875, 0.6162109375, 0.6378173828125, 0.659423828125, 0.6810302734375, 0.70263671875]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 2.0, 2.0, 5.0, 4.0, 5.0, 10.0, 18.0, 20.0, 31.0, 33.0, 52.0, 71.0, 75.0, 96.0, 111.0, 94.0, 92.0, 75.0, 40.0, 36.0, 31.0, 24.0, 27.0, 12.0, 16.0, 7.0, 3.0, 4.0, 5.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.01358795166015625, -0.013218998908996582, -0.012850046157836914, -0.012481093406677246, -0.012112140655517578, -0.01174318790435791, -0.011374235153198242, -0.011005282402038574, -0.010636329650878906, -0.010267376899719238, -0.00989842414855957, -0.009529471397399902, -0.009160518646240234, -0.008791565895080566, -0.008422613143920898, -0.00805366039276123, -0.0076847076416015625, -0.0073157548904418945, -0.0069468021392822266, -0.006577849388122559, -0.006208896636962891, -0.005839943885803223, -0.005470991134643555, -0.005102038383483887, -0.004733085632324219, -0.004364132881164551, -0.003995180130004883, -0.003626227378845215, -0.003257274627685547, -0.002888321876525879, -0.002519369125366211, -0.002150416374206543, -0.001781463623046875, -0.001412510871887207, -0.001043558120727539, -0.0006746053695678711, -0.0003056526184082031, 6.330013275146484e-05, 0.0004322528839111328, 0.0008012056350708008, 0.0011701583862304688, 0.0015391111373901367, 0.0019080638885498047, 0.0022770166397094727, 0.0026459693908691406, 0.0030149221420288086, 0.0033838748931884766, 0.0037528276443481445, 0.0041217803955078125, 0.0044907331466674805, 0.0048596858978271484, 0.005228638648986816, 0.005597591400146484, 0.005966544151306152, 0.00633549690246582, 0.006704449653625488, 0.007073402404785156, 0.007442355155944824, 0.007811307907104492, 0.00818026065826416, 0.008549213409423828, 0.008918166160583496, 0.009287118911743164, 0.009656071662902832, 0.0100250244140625]}, "gradients/decoder.transformer.h.3.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 6.0, 7.0, 5.0, 2.0, 8.0, 6.0, 9.0, 12.0, 19.0, 33.0, 40.0, 48.0, 81.0, 92.0, 170.0, 336.0, 692.0, 9027.0, 1034693.0, 1995.0, 559.0, 281.0, 138.0, 95.0, 61.0, 44.0, 34.0, 31.0, 13.0, 9.0, 3.0, 6.0, 2.0, 0.0, 4.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1964111328125, -0.18922996520996094, -0.18204879760742188, -0.1748676300048828, -0.16768646240234375, -0.1605052947998047, -0.15332412719726562, -0.14614295959472656, -0.1389617919921875, -0.13178062438964844, -0.12459945678710938, -0.11741828918457031, -0.11023712158203125, -0.10305595397949219, -0.09587478637695312, -0.08869361877441406, -0.081512451171875, -0.07433128356933594, -0.06715011596679688, -0.05996894836425781, -0.05278778076171875, -0.04560661315917969, -0.038425445556640625, -0.031244277954101562, -0.0240631103515625, -0.016881942749023438, -0.009700775146484375, -0.0025196075439453125, 0.00466156005859375, 0.011842727661132812, 0.019023895263671875, 0.026205062866210938, 0.03338623046875, 0.04056739807128906, 0.047748565673828125, 0.05492973327636719, 0.06211090087890625, 0.06929206848144531, 0.07647323608398438, 0.08365440368652344, 0.0908355712890625, 0.09801673889160156, 0.10519790649414062, 0.11237907409667969, 0.11956024169921875, 0.1267414093017578, 0.13392257690429688, 0.14110374450683594, 0.148284912109375, 0.15546607971191406, 0.16264724731445312, 0.1698284149169922, 0.17700958251953125, 0.1841907501220703, 0.19137191772460938, 0.19855308532714844, 0.2057342529296875, 0.21291542053222656, 0.22009658813476562, 0.2272777557373047, 0.23445892333984375, 0.2416400909423828, 0.24882125854492188, 0.25600242614746094, 0.26318359375]}, "gradients/decoder.transformer.h.3.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 6.0, 384.0, 613.0, 12.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.08323973417282104, -0.08180711418390274, -0.08037449419498444, -0.07894188165664673, -0.07750926166772842, -0.07607664167881012, -0.07464402914047241, -0.07321140915155411, -0.0717787891626358, -0.0703461691737175, -0.0689135491847992, -0.06748093664646149, -0.06604831665754318, -0.06461569666862488, -0.06318308413028717, -0.061750464141368866, -0.06031784415245056, -0.05888522416353226, -0.05745260789990425, -0.056019991636276245, -0.05458737164735794, -0.053154751658439636, -0.05172213539481163, -0.050289519131183624, -0.04885689914226532, -0.047424279153347015, -0.04599166288971901, -0.044559046626091, -0.0431264266371727, -0.041693806648254395, -0.04026119038462639, -0.03882857412099838, -0.03739595040678978, -0.035963334143161774, -0.03453071415424347, -0.033098094165325165, -0.03166547790169716, -0.030232859775424004, -0.02880024164915085, -0.027367623522877693, -0.025935005396604538, -0.024502387270331383, -0.023069769144058228, -0.021637151017785072, -0.020204532891511917, -0.018771914765238762, -0.017339296638965607, -0.01590667851269245, -0.014474061317741871, -0.013041443191468716, -0.01160882506519556, -0.010176206938922405, -0.00874358881264925, -0.007310970686376095, -0.00587835256010294, -0.004445734433829784, -0.003013116307556629, -0.001580498181283474, -0.00014788005501031876, 0.0012847380712628365, 0.0027173561975359917, 0.004149974323809147, 0.005582592450082302, 0.007015210576355457, 0.008447828702628613]}, "gradients/decoder.transformer.h.3.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 9.0, 3.0, 7.0, 19.0, 16.0, 12.0, 14.0, 24.0, 21.0, 34.0, 25.0, 32.0, 41.0, 44.0, 38.0, 38.0, 46.0, 46.0, 46.0, 49.0, 49.0, 49.0, 42.0, 43.0, 38.0, 49.0, 24.0, 38.0, 20.0, 19.0, 15.0, 18.0, 11.0, 2.0, 10.0, 4.0, 2.0, 1.0, 3.0, 3.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0], "bins": [-0.005097866058349609, -0.004945721477270126, -0.004793576896190643, -0.00464143231511116, -0.004489287734031677, -0.004337143152952194, -0.004184998571872711, -0.004032853990793228, -0.003880709409713745, -0.003728564828634262, -0.003576420247554779, -0.003424275666475296, -0.003272131085395813, -0.00311998650431633, -0.002967841923236847, -0.002815697342157364, -0.002663552761077881, -0.002511408179998398, -0.002359263598918915, -0.0022071190178394318, -0.0020549744367599487, -0.0019028298556804657, -0.0017506852746009827, -0.0015985406935214996, -0.0014463961124420166, -0.0012942515313625336, -0.0011421069502830505, -0.0009899623692035675, -0.0008378177881240845, -0.0006856732070446014, -0.0005335286259651184, -0.0003813840448856354, -0.00022923946380615234, -7.709488272666931e-05, 7.504969835281372e-05, 0.00022719427943229675, 0.0003793388605117798, 0.0005314834415912628, 0.0006836280226707458, 0.0008357726037502289, 0.000987917184829712, 0.001140061765909195, 0.001292206346988678, 0.001444350928068161, 0.001596495509147644, 0.001748640090227127, 0.00190078467130661, 0.002052929252386093, 0.002205073833465576, 0.002357218414545059, 0.0025093629956245422, 0.0026615075767040253, 0.0028136521577835083, 0.0029657967388629913, 0.0031179413199424744, 0.0032700859010219574, 0.0034222304821014404, 0.0035743750631809235, 0.0037265196442604065, 0.0038786642253398895, 0.0040308088064193726, 0.004182953387498856, 0.004335097968578339, 0.004487242549657822, 0.004639387130737305]}, "gradients/decoder.transformer.h.3.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 9.0, 9.0, 10.0, 12.0, 9.0, 14.0, 16.0, 24.0, 25.0, 31.0, 29.0, 34.0, 39.0, 37.0, 53.0, 36.0, 49.0, 54.0, 53.0, 57.0, 42.0, 53.0, 38.0, 42.0, 39.0, 44.0, 27.0, 25.0, 26.0, 13.0, 15.0, 13.0, 8.0, 12.0, 3.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.59375, -13.1527099609375, -12.711669921875, -12.2706298828125, -11.82958984375, -11.3885498046875, -10.947509765625, -10.5064697265625, -10.0654296875, -9.6243896484375, -9.183349609375, -8.7423095703125, -8.30126953125, -7.8602294921875, -7.419189453125, -6.9781494140625, -6.537109375, -6.0960693359375, -5.655029296875, -5.2139892578125, -4.77294921875, -4.3319091796875, -3.890869140625, -3.4498291015625, -3.0087890625, -2.5677490234375, -2.126708984375, -1.6856689453125, -1.24462890625, -0.8035888671875, -0.362548828125, 0.0784912109375, 0.51953125, 0.9605712890625, 1.401611328125, 1.8426513671875, 2.28369140625, 2.7247314453125, 3.165771484375, 3.6068115234375, 4.0478515625, 4.4888916015625, 4.929931640625, 5.3709716796875, 5.81201171875, 6.2530517578125, 6.694091796875, 7.1351318359375, 7.576171875, 8.0172119140625, 8.458251953125, 8.8992919921875, 9.34033203125, 9.7813720703125, 10.222412109375, 10.6634521484375, 11.1044921875, 11.5455322265625, 11.986572265625, 12.4276123046875, 12.86865234375, 13.3096923828125, 13.750732421875, 14.1917724609375, 14.6328125]}, "gradients/decoder.transformer.h.3.attn.c_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 3.0, 5.0, 4.0, 2.0, 11.0, 10.0, 24.0, 38.0, 54.0, 98.0, 91.0, 141.0, 220.0, 285.0, 393.0, 614.0, 759.0, 1130.0, 1867.0, 3931.0, 15534.0, 95580.0, 510215.0, 344520.0, 55311.0, 9668.0, 2977.0, 1532.0, 1021.0, 721.0, 501.0, 386.0, 294.0, 180.0, 151.0, 108.0, 66.0, 40.0, 24.0, 22.0, 14.0, 5.0, 5.0, 3.0, 0.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.859375, -21.15087890625, -20.4423828125, -19.73388671875, -19.025390625, -18.31689453125, -17.6083984375, -16.89990234375, -16.19140625, -15.48291015625, -14.7744140625, -14.06591796875, -13.357421875, -12.64892578125, -11.9404296875, -11.23193359375, -10.5234375, -9.81494140625, -9.1064453125, -8.39794921875, -7.689453125, -6.98095703125, -6.2724609375, -5.56396484375, -4.85546875, -4.14697265625, -3.4384765625, -2.72998046875, -2.021484375, -1.31298828125, -0.6044921875, 0.10400390625, 0.8125, 1.52099609375, 2.2294921875, 2.93798828125, 3.646484375, 4.35498046875, 5.0634765625, 5.77197265625, 6.48046875, 7.18896484375, 7.8974609375, 8.60595703125, 9.314453125, 10.02294921875, 10.7314453125, 11.43994140625, 12.1484375, 12.85693359375, 13.5654296875, 14.27392578125, 14.982421875, 15.69091796875, 16.3994140625, 17.10791015625, 17.81640625, 18.52490234375, 19.2333984375, 19.94189453125, 20.650390625, 21.35888671875, 22.0673828125, 22.77587890625, 23.484375]}, "gradients/decoder.transformer.h.3.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 5.0, 6.0, 5.0, 13.0, 15.0, 13.0, 17.0, 24.0, 30.0, 26.0, 29.0, 34.0, 52.0, 58.0, 88.0, 109.0, 299.0, 1594.0, 197.0, 90.0, 63.0, 43.0, 49.0, 23.0, 27.0, 33.0, 32.0, 20.0, 18.0, 13.0, 6.0, 6.0, 4.0, 5.0, 3.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-38.84375, -37.71240234375, -36.5810546875, -35.44970703125, -34.318359375, -33.18701171875, -32.0556640625, -30.92431640625, -29.79296875, -28.66162109375, -27.5302734375, -26.39892578125, -25.267578125, -24.13623046875, -23.0048828125, -21.87353515625, -20.7421875, -19.61083984375, -18.4794921875, -17.34814453125, -16.216796875, -15.08544921875, -13.9541015625, -12.82275390625, -11.69140625, -10.56005859375, -9.4287109375, -8.29736328125, -7.166015625, -6.03466796875, -4.9033203125, -3.77197265625, -2.640625, -1.50927734375, -0.3779296875, 0.75341796875, 1.884765625, 3.01611328125, 4.1474609375, 5.27880859375, 6.41015625, 7.54150390625, 8.6728515625, 9.80419921875, 10.935546875, 12.06689453125, 13.1982421875, 14.32958984375, 15.4609375, 16.59228515625, 17.7236328125, 18.85498046875, 19.986328125, 21.11767578125, 22.2490234375, 23.38037109375, 24.51171875, 25.64306640625, 26.7744140625, 27.90576171875, 29.037109375, 30.16845703125, 31.2998046875, 32.43115234375, 33.5625]}, "gradients/decoder.transformer.h.3.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 4.0, 4.0, 0.0, 5.0, 3.0, 2.0, 8.0, 13.0, 8.0, 14.0, 12.0, 15.0, 15.0, 25.0, 18.0, 40.0, 66.0, 92.0, 162.0, 242.0, 461.0, 1078.0, 11104.0, 3124332.0, 5816.0, 978.0, 431.0, 229.0, 156.0, 97.0, 77.0, 47.0, 42.0, 22.0, 28.0, 16.0, 12.0, 9.0, 11.0, 6.0, 11.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-92.9375, -89.669921875, -86.40234375, -83.134765625, -79.8671875, -76.599609375, -73.33203125, -70.064453125, -66.796875, -63.529296875, -60.26171875, -56.994140625, -53.7265625, -50.458984375, -47.19140625, -43.923828125, -40.65625, -37.388671875, -34.12109375, -30.853515625, -27.5859375, -24.318359375, -21.05078125, -17.783203125, -14.515625, -11.248046875, -7.98046875, -4.712890625, -1.4453125, 1.822265625, 5.08984375, 8.357421875, 11.625, 14.892578125, 18.16015625, 21.427734375, 24.6953125, 27.962890625, 31.23046875, 34.498046875, 37.765625, 41.033203125, 44.30078125, 47.568359375, 50.8359375, 54.103515625, 57.37109375, 60.638671875, 63.90625, 67.173828125, 70.44140625, 73.708984375, 76.9765625, 80.244140625, 83.51171875, 86.779296875, 90.046875, 93.314453125, 96.58203125, 99.849609375, 103.1171875, 106.384765625, 109.65234375, 112.919921875, 116.1875]}, "gradients/decoder.transformer.h.3.ln_1.weight": {"_type": "histogram", "values": [3.0, 1.0, 0.0, 1.0, 9.0, 212.0, 598.0, 182.0, 13.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-50.307533264160156, -42.56134796142578, -34.81515884399414, -27.068973541259766, -19.322786331176758, -11.57659912109375, -3.830413818359375, 3.9157752990722656, 11.66196060180664, 19.40814781188965, 27.154335021972656, 34.90052032470703, 42.646705627441406, 50.39289474487305, 58.13908004760742, 65.88526916503906, 73.63145446777344, 81.37763977050781, 89.12382507324219, 96.87001037597656, 104.61620330810547, 112.36238861083984, 120.10857391357422, 127.85476684570312, 135.6009521484375, 143.34713745117188, 151.09332275390625, 158.83950805664062, 166.585693359375, 174.33187866210938, 182.07806396484375, 189.8242645263672, 197.57044982910156, 205.31663513183594, 213.0628204345703, 220.8090057373047, 228.55519104003906, 236.3013916015625, 244.04757690429688, 251.79376220703125, 259.5399475097656, 267.2861328125, 275.0323181152344, 282.77850341796875, 290.5246887207031, 298.2708740234375, 306.0170593261719, 313.76324462890625, 321.5094299316406, 329.255615234375, 337.0018005371094, 344.74798583984375, 352.4941711425781, 360.2403564453125, 367.9865417480469, 375.73272705078125, 383.47894287109375, 391.2251281738281, 398.9713134765625, 406.7174987792969, 414.46368408203125, 422.2098693847656, 429.9560546875, 437.7022399902344, 445.44842529296875]}, "gradients/decoder.transformer.h.3.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 2.0, 2.0, 2.0, 8.0, 9.0, 10.0, 11.0, 11.0, 10.0, 12.0, 15.0, 14.0, 22.0, 14.0, 25.0, 24.0, 36.0, 31.0, 30.0, 38.0, 41.0, 32.0, 52.0, 32.0, 44.0, 37.0, 41.0, 32.0, 38.0, 28.0, 26.0, 43.0, 26.0, 29.0, 27.0, 16.0, 16.0, 24.0, 12.0, 11.0, 16.0, 16.0, 8.0, 9.0, 4.0, 4.0, 7.0, 1.0, 2.0, 5.0, 4.0, 2.0, 0.0, 1.0], "bins": [-77.93260192871094, -75.6983413696289, -73.46408081054688, -71.22982025146484, -68.99555969238281, -66.76129150390625, -64.52703094482422, -62.29277038574219, -60.058509826660156, -57.824249267578125, -55.589988708496094, -53.3557243347168, -51.121463775634766, -48.887203216552734, -46.65293884277344, -44.418678283691406, -42.184417724609375, -39.950157165527344, -37.71589660644531, -35.481632232666016, -33.247371673583984, -31.013111114501953, -28.77884864807129, -26.544586181640625, -24.310325622558594, -22.076065063476562, -19.8418025970459, -17.607540130615234, -15.373279571533203, -13.139018058776855, -10.904756546020508, -8.67049503326416, -6.436225891113281, -4.201964378356934, -1.967702865600586, 0.2665586471557617, 2.5008201599121094, 4.735081672668457, 6.969343185424805, 9.203604698181152, 11.4378662109375, 13.672127723693848, 15.906389236450195, 18.14065170288086, 20.37491226196289, 22.609172821044922, 24.843435287475586, 27.07769775390625, 29.31195831298828, 31.546218872070312, 33.780479431152344, 36.01474380493164, 38.24900436401367, 40.4832649230957, 42.717529296875, 44.95178985595703, 47.18605041503906, 49.420310974121094, 51.654571533203125, 53.88883590698242, 56.12309646606445, 58.357357025146484, 60.59162139892578, 62.82588195800781, 65.06014251708984]}, "gradients/decoder.transformer.h.2.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 7.0, 5.0, 7.0, 4.0, 7.0, 9.0, 10.0, 16.0, 23.0, 20.0, 18.0, 17.0, 36.0, 22.0, 45.0, 31.0, 34.0, 51.0, 53.0, 47.0, 39.0, 50.0, 48.0, 46.0, 39.0, 43.0, 36.0, 35.0, 44.0, 34.0, 26.0, 31.0, 18.0, 10.0, 9.0, 10.0, 9.0, 7.0, 5.0, 5.0, 3.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.6171875, -12.194580078125, -11.77197265625, -11.349365234375, -10.9267578125, -10.504150390625, -10.08154296875, -9.658935546875, -9.236328125, -8.813720703125, -8.39111328125, -7.968505859375, -7.5458984375, -7.123291015625, -6.70068359375, -6.278076171875, -5.85546875, -5.432861328125, -5.01025390625, -4.587646484375, -4.1650390625, -3.742431640625, -3.31982421875, -2.897216796875, -2.474609375, -2.052001953125, -1.62939453125, -1.206787109375, -0.7841796875, -0.361572265625, 0.06103515625, 0.483642578125, 0.90625, 1.328857421875, 1.75146484375, 2.174072265625, 2.5966796875, 3.019287109375, 3.44189453125, 3.864501953125, 4.287109375, 4.709716796875, 5.13232421875, 5.554931640625, 5.9775390625, 6.400146484375, 6.82275390625, 7.245361328125, 7.66796875, 8.090576171875, 8.51318359375, 8.935791015625, 9.3583984375, 9.781005859375, 10.20361328125, 10.626220703125, 11.048828125, 11.471435546875, 11.89404296875, 12.316650390625, 12.7392578125, 13.161865234375, 13.58447265625, 14.007080078125, 14.4296875]}, "gradients/decoder.transformer.h.2.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 2.0, 2.0, 5.0, 7.0, 7.0, 10.0, 22.0, 13.0, 32.0, 44.0, 45.0, 86.0, 87.0, 163.0, 229.0, 420.0, 876.0, 2376.0, 7993.0, 44617.0, 743685.0, 3003119.0, 354436.0, 26769.0, 5755.0, 1756.0, 751.0, 318.0, 172.0, 129.0, 93.0, 68.0, 43.0, 45.0, 22.0, 27.0, 18.0, 9.0, 9.0, 9.0, 7.0, 4.0, 1.0, 5.0, 1.0, 3.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-26.859375, -25.841064453125, -24.82275390625, -23.804443359375, -22.7861328125, -21.767822265625, -20.74951171875, -19.731201171875, -18.712890625, -17.694580078125, -16.67626953125, -15.657958984375, -14.6396484375, -13.621337890625, -12.60302734375, -11.584716796875, -10.56640625, -9.548095703125, -8.52978515625, -7.511474609375, -6.4931640625, -5.474853515625, -4.45654296875, -3.438232421875, -2.419921875, -1.401611328125, -0.38330078125, 0.635009765625, 1.6533203125, 2.671630859375, 3.68994140625, 4.708251953125, 5.7265625, 6.744873046875, 7.76318359375, 8.781494140625, 9.7998046875, 10.818115234375, 11.83642578125, 12.854736328125, 13.873046875, 14.891357421875, 15.90966796875, 16.927978515625, 17.9462890625, 18.964599609375, 19.98291015625, 21.001220703125, 22.01953125, 23.037841796875, 24.05615234375, 25.074462890625, 26.0927734375, 27.111083984375, 28.12939453125, 29.147705078125, 30.166015625, 31.184326171875, 32.20263671875, 33.220947265625, 34.2392578125, 35.257568359375, 36.27587890625, 37.294189453125, 38.3125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 2.0, 7.0, 7.0, 8.0, 7.0, 14.0, 19.0, 22.0, 29.0, 33.0, 57.0, 61.0, 87.0, 107.0, 137.0, 184.0, 255.0, 305.0, 445.0, 465.0, 455.0, 325.0, 230.0, 182.0, 123.0, 102.0, 93.0, 74.0, 52.0, 34.0, 37.0, 30.0, 25.0, 10.0, 13.0, 9.0, 5.0, 12.0, 4.0, 4.0, 0.0, 3.0, 1.0, 5.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-19.203125, -18.609619140625, -18.01611328125, -17.422607421875, -16.8291015625, -16.235595703125, -15.64208984375, -15.048583984375, -14.455078125, -13.861572265625, -13.26806640625, -12.674560546875, -12.0810546875, -11.487548828125, -10.89404296875, -10.300537109375, -9.70703125, -9.113525390625, -8.52001953125, -7.926513671875, -7.3330078125, -6.739501953125, -6.14599609375, -5.552490234375, -4.958984375, -4.365478515625, -3.77197265625, -3.178466796875, -2.5849609375, -1.991455078125, -1.39794921875, -0.804443359375, -0.2109375, 0.382568359375, 0.97607421875, 1.569580078125, 2.1630859375, 2.756591796875, 3.35009765625, 3.943603515625, 4.537109375, 5.130615234375, 5.72412109375, 6.317626953125, 6.9111328125, 7.504638671875, 8.09814453125, 8.691650390625, 9.28515625, 9.878662109375, 10.47216796875, 11.065673828125, 11.6591796875, 12.252685546875, 12.84619140625, 13.439697265625, 14.033203125, 14.626708984375, 15.22021484375, 15.813720703125, 16.4072265625, 17.000732421875, 17.59423828125, 18.187744140625, 18.78125]}, "gradients/decoder.transformer.h.2.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 2.0, 2.0, 9.0, 9.0, 13.0, 14.0, 21.0, 28.0, 47.0, 81.0, 96.0, 187.0, 313.0, 713.0, 2216.0, 17378.0, 1194920.0, 2941398.0, 32314.0, 2862.0, 841.0, 344.0, 196.0, 106.0, 55.0, 38.0, 29.0, 18.0, 9.0, 8.0, 10.0, 5.0, 2.0, 3.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-53.875, -51.95703125, -50.0390625, -48.12109375, -46.203125, -44.28515625, -42.3671875, -40.44921875, -38.53125, -36.61328125, -34.6953125, -32.77734375, -30.859375, -28.94140625, -27.0234375, -25.10546875, -23.1875, -21.26953125, -19.3515625, -17.43359375, -15.515625, -13.59765625, -11.6796875, -9.76171875, -7.84375, -5.92578125, -4.0078125, -2.08984375, -0.171875, 1.74609375, 3.6640625, 5.58203125, 7.5, 9.41796875, 11.3359375, 13.25390625, 15.171875, 17.08984375, 19.0078125, 20.92578125, 22.84375, 24.76171875, 26.6796875, 28.59765625, 30.515625, 32.43359375, 34.3515625, 36.26953125, 38.1875, 40.10546875, 42.0234375, 43.94140625, 45.859375, 47.77734375, 49.6953125, 51.61328125, 53.53125, 55.44921875, 57.3671875, 59.28515625, 61.203125, 63.12109375, 65.0390625, 66.95703125, 68.875]}, "gradients/decoder.transformer.h.2.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 960.0, 53.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1211.3843994140625, -1170.5318603515625, -1129.679443359375, -1088.826904296875, -1047.974365234375, -1007.1219482421875, -966.2694091796875, -925.4169311523438, -884.564453125, -843.7119750976562, -802.8594970703125, -762.0069580078125, -721.1544799804688, -680.302001953125, -639.449462890625, -598.5969848632812, -557.7445068359375, -516.8920288085938, -476.0395202636719, -435.18701171875, -394.33453369140625, -353.4820556640625, -312.6295471191406, -271.77703857421875, -230.924560546875, -190.0720672607422, -149.21957397460938, -108.36708068847656, -67.51458740234375, -26.662094116210938, 14.190399169921875, 55.04290771484375, 95.8955078125, 136.7480010986328, 177.60049438476562, 218.45298767089844, 259.30548095703125, 300.157958984375, 341.0104675292969, 381.86297607421875, 422.7154541015625, 463.56793212890625, 504.4204406738281, 545.27294921875, 586.1254272460938, 626.9779052734375, 667.8304443359375, 708.6829223632812, 749.535400390625, 790.3878784179688, 831.2403564453125, 872.0928955078125, 912.9453735351562, 953.7978515625, 994.650390625, 1035.5029296875, 1076.3553466796875, 1117.2078857421875, 1158.060302734375, 1198.912841796875, 1239.765380859375, 1280.6177978515625, 1321.4703369140625, 1362.32275390625, 1403.17529296875]}, "gradients/decoder.transformer.h.2.ln_2.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 1.0, 2.0, 1.0, 4.0, 2.0, 3.0, 10.0, 8.0, 9.0, 6.0, 10.0, 6.0, 19.0, 17.0, 12.0, 24.0, 30.0, 30.0, 35.0, 27.0, 34.0, 30.0, 31.0, 34.0, 43.0, 38.0, 43.0, 44.0, 46.0, 39.0, 38.0, 32.0, 35.0, 26.0, 32.0, 28.0, 27.0, 20.0, 24.0, 18.0, 16.0, 18.0, 11.0, 12.0, 6.0, 8.0, 7.0, 2.0, 2.0, 2.0, 0.0, 3.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0], "bins": [-75.8946533203125, -73.54013061523438, -71.18561553955078, -68.83109283447266, -66.47657775878906, -64.12205505371094, -61.76753616333008, -59.41301727294922, -57.058494567871094, -54.703975677490234, -52.349456787109375, -49.99493408203125, -47.64041519165039, -45.28589630126953, -42.93137741088867, -40.57685852050781, -38.22233963012695, -35.867820739746094, -33.513301849365234, -31.158781051635742, -28.80426025390625, -26.44974136352539, -24.09522247314453, -21.74070167541504, -19.38618278503418, -17.03166389465332, -14.677143096923828, -12.322624206542969, -9.968104362487793, -7.613584518432617, -5.259065628051758, -2.9045448303222656, -0.5500259399414062, 1.8044936656951904, 4.159013271331787, 6.513532638549805, 8.86805248260498, 11.222572326660156, 13.577091217041016, 15.931612014770508, 18.286130905151367, 20.640649795532227, 22.99517059326172, 25.349689483642578, 27.704208374023438, 30.05872917175293, 32.413246154785156, 34.76776885986328, 37.12228775024414, 39.476806640625, 41.83132553100586, 44.18584442138672, 46.540367126464844, 48.8948860168457, 51.24940490722656, 53.60392761230469, 55.95844268798828, 58.31296157836914, 60.66748046875, 63.022003173828125, 65.37651824951172, 67.73104095458984, 70.08555603027344, 72.44007873535156, 74.79460144042969]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 10.0, 9.0, 11.0, 11.0, 10.0, 13.0, 12.0, 24.0, 26.0, 30.0, 28.0, 29.0, 43.0, 40.0, 46.0, 33.0, 47.0, 45.0, 47.0, 49.0, 47.0, 39.0, 26.0, 39.0, 38.0, 31.0, 43.0, 22.0, 23.0, 20.0, 15.0, 28.0, 9.0, 11.0, 12.0, 4.0, 4.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.65478515625, -8.3408203125, -8.02685546875, -7.712890625, -7.39892578125, -7.0849609375, -6.77099609375, -6.45703125, -6.14306640625, -5.8291015625, -5.51513671875, -5.201171875, -4.88720703125, -4.5732421875, -4.25927734375, -3.9453125, -3.63134765625, -3.3173828125, -3.00341796875, -2.689453125, -2.37548828125, -2.0615234375, -1.74755859375, -1.43359375, -1.11962890625, -0.8056640625, -0.49169921875, -0.177734375, 0.13623046875, 0.4501953125, 0.76416015625, 1.078125, 1.39208984375, 1.7060546875, 2.02001953125, 2.333984375, 2.64794921875, 2.9619140625, 3.27587890625, 3.58984375, 3.90380859375, 4.2177734375, 4.53173828125, 4.845703125, 5.15966796875, 5.4736328125, 5.78759765625, 6.1015625, 6.41552734375, 6.7294921875, 7.04345703125, 7.357421875, 7.67138671875, 7.9853515625, 8.29931640625, 8.61328125, 8.92724609375, 9.2412109375, 9.55517578125, 9.869140625, 10.18310546875, 10.4970703125, 10.81103515625, 11.125]}, "gradients/decoder.transformer.h.2.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 3.0, 12.0, 9.0, 10.0, 20.0, 27.0, 43.0, 53.0, 62.0, 92.0, 157.0, 216.0, 311.0, 440.0, 618.0, 935.0, 1357.0, 1936.0, 2918.0, 4305.0, 6529.0, 9600.0, 14457.0, 22340.0, 34492.0, 53529.0, 82764.0, 126003.0, 169599.0, 165892.0, 121339.0, 80034.0, 51228.0, 33037.0, 21512.0, 14052.0, 9416.0, 6147.0, 4190.0, 2844.0, 1936.0, 1304.0, 915.0, 598.0, 410.0, 278.0, 188.0, 132.0, 73.0, 62.0, 48.0, 23.0, 18.0, 22.0, 11.0, 4.0, 7.0, 8.0, 5.0], "bins": [-0.7763671875, -0.7535018920898438, -0.7306365966796875, -0.7077713012695312, -0.684906005859375, -0.6620407104492188, -0.6391754150390625, -0.6163101196289062, -0.59344482421875, -0.5705795288085938, -0.5477142333984375, -0.5248489379882812, -0.501983642578125, -0.47911834716796875, -0.4562530517578125, -0.43338775634765625, -0.4105224609375, -0.38765716552734375, -0.3647918701171875, -0.34192657470703125, -0.319061279296875, -0.29619598388671875, -0.2733306884765625, -0.25046539306640625, -0.22760009765625, -0.20473480224609375, -0.1818695068359375, -0.15900421142578125, -0.136138916015625, -0.11327362060546875, -0.0904083251953125, -0.06754302978515625, -0.044677734375, -0.02181243896484375, 0.0010528564453125, 0.02391815185546875, 0.046783447265625, 0.06964874267578125, 0.0925140380859375, 0.11537933349609375, 0.13824462890625, 0.16110992431640625, 0.1839752197265625, 0.20684051513671875, 0.229705810546875, 0.25257110595703125, 0.2754364013671875, 0.29830169677734375, 0.3211669921875, 0.34403228759765625, 0.3668975830078125, 0.38976287841796875, 0.412628173828125, 0.43549346923828125, 0.4583587646484375, 0.48122406005859375, 0.50408935546875, 0.5269546508789062, 0.5498199462890625, 0.5726852416992188, 0.595550537109375, 0.6184158325195312, 0.6412811279296875, 0.6641464233398438, 0.68701171875]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 5.0, 7.0, 7.0, 8.0, 7.0, 14.0, 10.0, 17.0, 23.0, 24.0, 27.0, 26.0, 25.0, 27.0, 34.0, 46.0, 50.0, 32.0, 32.0, 33.0, 42.0, 1070.0, 42.0, 43.0, 43.0, 39.0, 37.0, 34.0, 35.0, 21.0, 24.0, 24.0, 26.0, 26.0, 6.0, 12.0, 15.0, 7.0, 7.0, 4.0, 6.0, 4.0, 8.0, 1.0, 2.0, 2.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.1484375, -5.95751953125, -5.7666015625, -5.57568359375, -5.384765625, -5.19384765625, -5.0029296875, -4.81201171875, -4.62109375, -4.43017578125, -4.2392578125, -4.04833984375, -3.857421875, -3.66650390625, -3.4755859375, -3.28466796875, -3.09375, -2.90283203125, -2.7119140625, -2.52099609375, -2.330078125, -2.13916015625, -1.9482421875, -1.75732421875, -1.56640625, -1.37548828125, -1.1845703125, -0.99365234375, -0.802734375, -0.61181640625, -0.4208984375, -0.22998046875, -0.0390625, 0.15185546875, 0.3427734375, 0.53369140625, 0.724609375, 0.91552734375, 1.1064453125, 1.29736328125, 1.48828125, 1.67919921875, 1.8701171875, 2.06103515625, 2.251953125, 2.44287109375, 2.6337890625, 2.82470703125, 3.015625, 3.20654296875, 3.3974609375, 3.58837890625, 3.779296875, 3.97021484375, 4.1611328125, 4.35205078125, 4.54296875, 4.73388671875, 4.9248046875, 5.11572265625, 5.306640625, 5.49755859375, 5.6884765625, 5.87939453125, 6.0703125]}, "gradients/decoder.transformer.h.2.crossattention.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 3.0, 5.0, 9.0, 11.0, 13.0, 34.0, 32.0, 48.0, 78.0, 127.0, 169.0, 209.0, 380.0, 501.0, 759.0, 1156.0, 1656.0, 2579.0, 4057.0, 5912.0, 9235.0, 14128.0, 21658.0, 32995.0, 49857.0, 75880.0, 109095.0, 144909.0, 1201762.0, 132302.0, 96312.0, 65622.0, 43421.0, 28611.0, 18546.0, 11996.0, 7915.0, 5052.0, 3355.0, 2232.0, 1490.0, 1006.0, 621.0, 448.0, 281.0, 219.0, 150.0, 109.0, 58.0, 52.0, 29.0, 15.0, 17.0, 11.0, 10.0, 4.0, 2.0, 1.0, 1.0, 0.0, 1.0], "bins": [-0.5546875, -0.5369796752929688, -0.5192718505859375, -0.5015640258789062, -0.483856201171875, -0.46614837646484375, -0.4484405517578125, -0.43073272705078125, -0.41302490234375, -0.39531707763671875, -0.3776092529296875, -0.35990142822265625, -0.342193603515625, -0.32448577880859375, -0.3067779541015625, -0.28907012939453125, -0.2713623046875, -0.25365447998046875, -0.2359466552734375, -0.21823883056640625, -0.200531005859375, -0.18282318115234375, -0.1651153564453125, -0.14740753173828125, -0.12969970703125, -0.11199188232421875, -0.0942840576171875, -0.07657623291015625, -0.058868408203125, -0.04116058349609375, -0.0234527587890625, -0.00574493408203125, 0.011962890625, 0.02967071533203125, 0.0473785400390625, 0.06508636474609375, 0.082794189453125, 0.10050201416015625, 0.1182098388671875, 0.13591766357421875, 0.15362548828125, 0.17133331298828125, 0.1890411376953125, 0.20674896240234375, 0.224456787109375, 0.24216461181640625, 0.2598724365234375, 0.27758026123046875, 0.2952880859375, 0.31299591064453125, 0.3307037353515625, 0.34841156005859375, 0.366119384765625, 0.38382720947265625, 0.4015350341796875, 0.41924285888671875, 0.43695068359375, 0.45465850830078125, 0.4723663330078125, 0.49007415771484375, 0.507781982421875, 0.5254898071289062, 0.5431976318359375, 0.5609054565429688, 0.57861328125]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 3.0, 2.0, 1.0, 2.0, 5.0, 8.0, 3.0, 4.0, 5.0, 9.0, 5.0, 6.0, 7.0, 13.0, 17.0, 16.0, 25.0, 38.0, 40.0, 58.0, 77.0, 81.0, 83.0, 56.0, 84.0, 68.0, 60.0, 43.0, 42.0, 34.0, 22.0, 20.0, 16.0, 6.0, 10.0, 6.0, 5.0, 7.0, 2.0, 5.0, 4.0, 3.0, 3.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0], "bins": [-0.00640106201171875, -0.006217479705810547, -0.006033897399902344, -0.005850315093994141, -0.0056667327880859375, -0.005483150482177734, -0.005299568176269531, -0.005115985870361328, -0.004932403564453125, -0.004748821258544922, -0.004565238952636719, -0.004381656646728516, -0.0041980743408203125, -0.004014492034912109, -0.0038309097290039062, -0.003647327423095703, -0.0034637451171875, -0.003280162811279297, -0.0030965805053710938, -0.0029129981994628906, -0.0027294158935546875, -0.0025458335876464844, -0.0023622512817382812, -0.002178668975830078, -0.001995086669921875, -0.0018115043640136719, -0.0016279220581054688, -0.0014443397521972656, -0.0012607574462890625, -0.0010771751403808594, -0.0008935928344726562, -0.0007100105285644531, -0.00052642822265625, -0.0003428459167480469, -0.00015926361083984375, 2.4318695068359375e-05, 0.0002079010009765625, 0.0003914833068847656, 0.0005750656127929688, 0.0007586479187011719, 0.000942230224609375, 0.0011258125305175781, 0.0013093948364257812, 0.0014929771423339844, 0.0016765594482421875, 0.0018601417541503906, 0.0020437240600585938, 0.002227306365966797, 0.002410888671875, 0.002594470977783203, 0.0027780532836914062, 0.0029616355895996094, 0.0031452178955078125, 0.0033288002014160156, 0.0035123825073242188, 0.003695964813232422, 0.003879547119140625, 0.004063129425048828, 0.004246711730957031, 0.004430294036865234, 0.0046138763427734375, 0.004797458648681641, 0.004981040954589844, 0.005164623260498047, 0.00534820556640625]}, "gradients/decoder.transformer.h.2.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 3.0, 5.0, 7.0, 5.0, 4.0, 7.0, 9.0, 8.0, 10.0, 12.0, 21.0, 20.0, 32.0, 45.0, 41.0, 69.0, 102.0, 154.0, 169.0, 316.0, 536.0, 1577.0, 139645.0, 899932.0, 4062.0, 618.0, 365.0, 225.0, 135.0, 102.0, 66.0, 50.0, 41.0, 26.0, 32.0, 17.0, 18.0, 16.0, 7.0, 6.0, 12.0, 10.0, 4.0, 3.0, 6.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 5.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.099365234375, -0.09607219696044922, -0.09277915954589844, -0.08948612213134766, -0.08619308471679688, -0.0829000473022461, -0.07960700988769531, -0.07631397247314453, -0.07302093505859375, -0.06972789764404297, -0.06643486022949219, -0.0631418228149414, -0.059848785400390625, -0.056555747985839844, -0.05326271057128906, -0.04996967315673828, -0.0466766357421875, -0.04338359832763672, -0.04009056091308594, -0.036797523498535156, -0.033504486083984375, -0.030211448669433594, -0.026918411254882812, -0.02362537384033203, -0.02033233642578125, -0.01703929901123047, -0.013746261596679688, -0.010453224182128906, -0.007160186767578125, -0.0038671493530273438, -0.0005741119384765625, 0.0027189254760742188, 0.006011962890625, 0.009305000305175781, 0.012598037719726562, 0.015891075134277344, 0.019184112548828125, 0.022477149963378906, 0.025770187377929688, 0.02906322479248047, 0.03235626220703125, 0.03564929962158203, 0.03894233703613281, 0.042235374450683594, 0.045528411865234375, 0.048821449279785156, 0.05211448669433594, 0.05540752410888672, 0.0587005615234375, 0.06199359893798828, 0.06528663635253906, 0.06857967376708984, 0.07187271118164062, 0.0751657485961914, 0.07845878601074219, 0.08175182342529297, 0.08504486083984375, 0.08833789825439453, 0.09163093566894531, 0.0949239730834961, 0.09821701049804688, 0.10151004791259766, 0.10480308532714844, 0.10809612274169922, 0.11138916015625]}, "gradients/decoder.transformer.h.2.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 6.0, 12.0, 47.0, 163.0, 336.0, 268.0, 127.0, 40.0, 9.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.014430073089897633, -0.014085158705711365, -0.013740244321525097, -0.013395329937338829, -0.013050415553152561, -0.012705501168966293, -0.0123605877161026, -0.012015673331916332, -0.011670758947730064, -0.011325844563543797, -0.010980930179357529, -0.01063601579517126, -0.010291101410984993, -0.0099461879581213, -0.009601272642612457, -0.009256359189748764, -0.008911443874239922, -0.008566529490053654, -0.008221615105867386, -0.007876700721681118, -0.0075317868031561375, -0.00718687241896987, -0.006841958034783602, -0.006497044116258621, -0.006152129732072353, -0.0058072153478860855, -0.005462300963699818, -0.00511738657951355, -0.004772472660988569, -0.004427558276802301, -0.0040826438926160336, -0.0037377297412604094, -0.003392815124243498, -0.00304790074005723, -0.002702986588701606, -0.002358072204515338, -0.0020131580531597137, -0.001668243668973446, -0.001323329284787178, -0.0009784151334315538, -0.000633500749245286, -0.0002885864523705095, 5.632784450426698e-05, 0.0004012421704828739, 0.0007461564382538199, 0.001091070706024766, 0.0014359850902110338, 0.001780899241566658, 0.002125813625752926, 0.0024707280099391937, 0.002815642161294818, 0.0031605565454810858, 0.00350547069683671, 0.003850385081022978, 0.004195299465209246, 0.004540213383734226, 0.004885127767920494, 0.005230042152106762, 0.00557495653629303, 0.005919870920479298, 0.006264784839004278, 0.006609699223190546, 0.006954613607376814, 0.007299527525901794, 0.00764444237574935]}, "gradients/decoder.transformer.h.2.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 2.0, 4.0, 3.0, 5.0, 3.0, 8.0, 4.0, 8.0, 13.0, 15.0, 12.0, 19.0, 18.0, 27.0, 27.0, 19.0, 34.0, 36.0, 41.0, 41.0, 33.0, 41.0, 32.0, 53.0, 41.0, 52.0, 50.0, 53.0, 46.0, 28.0, 42.0, 34.0, 29.0, 22.0, 21.0, 23.0, 14.0, 14.0, 10.0, 8.0, 9.0, 3.0, 9.0, 5.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.002740025520324707, -0.0026406217366456985, -0.00254121795296669, -0.0024418141692876816, -0.002342410385608673, -0.0022430066019296646, -0.002143602818250656, -0.0020441990345716476, -0.0019447952508926392, -0.0018453914672136307, -0.0017459876835346222, -0.0016465838998556137, -0.0015471801161766052, -0.0014477763324975967, -0.0013483725488185883, -0.0012489687651395798, -0.0011495649814605713, -0.0010501611977815628, -0.0009507574141025543, -0.0008513536304235458, -0.0007519498467445374, -0.0006525460630655289, -0.0005531422793865204, -0.0004537384957075119, -0.0003543347120285034, -0.00025493092834949493, -0.00015552714467048645, -5.6123360991477966e-05, 4.328042268753052e-05, 0.000142684206366539, 0.00024208799004554749, 0.00034149177372455597, 0.00044089555740356445, 0.0005402993410825729, 0.0006397031247615814, 0.0007391069084405899, 0.0008385106921195984, 0.0009379144757986069, 0.0010373182594776154, 0.0011367220431566238, 0.0012361258268356323, 0.0013355296105146408, 0.0014349333941936493, 0.0015343371778726578, 0.0016337409615516663, 0.0017331447452306747, 0.0018325485289096832, 0.0019319523125886917, 0.0020313560962677, 0.0021307598799467087, 0.002230163663625717, 0.0023295674473047256, 0.002428971230983734, 0.0025283750146627426, 0.002627778798341751, 0.0027271825820207596, 0.002826586365699768, 0.0029259901493787766, 0.003025393933057785, 0.0031247977167367935, 0.003224201500415802, 0.0033236052840948105, 0.003423009067773819, 0.0035224128514528275, 0.003621816635131836]}, "gradients/decoder.transformer.h.2.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 2.0, 2.0, 5.0, 5.0, 10.0, 9.0, 11.0, 11.0, 10.0, 13.0, 12.0, 25.0, 25.0, 31.0, 27.0, 30.0, 42.0, 40.0, 46.0, 33.0, 47.0, 45.0, 48.0, 48.0, 47.0, 41.0, 24.0, 39.0, 38.0, 32.0, 42.0, 22.0, 25.0, 18.0, 15.0, 28.0, 9.0, 11.0, 12.0, 4.0, 4.0, 6.0, 6.0, 3.0, 4.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.96875, -8.6546630859375, -8.340576171875, -8.0264892578125, -7.71240234375, -7.3983154296875, -7.084228515625, -6.7701416015625, -6.4560546875, -6.1419677734375, -5.827880859375, -5.5137939453125, -5.19970703125, -4.8856201171875, -4.571533203125, -4.2574462890625, -3.943359375, -3.6292724609375, -3.315185546875, -3.0010986328125, -2.68701171875, -2.3729248046875, -2.058837890625, -1.7447509765625, -1.4306640625, -1.1165771484375, -0.802490234375, -0.4884033203125, -0.17431640625, 0.1397705078125, 0.453857421875, 0.7679443359375, 1.08203125, 1.3961181640625, 1.710205078125, 2.0242919921875, 2.33837890625, 2.6524658203125, 2.966552734375, 3.2806396484375, 3.5947265625, 3.9088134765625, 4.222900390625, 4.5369873046875, 4.85107421875, 5.1651611328125, 5.479248046875, 5.7933349609375, 6.107421875, 6.4215087890625, 6.735595703125, 7.0496826171875, 7.36376953125, 7.6778564453125, 7.991943359375, 8.3060302734375, 8.6201171875, 8.9342041015625, 9.248291015625, 9.5623779296875, 9.87646484375, 10.1905517578125, 10.504638671875, 10.8187255859375, 11.1328125]}, "gradients/decoder.transformer.h.2.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 8.0, 3.0, 6.0, 10.0, 5.0, 18.0, 15.0, 29.0, 35.0, 45.0, 80.0, 91.0, 134.0, 169.0, 254.0, 407.0, 550.0, 867.0, 1302.0, 2141.0, 3991.0, 11200.0, 83071.0, 732706.0, 180886.0, 18353.0, 5144.0, 2448.0, 1584.0, 936.0, 620.0, 422.0, 304.0, 216.0, 154.0, 108.0, 66.0, 49.0, 35.0, 27.0, 22.0, 19.0, 10.0, 6.0, 3.0, 9.0, 3.0, 3.0, 2.0, 0.0, 0.0, 1.0, 3.0], "bins": [-28.921875, -28.087158203125, -27.25244140625, -26.417724609375, -25.5830078125, -24.748291015625, -23.91357421875, -23.078857421875, -22.244140625, -21.409423828125, -20.57470703125, -19.739990234375, -18.9052734375, -18.070556640625, -17.23583984375, -16.401123046875, -15.56640625, -14.731689453125, -13.89697265625, -13.062255859375, -12.2275390625, -11.392822265625, -10.55810546875, -9.723388671875, -8.888671875, -8.053955078125, -7.21923828125, -6.384521484375, -5.5498046875, -4.715087890625, -3.88037109375, -3.045654296875, -2.2109375, -1.376220703125, -0.54150390625, 0.293212890625, 1.1279296875, 1.962646484375, 2.79736328125, 3.632080078125, 4.466796875, 5.301513671875, 6.13623046875, 6.970947265625, 7.8056640625, 8.640380859375, 9.47509765625, 10.309814453125, 11.14453125, 11.979248046875, 12.81396484375, 13.648681640625, 14.4833984375, 15.318115234375, 16.15283203125, 16.987548828125, 17.822265625, 18.656982421875, 19.49169921875, 20.326416015625, 21.1611328125, 21.995849609375, 22.83056640625, 23.665283203125, 24.5]}, "gradients/decoder.transformer.h.2.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 3.0, 9.0, 8.0, 8.0, 4.0, 20.0, 7.0, 16.0, 21.0, 17.0, 24.0, 36.0, 42.0, 45.0, 46.0, 58.0, 78.0, 188.0, 1666.0, 245.0, 84.0, 59.0, 58.0, 39.0, 38.0, 35.0, 22.0, 28.0, 29.0, 16.0, 11.0, 6.0, 14.0, 13.0, 10.0, 12.0, 6.0, 6.0, 12.0, 3.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-26.546875, -25.7333984375, -24.919921875, -24.1064453125, -23.29296875, -22.4794921875, -21.666015625, -20.8525390625, -20.0390625, -19.2255859375, -18.412109375, -17.5986328125, -16.78515625, -15.9716796875, -15.158203125, -14.3447265625, -13.53125, -12.7177734375, -11.904296875, -11.0908203125, -10.27734375, -9.4638671875, -8.650390625, -7.8369140625, -7.0234375, -6.2099609375, -5.396484375, -4.5830078125, -3.76953125, -2.9560546875, -2.142578125, -1.3291015625, -0.515625, 0.2978515625, 1.111328125, 1.9248046875, 2.73828125, 3.5517578125, 4.365234375, 5.1787109375, 5.9921875, 6.8056640625, 7.619140625, 8.4326171875, 9.24609375, 10.0595703125, 10.873046875, 11.6865234375, 12.5, 13.3134765625, 14.126953125, 14.9404296875, 15.75390625, 16.5673828125, 17.380859375, 18.1943359375, 19.0078125, 19.8212890625, 20.634765625, 21.4482421875, 22.26171875, 23.0751953125, 23.888671875, 24.7021484375, 25.515625]}, "gradients/decoder.transformer.h.2.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 4.0, 1.0, 8.0, 14.0, 15.0, 12.0, 9.0, 13.0, 20.0, 23.0, 25.0, 32.0, 48.0, 76.0, 73.0, 97.0, 116.0, 171.0, 293.0, 526.0, 1218.0, 16863.0, 3118783.0, 4957.0, 973.0, 454.0, 247.0, 150.0, 109.0, 90.0, 52.0, 57.0, 36.0, 34.0, 26.0, 18.0, 19.0, 12.0, 11.0, 6.0, 5.0, 3.0, 3.0, 2.0, 3.0, 2.0, 4.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-70.75, -68.5654296875, -66.380859375, -64.1962890625, -62.01171875, -59.8271484375, -57.642578125, -55.4580078125, -53.2734375, -51.0888671875, -48.904296875, -46.7197265625, -44.53515625, -42.3505859375, -40.166015625, -37.9814453125, -35.796875, -33.6123046875, -31.427734375, -29.2431640625, -27.05859375, -24.8740234375, -22.689453125, -20.5048828125, -18.3203125, -16.1357421875, -13.951171875, -11.7666015625, -9.58203125, -7.3974609375, -5.212890625, -3.0283203125, -0.84375, 1.3408203125, 3.525390625, 5.7099609375, 7.89453125, 10.0791015625, 12.263671875, 14.4482421875, 16.6328125, 18.8173828125, 21.001953125, 23.1865234375, 25.37109375, 27.5556640625, 29.740234375, 31.9248046875, 34.109375, 36.2939453125, 38.478515625, 40.6630859375, 42.84765625, 45.0322265625, 47.216796875, 49.4013671875, 51.5859375, 53.7705078125, 55.955078125, 58.1396484375, 60.32421875, 62.5087890625, 64.693359375, 66.8779296875, 69.0625]}, "gradients/decoder.transformer.h.2.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 7.0, 24.0, 171.0, 418.0, 298.0, 79.0, 18.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-148.11790466308594, -143.9623260498047, -139.8067626953125, -135.65118408203125, -131.49562072753906, -127.34004211425781, -123.1844711303711, -119.02890014648438, -114.87332153320312, -110.7177505493164, -106.56217956542969, -102.40660095214844, -98.25102996826172, -94.095458984375, -89.93988800048828, -85.78431701660156, -81.62874603271484, -77.47317504882812, -73.3176040649414, -69.16203308105469, -65.00645446777344, -60.85088348388672, -56.6953125, -52.53974151611328, -48.3841667175293, -44.22859573364258, -40.073020935058594, -35.917449951171875, -31.761877059936523, -27.606304168701172, -23.450733184814453, -19.2951602935791, -15.139595031738281, -10.98402214050293, -6.8284502029418945, -2.6728782653808594, 1.4826946258544922, 5.638267517089844, 9.793838500976562, 13.949411392211914, 18.104984283447266, 22.260557174682617, 26.41613006591797, 30.571701049804688, 34.727272033691406, 38.88284683227539, 43.03841781616211, 47.193992614746094, 51.34956359863281, 55.50513458251953, 59.660709381103516, 63.816280364990234, 67.97185516357422, 72.12742614746094, 76.28299713134766, 80.43856811523438, 84.59414672851562, 88.74971771240234, 92.90528869628906, 97.06086730957031, 101.21643829345703, 105.37200927734375, 109.52758026123047, 113.68315124511719, 117.8387222290039]}, "gradients/decoder.transformer.h.2.ln_1.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 2.0, 1.0, 2.0, 1.0, 2.0, 2.0, 9.0, 1.0, 11.0, 6.0, 12.0, 12.0, 5.0, 15.0, 10.0, 26.0, 23.0, 24.0, 27.0, 27.0, 25.0, 39.0, 35.0, 27.0, 35.0, 41.0, 39.0, 41.0, 35.0, 44.0, 41.0, 37.0, 35.0, 35.0, 36.0, 27.0, 31.0, 27.0, 27.0, 18.0, 21.0, 13.0, 17.0, 17.0, 13.0, 6.0, 7.0, 6.0, 7.0, 3.0, 3.0, 7.0, 4.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-64.98450469970703, -62.85363006591797, -60.72275161743164, -58.59187698364258, -56.46099853515625, -54.33012390136719, -52.199249267578125, -50.06837463378906, -47.937496185302734, -45.80662155151367, -43.675743103027344, -41.54486846923828, -39.41399383544922, -37.28311538696289, -35.15224075317383, -33.0213623046875, -30.890487670898438, -28.759611129760742, -26.628734588623047, -24.497859954833984, -22.36698341369629, -20.236106872558594, -18.10523223876953, -15.974355697631836, -13.84347915649414, -11.712602615356445, -9.581727027893066, -7.450850963592529, -5.319974899291992, -3.189098358154297, -1.058222770690918, 1.072652816772461, 3.203521728515625, 5.334397792816162, 7.465273857116699, 9.596149444580078, 11.727025985717773, 13.857902526855469, 15.988778114318848, 18.119653701782227, 20.250530242919922, 22.381406784057617, 24.512283325195312, 26.643157958984375, 28.77403450012207, 30.904911041259766, 33.03578567504883, 35.166664123535156, 37.29753875732422, 39.42841339111328, 41.55929183959961, 43.69016647338867, 45.821044921875, 47.95191955566406, 50.082794189453125, 52.21366882324219, 54.344547271728516, 56.47542190551758, 58.606300354003906, 60.73717498779297, 62.86804962158203, 64.99893188476562, 67.12980651855469, 69.26068115234375, 71.39155578613281]}, "gradients/decoder.transformer.h.1.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 6.0, 1.0, 7.0, 9.0, 6.0, 5.0, 11.0, 13.0, 12.0, 12.0, 18.0, 24.0, 21.0, 29.0, 30.0, 25.0, 43.0, 49.0, 42.0, 61.0, 44.0, 53.0, 38.0, 45.0, 32.0, 39.0, 40.0, 40.0, 43.0, 28.0, 35.0, 29.0, 22.0, 15.0, 20.0, 16.0, 8.0, 9.0, 7.0, 8.0, 6.0, 5.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.15625, -9.8074951171875, -9.458740234375, -9.1099853515625, -8.76123046875, -8.4124755859375, -8.063720703125, -7.7149658203125, -7.3662109375, -7.0174560546875, -6.668701171875, -6.3199462890625, -5.97119140625, -5.6224365234375, -5.273681640625, -4.9249267578125, -4.576171875, -4.2274169921875, -3.878662109375, -3.5299072265625, -3.18115234375, -2.8323974609375, -2.483642578125, -2.1348876953125, -1.7861328125, -1.4373779296875, -1.088623046875, -0.7398681640625, -0.39111328125, -0.0423583984375, 0.306396484375, 0.6551513671875, 1.00390625, 1.3526611328125, 1.701416015625, 2.0501708984375, 2.39892578125, 2.7476806640625, 3.096435546875, 3.4451904296875, 3.7939453125, 4.1427001953125, 4.491455078125, 4.8402099609375, 5.18896484375, 5.5377197265625, 5.886474609375, 6.2352294921875, 6.583984375, 6.9327392578125, 7.281494140625, 7.6302490234375, 7.97900390625, 8.3277587890625, 8.676513671875, 9.0252685546875, 9.3740234375, 9.7227783203125, 10.071533203125, 10.4202880859375, 10.76904296875, 11.1177978515625, 11.466552734375, 11.8153076171875, 12.1640625]}, "gradients/decoder.transformer.h.1.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 8.0, 5.0, 12.0, 13.0, 14.0, 17.0, 27.0, 35.0, 41.0, 71.0, 91.0, 161.0, 219.0, 296.0, 490.0, 794.0, 1337.0, 2161.0, 3805.0, 7042.0, 15672.0, 51207.0, 277893.0, 1245943.0, 1862569.0, 572894.0, 104773.0, 24392.0, 9829.0, 5107.0, 2791.0, 1615.0, 1005.0, 659.0, 446.0, 272.0, 155.0, 127.0, 88.0, 63.0, 53.0, 29.0, 19.0, 17.0, 10.0, 7.0, 10.0, 1.0, 1.0, 2.0, 3.0, 4.0, 0.0, 2.0, 1.0, 1.0], "bins": [-14.328125, -13.8834228515625, -13.438720703125, -12.9940185546875, -12.54931640625, -12.1046142578125, -11.659912109375, -11.2152099609375, -10.7705078125, -10.3258056640625, -9.881103515625, -9.4364013671875, -8.99169921875, -8.5469970703125, -8.102294921875, -7.6575927734375, -7.212890625, -6.7681884765625, -6.323486328125, -5.8787841796875, -5.43408203125, -4.9893798828125, -4.544677734375, -4.0999755859375, -3.6552734375, -3.2105712890625, -2.765869140625, -2.3211669921875, -1.87646484375, -1.4317626953125, -0.987060546875, -0.5423583984375, -0.09765625, 0.3470458984375, 0.791748046875, 1.2364501953125, 1.68115234375, 2.1258544921875, 2.570556640625, 3.0152587890625, 3.4599609375, 3.9046630859375, 4.349365234375, 4.7940673828125, 5.23876953125, 5.6834716796875, 6.128173828125, 6.5728759765625, 7.017578125, 7.4622802734375, 7.906982421875, 8.3516845703125, 8.79638671875, 9.2410888671875, 9.685791015625, 10.1304931640625, 10.5751953125, 11.0198974609375, 11.464599609375, 11.9093017578125, 12.35400390625, 12.7987060546875, 13.243408203125, 13.6881103515625, 14.1328125]}, "gradients/decoder.transformer.h.1.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 1.0, 0.0, 7.0, 9.0, 18.0, 62.0, 157.0, 384.0, 923.0, 1394.0, 662.0, 302.0, 98.0, 43.0, 18.0, 6.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-55.625, -54.05029296875, -52.4755859375, -50.90087890625, -49.326171875, -47.75146484375, -46.1767578125, -44.60205078125, -43.02734375, -41.45263671875, -39.8779296875, -38.30322265625, -36.728515625, -35.15380859375, -33.5791015625, -32.00439453125, -30.4296875, -28.85498046875, -27.2802734375, -25.70556640625, -24.130859375, -22.55615234375, -20.9814453125, -19.40673828125, -17.83203125, -16.25732421875, -14.6826171875, -13.10791015625, -11.533203125, -9.95849609375, -8.3837890625, -6.80908203125, -5.234375, -3.65966796875, -2.0849609375, -0.51025390625, 1.064453125, 2.63916015625, 4.2138671875, 5.78857421875, 7.36328125, 8.93798828125, 10.5126953125, 12.08740234375, 13.662109375, 15.23681640625, 16.8115234375, 18.38623046875, 19.9609375, 21.53564453125, 23.1103515625, 24.68505859375, 26.259765625, 27.83447265625, 29.4091796875, 30.98388671875, 32.55859375, 34.13330078125, 35.7080078125, 37.28271484375, 38.857421875, 40.43212890625, 42.0068359375, 43.58154296875, 45.15625]}, "gradients/decoder.transformer.h.1.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 7.0, 5.0, 10.0, 21.0, 54.0, 128.0, 373.0, 1201.0, 7359.0, 4154677.0, 27934.0, 1731.0, 476.0, 167.0, 63.0, 30.0, 25.0, 10.0, 6.0, 5.0, 2.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-94.9375, -91.7333984375, -88.529296875, -85.3251953125, -82.12109375, -78.9169921875, -75.712890625, -72.5087890625, -69.3046875, -66.1005859375, -62.896484375, -59.6923828125, -56.48828125, -53.2841796875, -50.080078125, -46.8759765625, -43.671875, -40.4677734375, -37.263671875, -34.0595703125, -30.85546875, -27.6513671875, -24.447265625, -21.2431640625, -18.0390625, -14.8349609375, -11.630859375, -8.4267578125, -5.22265625, -2.0185546875, 1.185546875, 4.3896484375, 7.59375, 10.7978515625, 14.001953125, 17.2060546875, 20.41015625, 23.6142578125, 26.818359375, 30.0224609375, 33.2265625, 36.4306640625, 39.634765625, 42.8388671875, 46.04296875, 49.2470703125, 52.451171875, 55.6552734375, 58.859375, 62.0634765625, 65.267578125, 68.4716796875, 71.67578125, 74.8798828125, 78.083984375, 81.2880859375, 84.4921875, 87.6962890625, 90.900390625, 94.1044921875, 97.30859375, 100.5126953125, 103.716796875, 106.9208984375, 110.125]}, "gradients/decoder.transformer.h.1.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 9.0, 25.0, 38.0, 101.0, 179.0, 249.0, 178.0, 145.0, 53.0, 23.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-116.05976867675781, -112.28221130371094, -108.50465393066406, -104.72710418701172, -100.94954681396484, -97.17198944091797, -93.39443969726562, -89.61688232421875, -85.83932495117188, -82.061767578125, -78.28421020507812, -74.50666046142578, -70.7291030883789, -66.95154571533203, -63.17399215698242, -59.39643859863281, -55.61888122558594, -51.84132385253906, -48.06377029418945, -44.286216735839844, -40.50865936279297, -36.731101989746094, -32.953548431396484, -29.175992965698242, -25.3984375, -21.620882034301758, -17.843326568603516, -14.065771102905273, -10.288215637207031, -6.510660171508789, -2.733104705810547, 1.0444507598876953, 4.8220062255859375, 8.59956169128418, 12.377117156982422, 16.154672622680664, 19.932228088378906, 23.70978355407715, 27.48733901977539, 31.264894485473633, 35.042449951171875, 38.82000732421875, 42.59756088256836, 46.37511444091797, 50.152671813964844, 53.93022918701172, 57.70778274536133, 61.48533630371094, 65.26289367675781, 69.04045104980469, 72.81800842285156, 76.5955581665039, 80.37311553955078, 84.15067291259766, 87.92822265625, 91.70578002929688, 95.48333740234375, 99.26089477539062, 103.0384521484375, 106.81600189208984, 110.59355926513672, 114.3711166381836, 118.14866638183594, 121.92622375488281, 125.70378112792969]}, "gradients/decoder.transformer.h.1.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0, 3.0, 3.0, 3.0, 10.0, 11.0, 12.0, 10.0, 16.0, 19.0, 18.0, 22.0, 27.0, 22.0, 21.0, 32.0, 44.0, 28.0, 44.0, 45.0, 44.0, 42.0, 28.0, 45.0, 45.0, 37.0, 45.0, 36.0, 31.0, 37.0, 27.0, 18.0, 20.0, 23.0, 28.0, 17.0, 15.0, 16.0, 13.0, 6.0, 8.0, 8.0, 3.0, 7.0, 8.0, 1.0, 2.0, 1.0, 3.0, 0.0, 3.0, 0.0, 2.0, 1.0], "bins": [-72.61593627929688, -70.43852233886719, -68.2611083984375, -66.08369445800781, -63.90628433227539, -61.7288703918457, -59.55146026611328, -57.374046325683594, -55.196632385253906, -53.01921844482422, -50.84180450439453, -48.66439437866211, -46.48698043823242, -44.309566497802734, -42.13215637207031, -39.954742431640625, -37.77732849121094, -35.59991455078125, -33.42250061035156, -31.24509048461914, -29.067676544189453, -26.890262603759766, -24.71285057067871, -22.535438537597656, -20.35802459716797, -18.18061065673828, -16.003198623657227, -13.825785636901855, -11.648372650146484, -9.470959663391113, -7.293546676635742, -5.116133689880371, -2.938720703125, -0.7613077163696289, 1.4161052703857422, 3.5935182571411133, 5.770931243896484, 7.9483442306518555, 10.125757217407227, 12.303170204162598, 14.480583190917969, 16.657997131347656, 18.83540916442871, 21.012821197509766, 23.190235137939453, 25.36764907836914, 27.545061111450195, 29.72247314453125, 31.899887084960938, 34.077301025390625, 36.25471496582031, 38.432125091552734, 40.60953903198242, 42.78695297241211, 44.96436309814453, 47.14177703857422, 49.319190979003906, 51.496604919433594, 53.67401885986328, 55.8514289855957, 58.02884292602539, 60.20625686645508, 62.3836669921875, 64.56108093261719, 66.73849487304688]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 12.0, 11.0, 11.0, 17.0, 16.0, 15.0, 25.0, 24.0, 26.0, 29.0, 41.0, 32.0, 44.0, 41.0, 48.0, 35.0, 47.0, 49.0, 40.0, 43.0, 45.0, 40.0, 42.0, 34.0, 38.0, 34.0, 23.0, 17.0, 17.0, 13.0, 14.0, 16.0, 9.0, 10.0, 14.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.78125, -8.51922607421875, -8.2572021484375, -7.99517822265625, -7.733154296875, -7.47113037109375, -7.2091064453125, -6.94708251953125, -6.68505859375, -6.42303466796875, -6.1610107421875, -5.89898681640625, -5.636962890625, -5.37493896484375, -5.1129150390625, -4.85089111328125, -4.5888671875, -4.32684326171875, -4.0648193359375, -3.80279541015625, -3.540771484375, -3.27874755859375, -3.0167236328125, -2.75469970703125, -2.49267578125, -2.23065185546875, -1.9686279296875, -1.70660400390625, -1.444580078125, -1.18255615234375, -0.9205322265625, -0.65850830078125, -0.396484375, -0.13446044921875, 0.1275634765625, 0.38958740234375, 0.651611328125, 0.91363525390625, 1.1756591796875, 1.43768310546875, 1.69970703125, 1.96173095703125, 2.2237548828125, 2.48577880859375, 2.747802734375, 3.00982666015625, 3.2718505859375, 3.53387451171875, 3.7958984375, 4.05792236328125, 4.3199462890625, 4.58197021484375, 4.843994140625, 5.10601806640625, 5.3680419921875, 5.63006591796875, 5.89208984375, 6.15411376953125, 6.4161376953125, 6.67816162109375, 6.940185546875, 7.20220947265625, 7.4642333984375, 7.72625732421875, 7.98828125]}, "gradients/decoder.transformer.h.1.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 5.0, 8.0, 5.0, 9.0, 16.0, 21.0, 32.0, 67.0, 80.0, 123.0, 159.0, 239.0, 326.0, 399.0, 604.0, 847.0, 1153.0, 1796.0, 2639.0, 3725.0, 5374.0, 8077.0, 11589.0, 17239.0, 25922.0, 37887.0, 57266.0, 85429.0, 123137.0, 158701.0, 152920.0, 114445.0, 78417.0, 52081.0, 34787.0, 23217.0, 15657.0, 10606.0, 7266.0, 5064.0, 3365.0, 2354.0, 1754.0, 1034.0, 824.0, 584.0, 384.0, 271.0, 196.0, 141.0, 89.0, 83.0, 58.0, 35.0, 25.0, 13.0, 10.0, 7.0, 5.0, 4.0, 1.0, 2.0, 2.0], "bins": [-0.5673828125, -0.54901123046875, -0.5306396484375, -0.51226806640625, -0.493896484375, -0.47552490234375, -0.4571533203125, -0.43878173828125, -0.42041015625, -0.40203857421875, -0.3836669921875, -0.36529541015625, -0.346923828125, -0.32855224609375, -0.3101806640625, -0.29180908203125, -0.2734375, -0.25506591796875, -0.2366943359375, -0.21832275390625, -0.199951171875, -0.18157958984375, -0.1632080078125, -0.14483642578125, -0.12646484375, -0.10809326171875, -0.0897216796875, -0.07135009765625, -0.052978515625, -0.03460693359375, -0.0162353515625, 0.00213623046875, 0.0205078125, 0.03887939453125, 0.0572509765625, 0.07562255859375, 0.093994140625, 0.11236572265625, 0.1307373046875, 0.14910888671875, 0.16748046875, 0.18585205078125, 0.2042236328125, 0.22259521484375, 0.240966796875, 0.25933837890625, 0.2777099609375, 0.29608154296875, 0.314453125, 0.33282470703125, 0.3511962890625, 0.36956787109375, 0.387939453125, 0.40631103515625, 0.4246826171875, 0.44305419921875, 0.46142578125, 0.47979736328125, 0.4981689453125, 0.51654052734375, 0.534912109375, 0.55328369140625, 0.5716552734375, 0.59002685546875, 0.6083984375]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 2.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 3.0, 5.0, 6.0, 5.0, 3.0, 20.0, 11.0, 15.0, 15.0, 19.0, 13.0, 22.0, 29.0, 26.0, 42.0, 30.0, 39.0, 38.0, 31.0, 39.0, 39.0, 1062.0, 41.0, 44.0, 32.0, 35.0, 37.0, 53.0, 33.0, 30.0, 37.0, 32.0, 19.0, 23.0, 18.0, 18.0, 15.0, 4.0, 8.0, 16.0, 5.0, 4.0, 3.0, 7.0, 1.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-5.08203125, -4.92010498046875, -4.7581787109375, -4.59625244140625, -4.434326171875, -4.27239990234375, -4.1104736328125, -3.94854736328125, -3.78662109375, -3.62469482421875, -3.4627685546875, -3.30084228515625, -3.138916015625, -2.97698974609375, -2.8150634765625, -2.65313720703125, -2.4912109375, -2.32928466796875, -2.1673583984375, -2.00543212890625, -1.843505859375, -1.68157958984375, -1.5196533203125, -1.35772705078125, -1.19580078125, -1.03387451171875, -0.8719482421875, -0.71002197265625, -0.548095703125, -0.38616943359375, -0.2242431640625, -0.06231689453125, 0.099609375, 0.26153564453125, 0.4234619140625, 0.58538818359375, 0.747314453125, 0.90924072265625, 1.0711669921875, 1.23309326171875, 1.39501953125, 1.55694580078125, 1.7188720703125, 1.88079833984375, 2.042724609375, 2.20465087890625, 2.3665771484375, 2.52850341796875, 2.6904296875, 2.85235595703125, 3.0142822265625, 3.17620849609375, 3.338134765625, 3.50006103515625, 3.6619873046875, 3.82391357421875, 3.98583984375, 4.14776611328125, 4.3096923828125, 4.47161865234375, 4.633544921875, 4.79547119140625, 4.9573974609375, 5.11932373046875, 5.28125]}, "gradients/decoder.transformer.h.1.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 6.0, 10.0, 12.0, 17.0, 30.0, 40.0, 58.0, 99.0, 149.0, 217.0, 327.0, 492.0, 727.0, 1104.0, 1734.0, 2637.0, 3925.0, 5950.0, 9123.0, 14329.0, 22324.0, 34714.0, 52740.0, 80262.0, 118977.0, 189770.0, 1172307.0, 127635.0, 89885.0, 58566.0, 38151.0, 24603.0, 16120.0, 10553.0, 6733.0, 4364.0, 2902.0, 1909.0, 1269.0, 807.0, 558.0, 338.0, 214.0, 170.0, 91.0, 64.0, 38.0, 31.0, 24.0, 10.0, 10.0, 7.0, 3.0, 2.0, 1.0, 2.0], "bins": [-0.5556640625, -0.5393791198730469, -0.5230941772460938, -0.5068092346191406, -0.4905242919921875, -0.4742393493652344, -0.45795440673828125, -0.4416694641113281, -0.425384521484375, -0.4090995788574219, -0.39281463623046875, -0.3765296936035156, -0.3602447509765625, -0.3439598083496094, -0.32767486572265625, -0.3113899230957031, -0.29510498046875, -0.2788200378417969, -0.26253509521484375, -0.24625015258789062, -0.2299652099609375, -0.21368026733398438, -0.19739532470703125, -0.18111038208007812, -0.164825439453125, -0.14854049682617188, -0.13225555419921875, -0.11597061157226562, -0.0996856689453125, -0.08340072631835938, -0.06711578369140625, -0.050830841064453125, -0.0345458984375, -0.018260955810546875, -0.00197601318359375, 0.014308929443359375, 0.0305938720703125, 0.046878814697265625, 0.06316375732421875, 0.07944869995117188, 0.095733642578125, 0.11201858520507812, 0.12830352783203125, 0.14458847045898438, 0.1608734130859375, 0.17715835571289062, 0.19344329833984375, 0.20972824096679688, 0.22601318359375, 0.24229812622070312, 0.25858306884765625, 0.2748680114746094, 0.2911529541015625, 0.3074378967285156, 0.32372283935546875, 0.3400077819824219, 0.356292724609375, 0.3725776672363281, 0.38886260986328125, 0.4051475524902344, 0.4214324951171875, 0.4377174377441406, 0.45400238037109375, 0.4702873229980469, 0.486572265625]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 4.0, 1.0, 1.0, 2.0, 6.0, 8.0, 2.0, 11.0, 6.0, 13.0, 14.0, 24.0, 13.0, 38.0, 44.0, 43.0, 55.0, 71.0, 63.0, 83.0, 69.0, 63.0, 71.0, 60.0, 37.0, 31.0, 27.0, 28.0, 22.0, 13.0, 9.0, 11.0, 10.0, 12.0, 7.0, 8.0, 3.0, 4.0, 2.0, 4.0, 3.0, 1.0, 5.0, 0.0, 3.0, 1.0, 2.0, 0.0, 1.0, 2.0], "bins": [-0.005489349365234375, -0.0053269267082214355, -0.005164504051208496, -0.005002081394195557, -0.004839658737182617, -0.004677236080169678, -0.004514813423156738, -0.004352390766143799, -0.004189968109130859, -0.00402754545211792, -0.0038651227951049805, -0.003702700138092041, -0.0035402774810791016, -0.003377854824066162, -0.0032154321670532227, -0.003053009510040283, -0.0028905868530273438, -0.0027281641960144043, -0.002565741539001465, -0.0024033188819885254, -0.002240896224975586, -0.0020784735679626465, -0.001916050910949707, -0.0017536282539367676, -0.0015912055969238281, -0.0014287829399108887, -0.0012663602828979492, -0.0011039376258850098, -0.0009415149688720703, -0.0007790923118591309, -0.0006166696548461914, -0.00045424699783325195, -0.0002918243408203125, -0.00012940168380737305, 3.3020973205566406e-05, 0.00019544363021850586, 0.0003578662872314453, 0.0005202889442443848, 0.0006827116012573242, 0.0008451342582702637, 0.0010075569152832031, 0.0011699795722961426, 0.001332402229309082, 0.0014948248863220215, 0.001657247543334961, 0.0018196702003479004, 0.00198209285736084, 0.0021445155143737793, 0.0023069381713867188, 0.002469360828399658, 0.0026317834854125977, 0.002794206142425537, 0.0029566287994384766, 0.003119051456451416, 0.0032814741134643555, 0.003443896770477295, 0.0036063194274902344, 0.003768742084503174, 0.003931164741516113, 0.004093587398529053, 0.004256010055541992, 0.004418432712554932, 0.004580855369567871, 0.0047432780265808105, 0.00490570068359375]}, "gradients/decoder.transformer.h.1.crossattention.q_attn.weight": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 5.0, 5.0, 5.0, 10.0, 7.0, 10.0, 10.0, 18.0, 16.0, 24.0, 31.0, 35.0, 44.0, 55.0, 71.0, 82.0, 131.0, 194.0, 294.0, 526.0, 920.0, 16600.0, 1023462.0, 3932.0, 752.0, 430.0, 252.0, 178.0, 124.0, 83.0, 53.0, 36.0, 42.0, 18.0, 17.0, 10.0, 18.0, 10.0, 7.0, 4.0, 8.0, 6.0, 4.0, 7.0, 2.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.09210205078125, -0.08906936645507812, -0.08603668212890625, -0.08300399780273438, -0.0799713134765625, -0.07693862915039062, -0.07390594482421875, -0.07087326049804688, -0.067840576171875, -0.06480789184570312, -0.06177520751953125, -0.058742523193359375, -0.0557098388671875, -0.052677154541015625, -0.04964447021484375, -0.046611785888671875, -0.0435791015625, -0.040546417236328125, -0.03751373291015625, -0.034481048583984375, -0.0314483642578125, -0.028415679931640625, -0.02538299560546875, -0.022350311279296875, -0.019317626953125, -0.016284942626953125, -0.01325225830078125, -0.010219573974609375, -0.0071868896484375, -0.004154205322265625, -0.00112152099609375, 0.001911163330078125, 0.00494384765625, 0.007976531982421875, 0.01100921630859375, 0.014041900634765625, 0.0170745849609375, 0.020107269287109375, 0.02313995361328125, 0.026172637939453125, 0.029205322265625, 0.032238006591796875, 0.03527069091796875, 0.038303375244140625, 0.0413360595703125, 0.044368743896484375, 0.04740142822265625, 0.050434112548828125, 0.053466796875, 0.056499481201171875, 0.05953216552734375, 0.06256484985351562, 0.0655975341796875, 0.06863021850585938, 0.07166290283203125, 0.07469558715820312, 0.077728271484375, 0.08076095581054688, 0.08379364013671875, 0.08682632446289062, 0.0898590087890625, 0.09289169311523438, 0.09592437744140625, 0.09895706176757812, 0.10198974609375]}, "gradients/decoder.transformer.h.1.ln_cross_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 4.0, 15.0, 118.0, 409.0, 372.0, 76.0, 15.0, 5.0, 0.0, 1.0, 1.0, 1.0], "bins": [-0.018808776512742043, -0.018472231924533844, -0.018135687336325645, -0.017799142748117447, -0.01746259815990925, -0.01712605357170105, -0.01678950898349285, -0.016452964395284653, -0.016116419807076454, -0.015779875218868256, -0.015443330630660057, -0.015106786042451859, -0.01477024145424366, -0.014433696866035461, -0.014097152277827263, -0.013760607689619064, -0.013424063101410866, -0.013087518513202667, -0.012750973924994469, -0.01241442933678627, -0.012077884748578072, -0.011741340160369873, -0.011404795572161674, -0.011068250983953476, -0.010731706395745277, -0.010395161807537079, -0.01005861721932888, -0.009722072631120682, -0.009385528042912483, -0.009048983454704285, -0.008712438866496086, -0.008375894278287888, -0.008039349690079689, -0.0077028051018714905, -0.007366260513663292, -0.007029715925455093, -0.006693171337246895, -0.006356626749038696, -0.006020082160830498, -0.005683537572622299, -0.005346993450075388, -0.005010448861867189, -0.004673904273658991, -0.004337359685450792, -0.004000815097242594, -0.0036642705090343952, -0.0033277259208261967, -0.002991181332617998, -0.0026546367444097996, -0.002318092156201601, -0.0019815475679934025, -0.001645002979785204, -0.0013084583915770054, -0.0009719138033688068, -0.0006353692151606083, -0.00029882462695240974, 3.77199612557888e-05, 0.00037426454946398735, 0.0007108091376721859, 0.0010473537258803844, 0.001383898314088583, 0.0017204429022967815, 0.00205698749050498, 0.0023935320787131786, 0.002730076666921377]}, "gradients/decoder.transformer.h.1.ln_cross_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 4.0, 2.0, 2.0, 3.0, 7.0, 10.0, 15.0, 8.0, 14.0, 19.0, 22.0, 11.0, 29.0, 17.0, 20.0, 33.0, 35.0, 28.0, 48.0, 37.0, 41.0, 47.0, 44.0, 60.0, 51.0, 43.0, 38.0, 28.0, 46.0, 39.0, 25.0, 25.0, 22.0, 22.0, 23.0, 21.0, 20.0, 7.0, 13.0, 5.0, 13.0, 1.0, 5.0, 4.0, 2.0, 3.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0031191110610961914, -0.003028430975973606, -0.002937750890851021, -0.0028470708057284355, -0.0027563907206058502, -0.002665710635483265, -0.0025750305503606796, -0.0024843504652380943, -0.002393670380115509, -0.0023029902949929237, -0.0022123102098703384, -0.002121630124747753, -0.002030950039625168, -0.0019402699545025826, -0.0018495898693799973, -0.001758909784257412, -0.0016682296991348267, -0.0015775496140122414, -0.001486869528889656, -0.0013961894437670708, -0.0013055093586444855, -0.0012148292735219002, -0.0011241491883993149, -0.0010334691032767296, -0.0009427890181541443, -0.000852108933031559, -0.0007614288479089737, -0.0006707487627863884, -0.0005800686776638031, -0.0004893885925412178, -0.0003987085074186325, -0.0003080284222960472, -0.00021734833717346191, -0.00012666825205087662, -3.598816692829132e-05, 5.4691918194293976e-05, 0.00014537200331687927, 0.00023605208843946457, 0.00032673217356204987, 0.00041741225868463516, 0.0005080923438072205, 0.0005987724289298058, 0.000689452514052391, 0.0007801325991749763, 0.0008708126842975616, 0.0009614927694201469, 0.0010521728545427322, 0.0011428529396653175, 0.0012335330247879028, 0.0013242131099104881, 0.0014148931950330734, 0.0015055732801556587, 0.001596253365278244, 0.0016869334504008293, 0.0017776135355234146, 0.001868293620646, 0.001958973705768585, 0.0020496537908911705, 0.002140333876013756, 0.002231013961136341, 0.0023216940462589264, 0.0024123741313815117, 0.002503054216504097, 0.0025937343016266823, 0.0026844143867492676]}, "gradients/decoder.transformer.h.1.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 5.0, 5.0, 12.0, 11.0, 11.0, 17.0, 16.0, 15.0, 25.0, 24.0, 25.0, 30.0, 40.0, 33.0, 44.0, 41.0, 47.0, 36.0, 46.0, 50.0, 40.0, 43.0, 44.0, 41.0, 42.0, 34.0, 38.0, 34.0, 23.0, 17.0, 17.0, 13.0, 14.0, 15.0, 10.0, 10.0, 14.0, 10.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0], "bins": [-8.78125, -8.519287109375, -8.25732421875, -7.995361328125, -7.7333984375, -7.471435546875, -7.20947265625, -6.947509765625, -6.685546875, -6.423583984375, -6.16162109375, -5.899658203125, -5.6376953125, -5.375732421875, -5.11376953125, -4.851806640625, -4.58984375, -4.327880859375, -4.06591796875, -3.803955078125, -3.5419921875, -3.280029296875, -3.01806640625, -2.756103515625, -2.494140625, -2.232177734375, -1.97021484375, -1.708251953125, -1.4462890625, -1.184326171875, -0.92236328125, -0.660400390625, -0.3984375, -0.136474609375, 0.12548828125, 0.387451171875, 0.6494140625, 0.911376953125, 1.17333984375, 1.435302734375, 1.697265625, 1.959228515625, 2.22119140625, 2.483154296875, 2.7451171875, 3.007080078125, 3.26904296875, 3.531005859375, 3.79296875, 4.054931640625, 4.31689453125, 4.578857421875, 4.8408203125, 5.102783203125, 5.36474609375, 5.626708984375, 5.888671875, 6.150634765625, 6.41259765625, 6.674560546875, 6.9365234375, 7.198486328125, 7.46044921875, 7.722412109375, 7.984375]}, "gradients/decoder.transformer.h.1.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 1.0, 3.0, 1.0, 4.0, 6.0, 4.0, 13.0, 29.0, 26.0, 44.0, 58.0, 85.0, 112.0, 138.0, 168.0, 256.0, 405.0, 590.0, 976.0, 1793.0, 3814.0, 10469.0, 43394.0, 282742.0, 580630.0, 92381.0, 18698.0, 5715.0, 2413.0, 1256.0, 778.0, 520.0, 310.0, 191.0, 130.0, 104.0, 74.0, 60.0, 46.0, 29.0, 26.0, 13.0, 12.0, 12.0, 8.0, 8.0, 6.0, 3.0, 5.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 2.0], "bins": [-15.4609375, -14.9810791015625, -14.501220703125, -14.0213623046875, -13.54150390625, -13.0616455078125, -12.581787109375, -12.1019287109375, -11.6220703125, -11.1422119140625, -10.662353515625, -10.1824951171875, -9.70263671875, -9.2227783203125, -8.742919921875, -8.2630615234375, -7.783203125, -7.3033447265625, -6.823486328125, -6.3436279296875, -5.86376953125, -5.3839111328125, -4.904052734375, -4.4241943359375, -3.9443359375, -3.4644775390625, -2.984619140625, -2.5047607421875, -2.02490234375, -1.5450439453125, -1.065185546875, -0.5853271484375, -0.10546875, 0.3743896484375, 0.854248046875, 1.3341064453125, 1.81396484375, 2.2938232421875, 2.773681640625, 3.2535400390625, 3.7333984375, 4.2132568359375, 4.693115234375, 5.1729736328125, 5.65283203125, 6.1326904296875, 6.612548828125, 7.0924072265625, 7.572265625, 8.0521240234375, 8.531982421875, 9.0118408203125, 9.49169921875, 9.9715576171875, 10.451416015625, 10.9312744140625, 11.4111328125, 11.8909912109375, 12.370849609375, 12.8507080078125, 13.33056640625, 13.8104248046875, 14.290283203125, 14.7701416015625, 15.25]}, "gradients/decoder.transformer.h.1.attn.c_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 2.0, 7.0, 11.0, 8.0, 7.0, 21.0, 16.0, 29.0, 31.0, 28.0, 38.0, 44.0, 61.0, 91.0, 177.0, 1569.0, 366.0, 142.0, 94.0, 70.0, 45.0, 39.0, 32.0, 28.0, 23.0, 14.0, 27.0, 7.0, 4.0, 6.0, 4.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-27.875, -26.9716796875, -26.068359375, -25.1650390625, -24.26171875, -23.3583984375, -22.455078125, -21.5517578125, -20.6484375, -19.7451171875, -18.841796875, -17.9384765625, -17.03515625, -16.1318359375, -15.228515625, -14.3251953125, -13.421875, -12.5185546875, -11.615234375, -10.7119140625, -9.80859375, -8.9052734375, -8.001953125, -7.0986328125, -6.1953125, -5.2919921875, -4.388671875, -3.4853515625, -2.58203125, -1.6787109375, -0.775390625, 0.1279296875, 1.03125, 1.9345703125, 2.837890625, 3.7412109375, 4.64453125, 5.5478515625, 6.451171875, 7.3544921875, 8.2578125, 9.1611328125, 10.064453125, 10.9677734375, 11.87109375, 12.7744140625, 13.677734375, 14.5810546875, 15.484375, 16.3876953125, 17.291015625, 18.1943359375, 19.09765625, 20.0009765625, 20.904296875, 21.8076171875, 22.7109375, 23.6142578125, 24.517578125, 25.4208984375, 26.32421875, 27.2275390625, 28.130859375, 29.0341796875, 29.9375]}, "gradients/decoder.transformer.h.1.attn.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 3.0, 1.0, 3.0, 3.0, 15.0, 15.0, 19.0, 24.0, 35.0, 37.0, 73.0, 166.0, 285.0, 650.0, 2640.0, 3132158.0, 7973.0, 809.0, 351.0, 177.0, 94.0, 47.0, 24.0, 27.0, 22.0, 16.0, 10.0, 10.0, 5.0, 5.0, 4.0, 5.0, 3.0, 0.0, 0.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.5, -87.8095703125, -85.119140625, -82.4287109375, -79.73828125, -77.0478515625, -74.357421875, -71.6669921875, -68.9765625, -66.2861328125, -63.595703125, -60.9052734375, -58.21484375, -55.5244140625, -52.833984375, -50.1435546875, -47.453125, -44.7626953125, -42.072265625, -39.3818359375, -36.69140625, -34.0009765625, -31.310546875, -28.6201171875, -25.9296875, -23.2392578125, -20.548828125, -17.8583984375, -15.16796875, -12.4775390625, -9.787109375, -7.0966796875, -4.40625, -1.7158203125, 0.974609375, 3.6650390625, 6.35546875, 9.0458984375, 11.736328125, 14.4267578125, 17.1171875, 19.8076171875, 22.498046875, 25.1884765625, 27.87890625, 30.5693359375, 33.259765625, 35.9501953125, 38.640625, 41.3310546875, 44.021484375, 46.7119140625, 49.40234375, 52.0927734375, 54.783203125, 57.4736328125, 60.1640625, 62.8544921875, 65.544921875, 68.2353515625, 70.92578125, 73.6162109375, 76.306640625, 78.9970703125, 81.6875]}, "gradients/decoder.transformer.h.1.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 172.0, 827.0, 12.0, 2.0], "bins": [-472.2624206542969, -464.5577087402344, -456.8529968261719, -449.14825439453125, -441.44354248046875, -433.73883056640625, -426.03411865234375, -418.32940673828125, -410.6246643066406, -402.9199523925781, -395.2152404785156, -387.510498046875, -379.8057861328125, -372.10107421875, -364.3963623046875, -356.691650390625, -348.9869384765625, -341.2822265625, -333.5775146484375, -325.8727722167969, -318.1680603027344, -310.4633483886719, -302.7586364746094, -295.0539245605469, -287.34918212890625, -279.64447021484375, -271.93975830078125, -264.2350158691406, -256.5303039550781, -248.82559204101562, -241.12088012695312, -233.41615295410156, -225.71142578125, -218.0067138671875, -210.30198669433594, -202.59727478027344, -194.89254760742188, -187.18783569335938, -179.48312377929688, -171.7783966064453, -164.0736846923828, -156.3689727783203, -148.66424560546875, -140.95953369140625, -133.2548065185547, -125.55009460449219, -117.84537506103516, -110.14065551757812, -102.43594360351562, -94.7312240600586, -87.02650451660156, -79.32179260253906, -71.61707305908203, -63.912353515625, -56.20763397216797, -48.5029182434082, -40.79819869995117, -33.09347915649414, -25.388763427734375, -17.684043884277344, -9.979326248168945, -2.274608612060547, 5.430110931396484, 13.13482666015625, 20.83954620361328]}, "gradients/decoder.transformer.h.1.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 5.0, 6.0, 4.0, 4.0, 12.0, 5.0, 9.0, 9.0, 12.0, 16.0, 13.0, 22.0, 24.0, 21.0, 23.0, 34.0, 35.0, 34.0, 44.0, 37.0, 44.0, 45.0, 35.0, 52.0, 32.0, 39.0, 44.0, 30.0, 28.0, 36.0, 30.0, 22.0, 26.0, 28.0, 25.0, 23.0, 15.0, 13.0, 13.0, 7.0, 11.0, 8.0, 6.0, 7.0, 8.0, 4.0, 3.0, 1.0, 1.0, 4.0, 2.0, 1.0, 0.0, 2.0], "bins": [-51.977237701416016, -50.453521728515625, -48.929805755615234, -47.406089782714844, -45.88237380981445, -44.35865783691406, -42.83494186401367, -41.31122589111328, -39.78750991821289, -38.2637939453125, -36.74007797241211, -35.21636199951172, -33.69264602661133, -32.16893005371094, -30.645214080810547, -29.121498107910156, -27.597782135009766, -26.074066162109375, -24.550350189208984, -23.026634216308594, -21.502918243408203, -19.979202270507812, -18.455486297607422, -16.93177032470703, -15.40805435180664, -13.88433837890625, -12.36062240600586, -10.836906433105469, -9.313190460205078, -7.7894744873046875, -6.265758514404297, -4.742042541503906, -3.2183303833007812, -1.6946144104003906, -0.1708984375, 1.3528175354003906, 2.8765335083007812, 4.400249481201172, 5.9239654541015625, 7.447681427001953, 8.971397399902344, 10.495113372802734, 12.018829345703125, 13.542545318603516, 15.066261291503906, 16.589977264404297, 18.113693237304688, 19.637409210205078, 21.16112518310547, 22.68484115600586, 24.20855712890625, 25.73227310180664, 27.25598907470703, 28.779705047607422, 30.303421020507812, 31.827136993408203, 33.350852966308594, 34.874568939208984, 36.398284912109375, 37.922000885009766, 39.445716857910156, 40.96943283081055, 42.49314880371094, 44.01686477661133, 45.54058074951172]}, "gradients/decoder.transformer.h.0.mlp.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 3.0, 6.0, 3.0, 3.0, 6.0, 9.0, 8.0, 16.0, 14.0, 19.0, 26.0, 27.0, 23.0, 37.0, 36.0, 30.0, 34.0, 43.0, 41.0, 52.0, 42.0, 60.0, 40.0, 42.0, 53.0, 50.0, 44.0, 28.0, 27.0, 23.0, 27.0, 26.0, 16.0, 18.0, 18.0, 12.0, 12.0, 11.0, 5.0, 6.0, 4.0, 3.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-10.46875, -10.15576171875, -9.8427734375, -9.52978515625, -9.216796875, -8.90380859375, -8.5908203125, -8.27783203125, -7.96484375, -7.65185546875, -7.3388671875, -7.02587890625, -6.712890625, -6.39990234375, -6.0869140625, -5.77392578125, -5.4609375, -5.14794921875, -4.8349609375, -4.52197265625, -4.208984375, -3.89599609375, -3.5830078125, -3.27001953125, -2.95703125, -2.64404296875, -2.3310546875, -2.01806640625, -1.705078125, -1.39208984375, -1.0791015625, -0.76611328125, -0.453125, -0.14013671875, 0.1728515625, 0.48583984375, 0.798828125, 1.11181640625, 1.4248046875, 1.73779296875, 2.05078125, 2.36376953125, 2.6767578125, 2.98974609375, 3.302734375, 3.61572265625, 3.9287109375, 4.24169921875, 4.5546875, 4.86767578125, 5.1806640625, 5.49365234375, 5.806640625, 6.11962890625, 6.4326171875, 6.74560546875, 7.05859375, 7.37158203125, 7.6845703125, 7.99755859375, 8.310546875, 8.62353515625, 8.9365234375, 9.24951171875, 9.5625]}, "gradients/decoder.transformer.h.0.mlp.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 2.0, 9.0, 9.0, 11.0, 16.0, 23.0, 25.0, 19.0, 50.0, 55.0, 69.0, 69.0, 93.0, 104.0, 180.0, 215.0, 305.0, 441.0, 704.0, 1445.0, 4976.0, 145922.0, 3891797.0, 139015.0, 4895.0, 1451.0, 728.0, 455.0, 260.0, 219.0, 161.0, 109.0, 91.0, 76.0, 73.0, 39.0, 44.0, 28.0, 22.0, 18.0, 21.0, 10.0, 6.0, 10.0, 2.0, 3.0, 5.0, 5.0, 3.0, 3.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-53.25, -51.50390625, -49.7578125, -48.01171875, -46.265625, -44.51953125, -42.7734375, -41.02734375, -39.28125, -37.53515625, -35.7890625, -34.04296875, -32.296875, -30.55078125, -28.8046875, -27.05859375, -25.3125, -23.56640625, -21.8203125, -20.07421875, -18.328125, -16.58203125, -14.8359375, -13.08984375, -11.34375, -9.59765625, -7.8515625, -6.10546875, -4.359375, -2.61328125, -0.8671875, 0.87890625, 2.625, 4.37109375, 6.1171875, 7.86328125, 9.609375, 11.35546875, 13.1015625, 14.84765625, 16.59375, 18.33984375, 20.0859375, 21.83203125, 23.578125, 25.32421875, 27.0703125, 28.81640625, 30.5625, 32.30859375, 34.0546875, 35.80078125, 37.546875, 39.29296875, 41.0390625, 42.78515625, 44.53125, 46.27734375, 48.0234375, 49.76953125, 51.515625, 53.26171875, 55.0078125, 56.75390625, 58.5]}, "gradients/decoder.transformer.h.0.mlp.c_fc.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 5.0, 4.0, 8.0, 8.0, 7.0, 5.0, 23.0, 36.0, 46.0, 75.0, 95.0, 164.0, 249.0, 487.0, 687.0, 715.0, 507.0, 364.0, 227.0, 152.0, 68.0, 52.0, 28.0, 17.0, 16.0, 9.0, 7.0, 7.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.734375, -18.0927734375, -17.451171875, -16.8095703125, -16.16796875, -15.5263671875, -14.884765625, -14.2431640625, -13.6015625, -12.9599609375, -12.318359375, -11.6767578125, -11.03515625, -10.3935546875, -9.751953125, -9.1103515625, -8.46875, -7.8271484375, -7.185546875, -6.5439453125, -5.90234375, -5.2607421875, -4.619140625, -3.9775390625, -3.3359375, -2.6943359375, -2.052734375, -1.4111328125, -0.76953125, -0.1279296875, 0.513671875, 1.1552734375, 1.796875, 2.4384765625, 3.080078125, 3.7216796875, 4.36328125, 5.0048828125, 5.646484375, 6.2880859375, 6.9296875, 7.5712890625, 8.212890625, 8.8544921875, 9.49609375, 10.1376953125, 10.779296875, 11.4208984375, 12.0625, 12.7041015625, 13.345703125, 13.9873046875, 14.62890625, 15.2705078125, 15.912109375, 16.5537109375, 17.1953125, 17.8369140625, 18.478515625, 19.1201171875, 19.76171875, 20.4033203125, 21.044921875, 21.6865234375, 22.328125]}, "gradients/decoder.transformer.h.0.mlp.c_fc.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 0.0, 2.0, 1.0, 1.0, 3.0, 4.0, 7.0, 8.0, 14.0, 13.0, 47.0, 70.0, 144.0, 274.0, 580.0, 1805.0, 6456.0, 39857.0, 693182.0, 3256620.0, 173370.0, 16250.0, 3604.0, 1084.0, 452.0, 192.0, 110.0, 49.0, 30.0, 23.0, 12.0, 11.0, 9.0, 4.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.3125, -24.50341796875, -23.6943359375, -22.88525390625, -22.076171875, -21.26708984375, -20.4580078125, -19.64892578125, -18.83984375, -18.03076171875, -17.2216796875, -16.41259765625, -15.603515625, -14.79443359375, -13.9853515625, -13.17626953125, -12.3671875, -11.55810546875, -10.7490234375, -9.93994140625, -9.130859375, -8.32177734375, -7.5126953125, -6.70361328125, -5.89453125, -5.08544921875, -4.2763671875, -3.46728515625, -2.658203125, -1.84912109375, -1.0400390625, -0.23095703125, 0.578125, 1.38720703125, 2.1962890625, 3.00537109375, 3.814453125, 4.62353515625, 5.4326171875, 6.24169921875, 7.05078125, 7.85986328125, 8.6689453125, 9.47802734375, 10.287109375, 11.09619140625, 11.9052734375, 12.71435546875, 13.5234375, 14.33251953125, 15.1416015625, 15.95068359375, 16.759765625, 17.56884765625, 18.3779296875, 19.18701171875, 19.99609375, 20.80517578125, 21.6142578125, 22.42333984375, 23.232421875, 24.04150390625, 24.8505859375, 25.65966796875, 26.46875]}, "gradients/decoder.transformer.h.0.ln_2.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 5.0, 10.0, 10.0, 10.0, 18.0, 32.0, 41.0, 55.0, 68.0, 97.0, 118.0, 106.0, 123.0, 89.0, 76.0, 51.0, 40.0, 19.0, 15.0, 9.0, 7.0, 1.0, 2.0, 0.0, 4.0, 1.0, 2.0, 2.0], "bins": [-169.18980407714844, -165.64413452148438, -162.09848022460938, -158.5528106689453, -155.00714111328125, -151.4614715576172, -147.91580200195312, -144.37014770507812, -140.82447814941406, -137.27880859375, -133.733154296875, -130.18748474121094, -126.64181518554688, -123.09614562988281, -119.55048370361328, -116.00482177734375, -112.45915222167969, -108.91348266601562, -105.3678207397461, -101.82215881347656, -98.2764892578125, -94.73081970214844, -91.1851577758789, -87.63949584960938, -84.09382629394531, -80.54815673828125, -77.00249481201172, -73.45683288574219, -69.91116333007812, -66.36549377441406, -62.81983184814453, -59.274166107177734, -55.72850799560547, -52.18284225463867, -48.637176513671875, -45.09151077270508, -41.54584503173828, -38.000179290771484, -34.45451354980469, -30.90884780883789, -27.363182067871094, -23.817516326904297, -20.2718505859375, -16.726184844970703, -13.180519104003906, -9.63485336303711, -6.0891876220703125, -2.5435218811035156, 1.0021438598632812, 4.547809600830078, 8.093475341796875, 11.639141082763672, 15.184806823730469, 18.730472564697266, 22.276138305664062, 25.82180404663086, 29.367469787597656, 32.91313552856445, 36.45880126953125, 40.00446701049805, 43.550132751464844, 47.09579849243164, 50.64146423339844, 54.187129974365234, 57.73279571533203]}, "gradients/decoder.transformer.h.0.ln_2.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 5.0, 4.0, 3.0, 0.0, 6.0, 8.0, 6.0, 13.0, 16.0, 19.0, 16.0, 27.0, 33.0, 31.0, 34.0, 37.0, 44.0, 47.0, 46.0, 43.0, 48.0, 44.0, 30.0, 53.0, 47.0, 38.0, 31.0, 40.0, 27.0, 35.0, 23.0, 26.0, 21.0, 23.0, 15.0, 13.0, 12.0, 4.0, 8.0, 9.0, 4.0, 15.0, 5.0, 0.0, 1.0, 3.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-62.480873107910156, -60.58003234863281, -58.67919158935547, -56.77835464477539, -54.87751388549805, -52.9766731262207, -51.075836181640625, -49.17499542236328, -47.27415466308594, -45.373313903808594, -43.47247314453125, -41.57163619995117, -39.67079544067383, -37.769954681396484, -35.869117736816406, -33.96827697753906, -32.06743621826172, -30.166595458984375, -28.265756607055664, -26.364917755126953, -24.46407699584961, -22.563236236572266, -20.662397384643555, -18.761558532714844, -16.8607177734375, -14.959877967834473, -13.059038162231445, -11.158198356628418, -9.25735855102539, -7.356518745422363, -5.455678939819336, -3.5548391342163086, -1.6539993286132812, 0.2468404769897461, 2.1476802825927734, 4.048520088195801, 5.949359893798828, 7.8501996994018555, 9.751039505004883, 11.65187931060791, 13.552719116210938, 15.453558921813965, 17.354398727416992, 19.255237579345703, 21.156078338623047, 23.05691909790039, 24.9577579498291, 26.858596801757812, 28.759437561035156, 30.6602783203125, 32.561119079589844, 34.46195602416992, 36.362796783447266, 38.26363754272461, 40.16447448730469, 42.06531524658203, 43.966156005859375, 45.86699676513672, 47.76783752441406, 49.66867446899414, 51.569515228271484, 53.47035598754883, 55.371192932128906, 57.27203369140625, 59.172874450683594]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 10.0, 10.0, 11.0, 24.0, 24.0, 18.0, 25.0, 33.0, 24.0, 35.0, 42.0, 54.0, 41.0, 44.0, 59.0, 53.0, 36.0, 43.0, 41.0, 47.0, 41.0, 39.0, 27.0, 27.0, 27.0, 24.0, 21.0, 18.0, 15.0, 11.0, 9.0, 16.0, 8.0, 1.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-108.6875, -105.3935546875, -102.099609375, -98.8056640625, -95.51171875, -92.2177734375, -88.923828125, -85.6298828125, -82.3359375, -79.0419921875, -75.748046875, -72.4541015625, -69.16015625, -65.8662109375, -62.572265625, -59.2783203125, -55.984375, -52.6904296875, -49.396484375, -46.1025390625, -42.80859375, -39.5146484375, -36.220703125, -32.9267578125, -29.6328125, -26.3388671875, -23.044921875, -19.7509765625, -16.45703125, -13.1630859375, -9.869140625, -6.5751953125, -3.28125, 0.0126953125, 3.306640625, 6.6005859375, 9.89453125, 13.1884765625, 16.482421875, 19.7763671875, 23.0703125, 26.3642578125, 29.658203125, 32.9521484375, 36.24609375, 39.5400390625, 42.833984375, 46.1279296875, 49.421875, 52.7158203125, 56.009765625, 59.3037109375, 62.59765625, 65.8916015625, 69.185546875, 72.4794921875, 75.7734375, 79.0673828125, 82.361328125, 85.6552734375, 88.94921875, 92.2431640625, 95.537109375, 98.8310546875, 102.125]}, "gradients/decoder.transformer.h.0.crossattention.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 1.0, 1.0, 4.0, 10.0, 13.0, 29.0, 24.0, 49.0, 75.0, 93.0, 145.0, 221.0, 331.0, 464.0, 710.0, 1087.0, 1617.0, 2432.0, 3586.0, 5402.0, 8233.0, 12596.0, 19356.0, 28994.0, 45470.0, 69884.0, 106764.0, 148354.0, 167261.0, 140708.0, 98707.0, 64539.0, 42018.0, 27372.0, 17581.0, 11690.0, 7690.0, 4993.0, 3358.0, 2223.0, 1507.0, 1004.0, 667.0, 427.0, 289.0, 176.0, 121.0, 95.0, 62.0, 46.0, 33.0, 27.0, 8.0, 9.0, 6.0, 3.0, 2.0, 2.0, 1.0, 1.0], "bins": [-7.30078125, -7.07550048828125, -6.8502197265625, -6.62493896484375, -6.399658203125, -6.17437744140625, -5.9490966796875, -5.72381591796875, -5.49853515625, -5.27325439453125, -5.0479736328125, -4.82269287109375, -4.597412109375, -4.37213134765625, -4.1468505859375, -3.92156982421875, -3.6962890625, -3.47100830078125, -3.2457275390625, -3.02044677734375, -2.795166015625, -2.56988525390625, -2.3446044921875, -2.11932373046875, -1.89404296875, -1.66876220703125, -1.4434814453125, -1.21820068359375, -0.992919921875, -0.76763916015625, -0.5423583984375, -0.31707763671875, -0.091796875, 0.13348388671875, 0.3587646484375, 0.58404541015625, 0.809326171875, 1.03460693359375, 1.2598876953125, 1.48516845703125, 1.71044921875, 1.93572998046875, 2.1610107421875, 2.38629150390625, 2.611572265625, 2.83685302734375, 3.0621337890625, 3.28741455078125, 3.5126953125, 3.73797607421875, 3.9632568359375, 4.18853759765625, 4.413818359375, 4.63909912109375, 4.8643798828125, 5.08966064453125, 5.31494140625, 5.54022216796875, 5.7655029296875, 5.99078369140625, 6.216064453125, 6.44134521484375, 6.6666259765625, 6.89190673828125, 7.1171875]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 4.0, 5.0, 3.0, 9.0, 5.0, 8.0, 8.0, 8.0, 9.0, 13.0, 20.0, 14.0, 14.0, 25.0, 27.0, 34.0, 33.0, 37.0, 42.0, 43.0, 41.0, 39.0, 37.0, 32.0, 1057.0, 43.0, 27.0, 47.0, 42.0, 30.0, 36.0, 30.0, 31.0, 27.0, 27.0, 17.0, 22.0, 10.0, 12.0, 9.0, 9.0, 8.0, 12.0, 8.0, 4.0, 6.0, 6.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0], "bins": [-58.375, -56.5576171875, -54.740234375, -52.9228515625, -51.10546875, -49.2880859375, -47.470703125, -45.6533203125, -43.8359375, -42.0185546875, -40.201171875, -38.3837890625, -36.56640625, -34.7490234375, -32.931640625, -31.1142578125, -29.296875, -27.4794921875, -25.662109375, -23.8447265625, -22.02734375, -20.2099609375, -18.392578125, -16.5751953125, -14.7578125, -12.9404296875, -11.123046875, -9.3056640625, -7.48828125, -5.6708984375, -3.853515625, -2.0361328125, -0.21875, 1.5986328125, 3.416015625, 5.2333984375, 7.05078125, 8.8681640625, 10.685546875, 12.5029296875, 14.3203125, 16.1376953125, 17.955078125, 19.7724609375, 21.58984375, 23.4072265625, 25.224609375, 27.0419921875, 28.859375, 30.6767578125, 32.494140625, 34.3115234375, 36.12890625, 37.9462890625, 39.763671875, 41.5810546875, 43.3984375, 45.2158203125, 47.033203125, 48.8505859375, 50.66796875, 52.4853515625, 54.302734375, 56.1201171875, 57.9375]}, "gradients/decoder.transformer.h.0.crossattention.c_attn.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 10.0, 4.0, 12.0, 16.0, 23.0, 32.0, 78.0, 93.0, 164.0, 220.0, 347.0, 590.0, 950.0, 1406.0, 2388.0, 3623.0, 6158.0, 9821.0, 16320.0, 26628.0, 44435.0, 74160.0, 120135.0, 179429.0, 1233862.0, 144637.0, 90795.0, 55542.0, 33109.0, 20108.0, 12451.0, 7475.0, 4479.0, 2795.0, 1726.0, 1057.0, 744.0, 458.0, 291.0, 199.0, 134.0, 81.0, 45.0, 30.0, 30.0, 16.0, 12.0, 4.0, 4.0, 4.0, 3.0, 1.0, 1.0, 0.0, 2.0], "bins": [-7.9140625, -7.67578125, -7.4375, -7.19921875, -6.9609375, -6.72265625, -6.484375, -6.24609375, -6.0078125, -5.76953125, -5.53125, -5.29296875, -5.0546875, -4.81640625, -4.578125, -4.33984375, -4.1015625, -3.86328125, -3.625, -3.38671875, -3.1484375, -2.91015625, -2.671875, -2.43359375, -2.1953125, -1.95703125, -1.71875, -1.48046875, -1.2421875, -1.00390625, -0.765625, -0.52734375, -0.2890625, -0.05078125, 0.1875, 0.42578125, 0.6640625, 0.90234375, 1.140625, 1.37890625, 1.6171875, 1.85546875, 2.09375, 2.33203125, 2.5703125, 2.80859375, 3.046875, 3.28515625, 3.5234375, 3.76171875, 4.0, 4.23828125, 4.4765625, 4.71484375, 4.953125, 5.19140625, 5.4296875, 5.66796875, 5.90625, 6.14453125, 6.3828125, 6.62109375, 6.859375, 7.09765625, 7.3359375]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 3.0, 2.0, 2.0, 4.0, 4.0, 3.0, 5.0, 4.0, 11.0, 9.0, 13.0, 11.0, 16.0, 14.0, 26.0, 19.0, 19.0, 24.0, 22.0, 39.0, 32.0, 36.0, 31.0, 42.0, 43.0, 36.0, 49.0, 37.0, 33.0, 36.0, 44.0, 40.0, 38.0, 31.0, 35.0, 24.0, 16.0, 23.0, 19.0, 21.0, 24.0, 12.0, 6.0, 8.0, 9.0, 8.0, 7.0, 4.0, 8.0, 2.0, 2.0, 5.0, 3.0, 3.0, 1.0, 1.0, 1.0], "bins": [-0.049224853515625, -0.04775667190551758, -0.046288490295410156, -0.044820308685302734, -0.04335212707519531, -0.04188394546508789, -0.04041576385498047, -0.03894758224487305, -0.037479400634765625, -0.0360112190246582, -0.03454303741455078, -0.03307485580444336, -0.03160667419433594, -0.030138492584228516, -0.028670310974121094, -0.027202129364013672, -0.02573394775390625, -0.024265766143798828, -0.022797584533691406, -0.021329402923583984, -0.019861221313476562, -0.01839303970336914, -0.01692485809326172, -0.015456676483154297, -0.013988494873046875, -0.012520313262939453, -0.011052131652832031, -0.00958395004272461, -0.008115768432617188, -0.006647586822509766, -0.005179405212402344, -0.003711223602294922, -0.0022430419921875, -0.0007748603820800781, 0.0006933212280273438, 0.0021615028381347656, 0.0036296844482421875, 0.005097866058349609, 0.006566047668457031, 0.008034229278564453, 0.009502410888671875, 0.010970592498779297, 0.012438774108886719, 0.01390695571899414, 0.015375137329101562, 0.016843318939208984, 0.018311500549316406, 0.019779682159423828, 0.02124786376953125, 0.022716045379638672, 0.024184226989746094, 0.025652408599853516, 0.027120590209960938, 0.02858877182006836, 0.03005695343017578, 0.0315251350402832, 0.032993316650390625, 0.03446149826049805, 0.03592967987060547, 0.03739786148071289, 0.03886604309082031, 0.040334224700927734, 0.041802406311035156, 0.04327058792114258, 0.04473876953125]}, "gradients/decoder.transformer.h.0.crossattention.q_attn.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 7.0, 8.0, 11.0, 17.0, 21.0, 21.0, 25.0, 39.0, 50.0, 62.0, 101.0, 113.0, 183.0, 262.0, 438.0, 705.0, 1413.0, 2699.0, 6075.0, 15147.0, 40183.0, 114895.0, 315833.0, 343787.0, 130440.0, 45674.0, 16710.0, 6884.0, 2961.0, 1575.0, 806.0, 459.0, 293.0, 194.0, 117.0, 98.0, 65.0, 42.0, 33.0, 25.0, 26.0, 12.0, 10.0, 13.0, 10.0, 2.0, 2.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-0.336669921875, -0.325469970703125, -0.31427001953125, -0.303070068359375, -0.2918701171875, -0.280670166015625, -0.26947021484375, -0.258270263671875, -0.2470703125, -0.235870361328125, -0.22467041015625, -0.213470458984375, -0.2022705078125, -0.191070556640625, -0.17987060546875, -0.168670654296875, -0.157470703125, -0.146270751953125, -0.13507080078125, -0.123870849609375, -0.1126708984375, -0.101470947265625, -0.09027099609375, -0.079071044921875, -0.06787109375, -0.056671142578125, -0.04547119140625, -0.034271240234375, -0.0230712890625, -0.011871337890625, -0.00067138671875, 0.010528564453125, 0.021728515625, 0.032928466796875, 0.04412841796875, 0.055328369140625, 0.0665283203125, 0.077728271484375, 0.08892822265625, 0.100128173828125, 0.111328125, 0.122528076171875, 0.13372802734375, 0.144927978515625, 0.1561279296875, 0.167327880859375, 0.17852783203125, 0.189727783203125, 0.200927734375, 0.212127685546875, 0.22332763671875, 0.234527587890625, 0.2457275390625, 0.256927490234375, 0.26812744140625, 0.279327392578125, 0.29052734375, 0.301727294921875, 0.31292724609375, 0.324127197265625, 0.3353271484375, 0.346527099609375, 0.35772705078125, 0.368927001953125, 0.380126953125]}, "gradients/decoder.transformer.h.0.ln_cross_attn.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 5.0, 5.0, 6.0, 9.0, 17.0, 24.0, 31.0, 27.0, 41.0, 67.0, 68.0, 83.0, 72.0, 92.0, 77.0, 86.0, 61.0, 46.0, 48.0, 43.0, 30.0, 21.0, 17.0, 7.0, 9.0, 6.0, 3.0, 2.0, 2.0, 3.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.10573045164346695, -0.10330674797296524, -0.10088305175304413, -0.09845934808254242, -0.09603564441204071, -0.093611940741539, -0.09118823707103729, -0.08876454085111618, -0.08634083718061447, -0.08391713351011276, -0.08149343729019165, -0.07906973361968994, -0.07664602994918823, -0.07422232627868652, -0.07179862260818481, -0.0693749263882637, -0.066951222717762, -0.06452751904726028, -0.062103819102048874, -0.05968011915683746, -0.057256415486335754, -0.054832711815834045, -0.052409011870622635, -0.049985311925411224, -0.047561608254909515, -0.045137904584407806, -0.042714204639196396, -0.040290504693984985, -0.037866801023483276, -0.03544309735298157, -0.03301939740777016, -0.030595695599913597, -0.028171993792057037, -0.025748291984200478, -0.023324590176343918, -0.020900888368487358, -0.0184771865606308, -0.01605348475277424, -0.013629782944917679, -0.011206081137061119, -0.00878237932920456, -0.006358677521348, -0.00393497571349144, -0.00151127390563488, 0.0009124279022216797, 0.0033361297100782394, 0.005759831517934799, 0.008183533325791359, 0.010607235133647919, 0.013030936941504478, 0.015454638749361038, 0.017878340557217598, 0.020302042365074158, 0.022725744172930717, 0.025149445980787277, 0.027573147788643837, 0.029996849596500397, 0.032420553267002106, 0.034844253212213516, 0.03726795315742493, 0.039691656827926636, 0.042115360498428345, 0.044539060443639755, 0.046962760388851166, 0.049386464059352875]}, "gradients/decoder.transformer.h.0.ln_cross_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 2.0, 4.0, 2.0, 3.0, 7.0, 7.0, 12.0, 8.0, 10.0, 8.0, 20.0, 15.0, 27.0, 17.0, 25.0, 30.0, 25.0, 26.0, 43.0, 40.0, 29.0, 40.0, 47.0, 40.0, 32.0, 40.0, 43.0, 42.0, 36.0, 43.0, 36.0, 36.0, 30.0, 26.0, 23.0, 19.0, 18.0, 15.0, 16.0, 13.0, 10.0, 8.0, 7.0, 6.0, 4.0, 4.0, 2.0, 6.0, 5.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0], "bins": [-0.028862714767456055, -0.02783888950943947, -0.026815062388777733, -0.025791235268115997, -0.02476741001009941, -0.023743584752082825, -0.02271975763142109, -0.021695930510759354, -0.020672105252742767, -0.01964827999472618, -0.018624452874064445, -0.01760062575340271, -0.016576800495386124, -0.015552974306046963, -0.014529148116707802, -0.013505321927368641, -0.01248149573802948, -0.011457669548690319, -0.010433843359351158, -0.009410017170011997, -0.008386190980672836, -0.007362364791333675, -0.0063385386019945145, -0.0053147124126553535, -0.004290886223316193, -0.0032670600339770317, -0.002243233844637871, -0.0012194076552987099, -0.00019558146595954895, 0.000828244723379612, 0.0018520709127187729, 0.002875897102057934, 0.0038997232913970947, 0.004923549480736256, 0.0059473756700754166, 0.0069712018594145775, 0.007995028048753738, 0.0090188542380929, 0.01004268042743206, 0.011066506616771221, 0.012090332806110382, 0.013114158995449543, 0.014137985184788704, 0.015161811374127865, 0.016185637563467026, 0.017209462821483612, 0.018233289942145348, 0.019257117062807083, 0.02028094232082367, 0.021304767578840256, 0.02232859469950199, 0.023352421820163727, 0.024376247078180313, 0.0254000723361969, 0.026423899456858635, 0.02744772657752037, 0.028471551835536957, 0.029495377093553543, 0.03051920421421528, 0.031543031334877014, 0.0325668565928936, 0.03359068185091019, 0.03461451083421707, 0.03563833609223366, 0.036662161350250244]}, "gradients/decoder.transformer.h.0.attn.c_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 2.0, 4.0, 4.0, 6.0, 8.0, 9.0, 11.0, 11.0, 24.0, 23.0, 19.0, 26.0, 33.0, 23.0, 36.0, 42.0, 55.0, 38.0, 44.0, 60.0, 54.0, 35.0, 42.0, 42.0, 47.0, 41.0, 40.0, 27.0, 28.0, 26.0, 23.0, 21.0, 18.0, 15.0, 12.0, 8.0, 15.0, 9.0, 1.0, 8.0, 8.0, 6.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-108.75, -105.453125, -102.15625, -98.859375, -95.5625, -92.265625, -88.96875, -85.671875, -82.375, -79.078125, -75.78125, -72.484375, -69.1875, -65.890625, -62.59375, -59.296875, -56.0, -52.703125, -49.40625, -46.109375, -42.8125, -39.515625, -36.21875, -32.921875, -29.625, -26.328125, -23.03125, -19.734375, -16.4375, -13.140625, -9.84375, -6.546875, -3.25, 0.046875, 3.34375, 6.640625, 9.9375, 13.234375, 16.53125, 19.828125, 23.125, 26.421875, 29.71875, 33.015625, 36.3125, 39.609375, 42.90625, 46.203125, 49.5, 52.796875, 56.09375, 59.390625, 62.6875, 65.984375, 69.28125, 72.578125, 75.875, 79.171875, 82.46875, 85.765625, 89.0625, 92.359375, 95.65625, 98.953125, 102.25]}, "gradients/decoder.transformer.h.0.attn.c_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 0.0, 2.0, 5.0, 3.0, 7.0, 5.0, 1.0, 11.0, 14.0, 24.0, 27.0, 41.0, 39.0, 79.0, 120.0, 169.0, 277.0, 435.0, 735.0, 1280.0, 2269.0, 4528.0, 10340.0, 32787.0, 156858.0, 569239.0, 205508.0, 40925.0, 11969.0, 4928.0, 2432.0, 1281.0, 792.0, 524.0, 289.0, 189.0, 138.0, 70.0, 43.0, 54.0, 35.0, 21.0, 18.0, 20.0, 7.0, 6.0, 10.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.9375, -20.204833984375, -19.47216796875, -18.739501953125, -18.0068359375, -17.274169921875, -16.54150390625, -15.808837890625, -15.076171875, -14.343505859375, -13.61083984375, -12.878173828125, -12.1455078125, -11.412841796875, -10.68017578125, -9.947509765625, -9.21484375, -8.482177734375, -7.74951171875, -7.016845703125, -6.2841796875, -5.551513671875, -4.81884765625, -4.086181640625, -3.353515625, -2.620849609375, -1.88818359375, -1.155517578125, -0.4228515625, 0.309814453125, 1.04248046875, 1.775146484375, 2.5078125, 3.240478515625, 3.97314453125, 4.705810546875, 5.4384765625, 6.171142578125, 6.90380859375, 7.636474609375, 8.369140625, 9.101806640625, 9.83447265625, 10.567138671875, 11.2998046875, 12.032470703125, 12.76513671875, 13.497802734375, 14.23046875, 14.963134765625, 15.69580078125, 16.428466796875, 17.1611328125, 17.893798828125, 18.62646484375, 19.359130859375, 20.091796875, 20.824462890625, 21.55712890625, 22.289794921875, 23.0224609375, 23.755126953125, 24.48779296875, 25.220458984375, 25.953125]}, "gradients/decoder.transformer.h.0.attn.c_attn.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 8.0, 7.0, 2.0, 4.0, 8.0, 14.0, 17.0, 28.0, 20.0, 18.0, 31.0, 22.0, 28.0, 36.0, 27.0, 45.0, 43.0, 43.0, 49.0, 1799.0, 345.0, 41.0, 42.0, 47.0, 30.0, 43.0, 37.0, 37.0, 20.0, 22.0, 27.0, 20.0, 16.0, 16.0, 15.0, 12.0, 6.0, 12.0, 7.0, 6.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-110.5, -106.400390625, -102.30078125, -98.201171875, -94.1015625, -90.001953125, -85.90234375, -81.802734375, -77.703125, -73.603515625, -69.50390625, -65.404296875, -61.3046875, -57.205078125, -53.10546875, -49.005859375, -44.90625, -40.806640625, -36.70703125, -32.607421875, -28.5078125, -24.408203125, -20.30859375, -16.208984375, -12.109375, -8.009765625, -3.91015625, 0.189453125, 4.2890625, 8.388671875, 12.48828125, 16.587890625, 20.6875, 24.787109375, 28.88671875, 32.986328125, 37.0859375, 41.185546875, 45.28515625, 49.384765625, 53.484375, 57.583984375, 61.68359375, 65.783203125, 69.8828125, 73.982421875, 78.08203125, 82.181640625, 86.28125, 90.380859375, 94.48046875, 98.580078125, 102.6796875, 106.779296875, 110.87890625, 114.978515625, 119.078125, 123.177734375, 127.27734375, 131.376953125, 135.4765625, 139.576171875, 143.67578125, 147.775390625, 151.875]}, "gradients/decoder.transformer.h.0.attn.c_attn.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 6.0, 7.0, 9.0, 16.0, 20.0, 32.0, 37.0, 74.0, 104.0, 163.0, 255.0, 383.0, 746.0, 1478.0, 4893.0, 60375.0, 2903500.0, 160674.0, 8784.0, 1965.0, 880.0, 506.0, 269.0, 182.0, 113.0, 82.0, 46.0, 35.0, 19.0, 17.0, 9.0, 8.0, 4.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-43.59375, -42.21630859375, -40.8388671875, -39.46142578125, -38.083984375, -36.70654296875, -35.3291015625, -33.95166015625, -32.57421875, -31.19677734375, -29.8193359375, -28.44189453125, -27.064453125, -25.68701171875, -24.3095703125, -22.93212890625, -21.5546875, -20.17724609375, -18.7998046875, -17.42236328125, -16.044921875, -14.66748046875, -13.2900390625, -11.91259765625, -10.53515625, -9.15771484375, -7.7802734375, -6.40283203125, -5.025390625, -3.64794921875, -2.2705078125, -0.89306640625, 0.484375, 1.86181640625, 3.2392578125, 4.61669921875, 5.994140625, 7.37158203125, 8.7490234375, 10.12646484375, 11.50390625, 12.88134765625, 14.2587890625, 15.63623046875, 17.013671875, 18.39111328125, 19.7685546875, 21.14599609375, 22.5234375, 23.90087890625, 25.2783203125, 26.65576171875, 28.033203125, 29.41064453125, 30.7880859375, 32.16552734375, 33.54296875, 34.92041015625, 36.2978515625, 37.67529296875, 39.052734375, 40.43017578125, 41.8076171875, 43.18505859375, 44.5625]}, "gradients/decoder.transformer.h.0.ln_1.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 2.0, 2.0, 2.0, 6.0, 5.0, 6.0, 12.0, 21.0, 45.0, 115.0, 236.0, 249.0, 172.0, 73.0, 32.0, 11.0, 10.0, 4.0, 3.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0], "bins": [-582.6221313476562, -570.7791137695312, -558.9360961914062, -547.0930786132812, -535.25, -523.406982421875, -511.56396484375, -499.720947265625, -487.8779296875, -476.034912109375, -464.1918640136719, -452.3488464355469, -440.5058288574219, -428.6628112792969, -416.81976318359375, -404.97674560546875, -393.13372802734375, -381.29071044921875, -369.4476623535156, -357.6046447753906, -345.7616271972656, -333.9186096191406, -322.0755615234375, -310.2325439453125, -298.3894958496094, -286.5464782714844, -274.70343017578125, -262.86041259765625, -251.01739501953125, -239.1743621826172, -227.33132934570312, -215.48831176757812, -203.64527893066406, -191.80224609375, -179.959228515625, -168.11619567871094, -156.27317810058594, -144.43014526367188, -132.58712768554688, -120.74409484863281, -108.90106964111328, -97.05804443359375, -85.21501922607422, -73.37199401855469, -61.52896499633789, -49.68593978881836, -37.84291076660156, -25.99988555908203, -14.1568603515625, -2.3138341903686523, 9.529191970825195, 21.37221908569336, 33.21524429321289, 45.05826950073242, 56.90129852294922, 68.74432373046875, 80.58734893798828, 92.43037414550781, 104.27339935302734, 116.11642456054688, 127.95945739746094, 139.80247497558594, 151.6455078125, 163.488525390625, 175.33155822753906]}, "gradients/decoder.transformer.h.0.ln_1.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 8.0, 3.0, 10.0, 5.0, 9.0, 8.0, 11.0, 19.0, 21.0, 22.0, 27.0, 22.0, 30.0, 36.0, 37.0, 39.0, 35.0, 60.0, 46.0, 52.0, 61.0, 39.0, 46.0, 59.0, 33.0, 47.0, 31.0, 34.0, 36.0, 18.0, 21.0, 18.0, 14.0, 9.0, 8.0, 5.0, 6.0, 5.0, 5.0, 4.0, 3.0, 1.0, 5.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-170.09039306640625, -164.2017364501953, -158.31307983398438, -152.4244384765625, -146.53578186035156, -140.64712524414062, -134.7584686279297, -128.86981201171875, -122.98116302490234, -117.0925064086914, -111.203857421875, -105.31520080566406, -99.42654418945312, -93.53789520263672, -87.64923858642578, -81.76058959960938, -75.87193298339844, -69.9832763671875, -64.0946273803711, -58.205970764160156, -52.317317962646484, -46.42866516113281, -40.540008544921875, -34.6513557434082, -28.76270294189453, -22.87405014038086, -16.985395431518555, -11.09674072265625, -5.208087921142578, 0.6805648803710938, 6.569221496582031, 12.457874298095703, 18.346511840820312, 24.235164642333984, 30.12381935119629, 36.012474060058594, 41.901126861572266, 47.78977966308594, 53.678436279296875, 59.56708908081055, 65.45574188232422, 71.34439849853516, 77.23304748535156, 83.1217041015625, 89.01036071777344, 94.89900970458984, 100.78766632080078, 106.67631530761719, 112.56497192382812, 118.45362854003906, 124.34227752685547, 130.23092651367188, 136.1195831298828, 142.00823974609375, 147.8968963623047, 153.78555297851562, 159.6741943359375, 165.56285095214844, 171.45150756835938, 177.34014892578125, 183.2288055419922, 189.11746215820312, 195.00611877441406, 200.894775390625, 206.78343200683594]}, "gradients/decoder.transformer.wpe.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 3.0, 6.0, 3.0, 7.0, 7.0, 11.0, 18.0, 17.0, 34.0, 32.0, 43.0, 50.0, 67.0, 78.0, 95.0, 132.0, 153.0, 204.0, 228.0, 284.0, 358.0, 365.0, 531.0, 649.0, 1040830.0, 1142.0, 578.0, 490.0, 406.0, 323.0, 257.0, 232.0, 184.0, 133.0, 132.0, 106.0, 82.0, 69.0, 54.0, 42.0, 30.0, 27.0, 24.0, 15.0, 11.0, 9.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0], "bins": [-61.37311553955078, -59.66419982910156, -57.95528793334961, -56.24637222290039, -54.53746032714844, -52.82854461669922, -51.11962890625, -49.41071319580078, -47.70180130004883, -45.99288558959961, -44.283973693847656, -42.57505798339844, -40.86614227294922, -39.157230377197266, -37.44831466674805, -35.739402770996094, -34.030487060546875, -32.321571350097656, -30.612659454345703, -28.903743743896484, -27.1948299407959, -25.485916137695312, -23.777000427246094, -22.068086624145508, -20.359172821044922, -18.650259017944336, -16.94134521484375, -15.232429504394531, -13.523515701293945, -11.81460189819336, -10.105687141418457, -8.396772384643555, -6.687854766845703, -4.978940486907959, -3.270026206970215, -1.5611119270324707, 0.14780235290527344, 1.8567161560058594, 3.5656309127807617, 5.274545669555664, 6.98345947265625, 8.692373275756836, 10.401288032531738, 12.11020278930664, 13.819116592407227, 15.528030395507812, 17.23694610595703, 18.945859909057617, 20.654773712158203, 22.36368751525879, 24.072601318359375, 25.781517028808594, 27.49043083190918, 29.199344635009766, 30.908260345458984, 32.61717224121094, 34.326087951660156, 36.035003662109375, 37.74391555786133, 39.45283126831055, 41.1617431640625, 42.87065887451172, 44.57957458496094, 46.288490295410156, 47.99740219116211]}, "gradients/decoder.transformer.wte.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 2.0, 2.0, 1.0, 2.0, 3.0, 4.0, 3.0, 11.0, 5.0, 10.0, 6.0, 3.0, 16.0, 17.0, 34.0, 132.0, 28456.0, 51434396.0, 110.0, 30.0, 15.0, 12.0, 13.0, 8.0, 6.0, 5.0, 5.0, 0.0, 1.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5340.0, -5073.3935546875, -4806.78662109375, -4540.1796875, -4273.5732421875, -4006.966552734375, -3740.35986328125, -3473.753173828125, -3207.146484375, -2940.539794921875, -2673.93310546875, -2407.326416015625, -2140.7197265625, -1874.113037109375, -1607.50634765625, -1340.899658203125, -1074.29296875, -807.686279296875, -541.07958984375, -274.472900390625, -7.8662109375, 258.740478515625, 525.34716796875, 791.953857421875, 1058.560546875, 1325.167236328125, 1591.77392578125, 1858.380615234375, 2124.9873046875, 2391.593994140625, 2658.20068359375, 2924.807373046875, 3191.4140625, 3458.020751953125, 3724.62744140625, 3991.234130859375, 4257.8408203125, 4524.447265625, 4791.05419921875, 5057.6611328125, 5324.267578125, 5590.8740234375, 5857.48095703125, 6124.087890625, 6390.6943359375, 6657.30078125, 6923.90771484375, 7190.5146484375, 7457.12109375, 7723.7275390625, 7990.33447265625, 8256.94140625, 8523.5478515625, 8790.154296875, 9056.76171875, 9323.3681640625, 9589.974609375, 9856.5810546875, 10123.1875, 10389.794921875, 10656.4013671875, 10923.0078125, 11189.615234375, 11456.2216796875, 11722.828125]}, "gradients/encoder.adapter.layers.2.conv.weight": {"_type": "histogram", "values": [6.0, 6.0, 7.0, 8.0, 12.0, 15.0, 36.0, 47.0, 60.0, 85.0, 109.0, 194.0, 301.0, 472.0, 683.0, 1014.0, 1516.0, 2496.0, 3931.0, 6452.0, 10008.0, 15946.0, 26015.0, 41538.0, 68227.0, 109726.0, 175957.0, 275775.0, 412405.0, 3107569.0, 1009566.0, 369621.0, 244620.0, 154876.0, 95944.0, 59310.0, 36576.0, 22373.0, 14093.0, 8701.0, 5583.0, 3453.0, 2086.0, 1394.0, 932.0, 582.0, 366.0, 244.0, 178.0, 106.0, 74.0, 49.0, 34.0, 23.0, 12.0, 11.0, 8.0, 5.0, 5.0, 4.0, 2.0, 8.0, 0.0, 1.0], "bins": [-2.46875, -2.386077880859375, -2.30340576171875, -2.220733642578125, -2.1380615234375, -2.055389404296875, -1.97271728515625, -1.890045166015625, -1.807373046875, -1.724700927734375, -1.64202880859375, -1.559356689453125, -1.4766845703125, -1.394012451171875, -1.31134033203125, -1.228668212890625, -1.14599609375, -1.063323974609375, -0.98065185546875, -0.897979736328125, -0.8153076171875, -0.732635498046875, -0.64996337890625, -0.567291259765625, -0.484619140625, -0.401947021484375, -0.31927490234375, -0.236602783203125, -0.1539306640625, -0.071258544921875, 0.01141357421875, 0.094085693359375, 0.1767578125, 0.259429931640625, 0.34210205078125, 0.424774169921875, 0.5074462890625, 0.590118408203125, 0.67279052734375, 0.755462646484375, 0.838134765625, 0.920806884765625, 1.00347900390625, 1.086151123046875, 1.1688232421875, 1.251495361328125, 1.33416748046875, 1.416839599609375, 1.49951171875, 1.582183837890625, 1.66485595703125, 1.747528076171875, 1.8302001953125, 1.912872314453125, 1.99554443359375, 2.078216552734375, 2.160888671875, 2.243560791015625, 2.32623291015625, 2.408905029296875, 2.4915771484375, 2.574249267578125, 2.65692138671875, 2.739593505859375, 2.822265625]}, "gradients/encoder.adapter.layers.2.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 5.0, 4.0, 4.0, 8.0, 10.0, 15.0, 11.0, 15.0, 21.0, 32.0, 30.0, 31.0, 27.0, 35.0, 38.0, 28.0, 39.0, 54.0, 37.0, 99.0, 939.0, 135.0, 38.0, 55.0, 38.0, 32.0, 29.0, 45.0, 20.0, 27.0, 25.0, 24.0, 12.0, 9.0, 20.0, 12.0, 4.0, 3.0, 4.0, 5.0, 4.0, 3.0, 5.0, 7.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-25.421875, -24.666748046875, -23.91162109375, -23.156494140625, -22.4013671875, -21.646240234375, -20.89111328125, -20.135986328125, -19.380859375, -18.625732421875, -17.87060546875, -17.115478515625, -16.3603515625, -15.605224609375, -14.85009765625, -14.094970703125, -13.33984375, -12.584716796875, -11.82958984375, -11.074462890625, -10.3193359375, -9.564208984375, -8.80908203125, -8.053955078125, -7.298828125, -6.543701171875, -5.78857421875, -5.033447265625, -4.2783203125, -3.523193359375, -2.76806640625, -2.012939453125, -1.2578125, -0.502685546875, 0.25244140625, 1.007568359375, 1.7626953125, 2.517822265625, 3.27294921875, 4.028076171875, 4.783203125, 5.538330078125, 6.29345703125, 7.048583984375, 7.8037109375, 8.558837890625, 9.31396484375, 10.069091796875, 10.82421875, 11.579345703125, 12.33447265625, 13.089599609375, 13.8447265625, 14.599853515625, 15.35498046875, 16.110107421875, 16.865234375, 17.620361328125, 18.37548828125, 19.130615234375, 19.8857421875, 20.640869140625, 21.39599609375, 22.151123046875, 22.90625]}, "gradients/encoder.adapter.layers.1.conv.weight": {"_type": "histogram", "values": [2.0, 3.0, 2.0, 6.0, 10.0, 8.0, 21.0, 29.0, 50.0, 61.0, 120.0, 145.0, 205.0, 281.0, 472.0, 724.0, 1190.0, 1802.0, 2794.0, 4503.0, 7233.0, 11396.0, 18444.0, 29979.0, 49503.0, 81359.0, 136072.0, 225952.0, 364831.0, 807796.0, 3352760.0, 460852.0, 288806.0, 175153.0, 105332.0, 62691.0, 38254.0, 23380.0, 14454.0, 9189.0, 5789.0, 3553.0, 2216.0, 1454.0, 911.0, 566.0, 385.0, 227.0, 172.0, 112.0, 60.0, 43.0, 44.0, 15.0, 7.0, 11.0, 7.0, 4.0, 2.0, 4.0, 6.0, 0.0, 0.0, 4.0], "bins": [-2.6640625, -2.57598876953125, -2.4879150390625, -2.39984130859375, -2.311767578125, -2.22369384765625, -2.1356201171875, -2.04754638671875, -1.95947265625, -1.87139892578125, -1.7833251953125, -1.69525146484375, -1.607177734375, -1.51910400390625, -1.4310302734375, -1.34295654296875, -1.2548828125, -1.16680908203125, -1.0787353515625, -0.99066162109375, -0.902587890625, -0.81451416015625, -0.7264404296875, -0.63836669921875, -0.55029296875, -0.46221923828125, -0.3741455078125, -0.28607177734375, -0.197998046875, -0.10992431640625, -0.0218505859375, 0.06622314453125, 0.154296875, 0.24237060546875, 0.3304443359375, 0.41851806640625, 0.506591796875, 0.59466552734375, 0.6827392578125, 0.77081298828125, 0.85888671875, 0.94696044921875, 1.0350341796875, 1.12310791015625, 1.211181640625, 1.29925537109375, 1.3873291015625, 1.47540283203125, 1.5634765625, 1.65155029296875, 1.7396240234375, 1.82769775390625, 1.915771484375, 2.00384521484375, 2.0919189453125, 2.17999267578125, 2.26806640625, 2.35614013671875, 2.4442138671875, 2.53228759765625, 2.620361328125, 2.70843505859375, 2.7965087890625, 2.88458251953125, 2.97265625]}, "gradients/encoder.adapter.layers.1.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 0.0, 2.0, 2.0, 6.0, 3.0, 7.0, 4.0, 8.0, 14.0, 12.0, 13.0, 16.0, 23.0, 26.0, 32.0, 30.0, 31.0, 24.0, 37.0, 35.0, 38.0, 44.0, 55.0, 301.0, 790.0, 51.0, 49.0, 50.0, 39.0, 39.0, 40.0, 28.0, 26.0, 29.0, 16.0, 17.0, 25.0, 13.0, 9.0, 11.0, 12.0, 3.0, 5.0, 7.0, 4.0, 3.0, 5.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0], "bins": [-17.078125, -16.549072265625, -16.02001953125, -15.490966796875, -14.9619140625, -14.432861328125, -13.90380859375, -13.374755859375, -12.845703125, -12.316650390625, -11.78759765625, -11.258544921875, -10.7294921875, -10.200439453125, -9.67138671875, -9.142333984375, -8.61328125, -8.084228515625, -7.55517578125, -7.026123046875, -6.4970703125, -5.968017578125, -5.43896484375, -4.909912109375, -4.380859375, -3.851806640625, -3.32275390625, -2.793701171875, -2.2646484375, -1.735595703125, -1.20654296875, -0.677490234375, -0.1484375, 0.380615234375, 0.90966796875, 1.438720703125, 1.9677734375, 2.496826171875, 3.02587890625, 3.554931640625, 4.083984375, 4.613037109375, 5.14208984375, 5.671142578125, 6.2001953125, 6.729248046875, 7.25830078125, 7.787353515625, 8.31640625, 8.845458984375, 9.37451171875, 9.903564453125, 10.4326171875, 10.961669921875, 11.49072265625, 12.019775390625, 12.548828125, 13.077880859375, 13.60693359375, 14.135986328125, 14.6650390625, 15.194091796875, 15.72314453125, 16.252197265625, 16.78125]}, "gradients/encoder.adapter.layers.0.conv.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 4.0, 2.0, 2.0, 0.0, 3.0, 7.0, 5.0, 13.0, 11.0, 16.0, 20.0, 22.0, 29.0, 49.0, 70.0, 89.0, 126.0, 186.0, 279.0, 334.0, 502.0, 797.0, 1207.0, 1936.0, 3688.0, 7773.0, 21346.0, 84349.0, 5902716.0, 203896.0, 37777.0, 11969.0, 5085.0, 2581.0, 1474.0, 943.0, 656.0, 430.0, 285.0, 184.0, 166.0, 111.0, 95.0, 57.0, 28.0, 39.0, 19.0, 25.0, 11.0, 12.0, 3.0, 10.0, 0.0, 1.0, 4.0, 2.0, 5.0, 1.0, 1.0, 2.0], "bins": [-20.296875, -19.6767578125, -19.056640625, -18.4365234375, -17.81640625, -17.1962890625, -16.576171875, -15.9560546875, -15.3359375, -14.7158203125, -14.095703125, -13.4755859375, -12.85546875, -12.2353515625, -11.615234375, -10.9951171875, -10.375, -9.7548828125, -9.134765625, -8.5146484375, -7.89453125, -7.2744140625, -6.654296875, -6.0341796875, -5.4140625, -4.7939453125, -4.173828125, -3.5537109375, -2.93359375, -2.3134765625, -1.693359375, -1.0732421875, -0.453125, 0.1669921875, 0.787109375, 1.4072265625, 2.02734375, 2.6474609375, 3.267578125, 3.8876953125, 4.5078125, 5.1279296875, 5.748046875, 6.3681640625, 6.98828125, 7.6083984375, 8.228515625, 8.8486328125, 9.46875, 10.0888671875, 10.708984375, 11.3291015625, 11.94921875, 12.5693359375, 13.189453125, 13.8095703125, 14.4296875, 15.0498046875, 15.669921875, 16.2900390625, 16.91015625, 17.5302734375, 18.150390625, 18.7705078125, 19.390625]}, "gradients/encoder.adapter.layers.0.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 1.0, 6.0, 4.0, 10.0, 5.0, 7.0, 13.0, 20.0, 19.0, 27.0, 27.0, 24.0, 34.0, 36.0, 28.0, 45.0, 49.0, 39.0, 42.0, 112.0, 783.0, 267.0, 53.0, 38.0, 44.0, 34.0, 37.0, 30.0, 33.0, 30.0, 27.0, 21.0, 21.0, 16.0, 7.0, 11.0, 11.0, 4.0, 4.0, 5.0, 1.0, 4.0, 2.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-14.4609375, -14.032958984375, -13.60498046875, -13.177001953125, -12.7490234375, -12.321044921875, -11.89306640625, -11.465087890625, -11.037109375, -10.609130859375, -10.18115234375, -9.753173828125, -9.3251953125, -8.897216796875, -8.46923828125, -8.041259765625, -7.61328125, -7.185302734375, -6.75732421875, -6.329345703125, -5.9013671875, -5.473388671875, -5.04541015625, -4.617431640625, -4.189453125, -3.761474609375, -3.33349609375, -2.905517578125, -2.4775390625, -2.049560546875, -1.62158203125, -1.193603515625, -0.765625, -0.337646484375, 0.09033203125, 0.518310546875, 0.9462890625, 1.374267578125, 1.80224609375, 2.230224609375, 2.658203125, 3.086181640625, 3.51416015625, 3.942138671875, 4.3701171875, 4.798095703125, 5.22607421875, 5.654052734375, 6.08203125, 6.510009765625, 6.93798828125, 7.365966796875, 7.7939453125, 8.221923828125, 8.64990234375, 9.077880859375, 9.505859375, 9.933837890625, 10.36181640625, 10.789794921875, 11.2177734375, 11.645751953125, 12.07373046875, 12.501708984375, 12.9296875]}, "gradients/encoder.encoder.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 11.0, 54.0, 268.0, 497.0, 142.0, 30.0, 6.0, 4.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-177.8101806640625, -174.4757080078125, -171.14122009277344, -167.80674743652344, -164.47227478027344, -161.13778686523438, -157.80331420898438, -154.46884155273438, -151.1343536376953, -147.7998809814453, -144.46539306640625, -141.13092041015625, -137.79644775390625, -134.4619598388672, -131.1274871826172, -127.79301452636719, -124.45854187011719, -121.12406158447266, -117.78958892822266, -114.45510864257812, -111.1206283569336, -107.7861557006836, -104.45167541503906, -101.11720275878906, -97.78271484375, -94.44823455810547, -91.11376190185547, -87.77928161621094, -84.4448013305664, -81.1103286743164, -77.77584838867188, -74.44137573242188, -71.10689544677734, -67.77241516113281, -64.43794250488281, -61.10346221923828, -57.768985748291016, -54.43450927734375, -51.10002899169922, -47.76555252075195, -44.43107604980469, -41.09659957885742, -37.76211929321289, -34.427642822265625, -31.09316635131836, -27.75868797302246, -24.424209594726562, -21.089733123779297, -17.755252838134766, -14.420775413513184, -11.086297988891602, -7.751819610595703, -4.417342185974121, -1.082864761352539, 2.2516136169433594, 5.586090087890625, 8.920568466186523, 12.255045890808105, 15.589523315429688, 18.924001693725586, 22.258480072021484, 25.59295654296875, 28.92743492126465, 32.26190948486328, 35.59638977050781]}, "gradients/encoder.encoder.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 3.0, 8.0, 12.0, 11.0, 14.0, 15.0, 26.0, 31.0, 40.0, 52.0, 57.0, 58.0, 76.0, 68.0, 65.0, 55.0, 57.0, 59.0, 59.0, 53.0, 53.0, 43.0, 32.0, 23.0, 18.0, 12.0, 7.0, 4.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-20.64204216003418, -19.494304656982422, -18.346567153930664, -17.198829650878906, -16.05109405517578, -14.903356552124023, -13.755619049072266, -12.607882499694824, -11.460144996643066, -10.312407493591309, -9.164670944213867, -8.01693344116211, -6.86919641494751, -5.72145938873291, -4.573721885681152, -3.425985336303711, -2.278247833251953, -1.130510687828064, 0.017226457595825195, 1.164963722229004, 2.3127007484436035, 3.460437774658203, 4.608175277709961, 5.755911827087402, 6.90364933013916, 8.051386833190918, 9.19912338256836, 10.346860885620117, 11.494598388671875, 12.642334938049316, 13.790072441101074, 14.937808990478516, 16.08554458618164, 17.2332820892334, 18.381019592285156, 19.52875518798828, 20.67649269104004, 21.824230194091797, 22.971967697143555, 24.119705200195312, 25.267440795898438, 26.415178298950195, 27.562915802001953, 28.710651397705078, 29.858388900756836, 31.006126403808594, 32.15386199951172, 33.30160140991211, 34.4493408203125, 35.597076416015625, 36.744815826416016, 37.89255142211914, 39.04029083251953, 40.188026428222656, 41.33576202392578, 42.48350143432617, 43.6312370300293, 44.77897262573242, 45.92671203613281, 47.07444763183594, 48.22218704223633, 49.36992263793945, 50.517662048339844, 51.66539764404297, 52.813133239746094]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 4.0, 4.0, 5.0, 8.0, 8.0, 14.0, 20.0, 32.0, 38.0, 38.0, 68.0, 110.0, 170.0, 316.0, 533.0, 847.0, 1730.0, 3318.0, 7776.0, 22489.0, 174730.0, 3925999.0, 35588.0, 10599.0, 4389.0, 2216.0, 1163.0, 648.0, 430.0, 270.0, 188.0, 149.0, 85.0, 74.0, 53.0, 36.0, 19.0, 23.0, 20.0, 20.0, 13.0, 9.0, 3.0, 7.0, 6.0, 4.0, 4.0, 4.0, 2.0, 1.0, 1.0, 2.0, 2.0, 5.0, 2.0, 3.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5126953125, -0.49056243896484375, -0.4684295654296875, -0.44629669189453125, -0.424163818359375, -0.40203094482421875, -0.3798980712890625, -0.35776519775390625, -0.33563232421875, -0.31349945068359375, -0.2913665771484375, -0.26923370361328125, -0.247100830078125, -0.22496795654296875, -0.2028350830078125, -0.18070220947265625, -0.1585693359375, -0.13643646240234375, -0.1143035888671875, -0.09217071533203125, -0.070037841796875, -0.04790496826171875, -0.0257720947265625, -0.00363922119140625, 0.01849365234375, 0.04062652587890625, 0.0627593994140625, 0.08489227294921875, 0.107025146484375, 0.12915802001953125, 0.1512908935546875, 0.17342376708984375, 0.195556640625, 0.21768951416015625, 0.2398223876953125, 0.26195526123046875, 0.284088134765625, 0.30622100830078125, 0.3283538818359375, 0.35048675537109375, 0.37261962890625, 0.39475250244140625, 0.4168853759765625, 0.43901824951171875, 0.461151123046875, 0.48328399658203125, 0.5054168701171875, 0.5275497436523438, 0.5496826171875, 0.5718154907226562, 0.5939483642578125, 0.6160812377929688, 0.638214111328125, 0.6603469848632812, 0.6824798583984375, 0.7046127319335938, 0.72674560546875, 0.7488784790039062, 0.7710113525390625, 0.7931442260742188, 0.815277099609375, 0.8374099731445312, 0.8595428466796875, 0.8816757202148438, 0.90380859375]}, "gradients/encoder.encoder.layers.23.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 9.0, 5.0, 8.0, 11.0, 12.0, 13.0, 22.0, 13.0, 315.0, 488.0, 17.0, 12.0, 13.0, 14.0, 11.0, 7.0, 5.0, 6.0, 4.0, 4.0, 2.0, 3.0, 4.0, 0.0, 1.0, 4.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.084716796875, -0.08087539672851562, -0.07703399658203125, -0.07319259643554688, -0.0693511962890625, -0.06550979614257812, -0.06166839599609375, -0.057826995849609375, -0.053985595703125, -0.050144195556640625, -0.04630279541015625, -0.042461395263671875, -0.0386199951171875, -0.034778594970703125, -0.03093719482421875, -0.027095794677734375, -0.02325439453125, -0.019412994384765625, -0.01557159423828125, -0.011730194091796875, -0.0078887939453125, -0.004047393798828125, -0.00020599365234375, 0.003635406494140625, 0.007476806640625, 0.011318206787109375, 0.01515960693359375, 0.019001007080078125, 0.0228424072265625, 0.026683807373046875, 0.03052520751953125, 0.034366607666015625, 0.0382080078125, 0.042049407958984375, 0.04589080810546875, 0.049732208251953125, 0.0535736083984375, 0.057415008544921875, 0.06125640869140625, 0.06509780883789062, 0.068939208984375, 0.07278060913085938, 0.07662200927734375, 0.08046340942382812, 0.0843048095703125, 0.08814620971679688, 0.09198760986328125, 0.09582901000976562, 0.09967041015625, 0.10351181030273438, 0.10735321044921875, 0.11119461059570312, 0.1150360107421875, 0.11887741088867188, 0.12271881103515625, 0.12656021118164062, 0.130401611328125, 0.13424301147460938, 0.13808441162109375, 0.14192581176757812, 0.1457672119140625, 0.14960861206054688, 0.15345001220703125, 0.15729141235351562, 0.1611328125]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 5.0, 9.0, 13.0, 12.0, 24.0, 28.0, 34.0, 63.0, 74.0, 115.0, 187.0, 308.0, 509.0, 937.0, 1921.0, 4305.0, 12019.0, 46891.0, 417325.0, 3480003.0, 181885.0, 31031.0, 9178.0, 3703.0, 1607.0, 849.0, 468.0, 259.0, 160.0, 106.0, 70.0, 61.0, 41.0, 34.0, 11.0, 8.0, 10.0, 8.0, 5.0, 3.0, 3.0, 2.0, 0.0, 0.0, 0.0, 5.0, 1.0], "bins": [-0.70703125, -0.6875762939453125, -0.668121337890625, -0.6486663818359375, -0.62921142578125, -0.6097564697265625, -0.590301513671875, -0.5708465576171875, -0.5513916015625, -0.5319366455078125, -0.512481689453125, -0.4930267333984375, -0.47357177734375, -0.4541168212890625, -0.434661865234375, -0.4152069091796875, -0.395751953125, -0.3762969970703125, -0.356842041015625, -0.3373870849609375, -0.31793212890625, -0.2984771728515625, -0.279022216796875, -0.2595672607421875, -0.2401123046875, -0.2206573486328125, -0.201202392578125, -0.1817474365234375, -0.16229248046875, -0.1428375244140625, -0.123382568359375, -0.1039276123046875, -0.08447265625, -0.0650177001953125, -0.045562744140625, -0.0261077880859375, -0.00665283203125, 0.0128021240234375, 0.032257080078125, 0.0517120361328125, 0.0711669921875, 0.0906219482421875, 0.110076904296875, 0.1295318603515625, 0.14898681640625, 0.1684417724609375, 0.187896728515625, 0.2073516845703125, 0.226806640625, 0.2462615966796875, 0.265716552734375, 0.2851715087890625, 0.30462646484375, 0.3240814208984375, 0.343536376953125, 0.3629913330078125, 0.3824462890625, 0.4019012451171875, 0.421356201171875, 0.4408111572265625, 0.46026611328125, 0.4797210693359375, 0.499176025390625, 0.5186309814453125, 0.5380859375]}, "gradients/encoder.encoder.layers.23.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 5.0, 8.0, 11.0, 16.0, 17.0, 21.0, 25.0, 50.0, 80.0, 124.0, 167.0, 356.0, 973.0, 1231.0, 375.0, 191.0, 123.0, 83.0, 53.0, 39.0, 23.0, 15.0, 25.0, 15.0, 5.0, 9.0, 5.0, 4.0, 2.0, 8.0, 5.0, 2.0, 2.0, 3.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.1385498046875, -0.13323402404785156, -0.12791824340820312, -0.12260246276855469, -0.11728668212890625, -0.11197090148925781, -0.10665512084960938, -0.10133934020996094, -0.0960235595703125, -0.09070777893066406, -0.08539199829101562, -0.08007621765136719, -0.07476043701171875, -0.06944465637207031, -0.06412887573242188, -0.05881309509277344, -0.053497314453125, -0.04818153381347656, -0.042865753173828125, -0.03754997253417969, -0.03223419189453125, -0.026918411254882812, -0.021602630615234375, -0.016286849975585938, -0.0109710693359375, -0.0056552886962890625, -0.000339508056640625, 0.0049762725830078125, 0.01029205322265625, 0.015607833862304688, 0.020923614501953125, 0.026239395141601562, 0.03155517578125, 0.03687095642089844, 0.042186737060546875, 0.04750251770019531, 0.05281829833984375, 0.05813407897949219, 0.06344985961914062, 0.06876564025878906, 0.0740814208984375, 0.07939720153808594, 0.08471298217773438, 0.09002876281738281, 0.09534454345703125, 0.10066032409667969, 0.10597610473632812, 0.11129188537597656, 0.116607666015625, 0.12192344665527344, 0.12723922729492188, 0.1325550079345703, 0.13787078857421875, 0.1431865692138672, 0.14850234985351562, 0.15381813049316406, 0.1591339111328125, 0.16444969177246094, 0.16976547241210938, 0.1750812530517578, 0.18039703369140625, 0.1857128143310547, 0.19102859497070312, 0.19634437561035156, 0.20166015625]}, "gradients/encoder.encoder.layers.23.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 6.0, 12.0, 110.0, 549.0, 269.0, 53.0, 8.0, 3.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.296167850494385, -5.166160583496094, -5.036153316497803, -4.906146049499512, -4.776138782501221, -4.64613151550293, -4.516124248504639, -4.386116981506348, -4.256110191345215, -4.126102924346924, -3.996095657348633, -3.866088390350342, -3.736081123352051, -3.6060738563537598, -3.476066827774048, -3.346059560775757, -3.2160520553588867, -3.0860447883605957, -2.9560375213623047, -2.8260302543640137, -2.6960229873657227, -2.5660157203674316, -2.4360086917877197, -2.3060014247894287, -2.1759941577911377, -2.0459868907928467, -1.9159796237945557, -1.7859724760055542, -1.6559652090072632, -1.5259579420089722, -1.3959507942199707, -1.2659435272216797, -1.1359362602233887, -1.0059289932250977, -0.8759217858314514, -0.7459145784378052, -0.6159073114395142, -0.48590004444122314, -0.3558928370475769, -0.22588562965393066, -0.09587836265563965, 0.03412887454032898, 0.1641361117362976, 0.29414334893226624, 0.42415058612823486, 0.5541578531265259, 0.6841650605201721, 0.8141722679138184, 0.9441795349121094, 1.0741868019104004, 1.2041940689086914, 1.3342012166976929, 1.4642084836959839, 1.594215750694275, 1.7242228984832764, 1.8542301654815674, 1.9842374324798584, 2.1142446994781494, 2.2442519664764404, 2.3742592334747314, 2.5042662620544434, 2.6342735290527344, 2.7642807960510254, 2.8942880630493164, 3.0242953300476074]}, "gradients/encoder.encoder.layers.23.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 13.0, 21.0, 21.0, 49.0, 61.0, 76.0, 83.0, 93.0, 102.0, 90.0, 101.0, 78.0, 55.0, 57.0, 35.0, 27.0, 18.0, 8.0, 5.0, 2.0, 2.0, 5.0, 1.0, 1.0, 3.0], "bins": [-1.8116366863250732, -1.7747716903686523, -1.737906575202942, -1.7010414600372314, -1.6641764640808105, -1.6273114681243896, -1.5904463529586792, -1.5535812377929688, -1.5167162418365479, -1.479851245880127, -1.4429861307144165, -1.406121015548706, -1.3692560195922852, -1.3323910236358643, -1.2955259084701538, -1.2586607933044434, -1.2217957973480225, -1.1849308013916016, -1.1480656862258911, -1.1112005710601807, -1.0743355751037598, -1.0374705791473389, -1.0006054639816284, -0.9637404084205627, -0.9268753528594971, -0.8900102972984314, -0.8531452417373657, -0.8162801861763, -0.7794151306152344, -0.7425500750541687, -0.705685019493103, -0.6688199639320374, -0.6319547891616821, -0.5950897336006165, -0.5582246780395508, -0.5213596224784851, -0.48449456691741943, -0.44762951135635376, -0.4107644557952881, -0.3738994002342224, -0.33703434467315674, -0.30016928911209106, -0.2633042335510254, -0.22643917798995972, -0.18957412242889404, -0.15270906686782837, -0.1158440113067627, -0.07897895574569702, -0.04211390018463135, -0.005248844623565674, 0.0316162109375, 0.06848126649856567, 0.10534632205963135, 0.14221137762069702, 0.1790764331817627, 0.21594148874282837, 0.25280654430389404, 0.2896715998649597, 0.3265366554260254, 0.36340171098709106, 0.40026676654815674, 0.4371318221092224, 0.4739968776702881, 0.5108619332313538, 0.5477269887924194]}, "gradients/encoder.encoder.layers.23.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 3.0, 1.0, 3.0, 0.0, 1.0, 4.0, 4.0, 4.0, 6.0, 7.0, 21.0, 19.0, 34.0, 43.0, 65.0, 75.0, 125.0, 160.0, 283.0, 494.0, 798.0, 1435.0, 2845.0, 5961.0, 14425.0, 48778.0, 886375.0, 57805.0, 15624.0, 6401.0, 2970.0, 1511.0, 874.0, 486.0, 303.0, 202.0, 136.0, 81.0, 57.0, 41.0, 27.0, 21.0, 15.0, 12.0, 10.0, 7.0, 8.0, 6.0, 0.0, 1.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6953125, -0.6709518432617188, -0.6465911865234375, -0.6222305297851562, -0.597869873046875, -0.5735092163085938, -0.5491485595703125, -0.5247879028320312, -0.50042724609375, -0.47606658935546875, -0.4517059326171875, -0.42734527587890625, -0.402984619140625, -0.37862396240234375, -0.3542633056640625, -0.32990264892578125, -0.3055419921875, -0.28118133544921875, -0.2568206787109375, -0.23246002197265625, -0.208099365234375, -0.18373870849609375, -0.1593780517578125, -0.13501739501953125, -0.11065673828125, -0.08629608154296875, -0.0619354248046875, -0.03757476806640625, -0.013214111328125, 0.01114654541015625, 0.0355072021484375, 0.05986785888671875, 0.084228515625, 0.10858917236328125, 0.1329498291015625, 0.15731048583984375, 0.181671142578125, 0.20603179931640625, 0.2303924560546875, 0.25475311279296875, 0.27911376953125, 0.30347442626953125, 0.3278350830078125, 0.35219573974609375, 0.376556396484375, 0.40091705322265625, 0.4252777099609375, 0.44963836669921875, 0.4739990234375, 0.49835968017578125, 0.5227203369140625, 0.5470809936523438, 0.571441650390625, 0.5958023071289062, 0.6201629638671875, 0.6445236206054688, 0.66888427734375, 0.6932449340820312, 0.7176055908203125, 0.7419662475585938, 0.766326904296875, 0.7906875610351562, 0.8150482177734375, 0.8394088745117188, 0.86376953125]}, "gradients/encoder.encoder.layers.23.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 4.0, 2.0, 4.0, 3.0, 7.0, 8.0, 6.0, 11.0, 11.0, 15.0, 13.0, 13.0, 105.0, 359.0, 290.0, 59.0, 20.0, 11.0, 8.0, 7.0, 9.0, 8.0, 7.0, 6.0, 7.0, 3.0, 3.0, 2.0, 1.0, 3.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.07769775390625, -0.07469844818115234, -0.07169914245605469, -0.06869983673095703, -0.06570053100585938, -0.06270122528076172, -0.05970191955566406, -0.056702613830566406, -0.05370330810546875, -0.050704002380371094, -0.04770469665527344, -0.04470539093017578, -0.041706085205078125, -0.03870677947998047, -0.03570747375488281, -0.032708168029785156, -0.0297088623046875, -0.026709556579589844, -0.023710250854492188, -0.02071094512939453, -0.017711639404296875, -0.014712333679199219, -0.011713027954101562, -0.008713722229003906, -0.00571441650390625, -0.0027151107788085938, 0.0002841949462890625, 0.0032835006713867188, 0.006282806396484375, 0.009282112121582031, 0.012281417846679688, 0.015280723571777344, 0.018280029296875, 0.021279335021972656, 0.024278640747070312, 0.02727794647216797, 0.030277252197265625, 0.03327655792236328, 0.03627586364746094, 0.039275169372558594, 0.04227447509765625, 0.045273780822753906, 0.04827308654785156, 0.05127239227294922, 0.054271697998046875, 0.05727100372314453, 0.06027030944824219, 0.06326961517333984, 0.0662689208984375, 0.06926822662353516, 0.07226753234863281, 0.07526683807373047, 0.07826614379882812, 0.08126544952392578, 0.08426475524902344, 0.0872640609741211, 0.09026336669921875, 0.0932626724243164, 0.09626197814941406, 0.09926128387451172, 0.10226058959960938, 0.10525989532470703, 0.10825920104980469, 0.11125850677490234, 0.1142578125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 2.0, 4.0, 6.0, 10.0, 10.0, 18.0, 20.0, 23.0, 35.0, 54.0, 76.0, 101.0, 180.0, 295.0, 510.0, 894.0, 2156.0, 5881.0, 30118.0, 578569.0, 396382.0, 23884.0, 5326.0, 1923.0, 812.0, 457.0, 276.0, 147.0, 101.0, 83.0, 60.0, 50.0, 30.0, 21.0, 13.0, 7.0, 5.0, 3.0, 5.0, 7.0, 4.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.841796875, -0.812713623046875, -0.78363037109375, -0.754547119140625, -0.7254638671875, -0.696380615234375, -0.66729736328125, -0.638214111328125, -0.609130859375, -0.580047607421875, -0.55096435546875, -0.521881103515625, -0.4927978515625, -0.463714599609375, -0.43463134765625, -0.405548095703125, -0.37646484375, -0.347381591796875, -0.31829833984375, -0.289215087890625, -0.2601318359375, -0.231048583984375, -0.20196533203125, -0.172882080078125, -0.143798828125, -0.114715576171875, -0.08563232421875, -0.056549072265625, -0.0274658203125, 0.001617431640625, 0.03070068359375, 0.059783935546875, 0.0888671875, 0.117950439453125, 0.14703369140625, 0.176116943359375, 0.2052001953125, 0.234283447265625, 0.26336669921875, 0.292449951171875, 0.321533203125, 0.350616455078125, 0.37969970703125, 0.408782958984375, 0.4378662109375, 0.466949462890625, 0.49603271484375, 0.525115966796875, 0.55419921875, 0.583282470703125, 0.61236572265625, 0.641448974609375, 0.6705322265625, 0.699615478515625, 0.72869873046875, 0.757781982421875, 0.786865234375, 0.815948486328125, 0.84503173828125, 0.874114990234375, 0.9031982421875, 0.932281494140625, 0.96136474609375, 0.990447998046875, 1.01953125]}, "gradients/encoder.encoder.layers.23.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 5.0, 9.0, 7.0, 8.0, 12.0, 20.0, 19.0, 16.0, 17.0, 24.0, 25.0, 34.0, 47.0, 43.0, 49.0, 53.0, 56.0, 49.0, 40.0, 46.0, 57.0, 48.0, 54.0, 40.0, 44.0, 40.0, 24.0, 24.0, 24.0, 14.0, 11.0, 8.0, 15.0, 4.0, 7.0, 5.0, 7.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.32666015625, -0.3145408630371094, -0.30242156982421875, -0.2903022766113281, -0.2781829833984375, -0.2660636901855469, -0.25394439697265625, -0.24182510375976562, -0.229705810546875, -0.21758651733398438, -0.20546722412109375, -0.19334793090820312, -0.1812286376953125, -0.16910934448242188, -0.15699005126953125, -0.14487075805664062, -0.13275146484375, -0.12063217163085938, -0.10851287841796875, -0.09639358520507812, -0.0842742919921875, -0.07215499877929688, -0.06003570556640625, -0.047916412353515625, -0.035797119140625, -0.023677825927734375, -0.01155853271484375, 0.000560760498046875, 0.0126800537109375, 0.024799346923828125, 0.03691864013671875, 0.049037933349609375, 0.0611572265625, 0.07327651977539062, 0.08539581298828125, 0.09751510620117188, 0.1096343994140625, 0.12175369262695312, 0.13387298583984375, 0.14599227905273438, 0.158111572265625, 0.17023086547851562, 0.18235015869140625, 0.19446945190429688, 0.2065887451171875, 0.21870803833007812, 0.23082733154296875, 0.24294662475585938, 0.25506591796875, 0.2671852111816406, 0.27930450439453125, 0.2914237976074219, 0.3035430908203125, 0.3156623840332031, 0.32778167724609375, 0.3399009704589844, 0.352020263671875, 0.3641395568847656, 0.37625885009765625, 0.3883781433105469, 0.4004974365234375, 0.4126167297363281, 0.42473602294921875, 0.4368553161621094, 0.448974609375]}, "gradients/encoder.encoder.layers.23.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 0.0, 3.0, 3.0, 5.0, 7.0, 7.0, 17.0, 26.0, 19.0, 41.0, 68.0, 128.0, 270.0, 599.0, 1947.0, 12358.0, 978381.0, 49369.0, 3597.0, 924.0, 360.0, 182.0, 97.0, 57.0, 22.0, 24.0, 19.0, 9.0, 5.0, 5.0, 1.0, 8.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.96484375, -1.902862548828125, -1.84088134765625, -1.778900146484375, -1.7169189453125, -1.654937744140625, -1.59295654296875, -1.530975341796875, -1.468994140625, -1.407012939453125, -1.34503173828125, -1.283050537109375, -1.2210693359375, -1.159088134765625, -1.09710693359375, -1.035125732421875, -0.97314453125, -0.911163330078125, -0.84918212890625, -0.787200927734375, -0.7252197265625, -0.663238525390625, -0.60125732421875, -0.539276123046875, -0.477294921875, -0.415313720703125, -0.35333251953125, -0.291351318359375, -0.2293701171875, -0.167388916015625, -0.10540771484375, -0.043426513671875, 0.0185546875, 0.080535888671875, 0.14251708984375, 0.204498291015625, 0.2664794921875, 0.328460693359375, 0.39044189453125, 0.452423095703125, 0.514404296875, 0.576385498046875, 0.63836669921875, 0.700347900390625, 0.7623291015625, 0.824310302734375, 0.88629150390625, 0.948272705078125, 1.01025390625, 1.072235107421875, 1.13421630859375, 1.196197509765625, 1.2581787109375, 1.320159912109375, 1.38214111328125, 1.444122314453125, 1.506103515625, 1.568084716796875, 1.63006591796875, 1.692047119140625, 1.7540283203125, 1.816009521484375, 1.87799072265625, 1.939971923828125, 2.001953125]}, "gradients/encoder.encoder.layers.23.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 1.0, 7.0, 7.0, 20.0, 21.0, 31.0, 53.0, 54.0, 102.0, 105.0, 135.0, 113.0, 113.0, 74.0, 59.0, 41.0, 31.0, 12.0, 11.0, 5.0, 4.0, 4.0, 1.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.5299530029296875e-05, -4.395097494125366e-05, -4.260241985321045e-05, -4.1253864765167236e-05, -3.9905309677124023e-05, -3.855675458908081e-05, -3.72081995010376e-05, -3.5859644412994385e-05, -3.451108932495117e-05, -3.316253423690796e-05, -3.1813979148864746e-05, -3.0465424060821533e-05, -2.911686897277832e-05, -2.7768313884735107e-05, -2.6419758796691895e-05, -2.507120370864868e-05, -2.372264862060547e-05, -2.2374093532562256e-05, -2.1025538444519043e-05, -1.967698335647583e-05, -1.8328428268432617e-05, -1.6979873180389404e-05, -1.563131809234619e-05, -1.4282763004302979e-05, -1.2934207916259766e-05, -1.1585652828216553e-05, -1.023709774017334e-05, -8.888542652130127e-06, -7.539987564086914e-06, -6.191432476043701e-06, -4.842877388000488e-06, -3.4943222999572754e-06, -2.1457672119140625e-06, -7.972121238708496e-07, 5.513429641723633e-07, 1.8998980522155762e-06, 3.248453140258789e-06, 4.597008228302002e-06, 5.945563316345215e-06, 7.294118404388428e-06, 8.64267349243164e-06, 9.991228580474854e-06, 1.1339783668518066e-05, 1.268833875656128e-05, 1.4036893844604492e-05, 1.5385448932647705e-05, 1.6734004020690918e-05, 1.808255910873413e-05, 1.9431114196777344e-05, 2.0779669284820557e-05, 2.212822437286377e-05, 2.3476779460906982e-05, 2.4825334548950195e-05, 2.6173889636993408e-05, 2.752244472503662e-05, 2.8870999813079834e-05, 3.0219554901123047e-05, 3.156810998916626e-05, 3.291666507720947e-05, 3.4265220165252686e-05, 3.56137752532959e-05, 3.696233034133911e-05, 3.8310885429382324e-05, 3.965944051742554e-05, 4.100799560546875e-05]}, "gradients/encoder.encoder.layers.23.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 7.0, 3.0, 3.0, 6.0, 8.0, 12.0, 21.0, 29.0, 43.0, 53.0, 87.0, 167.0, 211.0, 385.0, 646.0, 1245.0, 2521.0, 6165.0, 19179.0, 112460.0, 768168.0, 106796.0, 18954.0, 6000.0, 2528.0, 1224.0, 671.0, 370.0, 219.0, 130.0, 78.0, 56.0, 36.0, 29.0, 21.0, 8.0, 7.0, 7.0, 0.0, 4.0, 7.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.7470703125, -0.724761962890625, -0.70245361328125, -0.680145263671875, -0.6578369140625, -0.635528564453125, -0.61322021484375, -0.590911865234375, -0.568603515625, -0.546295166015625, -0.52398681640625, -0.501678466796875, -0.4793701171875, -0.457061767578125, -0.43475341796875, -0.412445068359375, -0.39013671875, -0.367828369140625, -0.34552001953125, -0.323211669921875, -0.3009033203125, -0.278594970703125, -0.25628662109375, -0.233978271484375, -0.211669921875, -0.189361572265625, -0.16705322265625, -0.144744873046875, -0.1224365234375, -0.100128173828125, -0.07781982421875, -0.055511474609375, -0.033203125, -0.010894775390625, 0.01141357421875, 0.033721923828125, 0.0560302734375, 0.078338623046875, 0.10064697265625, 0.122955322265625, 0.145263671875, 0.167572021484375, 0.18988037109375, 0.212188720703125, 0.2344970703125, 0.256805419921875, 0.27911376953125, 0.301422119140625, 0.32373046875, 0.346038818359375, 0.36834716796875, 0.390655517578125, 0.4129638671875, 0.435272216796875, 0.45758056640625, 0.479888916015625, 0.502197265625, 0.524505615234375, 0.54681396484375, 0.569122314453125, 0.5914306640625, 0.613739013671875, 0.63604736328125, 0.658355712890625, 0.6806640625]}, "gradients/encoder.encoder.layers.23.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 2.0, 4.0, 6.0, 11.0, 15.0, 19.0, 45.0, 59.0, 99.0, 145.0, 139.0, 143.0, 108.0, 70.0, 41.0, 29.0, 19.0, 13.0, 12.0, 6.0, 6.0, 5.0, 4.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.93896484375, -0.9169731140136719, -0.8949813842773438, -0.8729896545410156, -0.8509979248046875, -0.8290061950683594, -0.8070144653320312, -0.7850227355957031, -0.763031005859375, -0.7410392761230469, -0.7190475463867188, -0.6970558166503906, -0.6750640869140625, -0.6530723571777344, -0.6310806274414062, -0.6090888977050781, -0.58709716796875, -0.5651054382324219, -0.5431137084960938, -0.5211219787597656, -0.4991302490234375, -0.4771385192871094, -0.45514678955078125, -0.4331550598144531, -0.411163330078125, -0.3891716003417969, -0.36717987060546875, -0.3451881408691406, -0.3231964111328125, -0.3012046813964844, -0.27921295166015625, -0.2572212219238281, -0.2352294921875, -0.21323776245117188, -0.19124603271484375, -0.16925430297851562, -0.1472625732421875, -0.12527084350585938, -0.10327911376953125, -0.08128738403320312, -0.059295654296875, -0.037303924560546875, -0.01531219482421875, 0.006679534912109375, 0.0286712646484375, 0.050662994384765625, 0.07265472412109375, 0.09464645385742188, 0.11663818359375, 0.13862991333007812, 0.16062164306640625, 0.18261337280273438, 0.2046051025390625, 0.22659683227539062, 0.24858856201171875, 0.2705802917480469, 0.292572021484375, 0.3145637512207031, 0.33655548095703125, 0.3585472106933594, 0.3805389404296875, 0.4025306701660156, 0.42452239990234375, 0.4465141296386719, 0.468505859375]}, "gradients/encoder.encoder.layers.23.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 3.0, 6.0, 10.0, 20.0, 39.0, 202.0, 528.0, 147.0, 28.0, 14.0, 7.0, 4.0, 2.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.350286483764648, -12.983917236328125, -12.617548942565918, -12.251179695129395, -11.884811401367188, -11.518442153930664, -11.15207290649414, -10.785703659057617, -10.41933536529541, -10.052966117858887, -9.68659782409668, -9.320228576660156, -8.953859329223633, -8.587491035461426, -8.221121788024902, -7.854753017425537, -7.488384246826172, -7.122015476226807, -6.755646705627441, -6.389277458190918, -6.022908687591553, -5.6565399169921875, -5.290170669555664, -4.923801898956299, -4.557433128356934, -4.191064357757568, -3.824695348739624, -3.4583263397216797, -3.0919575691223145, -2.725588798522949, -2.359219789505005, -1.9928507804870605, -1.6264820098876953, -1.2601131200790405, -0.8937442302703857, -0.527375340461731, -0.16100645065307617, 0.2053624391555786, 0.5717313289642334, 0.9381003379821777, 1.304469108581543, 1.6708379983901978, 2.0372068881988525, 2.403575897216797, 2.769944667816162, 3.1363134384155273, 3.5026824474334717, 3.869051456451416, 4.235420227050781, 4.6017889976501465, 4.968157768249512, 5.334527015686035, 5.7008957862854, 6.067264556884766, 6.433633804321289, 6.800002574920654, 7.1663713455200195, 7.532740116119385, 7.89910888671875, 8.265478134155273, 8.631847381591797, 8.998215675354004, 9.364584922790527, 9.730953216552734, 10.097322463989258]}, "gradients/encoder.encoder.layers.23.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 3.0, 2.0, 1.0, 0.0, 2.0, 1.0, 2.0, 3.0, 4.0, 2.0, 5.0, 5.0, 4.0, 13.0, 22.0, 21.0, 23.0, 52.0, 87.0, 101.0, 119.0, 133.0, 100.0, 103.0, 69.0, 44.0, 24.0, 15.0, 12.0, 5.0, 5.0, 3.0, 2.0, 7.0, 6.0, 2.0, 0.0, 4.0, 4.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-6.68892240524292, -6.488001823425293, -6.287081718444824, -6.086161136627197, -5.88524055480957, -5.684320449829102, -5.483399868011475, -5.282479286193848, -5.081559181213379, -4.880638599395752, -4.679718494415283, -4.478797912597656, -4.2778778076171875, -4.0769572257995605, -3.8760366439819336, -3.6751163005828857, -3.474195957183838, -3.27327561378479, -3.072355270385742, -2.8714346885681152, -2.6705143451690674, -2.4695940017700195, -2.2686734199523926, -2.0677530765533447, -1.8668327331542969, -1.665912389755249, -1.4649919271469116, -1.2640714645385742, -1.0631511211395264, -0.8622307777404785, -0.6613103151321411, -0.4603898525238037, -0.25946950912475586, -0.05854910612106323, 0.1423712968826294, 0.343291699886322, 0.5442121028900146, 0.7451324462890625, 0.9460529088973999, 1.1469733715057373, 1.3478937149047852, 1.548814058303833, 1.7497345209121704, 1.9506549835205078, 2.1515753269195557, 2.3524956703186035, 2.5534162521362305, 2.7543365955352783, 2.955256938934326, 3.156177282333374, 3.357097625732422, 3.558018207550049, 3.7589385509490967, 3.9598588943481445, 4.1607794761657715, 4.361700057983398, 4.562620162963867, 4.763540744781494, 4.964460849761963, 5.16538143157959, 5.366301536560059, 5.5672221183776855, 5.7681427001953125, 5.969062805175781, 6.169983386993408]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 4.0, 3.0, 5.0, 5.0, 7.0, 21.0, 34.0, 50.0, 282.0, 20983.0, 4167917.0, 4318.0, 443.0, 135.0, 40.0, 20.0, 14.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.380859375, -3.126739501953125, -2.87261962890625, -2.618499755859375, -2.3643798828125, -2.110260009765625, -1.85614013671875, -1.602020263671875, -1.347900390625, -1.093780517578125, -0.83966064453125, -0.585540771484375, -0.3314208984375, -0.077301025390625, 0.17681884765625, 0.430938720703125, 0.68505859375, 0.939178466796875, 1.19329833984375, 1.447418212890625, 1.7015380859375, 1.955657958984375, 2.20977783203125, 2.463897705078125, 2.718017578125, 2.972137451171875, 3.22625732421875, 3.480377197265625, 3.7344970703125, 3.988616943359375, 4.24273681640625, 4.496856689453125, 4.7509765625, 5.005096435546875, 5.25921630859375, 5.513336181640625, 5.7674560546875, 6.021575927734375, 6.27569580078125, 6.529815673828125, 6.783935546875, 7.038055419921875, 7.29217529296875, 7.546295166015625, 7.8004150390625, 8.054534912109375, 8.30865478515625, 8.562774658203125, 8.81689453125, 9.071014404296875, 9.32513427734375, 9.579254150390625, 9.8333740234375, 10.087493896484375, 10.34161376953125, 10.595733642578125, 10.849853515625, 11.103973388671875, 11.35809326171875, 11.612213134765625, 11.8663330078125, 12.120452880859375, 12.37457275390625, 12.628692626953125, 12.8828125]}, "gradients/encoder.encoder.layers.22.feed_forward.output_dense.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 5.0, 7.0, 3.0, 10.0, 5.0, 10.0, 10.0, 18.0, 34.0, 110.0, 241.0, 260.0, 142.0, 51.0, 25.0, 11.0, 13.0, 9.0, 2.0, 7.0, 7.0, 2.0, 4.0, 7.0, 5.0, 1.0, 0.0, 2.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.04693603515625, -0.04436492919921875, -0.0417938232421875, -0.03922271728515625, -0.036651611328125, -0.03408050537109375, -0.0315093994140625, -0.02893829345703125, -0.0263671875, -0.02379608154296875, -0.0212249755859375, -0.01865386962890625, -0.016082763671875, -0.01351165771484375, -0.0109405517578125, -0.00836944580078125, -0.00579833984375, -0.00322723388671875, -0.0006561279296875, 0.00191497802734375, 0.004486083984375, 0.00705718994140625, 0.0096282958984375, 0.01219940185546875, 0.0147705078125, 0.01734161376953125, 0.0199127197265625, 0.02248382568359375, 0.025054931640625, 0.02762603759765625, 0.0301971435546875, 0.03276824951171875, 0.03533935546875, 0.03791046142578125, 0.0404815673828125, 0.04305267333984375, 0.045623779296875, 0.04819488525390625, 0.0507659912109375, 0.05333709716796875, 0.055908203125, 0.05847930908203125, 0.0610504150390625, 0.06362152099609375, 0.066192626953125, 0.06876373291015625, 0.0713348388671875, 0.07390594482421875, 0.07647705078125, 0.07904815673828125, 0.0816192626953125, 0.08419036865234375, 0.086761474609375, 0.08933258056640625, 0.0919036865234375, 0.09447479248046875, 0.0970458984375, 0.09961700439453125, 0.1021881103515625, 0.10475921630859375, 0.107330322265625, 0.10990142822265625, 0.1124725341796875, 0.11504364013671875, 0.11761474609375]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 9.0, 15.0, 20.0, 22.0, 26.0, 49.0, 66.0, 123.0, 209.0, 328.0, 635.0, 1778.0, 5277.0, 24364.0, 272254.0, 3772188.0, 97290.0, 13881.0, 3552.0, 1210.0, 464.0, 247.0, 98.0, 83.0, 33.0, 24.0, 22.0, 4.0, 5.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.33984375, -1.3057785034179688, -1.2717132568359375, -1.2376480102539062, -1.203582763671875, -1.1695175170898438, -1.1354522705078125, -1.1013870239257812, -1.06732177734375, -1.0332565307617188, -0.9991912841796875, -0.9651260375976562, -0.931060791015625, -0.8969955444335938, -0.8629302978515625, -0.8288650512695312, -0.7947998046875, -0.7607345581054688, -0.7266693115234375, -0.6926040649414062, -0.658538818359375, -0.6244735717773438, -0.5904083251953125, -0.5563430786132812, -0.52227783203125, -0.48821258544921875, -0.4541473388671875, -0.42008209228515625, -0.386016845703125, -0.35195159912109375, -0.3178863525390625, -0.28382110595703125, -0.249755859375, -0.21569061279296875, -0.1816253662109375, -0.14756011962890625, -0.113494873046875, -0.07942962646484375, -0.0453643798828125, -0.01129913330078125, 0.02276611328125, 0.05683135986328125, 0.0908966064453125, 0.12496185302734375, 0.159027099609375, 0.19309234619140625, 0.2271575927734375, 0.26122283935546875, 0.2952880859375, 0.32935333251953125, 0.3634185791015625, 0.39748382568359375, 0.431549072265625, 0.46561431884765625, 0.4996795654296875, 0.5337448120117188, 0.56781005859375, 0.6018753051757812, 0.6359405517578125, 0.6700057983398438, 0.704071044921875, 0.7381362915039062, 0.7722015380859375, 0.8062667846679688, 0.84033203125]}, "gradients/encoder.encoder.layers.22.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 4.0, 3.0, 1.0, 5.0, 3.0, 12.0, 5.0, 8.0, 8.0, 11.0, 9.0, 19.0, 25.0, 29.0, 36.0, 59.0, 84.0, 129.0, 271.0, 787.0, 1447.0, 523.0, 203.0, 118.0, 63.0, 44.0, 42.0, 30.0, 13.0, 19.0, 11.0, 10.0, 6.0, 7.0, 4.0, 9.0, 5.0, 2.0, 5.0, 2.0, 1.0, 5.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 2.0, 3.0, 0.0, 0.0, 1.0], "bins": [-0.08026123046875, -0.0775299072265625, -0.074798583984375, -0.0720672607421875, -0.0693359375, -0.0666046142578125, -0.063873291015625, -0.0611419677734375, -0.05841064453125, -0.0556793212890625, -0.052947998046875, -0.0502166748046875, -0.0474853515625, -0.0447540283203125, -0.042022705078125, -0.0392913818359375, -0.03656005859375, -0.0338287353515625, -0.031097412109375, -0.0283660888671875, -0.025634765625, -0.0229034423828125, -0.020172119140625, -0.0174407958984375, -0.01470947265625, -0.0119781494140625, -0.009246826171875, -0.0065155029296875, -0.0037841796875, -0.0010528564453125, 0.001678466796875, 0.0044097900390625, 0.00714111328125, 0.0098724365234375, 0.012603759765625, 0.0153350830078125, 0.01806640625, 0.0207977294921875, 0.023529052734375, 0.0262603759765625, 0.02899169921875, 0.0317230224609375, 0.034454345703125, 0.0371856689453125, 0.0399169921875, 0.0426483154296875, 0.045379638671875, 0.0481109619140625, 0.05084228515625, 0.0535736083984375, 0.056304931640625, 0.0590362548828125, 0.061767578125, 0.0644989013671875, 0.067230224609375, 0.0699615478515625, 0.07269287109375, 0.0754241943359375, 0.078155517578125, 0.0808868408203125, 0.0836181640625, 0.0863494873046875, 0.089080810546875, 0.0918121337890625, 0.09454345703125]}, "gradients/encoder.encoder.layers.22.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 15.0, 85.0, 850.0, 56.0, 6.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.9730353355407715, -7.801554203033447, -7.630073070526123, -7.458591461181641, -7.287110328674316, -7.115629196166992, -6.944148063659668, -6.772666931152344, -6.6011857986450195, -6.429704666137695, -6.258223533630371, -6.086742401123047, -5.9152607917785645, -5.74377965927124, -5.572298526763916, -5.400817394256592, -5.229335784912109, -5.057854652404785, -4.886373519897461, -4.714892387390137, -4.543410778045654, -4.37192964553833, -4.200448513031006, -4.028967380523682, -3.8574862480163574, -3.686005115509033, -3.51452374458313, -3.3430426120758057, -3.1715614795684814, -3.000080108642578, -2.828598976135254, -2.6571178436279297, -2.4856367111206055, -2.3141555786132812, -2.142674207687378, -1.9711930751800537, -1.7997119426727295, -1.6282306909561157, -1.456749439239502, -1.2852683067321777, -1.113787055015564, -0.942305862903595, -0.770824670791626, -0.5993434190750122, -0.4278622269630432, -0.2563810348510742, -0.08489978313446045, 0.08658134937286377, 0.25806260108947754, 0.42954379320144653, 0.6010249853134155, 0.7725062370300293, 0.9439874291419983, 1.1154686212539673, 1.286949872970581, 1.4584310054779053, 1.629912257194519, 1.8013935089111328, 1.972874641418457, 2.1443557739257812, 2.3158371448516846, 2.487318277359009, 2.658799648284912, 2.8302807807922363, 3.0017619132995605]}, "gradients/encoder.encoder.layers.22.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 0.0, 1.0, 3.0, 1.0, 0.0, 2.0, 8.0, 2.0, 12.0, 15.0, 19.0, 31.0, 47.0, 58.0, 87.0, 81.0, 97.0, 92.0, 101.0, 93.0, 79.0, 62.0, 42.0, 26.0, 14.0, 9.0, 8.0, 3.0, 7.0, 2.0, 5.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7158904075622559, -0.6941738128662109, -0.6724572777748108, -0.6507406830787659, -0.629024088382721, -0.6073075532913208, -0.5855909585952759, -0.563874363899231, -0.542157769203186, -0.5204411745071411, -0.4987246096134186, -0.47700804471969604, -0.4552914500236511, -0.4335748851299286, -0.41185832023620605, -0.39014172554016113, -0.368425190448761, -0.34670862555503845, -0.32499203085899353, -0.303275465965271, -0.2815588712692261, -0.25984230637550354, -0.238125741481781, -0.21640916168689728, -0.19469258189201355, -0.17297600209712982, -0.1512594223022461, -0.12954285740852356, -0.10782627761363983, -0.0861096978187561, -0.06439313292503357, -0.04267655313014984, -0.020959973335266113, 0.0007566027343273163, 0.022473178803920746, 0.04418975114822388, 0.0659063309431076, 0.08762291073799133, 0.10933947563171387, 0.1310560554265976, 0.15277263522148132, 0.17448921501636505, 0.19620579481124878, 0.2179223597049713, 0.23963893949985504, 0.26135551929473877, 0.2830720841884613, 0.30478864908218384, 0.32650524377822876, 0.3482218086719513, 0.3699384033679962, 0.39165496826171875, 0.41337156295776367, 0.4350881278514862, 0.45680469274520874, 0.47852128744125366, 0.5002378225326538, 0.5219544172286987, 0.5436709523200989, 0.5653875470161438, 0.5871041417121887, 0.6088206768035889, 0.6305372714996338, 0.6522538661956787, 0.6739704608917236]}, "gradients/encoder.encoder.layers.22.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 3.0, 3.0, 6.0, 11.0, 13.0, 19.0, 21.0, 41.0, 80.0, 113.0, 206.0, 417.0, 836.0, 1675.0, 3541.0, 7966.0, 20748.0, 112964.0, 754839.0, 109654.0, 20698.0, 7857.0, 3529.0, 1592.0, 816.0, 396.0, 214.0, 117.0, 74.0, 30.0, 33.0, 19.0, 6.0, 6.0, 5.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-0.82470703125, -0.8021087646484375, -0.779510498046875, -0.7569122314453125, -0.73431396484375, -0.7117156982421875, -0.689117431640625, -0.6665191650390625, -0.6439208984375, -0.6213226318359375, -0.598724365234375, -0.5761260986328125, -0.55352783203125, -0.5309295654296875, -0.508331298828125, -0.4857330322265625, -0.463134765625, -0.4405364990234375, -0.417938232421875, -0.3953399658203125, -0.37274169921875, -0.3501434326171875, -0.327545166015625, -0.3049468994140625, -0.2823486328125, -0.2597503662109375, -0.237152099609375, -0.2145538330078125, -0.19195556640625, -0.1693572998046875, -0.146759033203125, -0.1241607666015625, -0.1015625, -0.0789642333984375, -0.056365966796875, -0.0337677001953125, -0.01116943359375, 0.0114288330078125, 0.034027099609375, 0.0566253662109375, 0.0792236328125, 0.1018218994140625, 0.124420166015625, 0.1470184326171875, 0.16961669921875, 0.1922149658203125, 0.214813232421875, 0.2374114990234375, 0.260009765625, 0.2826080322265625, 0.305206298828125, 0.3278045654296875, 0.35040283203125, 0.3730010986328125, 0.395599365234375, 0.4181976318359375, 0.4407958984375, 0.4633941650390625, 0.485992431640625, 0.5085906982421875, 0.53118896484375, 0.5537872314453125, 0.576385498046875, 0.5989837646484375, 0.62158203125]}, "gradients/encoder.encoder.layers.22.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 1.0, 4.0, 1.0, 3.0, 4.0, 2.0, 6.0, 2.0, 8.0, 7.0, 5.0, 6.0, 11.0, 19.0, 36.0, 73.0, 94.0, 144.0, 195.0, 137.0, 93.0, 49.0, 31.0, 19.0, 11.0, 6.0, 7.0, 10.0, 2.0, 3.0, 4.0, 2.0, 2.0, 6.0, 1.0, 7.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.05706787109375, -0.05512809753417969, -0.053188323974609375, -0.05124855041503906, -0.04930877685546875, -0.04736900329589844, -0.045429229736328125, -0.04348945617675781, -0.0415496826171875, -0.03960990905761719, -0.037670135498046875, -0.03573036193847656, -0.03379058837890625, -0.03185081481933594, -0.029911041259765625, -0.027971267700195312, -0.026031494140625, -0.024091720581054688, -0.022151947021484375, -0.020212173461914062, -0.01827239990234375, -0.016332626342773438, -0.014392852783203125, -0.012453079223632812, -0.0105133056640625, -0.008573532104492188, -0.006633758544921875, -0.0046939849853515625, -0.00275421142578125, -0.0008144378662109375, 0.001125335693359375, 0.0030651092529296875, 0.0050048828125, 0.0069446563720703125, 0.008884429931640625, 0.010824203491210938, 0.01276397705078125, 0.014703750610351562, 0.016643524169921875, 0.018583297729492188, 0.0205230712890625, 0.022462844848632812, 0.024402618408203125, 0.026342391967773438, 0.02828216552734375, 0.030221939086914062, 0.032161712646484375, 0.03410148620605469, 0.036041259765625, 0.03798103332519531, 0.039920806884765625, 0.04186058044433594, 0.04380035400390625, 0.04574012756347656, 0.047679901123046875, 0.04961967468261719, 0.0515594482421875, 0.05349922180175781, 0.055438995361328125, 0.05737876892089844, 0.05931854248046875, 0.06125831604003906, 0.06319808959960938, 0.06513786315917969, 0.06707763671875]}, "gradients/encoder.encoder.layers.22.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 0.0, 2.0, 6.0, 2.0, 2.0, 7.0, 5.0, 6.0, 7.0, 12.0, 16.0, 24.0, 41.0, 149.0, 565.0, 5532.0, 290855.0, 737439.0, 12529.0, 990.0, 206.0, 73.0, 24.0, 14.0, 5.0, 7.0, 7.0, 6.0, 3.0, 4.0, 6.0, 1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.34765625, -1.3057098388671875, -1.263763427734375, -1.2218170166015625, -1.17987060546875, -1.1379241943359375, -1.095977783203125, -1.0540313720703125, -1.0120849609375, -0.9701385498046875, -0.928192138671875, -0.8862457275390625, -0.84429931640625, -0.8023529052734375, -0.760406494140625, -0.7184600830078125, -0.676513671875, -0.6345672607421875, -0.592620849609375, -0.5506744384765625, -0.50872802734375, -0.4667816162109375, -0.424835205078125, -0.3828887939453125, -0.3409423828125, -0.2989959716796875, -0.257049560546875, -0.2151031494140625, -0.17315673828125, -0.1312103271484375, -0.089263916015625, -0.0473175048828125, -0.00537109375, 0.0365753173828125, 0.078521728515625, 0.1204681396484375, 0.16241455078125, 0.2043609619140625, 0.246307373046875, 0.2882537841796875, 0.3302001953125, 0.3721466064453125, 0.414093017578125, 0.4560394287109375, 0.49798583984375, 0.5399322509765625, 0.581878662109375, 0.6238250732421875, 0.665771484375, 0.7077178955078125, 0.749664306640625, 0.7916107177734375, 0.83355712890625, 0.8755035400390625, 0.917449951171875, 0.9593963623046875, 1.0013427734375, 1.0432891845703125, 1.085235595703125, 1.1271820068359375, 1.16912841796875, 1.2110748291015625, 1.253021240234375, 1.2949676513671875, 1.3369140625]}, "gradients/encoder.encoder.layers.22.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 5.0, 1.0, 4.0, 5.0, 7.0, 3.0, 7.0, 2.0, 11.0, 9.0, 13.0, 18.0, 24.0, 23.0, 28.0, 27.0, 31.0, 23.0, 40.0, 43.0, 35.0, 44.0, 46.0, 38.0, 52.0, 40.0, 54.0, 58.0, 38.0, 35.0, 29.0, 29.0, 29.0, 22.0, 28.0, 20.0, 17.0, 25.0, 5.0, 11.0, 6.0, 8.0, 4.0, 1.0, 6.0, 2.0, 0.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0], "bins": [-0.21435546875, -0.2073955535888672, -0.20043563842773438, -0.19347572326660156, -0.18651580810546875, -0.17955589294433594, -0.17259597778320312, -0.1656360626220703, -0.1586761474609375, -0.1517162322998047, -0.14475631713867188, -0.13779640197753906, -0.13083648681640625, -0.12387657165527344, -0.11691665649414062, -0.10995674133300781, -0.102996826171875, -0.09603691101074219, -0.08907699584960938, -0.08211708068847656, -0.07515716552734375, -0.06819725036621094, -0.061237335205078125, -0.05427742004394531, -0.0473175048828125, -0.04035758972167969, -0.033397674560546875, -0.026437759399414062, -0.01947784423828125, -0.012517929077148438, -0.005558013916015625, 0.0014019012451171875, 0.00836181640625, 0.015321731567382812, 0.022281646728515625, 0.029241561889648438, 0.03620147705078125, 0.04316139221191406, 0.050121307373046875, 0.05708122253417969, 0.0640411376953125, 0.07100105285644531, 0.07796096801757812, 0.08492088317871094, 0.09188079833984375, 0.09884071350097656, 0.10580062866210938, 0.11276054382324219, 0.119720458984375, 0.1266803741455078, 0.13364028930664062, 0.14060020446777344, 0.14756011962890625, 0.15452003479003906, 0.16147994995117188, 0.1684398651123047, 0.1753997802734375, 0.1823596954345703, 0.18931961059570312, 0.19627952575683594, 0.20323944091796875, 0.21019935607910156, 0.21715927124023438, 0.2241191864013672, 0.2310791015625]}, "gradients/encoder.encoder.layers.22.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 4.0, 3.0, 4.0, 12.0, 14.0, 40.0, 147.0, 913.0, 59245.0, 985615.0, 2190.0, 243.0, 64.0, 21.0, 10.0, 5.0, 5.0, 4.0, 4.0, 1.0, 6.0, 0.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.298828125, -3.18572998046875, -3.0726318359375, -2.95953369140625, -2.846435546875, -2.73333740234375, -2.6202392578125, -2.50714111328125, -2.39404296875, -2.28094482421875, -2.1678466796875, -2.05474853515625, -1.941650390625, -1.82855224609375, -1.7154541015625, -1.60235595703125, -1.4892578125, -1.37615966796875, -1.2630615234375, -1.14996337890625, -1.036865234375, -0.92376708984375, -0.8106689453125, -0.69757080078125, -0.58447265625, -0.47137451171875, -0.3582763671875, -0.24517822265625, -0.132080078125, -0.01898193359375, 0.0941162109375, 0.20721435546875, 0.3203125, 0.43341064453125, 0.5465087890625, 0.65960693359375, 0.772705078125, 0.88580322265625, 0.9989013671875, 1.11199951171875, 1.22509765625, 1.33819580078125, 1.4512939453125, 1.56439208984375, 1.677490234375, 1.79058837890625, 1.9036865234375, 2.01678466796875, 2.1298828125, 2.24298095703125, 2.3560791015625, 2.46917724609375, 2.582275390625, 2.69537353515625, 2.8084716796875, 2.92156982421875, 3.03466796875, 3.14776611328125, 3.2608642578125, 3.37396240234375, 3.487060546875, 3.60015869140625, 3.7132568359375, 3.82635498046875, 3.939453125]}, "gradients/encoder.encoder.layers.22.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 3.0, 2.0, 7.0, 6.0, 9.0, 17.0, 27.0, 41.0, 87.0, 179.0, 243.0, 179.0, 100.0, 37.0, 27.0, 17.0, 7.0, 5.0, 4.0, 4.0, 5.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001590251922607422, -0.00015500467270612717, -0.00015098415315151215, -0.00014696363359689713, -0.0001429431140422821, -0.00013892259448766708, -0.00013490207493305206, -0.00013088155537843704, -0.00012686103582382202, -0.000122840516269207, -0.00011881999671459198, -0.00011479947715997696, -0.00011077895760536194, -0.00010675843805074692, -0.0001027379184961319, -9.871739894151688e-05, -9.469687938690186e-05, -9.067635983228683e-05, -8.665584027767181e-05, -8.263532072305679e-05, -7.861480116844177e-05, -7.459428161382675e-05, -7.057376205921173e-05, -6.655324250459671e-05, -6.253272294998169e-05, -5.851220339536667e-05, -5.449168384075165e-05, -5.047116428613663e-05, -4.6450644731521606e-05, -4.2430125176906586e-05, -3.8409605622291565e-05, -3.4389086067676544e-05, -3.0368566513061523e-05, -2.6348046958446503e-05, -2.2327527403831482e-05, -1.830700784921646e-05, -1.428648829460144e-05, -1.026596873998642e-05, -6.245449185371399e-06, -2.224929630756378e-06, 1.7955899238586426e-06, 5.816109478473663e-06, 9.836629033088684e-06, 1.3857148587703705e-05, 1.7877668142318726e-05, 2.1898187696933746e-05, 2.5918707251548767e-05, 2.9939226806163788e-05, 3.395974636077881e-05, 3.798026591539383e-05, 4.200078547000885e-05, 4.602130502462387e-05, 5.004182457923889e-05, 5.406234413385391e-05, 5.808286368846893e-05, 6.210338324308395e-05, 6.612390279769897e-05, 7.0144422352314e-05, 7.416494190692902e-05, 7.818546146154404e-05, 8.220598101615906e-05, 8.622650057077408e-05, 9.02470201253891e-05, 9.426753968000412e-05, 9.828805923461914e-05]}, "gradients/encoder.encoder.layers.22.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 6.0, 6.0, 12.0, 14.0, 26.0, 45.0, 43.0, 92.0, 150.0, 274.0, 539.0, 1174.0, 3070.0, 12045.0, 111530.0, 829849.0, 74278.0, 10219.0, 2799.0, 1131.0, 526.0, 298.0, 154.0, 94.0, 55.0, 40.0, 34.0, 24.0, 12.0, 7.0, 4.0, 4.0, 3.0, 0.0, 3.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.619140625, -0.5915374755859375, -0.563934326171875, -0.5363311767578125, -0.50872802734375, -0.4811248779296875, -0.453521728515625, -0.4259185791015625, -0.3983154296875, -0.3707122802734375, -0.343109130859375, -0.3155059814453125, -0.28790283203125, -0.2602996826171875, -0.232696533203125, -0.2050933837890625, -0.177490234375, -0.1498870849609375, -0.122283935546875, -0.0946807861328125, -0.06707763671875, -0.0394744873046875, -0.011871337890625, 0.0157318115234375, 0.0433349609375, 0.0709381103515625, 0.098541259765625, 0.1261444091796875, 0.15374755859375, 0.1813507080078125, 0.208953857421875, 0.2365570068359375, 0.26416015625, 0.2917633056640625, 0.319366455078125, 0.3469696044921875, 0.37457275390625, 0.4021759033203125, 0.429779052734375, 0.4573822021484375, 0.4849853515625, 0.5125885009765625, 0.540191650390625, 0.5677947998046875, 0.59539794921875, 0.6230010986328125, 0.650604248046875, 0.6782073974609375, 0.705810546875, 0.7334136962890625, 0.761016845703125, 0.7886199951171875, 0.81622314453125, 0.8438262939453125, 0.871429443359375, 0.8990325927734375, 0.9266357421875, 0.9542388916015625, 0.981842041015625, 1.0094451904296875, 1.03704833984375, 1.0646514892578125, 1.092254638671875, 1.1198577880859375, 1.1474609375]}, "gradients/encoder.encoder.layers.22.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 4.0, 11.0, 16.0, 15.0, 26.0, 34.0, 76.0, 87.0, 119.0, 138.0, 128.0, 116.0, 89.0, 45.0, 37.0, 19.0, 13.0, 7.0, 10.0, 7.0, 1.0, 3.0, 1.0, 2.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.257080078125, -0.24400711059570312, -0.23093414306640625, -0.21786117553710938, -0.2047882080078125, -0.19171524047851562, -0.17864227294921875, -0.16556930541992188, -0.152496337890625, -0.13942337036132812, -0.12635040283203125, -0.11327743530273438, -0.1002044677734375, -0.08713150024414062, -0.07405853271484375, -0.060985565185546875, -0.04791259765625, -0.034839630126953125, -0.02176666259765625, -0.008693695068359375, 0.0043792724609375, 0.017452239990234375, 0.03052520751953125, 0.043598175048828125, 0.056671142578125, 0.06974411010742188, 0.08281707763671875, 0.09589004516601562, 0.1089630126953125, 0.12203598022460938, 0.13510894775390625, 0.14818191528320312, 0.1612548828125, 0.17432785034179688, 0.18740081787109375, 0.20047378540039062, 0.2135467529296875, 0.22661972045898438, 0.23969268798828125, 0.2527656555175781, 0.265838623046875, 0.2789115905761719, 0.29198455810546875, 0.3050575256347656, 0.3181304931640625, 0.3312034606933594, 0.34427642822265625, 0.3573493957519531, 0.37042236328125, 0.3834953308105469, 0.39656829833984375, 0.4096412658691406, 0.4227142333984375, 0.4357872009277344, 0.44886016845703125, 0.4619331359863281, 0.475006103515625, 0.4880790710449219, 0.5011520385742188, 0.5142250061035156, 0.5272979736328125, 0.5403709411621094, 0.5534439086914062, 0.5665168762207031, 0.57958984375]}, "gradients/encoder.encoder.layers.22.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 2.0, 5.0, 11.0, 39.0, 127.0, 248.0, 324.0, 152.0, 57.0, 16.0, 6.0, 3.0, 4.0, 1.0, 4.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.7624757289886475, -2.618496894836426, -2.474518299102783, -2.3305397033691406, -2.186560869216919, -2.0425820350646973, -1.8986034393310547, -1.7546247243881226, -1.6106460094451904, -1.4666672945022583, -1.3226885795593262, -1.178709864616394, -1.034731149673462, -0.8907524347305298, -0.7467737197875977, -0.6027950048446655, -0.4588162899017334, -0.31483757495880127, -0.17085886001586914, -0.02688014507293701, 0.11709856986999512, 0.26107728481292725, 0.4050559997558594, 0.5490347146987915, 0.6930134296417236, 0.8369921445846558, 0.9809708595275879, 1.12494957447052, 1.2689282894134521, 1.4129070043563843, 1.5568857192993164, 1.7008644342422485, 1.8448429107666016, 1.9888216257095337, 2.132800340652466, 2.2767791748046875, 2.42075777053833, 2.5647363662719727, 2.7087152004241943, 2.852694034576416, 2.9966726303100586, 3.140651226043701, 3.284630060195923, 3.4286088943481445, 3.572587490081787, 3.7165660858154297, 3.8605449199676514, 4.004523754119873, 4.148502349853516, 4.292480945587158, 4.436459541320801, 4.580438613891602, 4.724417209625244, 4.868395805358887, 5.0123748779296875, 5.15635347366333, 5.300332069396973, 5.444310665130615, 5.588289260864258, 5.732268333435059, 5.876246929168701, 6.020225524902344, 6.1642045974731445, 6.308183193206787, 6.45216178894043]}, "gradients/encoder.encoder.layers.22.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 0.0, 2.0, 5.0, 3.0, 6.0, 7.0, 6.0, 12.0, 14.0, 30.0, 29.0, 37.0, 56.0, 64.0, 81.0, 86.0, 92.0, 95.0, 84.0, 83.0, 47.0, 50.0, 40.0, 21.0, 12.0, 13.0, 9.0, 4.0, 1.0, 8.0, 2.0, 2.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.517001152038574, -2.426503896713257, -2.3360066413879395, -2.245509386062622, -2.1550121307373047, -2.0645151138305664, -1.974017858505249, -1.8835206031799316, -1.7930233478546143, -1.7025260925292969, -1.6120288372039795, -1.5215317010879517, -1.4310344457626343, -1.340537190437317, -1.250040054321289, -1.1595427989959717, -1.0690455436706543, -0.9785482883453369, -0.8880510926246643, -0.7975538969039917, -0.7070566415786743, -0.6165593862533569, -0.5260621905326843, -0.4355649948120117, -0.34506773948669434, -0.25457051396369934, -0.16407328844070435, -0.07357606291770935, 0.016921162605285645, 0.10741838812828064, 0.19791561365127563, 0.28841280937194824, 0.3789100646972656, 0.4694072902202606, 0.5599045157432556, 0.6504017114639282, 0.7408989667892456, 0.831396222114563, 0.9218934178352356, 1.0123906135559082, 1.1028878688812256, 1.193385124206543, 1.2838823795318604, 1.3743795156478882, 1.4648767709732056, 1.555374026298523, 1.6458711624145508, 1.7363684177398682, 1.8268656730651855, 1.917362928390503, 2.0078601837158203, 2.0983574390411377, 2.188854694366455, 2.2793517112731934, 2.3698489665985107, 2.460346221923828, 2.5508434772491455, 2.641340732574463, 2.7318379878997803, 2.8223352432250977, 2.912832260131836, 3.0033295154571533, 3.0938267707824707, 3.184324026107788, 3.2748212814331055]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 4.0, 2.0, 4.0, 4.0, 6.0, 2.0, 2.0, 3.0, 7.0, 11.0, 12.0, 11.0, 45.0, 33.0, 57.0, 68.0, 107.0, 155.0, 215.0, 398.0, 663.0, 1255.0, 2942.0, 8802.0, 40576.0, 3441914.0, 657838.0, 27898.0, 6472.0, 2348.0, 1066.0, 538.0, 293.0, 182.0, 125.0, 75.0, 43.0, 30.0, 20.0, 13.0, 7.0, 6.0, 10.0, 4.0, 9.0, 2.0, 5.0, 0.0, 4.0, 3.0, 2.0, 0.0, 2.0, 0.0, 0.0, 5.0], "bins": [-1.400390625, -1.3590850830078125, -1.317779541015625, -1.2764739990234375, -1.23516845703125, -1.1938629150390625, -1.152557373046875, -1.1112518310546875, -1.0699462890625, -1.0286407470703125, -0.987335205078125, -0.9460296630859375, -0.90472412109375, -0.8634185791015625, -0.822113037109375, -0.7808074951171875, -0.739501953125, -0.6981964111328125, -0.656890869140625, -0.6155853271484375, -0.57427978515625, -0.5329742431640625, -0.491668701171875, -0.4503631591796875, -0.4090576171875, -0.3677520751953125, -0.326446533203125, -0.2851409912109375, -0.24383544921875, -0.2025299072265625, -0.161224365234375, -0.1199188232421875, -0.07861328125, -0.0373077392578125, 0.003997802734375, 0.0453033447265625, 0.08660888671875, 0.1279144287109375, 0.169219970703125, 0.2105255126953125, 0.2518310546875, 0.2931365966796875, 0.334442138671875, 0.3757476806640625, 0.41705322265625, 0.4583587646484375, 0.499664306640625, 0.5409698486328125, 0.582275390625, 0.6235809326171875, 0.664886474609375, 0.7061920166015625, 0.74749755859375, 0.7888031005859375, 0.830108642578125, 0.8714141845703125, 0.9127197265625, 0.9540252685546875, 0.995330810546875, 1.0366363525390625, 1.07794189453125, 1.1192474365234375, 1.160552978515625, 1.2018585205078125, 1.2431640625]}, "gradients/encoder.encoder.layers.21.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 2.0, 1.0, 0.0, 5.0, 2.0, 9.0, 4.0, 4.0, 7.0, 3.0, 14.0, 21.0, 33.0, 33.0, 40.0, 57.0, 67.0, 72.0, 112.0, 112.0, 89.0, 76.0, 69.0, 42.0, 34.0, 17.0, 18.0, 9.0, 10.0, 11.0, 8.0, 4.0, 1.0, 1.0, 1.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 2.0, 1.0, 2.0, 1.0, 1.0, 1.0], "bins": [-0.050140380859375, -0.048745155334472656, -0.04734992980957031, -0.04595470428466797, -0.044559478759765625, -0.04316425323486328, -0.04176902770996094, -0.040373802185058594, -0.03897857666015625, -0.037583351135253906, -0.03618812561035156, -0.03479290008544922, -0.033397674560546875, -0.03200244903564453, -0.030607223510742188, -0.029211997985839844, -0.0278167724609375, -0.026421546936035156, -0.025026321411132812, -0.02363109588623047, -0.022235870361328125, -0.02084064483642578, -0.019445419311523438, -0.018050193786621094, -0.01665496826171875, -0.015259742736816406, -0.013864517211914062, -0.012469291687011719, -0.011074066162109375, -0.009678840637207031, -0.008283615112304688, -0.006888389587402344, -0.0054931640625, -0.004097938537597656, -0.0027027130126953125, -0.0013074874877929688, 8.7738037109375e-05, 0.0014829635620117188, 0.0028781890869140625, 0.004273414611816406, 0.00566864013671875, 0.007063865661621094, 0.008459091186523438, 0.009854316711425781, 0.011249542236328125, 0.012644767761230469, 0.014039993286132812, 0.015435218811035156, 0.0168304443359375, 0.018225669860839844, 0.019620895385742188, 0.02101612091064453, 0.022411346435546875, 0.02380657196044922, 0.025201797485351562, 0.026597023010253906, 0.02799224853515625, 0.029387474060058594, 0.030782699584960938, 0.03217792510986328, 0.033573150634765625, 0.03496837615966797, 0.03636360168457031, 0.037758827209472656, 0.039154052734375]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 2.0, 23.0, 33.0, 108.0, 603.0, 35956.0, 4151394.0, 5754.0, 304.0, 71.0, 28.0, 9.0, 2.0, 2.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.115234375, -1.993194580078125, -1.87115478515625, -1.749114990234375, -1.6270751953125, -1.505035400390625, -1.38299560546875, -1.260955810546875, -1.138916015625, -1.016876220703125, -0.89483642578125, -0.772796630859375, -0.6507568359375, -0.528717041015625, -0.40667724609375, -0.284637451171875, -0.16259765625, -0.040557861328125, 0.08148193359375, 0.203521728515625, 0.3255615234375, 0.447601318359375, 0.56964111328125, 0.691680908203125, 0.813720703125, 0.935760498046875, 1.05780029296875, 1.179840087890625, 1.3018798828125, 1.423919677734375, 1.54595947265625, 1.667999267578125, 1.7900390625, 1.912078857421875, 2.03411865234375, 2.156158447265625, 2.2781982421875, 2.400238037109375, 2.52227783203125, 2.644317626953125, 2.766357421875, 2.888397216796875, 3.01043701171875, 3.132476806640625, 3.2545166015625, 3.376556396484375, 3.49859619140625, 3.620635986328125, 3.74267578125, 3.864715576171875, 3.98675537109375, 4.108795166015625, 4.2308349609375, 4.352874755859375, 4.47491455078125, 4.596954345703125, 4.718994140625, 4.841033935546875, 4.96307373046875, 5.085113525390625, 5.2071533203125, 5.329193115234375, 5.45123291015625, 5.573272705078125, 5.6953125]}, "gradients/encoder.encoder.layers.21.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 3.0, 5.0, 4.0, 4.0, 7.0, 8.0, 7.0, 4.0, 12.0, 13.0, 26.0, 29.0, 30.0, 62.0, 84.0, 119.0, 226.0, 477.0, 1287.0, 803.0, 326.0, 188.0, 118.0, 76.0, 34.0, 40.0, 25.0, 17.0, 15.0, 4.0, 4.0, 2.0, 5.0, 1.0, 5.0, 4.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.08917236328125, -0.08596038818359375, -0.0827484130859375, -0.07953643798828125, -0.076324462890625, -0.07311248779296875, -0.0699005126953125, -0.06668853759765625, -0.0634765625, -0.06026458740234375, -0.0570526123046875, -0.05384063720703125, -0.050628662109375, -0.04741668701171875, -0.0442047119140625, -0.04099273681640625, -0.03778076171875, -0.03456878662109375, -0.0313568115234375, -0.02814483642578125, -0.024932861328125, -0.02172088623046875, -0.0185089111328125, -0.01529693603515625, -0.0120849609375, -0.00887298583984375, -0.0056610107421875, -0.00244903564453125, 0.000762939453125, 0.00397491455078125, 0.0071868896484375, 0.01039886474609375, 0.01361083984375, 0.01682281494140625, 0.0200347900390625, 0.02324676513671875, 0.026458740234375, 0.02967071533203125, 0.0328826904296875, 0.03609466552734375, 0.039306640625, 0.04251861572265625, 0.0457305908203125, 0.04894256591796875, 0.052154541015625, 0.05536651611328125, 0.0585784912109375, 0.06179046630859375, 0.06500244140625, 0.06821441650390625, 0.0714263916015625, 0.07463836669921875, 0.077850341796875, 0.08106231689453125, 0.0842742919921875, 0.08748626708984375, 0.0906982421875, 0.09391021728515625, 0.0971221923828125, 0.10033416748046875, 0.103546142578125, 0.10675811767578125, 0.1099700927734375, 0.11318206787109375, 0.11639404296875]}, "gradients/encoder.encoder.layers.21.final_layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 4.0, 17.0, 797.0, 195.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.9089664220809937, -1.66550612449646, -1.4220457077026367, -1.1785852909088135, -0.9351249933242798, -0.6916645765304565, -0.44820427894592285, -0.20474398136138916, 0.03871643543243408, 0.28217679262161255, 0.525637149810791, 0.7690975069999695, 1.012557864189148, 1.2560182809829712, 1.4994785785675049, 1.7429388761520386, 1.9863992929458618, 2.2298595905303955, 2.4733200073242188, 2.716780424118042, 2.9602408409118652, 3.2037010192871094, 3.4471614360809326, 3.690621852874756, 3.93408203125, 4.177542209625244, 4.4210028648376465, 4.664463043212891, 4.907923698425293, 5.151383876800537, 5.394844055175781, 5.638304710388184, 5.881765365600586, 6.12522554397583, 6.368686199188232, 6.612146377563477, 6.855607032775879, 7.099067211151123, 7.342527389526367, 7.5859880447387695, 7.829448223114014, 8.072908401489258, 8.31636905670166, 8.559829711914062, 8.803289413452148, 9.04675006866455, 9.290210723876953, 9.533670425415039, 9.777131080627441, 10.020591735839844, 10.26405143737793, 10.507512092590332, 10.750972747802734, 10.99443244934082, 11.237893104553223, 11.481353759765625, 11.724813461303711, 11.968274116516113, 12.2117338180542, 12.455194473266602, 12.698655128479004, 12.942115783691406, 13.185575485229492, 13.429036140441895, 13.672496795654297]}, "gradients/encoder.encoder.layers.21.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 7.0, 6.0, 8.0, 20.0, 36.0, 56.0, 98.0, 117.0, 129.0, 152.0, 116.0, 116.0, 70.0, 36.0, 19.0, 11.0, 7.0, 8.0, 3.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.4736161231994629, -0.4380244314670563, -0.40243270993232727, -0.36684101819992065, -0.33124929666519165, -0.29565760493278503, -0.2600659132003784, -0.2244742065668106, -0.1888824999332428, -0.153290793299675, -0.11769909411668777, -0.08210739493370056, -0.04651568830013275, -0.010923981666564941, 0.024667710065841675, 0.060259416699409485, 0.0958511233329773, 0.1314428299665451, 0.16703453660011292, 0.20262622833251953, 0.23821793496608734, 0.27380964159965515, 0.30940133333206177, 0.34499305486679077, 0.3805847465991974, 0.416176438331604, 0.451768159866333, 0.4873598515987396, 0.5229515433311462, 0.5585432648658752, 0.5941349267959595, 0.6297266483306885, 0.6653183698654175, 0.7009100914001465, 0.7365017533302307, 0.7720934748649597, 0.8076851963996887, 0.843276858329773, 0.878868579864502, 0.914460301399231, 0.95005202293396, 0.985643744468689, 1.021235466003418, 1.0568270683288574, 1.0924187898635864, 1.1280105113983154, 1.1636022329330444, 1.1991939544677734, 1.234785556793213, 1.270377278327942, 1.305968999862671, 1.3415606021881104, 1.3771523237228394, 1.4127440452575684, 1.4483357667922974, 1.4839274883270264, 1.5195192098617554, 1.5551109313964844, 1.5907026529312134, 1.6262943744659424, 1.6618859767913818, 1.6974776983261108, 1.7330694198608398, 1.7686611413955688, 1.8042528629302979]}, "gradients/encoder.encoder.layers.21.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 6.0, 4.0, 4.0, 3.0, 9.0, 7.0, 10.0, 12.0, 21.0, 22.0, 21.0, 33.0, 30.0, 25.0, 36.0, 36.0, 38.0, 58.0, 249.0, 6277.0, 975793.0, 64667.0, 738.0, 81.0, 53.0, 46.0, 39.0, 27.0, 42.0, 27.0, 30.0, 20.0, 19.0, 11.0, 10.0, 12.0, 7.0, 6.0, 7.0, 3.0, 5.0, 2.0, 5.0, 2.0, 2.0, 3.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.365234375, -2.297088623046875, -2.22894287109375, -2.160797119140625, -2.0926513671875, -2.024505615234375, -1.95635986328125, -1.888214111328125, -1.820068359375, -1.751922607421875, -1.68377685546875, -1.615631103515625, -1.5474853515625, -1.479339599609375, -1.41119384765625, -1.343048095703125, -1.27490234375, -1.206756591796875, -1.13861083984375, -1.070465087890625, -1.0023193359375, -0.934173583984375, -0.86602783203125, -0.797882080078125, -0.729736328125, -0.661590576171875, -0.59344482421875, -0.525299072265625, -0.4571533203125, -0.389007568359375, -0.32086181640625, -0.252716064453125, -0.1845703125, -0.116424560546875, -0.04827880859375, 0.019866943359375, 0.0880126953125, 0.156158447265625, 0.22430419921875, 0.292449951171875, 0.360595703125, 0.428741455078125, 0.49688720703125, 0.565032958984375, 0.6331787109375, 0.701324462890625, 0.76947021484375, 0.837615966796875, 0.90576171875, 0.973907470703125, 1.04205322265625, 1.110198974609375, 1.1783447265625, 1.246490478515625, 1.31463623046875, 1.382781982421875, 1.450927734375, 1.519073486328125, 1.58721923828125, 1.655364990234375, 1.7235107421875, 1.791656494140625, 1.85980224609375, 1.927947998046875, 1.99609375]}, "gradients/encoder.encoder.layers.21.attention.out_proj.bias": {"_type": "histogram", "values": [4.0, 3.0, 11.0, 65.0, 233.0, 395.0, 241.0, 52.0, 14.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.041717529296875, -0.03418397903442383, -0.026650428771972656, -0.019116878509521484, -0.011583328247070312, -0.004049777984619141, 0.0034837722778320312, 0.011017322540283203, 0.018550872802734375, 0.026084423065185547, 0.03361797332763672, 0.04115152359008789, 0.04868507385253906, 0.056218624114990234, 0.0637521743774414, 0.07128572463989258, 0.07881927490234375, 0.08635282516479492, 0.0938863754272461, 0.10141992568969727, 0.10895347595214844, 0.11648702621459961, 0.12402057647705078, 0.13155412673950195, 0.13908767700195312, 0.1466212272644043, 0.15415477752685547, 0.16168832778930664, 0.1692218780517578, 0.17675542831420898, 0.18428897857666016, 0.19182252883911133, 0.1993560791015625, 0.20688962936401367, 0.21442317962646484, 0.22195672988891602, 0.2294902801513672, 0.23702383041381836, 0.24455738067626953, 0.2520909309387207, 0.2596244812011719, 0.26715803146362305, 0.2746915817260742, 0.2822251319885254, 0.28975868225097656, 0.29729223251342773, 0.3048257827758789, 0.3123593330383301, 0.31989288330078125, 0.3274264335632324, 0.3349599838256836, 0.34249353408813477, 0.35002708435058594, 0.3575606346130371, 0.3650941848754883, 0.37262773513793945, 0.3801612854003906, 0.3876948356628418, 0.39522838592529297, 0.40276193618774414, 0.4102954864501953, 0.4178290367126465, 0.42536258697509766, 0.43289613723754883, 0.4404296875]}, "gradients/encoder.encoder.layers.21.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 3.0, 6.0, 2.0, 8.0, 7.0, 13.0, 12.0, 19.0, 21.0, 45.0, 54.0, 70.0, 105.0, 197.0, 333.0, 706.0, 1776.0, 6284.0, 30119.0, 215130.0, 614218.0, 149105.0, 22351.0, 4973.0, 1529.0, 628.0, 289.0, 187.0, 114.0, 82.0, 39.0, 34.0, 32.0, 9.0, 16.0, 9.0, 7.0, 7.0, 6.0, 5.0, 3.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0], "bins": [-0.77880859375, -0.757415771484375, -0.73602294921875, -0.714630126953125, -0.6932373046875, -0.671844482421875, -0.65045166015625, -0.629058837890625, -0.607666015625, -0.586273193359375, -0.56488037109375, -0.543487548828125, -0.5220947265625, -0.500701904296875, -0.47930908203125, -0.457916259765625, -0.4365234375, -0.415130615234375, -0.39373779296875, -0.372344970703125, -0.3509521484375, -0.329559326171875, -0.30816650390625, -0.286773681640625, -0.265380859375, -0.243988037109375, -0.22259521484375, -0.201202392578125, -0.1798095703125, -0.158416748046875, -0.13702392578125, -0.115631103515625, -0.09423828125, -0.072845458984375, -0.05145263671875, -0.030059814453125, -0.0086669921875, 0.012725830078125, 0.03411865234375, 0.055511474609375, 0.076904296875, 0.098297119140625, 0.11968994140625, 0.141082763671875, 0.1624755859375, 0.183868408203125, 0.20526123046875, 0.226654052734375, 0.248046875, 0.269439697265625, 0.29083251953125, 0.312225341796875, 0.3336181640625, 0.355010986328125, 0.37640380859375, 0.397796630859375, 0.419189453125, 0.440582275390625, 0.46197509765625, 0.483367919921875, 0.5047607421875, 0.526153564453125, 0.54754638671875, 0.568939208984375, 0.59033203125]}, "gradients/encoder.encoder.layers.21.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 4.0, 3.0, 6.0, 5.0, 10.0, 10.0, 14.0, 6.0, 10.0, 21.0, 28.0, 28.0, 29.0, 40.0, 34.0, 32.0, 53.0, 58.0, 48.0, 55.0, 64.0, 62.0, 49.0, 44.0, 43.0, 40.0, 35.0, 28.0, 19.0, 27.0, 21.0, 10.0, 16.0, 11.0, 12.0, 9.0, 5.0, 3.0, 4.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.3740234375, -0.3628807067871094, -0.35173797607421875, -0.3405952453613281, -0.3294525146484375, -0.3183097839355469, -0.30716705322265625, -0.2960243225097656, -0.284881591796875, -0.2737388610839844, -0.26259613037109375, -0.2514533996582031, -0.2403106689453125, -0.22916793823242188, -0.21802520751953125, -0.20688247680664062, -0.19573974609375, -0.18459701538085938, -0.17345428466796875, -0.16231155395507812, -0.1511688232421875, -0.14002609252929688, -0.12888336181640625, -0.11774063110351562, -0.106597900390625, -0.09545516967773438, -0.08431243896484375, -0.07316970825195312, -0.0620269775390625, -0.050884246826171875, -0.03974151611328125, -0.028598785400390625, -0.0174560546875, -0.006313323974609375, 0.00482940673828125, 0.015972137451171875, 0.0271148681640625, 0.038257598876953125, 0.04940032958984375, 0.060543060302734375, 0.071685791015625, 0.08282852172851562, 0.09397125244140625, 0.10511398315429688, 0.1162567138671875, 0.12739944458007812, 0.13854217529296875, 0.14968490600585938, 0.16082763671875, 0.17197036743164062, 0.18311309814453125, 0.19425582885742188, 0.2053985595703125, 0.21654129028320312, 0.22768402099609375, 0.23882675170898438, 0.249969482421875, 0.2611122131347656, 0.27225494384765625, 0.2833976745605469, 0.2945404052734375, 0.3056831359863281, 0.31682586669921875, 0.3279685974121094, 0.339111328125]}, "gradients/encoder.encoder.layers.21.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 7.0, 2.0, 6.0, 6.0, 7.0, 11.0, 32.0, 48.0, 73.0, 111.0, 183.0, 300.0, 654.0, 1550.0, 4727.0, 22359.0, 189351.0, 677973.0, 127990.0, 16622.0, 3910.0, 1369.0, 563.0, 275.0, 156.0, 76.0, 56.0, 49.0, 28.0, 18.0, 5.0, 15.0, 8.0, 7.0, 4.0, 5.0, 3.0, 1.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.496337890625, -0.4794654846191406, -0.46259307861328125, -0.4457206726074219, -0.4288482666015625, -0.4119758605957031, -0.39510345458984375, -0.3782310485839844, -0.361358642578125, -0.3444862365722656, -0.32761383056640625, -0.3107414245605469, -0.2938690185546875, -0.2769966125488281, -0.26012420654296875, -0.24325180053710938, -0.22637939453125, -0.20950698852539062, -0.19263458251953125, -0.17576217651367188, -0.1588897705078125, -0.14201736450195312, -0.12514495849609375, -0.10827255249023438, -0.091400146484375, -0.07452774047851562, -0.05765533447265625, -0.040782928466796875, -0.0239105224609375, -0.007038116455078125, 0.00983428955078125, 0.026706695556640625, 0.0435791015625, 0.060451507568359375, 0.07732391357421875, 0.09419631958007812, 0.1110687255859375, 0.12794113159179688, 0.14481353759765625, 0.16168594360351562, 0.178558349609375, 0.19543075561523438, 0.21230316162109375, 0.22917556762695312, 0.2460479736328125, 0.2629203796386719, 0.27979278564453125, 0.2966651916503906, 0.31353759765625, 0.3304100036621094, 0.34728240966796875, 0.3641548156738281, 0.3810272216796875, 0.3978996276855469, 0.41477203369140625, 0.4316444396972656, 0.448516845703125, 0.4653892517089844, 0.48226165771484375, 0.4991340637207031, 0.5160064697265625, 0.5328788757324219, 0.5497512817382812, 0.5666236877441406, 0.58349609375]}, "gradients/encoder.encoder.layers.21.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 2.0, 3.0, 2.0, 6.0, 8.0, 13.0, 28.0, 40.0, 46.0, 63.0, 72.0, 109.0, 108.0, 115.0, 91.0, 94.0, 65.0, 33.0, 35.0, 23.0, 16.0, 14.0, 6.0, 5.0, 7.0, 2.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-7.009506225585938e-05, -6.834324449300766e-05, -6.659142673015594e-05, -6.483960896730423e-05, -6.308779120445251e-05, -6.13359734416008e-05, -5.9584155678749084e-05, -5.783233791589737e-05, -5.6080520153045654e-05, -5.432870239019394e-05, -5.2576884627342224e-05, -5.082506686449051e-05, -4.9073249101638794e-05, -4.732143133878708e-05, -4.5569613575935364e-05, -4.381779581308365e-05, -4.2065978050231934e-05, -4.031416028738022e-05, -3.8562342524528503e-05, -3.681052476167679e-05, -3.505870699882507e-05, -3.330688923597336e-05, -3.155507147312164e-05, -2.9803253710269928e-05, -2.8051435947418213e-05, -2.6299618184566498e-05, -2.4547800421714783e-05, -2.2795982658863068e-05, -2.1044164896011353e-05, -1.9292347133159637e-05, -1.7540529370307922e-05, -1.5788711607456207e-05, -1.4036893844604492e-05, -1.2285076081752777e-05, -1.0533258318901062e-05, -8.781440556049347e-06, -7.029622793197632e-06, -5.277805030345917e-06, -3.5259872674942017e-06, -1.7741695046424866e-06, -2.2351741790771484e-08, 1.7294660210609436e-06, 3.4812837839126587e-06, 5.233101546764374e-06, 6.984919309616089e-06, 8.736737072467804e-06, 1.0488554835319519e-05, 1.2240372598171234e-05, 1.399219036102295e-05, 1.5744008123874664e-05, 1.749582588672638e-05, 1.9247643649578094e-05, 2.099946141242981e-05, 2.2751279175281525e-05, 2.450309693813324e-05, 2.6254914700984955e-05, 2.800673246383667e-05, 2.9758550226688385e-05, 3.15103679895401e-05, 3.3262185752391815e-05, 3.501400351524353e-05, 3.6765821278095245e-05, 3.851763904094696e-05, 4.0269456803798676e-05, 4.202127456665039e-05]}, "gradients/encoder.encoder.layers.21.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 6.0, 8.0, 20.0, 20.0, 30.0, 61.0, 178.0, 410.0, 1217.0, 6162.0, 171451.0, 839457.0, 26074.0, 2359.0, 670.0, 209.0, 108.0, 52.0, 31.0, 10.0, 8.0, 7.0, 3.0, 6.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.1455078125, -1.113922119140625, -1.08233642578125, -1.050750732421875, -1.0191650390625, -0.987579345703125, -0.95599365234375, -0.924407958984375, -0.892822265625, -0.861236572265625, -0.82965087890625, -0.798065185546875, -0.7664794921875, -0.734893798828125, -0.70330810546875, -0.671722412109375, -0.64013671875, -0.608551025390625, -0.57696533203125, -0.545379638671875, -0.5137939453125, -0.482208251953125, -0.45062255859375, -0.419036865234375, -0.387451171875, -0.355865478515625, -0.32427978515625, -0.292694091796875, -0.2611083984375, -0.229522705078125, -0.19793701171875, -0.166351318359375, -0.134765625, -0.103179931640625, -0.07159423828125, -0.040008544921875, -0.0084228515625, 0.023162841796875, 0.05474853515625, 0.086334228515625, 0.117919921875, 0.149505615234375, 0.18109130859375, 0.212677001953125, 0.2442626953125, 0.275848388671875, 0.30743408203125, 0.339019775390625, 0.37060546875, 0.402191162109375, 0.43377685546875, 0.465362548828125, 0.4969482421875, 0.528533935546875, 0.56011962890625, 0.591705322265625, 0.623291015625, 0.654876708984375, 0.68646240234375, 0.718048095703125, 0.7496337890625, 0.781219482421875, 0.81280517578125, 0.844390869140625, 0.8759765625]}, "gradients/encoder.encoder.layers.21.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 3.0, 6.0, 5.0, 5.0, 12.0, 23.0, 26.0, 40.0, 69.0, 97.0, 140.0, 144.0, 152.0, 98.0, 76.0, 41.0, 30.0, 12.0, 11.0, 11.0, 7.0, 1.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.468505859375, -0.4566841125488281, -0.44486236572265625, -0.4330406188964844, -0.4212188720703125, -0.4093971252441406, -0.39757537841796875, -0.3857536315917969, -0.373931884765625, -0.3621101379394531, -0.35028839111328125, -0.3384666442871094, -0.3266448974609375, -0.3148231506347656, -0.30300140380859375, -0.2911796569824219, -0.27935791015625, -0.2675361633300781, -0.25571441650390625, -0.24389266967773438, -0.2320709228515625, -0.22024917602539062, -0.20842742919921875, -0.19660568237304688, -0.184783935546875, -0.17296218872070312, -0.16114044189453125, -0.14931869506835938, -0.1374969482421875, -0.12567520141601562, -0.11385345458984375, -0.10203170776367188, -0.0902099609375, -0.07838821411132812, -0.06656646728515625, -0.054744720458984375, -0.0429229736328125, -0.031101226806640625, -0.01927947998046875, -0.007457733154296875, 0.004364013671875, 0.016185760498046875, 0.02800750732421875, 0.039829254150390625, 0.0516510009765625, 0.06347274780273438, 0.07529449462890625, 0.08711624145507812, 0.09893798828125, 0.11075973510742188, 0.12258148193359375, 0.13440322875976562, 0.1462249755859375, 0.15804672241210938, 0.16986846923828125, 0.18169021606445312, 0.193511962890625, 0.20533370971679688, 0.21715545654296875, 0.22897720336914062, 0.2407989501953125, 0.2526206970214844, 0.26444244384765625, 0.2762641906738281, 0.2880859375]}, "gradients/encoder.encoder.layers.21.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 2.0, 8.0, 5.0, 13.0, 44.0, 478.0, 453.0, 10.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.3227763175964355, -6.718204498291016, -6.1136322021484375, -5.509060382843018, -4.904488563537598, -4.299916744232178, -3.6953446865081787, -3.0907726287841797, -2.4862008094787598, -1.8816288709640503, -1.2770569324493408, -0.6724849939346313, -0.06791305541992188, 0.536658763885498, 1.141230821609497, 1.745802879333496, 2.350374698638916, 2.954946517944336, 3.559518575668335, 4.164090633392334, 4.768662452697754, 5.373234272003174, 5.977806091308594, 6.582378387451172, 7.186950206756592, 7.791522026062012, 8.39609432220459, 9.000665664672852, 9.60523796081543, 10.209810256958008, 10.81438159942627, 11.418953895568848, 12.02352523803711, 12.628097534179688, 13.23266887664795, 13.837241172790527, 14.441812515258789, 15.046384811401367, 15.650957107543945, 16.255529403686523, 16.86009979248047, 17.464672088623047, 18.069244384765625, 18.67381477355957, 19.27838706970215, 19.882959365844727, 20.487531661987305, 21.092103958129883, 21.69667625427246, 22.30124855041504, 22.905820846557617, 23.510391235351562, 24.11496353149414, 24.71953582763672, 25.324108123779297, 25.928680419921875, 26.533252716064453, 27.13782501220703, 27.74239730834961, 28.346967697143555, 28.951539993286133, 29.55611228942871, 30.16068458557129, 30.765256881713867, 31.369827270507812]}, "gradients/encoder.encoder.layers.21.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 2.0, 1.0, 3.0, 6.0, 7.0, 7.0, 5.0, 11.0, 22.0, 19.0, 30.0, 23.0, 30.0, 32.0, 46.0, 36.0, 42.0, 58.0, 53.0, 62.0, 54.0, 53.0, 55.0, 55.0, 57.0, 33.0, 31.0, 41.0, 22.0, 22.0, 23.0, 16.0, 9.0, 10.0, 7.0, 4.0, 8.0, 8.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.47566556930542, -2.390188217163086, -2.304711103439331, -2.219233751296997, -2.133756637573242, -2.048279285430908, -1.9628020524978638, -1.8773248195648193, -1.791847586631775, -1.7063703536987305, -1.620893120765686, -1.5354158878326416, -1.4499385356903076, -1.3644614219665527, -1.2789840698242188, -1.1935068368911743, -1.1080296039581299, -1.0225523710250854, -0.937075138092041, -0.8515978455543518, -0.7661206126213074, -0.6806433796882629, -0.5951660871505737, -0.5096888542175293, -0.42421162128448486, -0.33873438835144043, -0.2532571256160736, -0.1677798628807068, -0.08230262994766235, 0.00317460298538208, 0.08865189552307129, 0.17412912845611572, 0.25960612297058105, 0.3450833559036255, 0.4305606186389923, 0.5160378813743591, 0.6015151143074036, 0.686992347240448, 0.7724696397781372, 0.8579468727111816, 0.9434241056442261, 1.0289013385772705, 1.114378571510315, 1.1998558044433594, 1.2853331565856934, 1.3708102703094482, 1.4562876224517822, 1.5417648553848267, 1.627242088317871, 1.7127193212509155, 1.79819655418396, 1.883673906326294, 1.9691510200500488, 2.054628372192383, 2.140105724334717, 2.2255828380584717, 2.3110599517822266, 2.3965373039245605, 2.4820144176483154, 2.5674917697906494, 2.6529688835144043, 2.7384462356567383, 2.8239235877990723, 2.909400701522827, 2.994878053665161]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 3.0, 4.0, 18.0, 44.0, 128.0, 2340.0, 4188016.0, 2887.0, 470.0, 184.0, 91.0, 43.0, 31.0, 17.0, 6.0, 5.0, 6.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.08203125, -2.75799560546875, -2.4339599609375, -2.10992431640625, -1.785888671875, -1.46185302734375, -1.1378173828125, -0.81378173828125, -0.48974609375, -0.16571044921875, 0.1583251953125, 0.48236083984375, 0.806396484375, 1.13043212890625, 1.4544677734375, 1.77850341796875, 2.1025390625, 2.42657470703125, 2.7506103515625, 3.07464599609375, 3.398681640625, 3.72271728515625, 4.0467529296875, 4.37078857421875, 4.69482421875, 5.01885986328125, 5.3428955078125, 5.66693115234375, 5.990966796875, 6.31500244140625, 6.6390380859375, 6.96307373046875, 7.287109375, 7.61114501953125, 7.9351806640625, 8.25921630859375, 8.583251953125, 8.90728759765625, 9.2313232421875, 9.55535888671875, 9.87939453125, 10.20343017578125, 10.5274658203125, 10.85150146484375, 11.175537109375, 11.49957275390625, 11.8236083984375, 12.14764404296875, 12.4716796875, 12.79571533203125, 13.1197509765625, 13.44378662109375, 13.767822265625, 14.09185791015625, 14.4158935546875, 14.73992919921875, 15.06396484375, 15.38800048828125, 15.7120361328125, 16.03607177734375, 16.360107421875, 16.68414306640625, 17.0081787109375, 17.33221435546875, 17.65625]}, "gradients/encoder.encoder.layers.20.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 4.0, 6.0, 22.0, 54.0, 131.0, 247.0, 293.0, 151.0, 70.0, 28.0, 8.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.08056640625, -0.07173919677734375, -0.0629119873046875, -0.05408477783203125, -0.045257568359375, -0.03643035888671875, -0.0276031494140625, -0.01877593994140625, -0.00994873046875, -0.00112152099609375, 0.0077056884765625, 0.01653289794921875, 0.025360107421875, 0.03418731689453125, 0.0430145263671875, 0.05184173583984375, 0.0606689453125, 0.06949615478515625, 0.0783233642578125, 0.08715057373046875, 0.095977783203125, 0.10480499267578125, 0.1136322021484375, 0.12245941162109375, 0.13128662109375, 0.14011383056640625, 0.1489410400390625, 0.15776824951171875, 0.166595458984375, 0.17542266845703125, 0.1842498779296875, 0.19307708740234375, 0.201904296875, 0.21073150634765625, 0.2195587158203125, 0.22838592529296875, 0.237213134765625, 0.24604034423828125, 0.2548675537109375, 0.26369476318359375, 0.27252197265625, 0.28134918212890625, 0.2901763916015625, 0.29900360107421875, 0.307830810546875, 0.31665802001953125, 0.3254852294921875, 0.33431243896484375, 0.3431396484375, 0.35196685791015625, 0.3607940673828125, 0.36962127685546875, 0.378448486328125, 0.38727569580078125, 0.3961029052734375, 0.40493011474609375, 0.41375732421875, 0.42258453369140625, 0.4314117431640625, 0.44023895263671875, 0.449066162109375, 0.45789337158203125, 0.4667205810546875, 0.47554779052734375, 0.484375]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 17.0, 44.0, 92.0, 142.0, 308.0, 20444.0, 4172240.0, 421.0, 236.0, 166.0, 102.0, 56.0, 20.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-14.3828125, -13.7864990234375, -13.190185546875, -12.5938720703125, -11.99755859375, -11.4012451171875, -10.804931640625, -10.2086181640625, -9.6123046875, -9.0159912109375, -8.419677734375, -7.8233642578125, -7.22705078125, -6.6307373046875, -6.034423828125, -5.4381103515625, -4.841796875, -4.2454833984375, -3.649169921875, -3.0528564453125, -2.45654296875, -1.8602294921875, -1.263916015625, -0.6676025390625, -0.0712890625, 0.5250244140625, 1.121337890625, 1.7176513671875, 2.31396484375, 2.9102783203125, 3.506591796875, 4.1029052734375, 4.69921875, 5.2955322265625, 5.891845703125, 6.4881591796875, 7.08447265625, 7.6807861328125, 8.277099609375, 8.8734130859375, 9.4697265625, 10.0660400390625, 10.662353515625, 11.2586669921875, 11.85498046875, 12.4512939453125, 13.047607421875, 13.6439208984375, 14.240234375, 14.8365478515625, 15.432861328125, 16.0291748046875, 16.62548828125, 17.2218017578125, 17.818115234375, 18.4144287109375, 19.0107421875, 19.6070556640625, 20.203369140625, 20.7996826171875, 21.39599609375, 21.9923095703125, 22.588623046875, 23.1849365234375, 23.78125]}, "gradients/encoder.encoder.layers.20.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 9.0, 18.0, 75.0, 3051.0, 913.0, 19.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6337890625, -0.5805206298828125, -0.527252197265625, -0.4739837646484375, -0.42071533203125, -0.3674468994140625, -0.314178466796875, -0.2609100341796875, -0.2076416015625, -0.1543731689453125, -0.101104736328125, -0.0478363037109375, 0.00543212890625, 0.0587005615234375, 0.111968994140625, 0.1652374267578125, 0.218505859375, 0.2717742919921875, 0.325042724609375, 0.3783111572265625, 0.43157958984375, 0.4848480224609375, 0.538116455078125, 0.5913848876953125, 0.6446533203125, 0.6979217529296875, 0.751190185546875, 0.8044586181640625, 0.85772705078125, 0.9109954833984375, 0.964263916015625, 1.0175323486328125, 1.07080078125, 1.1240692138671875, 1.177337646484375, 1.2306060791015625, 1.28387451171875, 1.3371429443359375, 1.390411376953125, 1.4436798095703125, 1.4969482421875, 1.5502166748046875, 1.603485107421875, 1.6567535400390625, 1.71002197265625, 1.7632904052734375, 1.816558837890625, 1.8698272705078125, 1.923095703125, 1.9763641357421875, 2.029632568359375, 2.0829010009765625, 2.13616943359375, 2.1894378662109375, 2.242706298828125, 2.2959747314453125, 2.3492431640625, 2.4025115966796875, 2.455780029296875, 2.5090484619140625, 2.56231689453125, 2.6155853271484375, 2.668853759765625, 2.7221221923828125, 2.775390625]}, "gradients/encoder.encoder.layers.20.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 1.0, 1.0, 9.0, 75.0, 846.0, 74.0, 8.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.254074573516846, -5.424280166625977, -4.594485282897949, -3.76469087600708, -2.934896469116211, -2.105102062225342, -1.2753071784973145, -0.4455127716064453, 0.38428163528442383, 1.2140761613845825, 2.043870687484741, 2.8736653327941895, 3.7034597396850586, 4.533254146575928, 5.363049030303955, 6.192843437194824, 7.022637844085693, 7.8524322509765625, 8.68222713470459, 9.512022018432617, 10.341815948486328, 11.171609878540039, 12.001405715942383, 12.831199645996094, 13.660993576049805, 14.490788459777832, 15.320582389831543, 16.15037727355957, 16.98017120361328, 17.809967041015625, 18.639760971069336, 19.469554901123047, 20.29935073852539, 21.1291446685791, 21.958940505981445, 22.788734436035156, 23.618528366088867, 24.448322296142578, 25.278118133544922, 26.107912063598633, 26.937705993652344, 27.767499923706055, 28.5972957611084, 29.42708969116211, 30.25688362121582, 31.08667755126953, 31.916473388671875, 32.74626922607422, 33.57606506347656, 34.405860900878906, 35.235652923583984, 36.06544876098633, 36.89524459838867, 37.72503662109375, 38.554832458496094, 39.38462829589844, 40.214420318603516, 41.04421615600586, 41.87400817871094, 42.70380401611328, 43.533599853515625, 44.3633918762207, 45.19318771362305, 46.02298355102539, 46.85277557373047]}, "gradients/encoder.encoder.layers.20.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 5.0, 14.0, 17.0, 43.0, 78.0, 102.0, 146.0, 155.0, 157.0, 120.0, 78.0, 40.0, 26.0, 15.0, 5.0, 4.0, 1.0, 1.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.333023071289062, -9.049577713012695, -8.766131401062012, -8.482686042785645, -8.199240684509277, -7.915794849395752, -7.632349014282227, -7.348903656005859, -7.065457820892334, -6.782011985778809, -6.498566627502441, -6.215120792388916, -5.931674957275391, -5.648229598999023, -5.364783763885498, -5.081337928771973, -4.7978925704956055, -4.51444673538208, -4.231001377105713, -3.9475555419921875, -3.664109945297241, -3.380664348602295, -3.0972185134887695, -2.8137729167938232, -2.530327320098877, -2.2468817234039307, -1.9634360074996948, -1.679990291595459, -1.3965446949005127, -1.1130990982055664, -0.8296533823013306, -0.5462076663970947, -0.26276111602783203, 0.020684540271759033, 0.3041301965713501, 0.5875758528709412, 0.8710215091705322, 1.1544671058654785, 1.4379128217697144, 1.7213585376739502, 2.0048041343688965, 2.2882497310638428, 2.571695327758789, 2.8551411628723145, 3.1385867595672607, 3.422032356262207, 3.7054781913757324, 3.9889237880706787, 4.272369384765625, 4.55581521987915, 4.839260578155518, 5.122706413269043, 5.40615177154541, 5.6895976066589355, 5.973043441772461, 6.256488800048828, 6.5399346351623535, 6.823380470275879, 7.106825828552246, 7.3902716636657715, 7.673717498779297, 7.957162857055664, 8.240608215332031, 8.524054527282715, 8.807499885559082]}, "gradients/encoder.encoder.layers.20.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 5.0, 1.0, 1.0, 6.0, 5.0, 16.0, 14.0, 12.0, 19.0, 20.0, 27.0, 47.0, 61.0, 106.0, 198.0, 360.0, 801.0, 2297.0, 13698.0, 320257.0, 682960.0, 22454.0, 3287.0, 954.0, 413.0, 182.0, 122.0, 80.0, 46.0, 34.0, 24.0, 18.0, 11.0, 6.0, 3.0, 4.0, 5.0, 2.0, 5.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0], "bins": [-3.8828125, -3.7752685546875, -3.667724609375, -3.5601806640625, -3.45263671875, -3.3450927734375, -3.237548828125, -3.1300048828125, -3.0224609375, -2.9149169921875, -2.807373046875, -2.6998291015625, -2.59228515625, -2.4847412109375, -2.377197265625, -2.2696533203125, -2.162109375, -2.0545654296875, -1.947021484375, -1.8394775390625, -1.73193359375, -1.6243896484375, -1.516845703125, -1.4093017578125, -1.3017578125, -1.1942138671875, -1.086669921875, -0.9791259765625, -0.87158203125, -0.7640380859375, -0.656494140625, -0.5489501953125, -0.44140625, -0.3338623046875, -0.226318359375, -0.1187744140625, -0.01123046875, 0.0963134765625, 0.203857421875, 0.3114013671875, 0.4189453125, 0.5264892578125, 0.634033203125, 0.7415771484375, 0.84912109375, 0.9566650390625, 1.064208984375, 1.1717529296875, 1.279296875, 1.3868408203125, 1.494384765625, 1.6019287109375, 1.70947265625, 1.8170166015625, 1.924560546875, 2.0321044921875, 2.1396484375, 2.2471923828125, 2.354736328125, 2.4622802734375, 2.56982421875, 2.6773681640625, 2.784912109375, 2.8924560546875, 3.0]}, "gradients/encoder.encoder.layers.20.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 3.0, 5.0, 9.0, 26.0, 55.0, 98.0, 148.0, 186.0, 183.0, 134.0, 86.0, 42.0, 18.0, 10.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.34033203125, -0.32405853271484375, -0.3077850341796875, -0.29151153564453125, -0.275238037109375, -0.25896453857421875, -0.2426910400390625, -0.22641754150390625, -0.21014404296875, -0.19387054443359375, -0.1775970458984375, -0.16132354736328125, -0.145050048828125, -0.12877655029296875, -0.1125030517578125, -0.09622955322265625, -0.0799560546875, -0.06368255615234375, -0.0474090576171875, -0.03113555908203125, -0.014862060546875, 0.00141143798828125, 0.0176849365234375, 0.03395843505859375, 0.05023193359375, 0.06650543212890625, 0.0827789306640625, 0.09905242919921875, 0.115325927734375, 0.13159942626953125, 0.1478729248046875, 0.16414642333984375, 0.180419921875, 0.19669342041015625, 0.2129669189453125, 0.22924041748046875, 0.245513916015625, 0.26178741455078125, 0.2780609130859375, 0.29433441162109375, 0.31060791015625, 0.32688140869140625, 0.3431549072265625, 0.35942840576171875, 0.375701904296875, 0.39197540283203125, 0.4082489013671875, 0.42452239990234375, 0.4407958984375, 0.45706939697265625, 0.4733428955078125, 0.48961639404296875, 0.505889892578125, 0.5221633911132812, 0.5384368896484375, 0.5547103881835938, 0.57098388671875, 0.5872573852539062, 0.6035308837890625, 0.6198043823242188, 0.636077880859375, 0.6523513793945312, 0.6686248779296875, 0.6848983764648438, 0.701171875]}, "gradients/encoder.encoder.layers.20.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 6.0, 7.0, 6.0, 15.0, 14.0, 16.0, 21.0, 29.0, 56.0, 71.0, 150.0, 249.0, 559.0, 1647.0, 7676.0, 80867.0, 857330.0, 88620.0, 8054.0, 1903.0, 584.0, 282.0, 142.0, 77.0, 47.0, 28.0, 32.0, 18.0, 16.0, 5.0, 12.0, 6.0, 8.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.900390625, -1.840087890625, -1.77978515625, -1.719482421875, -1.6591796875, -1.598876953125, -1.53857421875, -1.478271484375, -1.41796875, -1.357666015625, -1.29736328125, -1.237060546875, -1.1767578125, -1.116455078125, -1.05615234375, -0.995849609375, -0.935546875, -0.875244140625, -0.81494140625, -0.754638671875, -0.6943359375, -0.634033203125, -0.57373046875, -0.513427734375, -0.453125, -0.392822265625, -0.33251953125, -0.272216796875, -0.2119140625, -0.151611328125, -0.09130859375, -0.031005859375, 0.029296875, 0.089599609375, 0.14990234375, 0.210205078125, 0.2705078125, 0.330810546875, 0.39111328125, 0.451416015625, 0.51171875, 0.572021484375, 0.63232421875, 0.692626953125, 0.7529296875, 0.813232421875, 0.87353515625, 0.933837890625, 0.994140625, 1.054443359375, 1.11474609375, 1.175048828125, 1.2353515625, 1.295654296875, 1.35595703125, 1.416259765625, 1.4765625, 1.536865234375, 1.59716796875, 1.657470703125, 1.7177734375, 1.778076171875, 1.83837890625, 1.898681640625, 1.958984375]}, "gradients/encoder.encoder.layers.20.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 4.0, 2.0, 2.0, 4.0, 7.0, 9.0, 14.0, 5.0, 20.0, 18.0, 31.0, 22.0, 41.0, 43.0, 42.0, 47.0, 52.0, 61.0, 80.0, 62.0, 68.0, 61.0, 52.0, 52.0, 35.0, 33.0, 32.0, 23.0, 17.0, 16.0, 14.0, 9.0, 9.0, 4.0, 6.0, 3.0, 2.0, 0.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0], "bins": [-0.90869140625, -0.8810882568359375, -0.853485107421875, -0.8258819580078125, -0.79827880859375, -0.7706756591796875, -0.743072509765625, -0.7154693603515625, -0.6878662109375, -0.6602630615234375, -0.632659912109375, -0.6050567626953125, -0.57745361328125, -0.5498504638671875, -0.522247314453125, -0.4946441650390625, -0.467041015625, -0.4394378662109375, -0.411834716796875, -0.3842315673828125, -0.35662841796875, -0.3290252685546875, -0.301422119140625, -0.2738189697265625, -0.2462158203125, -0.2186126708984375, -0.191009521484375, -0.1634063720703125, -0.13580322265625, -0.1082000732421875, -0.080596923828125, -0.0529937744140625, -0.025390625, 0.0022125244140625, 0.029815673828125, 0.0574188232421875, 0.08502197265625, 0.1126251220703125, 0.140228271484375, 0.1678314208984375, 0.1954345703125, 0.2230377197265625, 0.250640869140625, 0.2782440185546875, 0.30584716796875, 0.3334503173828125, 0.361053466796875, 0.3886566162109375, 0.416259765625, 0.4438629150390625, 0.471466064453125, 0.4990692138671875, 0.52667236328125, 0.5542755126953125, 0.581878662109375, 0.6094818115234375, 0.6370849609375, 0.6646881103515625, 0.692291259765625, 0.7198944091796875, 0.74749755859375, 0.7751007080078125, 0.802703857421875, 0.8303070068359375, 0.85791015625]}, "gradients/encoder.encoder.layers.20.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 2.0, 6.0, 13.0, 25.0, 28.0, 89.0, 138.0, 445.0, 3335.0, 992827.0, 49929.0, 1225.0, 236.0, 106.0, 69.0, 39.0, 22.0, 14.0, 3.0, 0.0, 7.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.775390625, -2.642059326171875, -2.50872802734375, -2.375396728515625, -2.2420654296875, -2.108734130859375, -1.97540283203125, -1.842071533203125, -1.708740234375, -1.575408935546875, -1.44207763671875, -1.308746337890625, -1.1754150390625, -1.042083740234375, -0.90875244140625, -0.775421142578125, -0.64208984375, -0.508758544921875, -0.37542724609375, -0.242095947265625, -0.1087646484375, 0.024566650390625, 0.15789794921875, 0.291229248046875, 0.424560546875, 0.557891845703125, 0.69122314453125, 0.824554443359375, 0.9578857421875, 1.091217041015625, 1.22454833984375, 1.357879638671875, 1.4912109375, 1.624542236328125, 1.75787353515625, 1.891204833984375, 2.0245361328125, 2.157867431640625, 2.29119873046875, 2.424530029296875, 2.557861328125, 2.691192626953125, 2.82452392578125, 2.957855224609375, 3.0911865234375, 3.224517822265625, 3.35784912109375, 3.491180419921875, 3.62451171875, 3.757843017578125, 3.89117431640625, 4.024505615234375, 4.1578369140625, 4.291168212890625, 4.42449951171875, 4.557830810546875, 4.691162109375, 4.824493408203125, 4.95782470703125, 5.091156005859375, 5.2244873046875, 5.357818603515625, 5.49114990234375, 5.624481201171875, 5.7578125]}, "gradients/encoder.encoder.layers.20.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 5.0, 2.0, 4.0, 10.0, 7.0, 12.0, 16.0, 22.0, 40.0, 75.0, 85.0, 124.0, 130.0, 132.0, 95.0, 84.0, 45.0, 43.0, 28.0, 14.0, 10.0, 2.0, 5.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0], "bins": [-0.00011724233627319336, -0.0001145070418715477, -0.00011177174746990204, -0.00010903645306825638, -0.00010630115866661072, -0.00010356586426496506, -0.0001008305698633194, -9.809527546167374e-05, -9.535998106002808e-05, -9.262468665838242e-05, -8.988939225673676e-05, -8.71540978550911e-05, -8.441880345344543e-05, -8.168350905179977e-05, -7.894821465015411e-05, -7.621292024850845e-05, -7.347762584686279e-05, -7.074233144521713e-05, -6.800703704357147e-05, -6.527174264192581e-05, -6.253644824028015e-05, -5.980115383863449e-05, -5.706585943698883e-05, -5.433056503534317e-05, -5.159527063369751e-05, -4.885997623205185e-05, -4.612468183040619e-05, -4.338938742876053e-05, -4.065409302711487e-05, -3.791879862546921e-05, -3.518350422382355e-05, -3.244820982217789e-05, -2.9712915420532227e-05, -2.6977621018886566e-05, -2.4242326617240906e-05, -2.1507032215595245e-05, -1.8771737813949585e-05, -1.6036443412303925e-05, -1.3301149010658264e-05, -1.0565854609012604e-05, -7.830560207366943e-06, -5.095265805721283e-06, -2.3599714040756226e-06, 3.7532299757003784e-07, 3.1106173992156982e-06, 5.845911800861359e-06, 8.581206202507019e-06, 1.131650060415268e-05, 1.405179500579834e-05, 1.6787089407444e-05, 1.952238380908966e-05, 2.225767821073532e-05, 2.499297261238098e-05, 2.7728267014026642e-05, 3.0463561415672302e-05, 3.319885581731796e-05, 3.593415021896362e-05, 3.8669444620609283e-05, 4.1404739022254944e-05, 4.4140033423900604e-05, 4.6875327825546265e-05, 4.9610622227191925e-05, 5.2345916628837585e-05, 5.5081211030483246e-05, 5.7816505432128906e-05]}, "gradients/encoder.encoder.layers.20.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 5.0, 9.0, 9.0, 9.0, 14.0, 27.0, 43.0, 73.0, 114.0, 181.0, 474.0, 1652.0, 10954.0, 880248.0, 147482.0, 5402.0, 1035.0, 375.0, 168.0, 96.0, 60.0, 30.0, 29.0, 22.0, 16.0, 12.0, 6.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.931640625, -1.868988037109375, -1.80633544921875, -1.743682861328125, -1.6810302734375, -1.618377685546875, -1.55572509765625, -1.493072509765625, -1.430419921875, -1.367767333984375, -1.30511474609375, -1.242462158203125, -1.1798095703125, -1.117156982421875, -1.05450439453125, -0.991851806640625, -0.92919921875, -0.866546630859375, -0.80389404296875, -0.741241455078125, -0.6785888671875, -0.615936279296875, -0.55328369140625, -0.490631103515625, -0.427978515625, -0.365325927734375, -0.30267333984375, -0.240020751953125, -0.1773681640625, -0.114715576171875, -0.05206298828125, 0.010589599609375, 0.0732421875, 0.135894775390625, 0.19854736328125, 0.261199951171875, 0.3238525390625, 0.386505126953125, 0.44915771484375, 0.511810302734375, 0.574462890625, 0.637115478515625, 0.69976806640625, 0.762420654296875, 0.8250732421875, 0.887725830078125, 0.95037841796875, 1.013031005859375, 1.07568359375, 1.138336181640625, 1.20098876953125, 1.263641357421875, 1.3262939453125, 1.388946533203125, 1.45159912109375, 1.514251708984375, 1.576904296875, 1.639556884765625, 1.70220947265625, 1.764862060546875, 1.8275146484375, 1.890167236328125, 1.95281982421875, 2.015472412109375, 2.078125]}, "gradients/encoder.encoder.layers.20.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 2.0, 5.0, 6.0, 4.0, 12.0, 15.0, 32.0, 124.0, 248.0, 307.0, 124.0, 59.0, 21.0, 14.0, 10.0, 1.0, 4.0, 1.0, 7.0, 5.0, 1.0, 0.0, 0.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.80126953125, -0.7706222534179688, -0.7399749755859375, -0.7093276977539062, -0.678680419921875, -0.6480331420898438, -0.6173858642578125, -0.5867385864257812, -0.55609130859375, -0.5254440307617188, -0.4947967529296875, -0.46414947509765625, -0.433502197265625, -0.40285491943359375, -0.3722076416015625, -0.34156036376953125, -0.3109130859375, -0.28026580810546875, -0.2496185302734375, -0.21897125244140625, -0.188323974609375, -0.15767669677734375, -0.1270294189453125, -0.09638214111328125, -0.06573486328125, -0.03508758544921875, -0.0044403076171875, 0.02620697021484375, 0.056854248046875, 0.08750152587890625, 0.1181488037109375, 0.14879608154296875, 0.179443359375, 0.21009063720703125, 0.2407379150390625, 0.27138519287109375, 0.302032470703125, 0.33267974853515625, 0.3633270263671875, 0.39397430419921875, 0.42462158203125, 0.45526885986328125, 0.4859161376953125, 0.5165634155273438, 0.547210693359375, 0.5778579711914062, 0.6085052490234375, 0.6391525268554688, 0.6697998046875, 0.7004470825195312, 0.7310943603515625, 0.7617416381835938, 0.792388916015625, 0.8230361938476562, 0.8536834716796875, 0.8843307495117188, 0.91497802734375, 0.9456253051757812, 0.9762725830078125, 1.0069198608398438, 1.037567138671875, 1.0682144165039062, 1.0988616943359375, 1.1295089721679688, 1.16015625]}, "gradients/encoder.encoder.layers.20.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 13.0, 215.0, 742.0, 33.0, 5.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-39.22661590576172, -38.082000732421875, -36.93738555908203, -35.79277038574219, -34.648155212402344, -33.5035400390625, -32.358924865722656, -31.214305877685547, -30.069690704345703, -28.92507553100586, -27.780460357666016, -26.635845184326172, -25.491228103637695, -24.34661293029785, -23.201997756958008, -22.05738067626953, -20.91276741027832, -19.768152236938477, -18.623537063598633, -17.478919982910156, -16.334304809570312, -15.189689636230469, -14.045074462890625, -12.900458335876465, -11.755843162536621, -10.611227989196777, -9.466611862182617, -8.321996688842773, -7.1773810386657715, -6.0327653884887695, -4.888150215148926, -3.7435340881347656, -2.598918914794922, -1.4543033838272095, -0.30968785285949707, 0.8349275588989258, 1.9795432090759277, 3.1241588592529297, 4.268774032592773, 5.413390159606934, 6.558005332946777, 7.702620983123779, 8.847236633300781, 9.991851806640625, 11.136466979980469, 12.281083106994629, 13.425698280334473, 14.570314407348633, 15.714929580688477, 16.85954475402832, 18.004159927368164, 19.14877700805664, 20.293392181396484, 21.438007354736328, 22.582622528076172, 23.727237701416016, 24.87185287475586, 26.016468048095703, 27.161083221435547, 28.30569839477539, 29.450315475463867, 30.59493064880371, 31.739545822143555, 32.88416290283203, 34.028778076171875]}, "gradients/encoder.encoder.layers.20.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 3.0, 5.0, 5.0, 6.0, 6.0, 5.0, 8.0, 9.0, 15.0, 18.0, 19.0, 21.0, 22.0, 26.0, 36.0, 34.0, 49.0, 51.0, 50.0, 54.0, 53.0, 50.0, 51.0, 51.0, 50.0, 39.0, 49.0, 38.0, 30.0, 34.0, 11.0, 24.0, 21.0, 13.0, 16.0, 6.0, 9.0, 9.0, 5.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0], "bins": [-5.533768177032471, -5.3812642097473145, -5.228760242462158, -5.076256275177002, -4.923752307891846, -4.7712483406066895, -4.618744373321533, -4.466239929199219, -4.3137359619140625, -4.161231994628906, -4.00872802734375, -3.8562240600585938, -3.7037200927734375, -3.5512161254882812, -3.398711919784546, -3.2462079524993896, -3.0937042236328125, -2.9412002563476562, -2.7886962890625, -2.6361923217773438, -2.4836883544921875, -2.3311843872070312, -2.178680181503296, -2.0261762142181396, -1.8736722469329834, -1.7211682796478271, -1.568664312362671, -1.416160225868225, -1.2636562585830688, -1.1111522912979126, -0.9586482644081116, -0.8061442375183105, -0.6536407470703125, -0.5011367797851562, -0.3486327528953552, -0.1961287558078766, -0.04362475872039795, 0.1088792085647583, 0.2613832354545593, 0.41388726234436035, 0.5663912296295166, 0.7188951969146729, 0.8713992238044739, 1.023903250694275, 1.1764072179794312, 1.3289111852645874, 1.4814152717590332, 1.6339192390441895, 1.7864232063293457, 1.938927173614502, 2.091431140899658, 2.2439351081848145, 2.3964390754699707, 2.548943042755127, 2.7014472484588623, 2.8539512157440186, 3.006455183029175, 3.158959150314331, 3.3114631175994873, 3.4639670848846436, 3.616471290588379, 3.768975257873535, 3.9214792251586914, 4.073983192443848, 4.226487159729004]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 4.0, 1.0, 3.0, 8.0, 10.0, 18.0, 22.0, 36.0, 59.0, 152.0, 381.0, 778.0, 2138.0, 7883.0, 55087.0, 3773129.0, 326841.0, 20211.0, 4232.0, 1450.0, 690.0, 405.0, 216.0, 126.0, 87.0, 76.0, 51.0, 30.0, 29.0, 25.0, 23.0, 22.0, 18.0, 11.0, 11.0, 7.0, 4.0, 6.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-1.615234375, -1.524383544921875, -1.43353271484375, -1.342681884765625, -1.2518310546875, -1.160980224609375, -1.07012939453125, -0.979278564453125, -0.888427734375, -0.797576904296875, -0.70672607421875, -0.615875244140625, -0.5250244140625, -0.434173583984375, -0.34332275390625, -0.252471923828125, -0.16162109375, -0.070770263671875, 0.02008056640625, 0.110931396484375, 0.2017822265625, 0.292633056640625, 0.38348388671875, 0.474334716796875, 0.565185546875, 0.656036376953125, 0.74688720703125, 0.837738037109375, 0.9285888671875, 1.019439697265625, 1.11029052734375, 1.201141357421875, 1.2919921875, 1.382843017578125, 1.47369384765625, 1.564544677734375, 1.6553955078125, 1.746246337890625, 1.83709716796875, 1.927947998046875, 2.018798828125, 2.109649658203125, 2.20050048828125, 2.291351318359375, 2.3822021484375, 2.473052978515625, 2.56390380859375, 2.654754638671875, 2.74560546875, 2.836456298828125, 2.92730712890625, 3.018157958984375, 3.1090087890625, 3.199859619140625, 3.29071044921875, 3.381561279296875, 3.472412109375, 3.563262939453125, 3.65411376953125, 3.744964599609375, 3.8358154296875, 3.926666259765625, 4.01751708984375, 4.108367919921875, 4.19921875]}, "gradients/encoder.encoder.layers.19.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 1.0, 3.0, 2.0, 5.0, 12.0, 24.0, 39.0, 80.0, 92.0, 153.0, 175.0, 140.0, 112.0, 72.0, 51.0, 20.0, 21.0, 6.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.25, -0.23580169677734375, -0.2216033935546875, -0.20740509033203125, -0.193206787109375, -0.17900848388671875, -0.1648101806640625, -0.15061187744140625, -0.13641357421875, -0.12221527099609375, -0.1080169677734375, -0.09381866455078125, -0.079620361328125, -0.06542205810546875, -0.0512237548828125, -0.03702545166015625, -0.0228271484375, -0.00862884521484375, 0.0055694580078125, 0.01976776123046875, 0.033966064453125, 0.04816436767578125, 0.0623626708984375, 0.07656097412109375, 0.09075927734375, 0.10495758056640625, 0.1191558837890625, 0.13335418701171875, 0.147552490234375, 0.16175079345703125, 0.1759490966796875, 0.19014739990234375, 0.204345703125, 0.21854400634765625, 0.2327423095703125, 0.24694061279296875, 0.261138916015625, 0.27533721923828125, 0.2895355224609375, 0.30373382568359375, 0.31793212890625, 0.33213043212890625, 0.3463287353515625, 0.36052703857421875, 0.374725341796875, 0.38892364501953125, 0.4031219482421875, 0.41732025146484375, 0.4315185546875, 0.44571685791015625, 0.4599151611328125, 0.47411346435546875, 0.488311767578125, 0.5025100708007812, 0.5167083740234375, 0.5309066772460938, 0.54510498046875, 0.5593032836914062, 0.5735015869140625, 0.5876998901367188, 0.601898193359375, 0.6160964965820312, 0.6302947998046875, 0.6444931030273438, 0.65869140625]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 5.0, 13.0, 41.0, 124.0, 837.0, 4181111.0, 11450.0, 457.0, 160.0, 53.0, 20.0, 11.0, 4.0, 4.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.609375, -9.06884765625, -8.5283203125, -7.98779296875, -7.447265625, -6.90673828125, -6.3662109375, -5.82568359375, -5.28515625, -4.74462890625, -4.2041015625, -3.66357421875, -3.123046875, -2.58251953125, -2.0419921875, -1.50146484375, -0.9609375, -0.42041015625, 0.1201171875, 0.66064453125, 1.201171875, 1.74169921875, 2.2822265625, 2.82275390625, 3.36328125, 3.90380859375, 4.4443359375, 4.98486328125, 5.525390625, 6.06591796875, 6.6064453125, 7.14697265625, 7.6875, 8.22802734375, 8.7685546875, 9.30908203125, 9.849609375, 10.39013671875, 10.9306640625, 11.47119140625, 12.01171875, 12.55224609375, 13.0927734375, 13.63330078125, 14.173828125, 14.71435546875, 15.2548828125, 15.79541015625, 16.3359375, 16.87646484375, 17.4169921875, 17.95751953125, 18.498046875, 19.03857421875, 19.5791015625, 20.11962890625, 20.66015625, 21.20068359375, 21.7412109375, 22.28173828125, 22.822265625, 23.36279296875, 23.9033203125, 24.44384765625, 24.984375]}, "gradients/encoder.encoder.layers.19.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 8.0, 10.0, 29.0, 97.0, 854.0, 2827.0, 175.0, 45.0, 18.0, 10.0, 5.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.59423828125, -0.5522384643554688, -0.5102386474609375, -0.46823883056640625, -0.426239013671875, -0.38423919677734375, -0.3422393798828125, -0.30023956298828125, -0.25823974609375, -0.21623992919921875, -0.1742401123046875, -0.13224029541015625, -0.090240478515625, -0.04824066162109375, -0.0062408447265625, 0.03575897216796875, 0.0777587890625, 0.11975860595703125, 0.1617584228515625, 0.20375823974609375, 0.245758056640625, 0.28775787353515625, 0.3297576904296875, 0.37175750732421875, 0.41375732421875, 0.45575714111328125, 0.4977569580078125, 0.5397567749023438, 0.581756591796875, 0.6237564086914062, 0.6657562255859375, 0.7077560424804688, 0.749755859375, 0.7917556762695312, 0.8337554931640625, 0.8757553100585938, 0.917755126953125, 0.9597549438476562, 1.0017547607421875, 1.0437545776367188, 1.08575439453125, 1.1277542114257812, 1.1697540283203125, 1.2117538452148438, 1.253753662109375, 1.2957534790039062, 1.3377532958984375, 1.3797531127929688, 1.4217529296875, 1.4637527465820312, 1.5057525634765625, 1.5477523803710938, 1.589752197265625, 1.6317520141601562, 1.6737518310546875, 1.7157516479492188, 1.75775146484375, 1.7997512817382812, 1.8417510986328125, 1.8837509155273438, 1.925750732421875, 1.9677505493164062, 2.0097503662109375, 2.0517501831054688, 2.09375]}, "gradients/encoder.encoder.layers.19.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 11.0, 223.0, 721.0, 38.0, 10.0, 3.0, 3.0, 1.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.894742965698242, -21.288745880126953, -20.682748794555664, -20.076753616333008, -19.47075653076172, -18.86475944519043, -18.25876235961914, -17.65276527404785, -17.046768188476562, -16.440771102905273, -15.8347749710083, -15.228777885437012, -14.622781753540039, -14.01678466796875, -13.410787582397461, -12.804790496826172, -12.198795318603516, -11.592798233032227, -10.986802101135254, -10.380805015563965, -9.774808883666992, -9.168811798095703, -8.562814712524414, -7.956818103790283, -7.350821495056152, -6.7448248863220215, -6.138828277587891, -5.532831192016602, -4.926834583282471, -4.32083797454834, -3.71484112739563, -3.10884428024292, -2.502849578857422, -1.8968528509140015, -1.290856122970581, -0.6848593950271606, -0.07886266708374023, 0.5271339416503906, 1.1331307888031006, 1.7391276359558105, 2.3451242446899414, 2.9511208534240723, 3.5571177005767822, 4.163114547729492, 4.769111156463623, 5.375107765197754, 5.981104850769043, 6.587101459503174, 7.193098068237305, 7.7990946769714355, 8.405091285705566, 9.011088371276855, 9.617084503173828, 10.223081588745117, 10.829078674316406, 11.435075759887695, 12.041071891784668, 12.647068977355957, 13.25306510925293, 13.859062194824219, 14.465059280395508, 15.07105541229248, 15.67705249786377, 16.283048629760742, 16.88904571533203]}, "gradients/encoder.encoder.layers.19.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 3.0, 8.0, 12.0, 17.0, 35.0, 44.0, 75.0, 85.0, 101.0, 95.0, 101.0, 92.0, 88.0, 80.0, 61.0, 36.0, 28.0, 13.0, 17.0, 6.0, 3.0, 7.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-4.018214702606201, -3.871316909790039, -3.724419355392456, -3.577521562576294, -3.430624008178711, -3.283726215362549, -3.1368284225463867, -2.9899306297302246, -2.8430330753326416, -2.6961352825164795, -2.5492377281188965, -2.4023399353027344, -2.2554421424865723, -2.1085445880889893, -1.9616467952728271, -1.8147491216659546, -1.667851448059082, -1.5209537744522095, -1.374056100845337, -1.2271583080291748, -1.0802606344223022, -0.9333629608154297, -0.7864652276039124, -0.639567494392395, -0.49266982078552246, -0.3457721173763275, -0.19887441396713257, -0.05197671055793762, 0.09492099285125732, 0.24181866645812988, 0.3887163996696472, 0.5356141328811646, 0.6825122833251953, 0.8294099569320679, 0.9763076901435852, 1.1232054233551025, 1.270103096961975, 1.4170007705688477, 1.5638985633850098, 1.7107962369918823, 1.8576939105987549, 2.004591703414917, 2.1514892578125, 2.298387050628662, 2.445284843444824, 2.5921823978424072, 2.7390801906585693, 2.8859777450561523, 3.0328755378723145, 3.1797733306884766, 3.3266708850860596, 3.4735686779022217, 3.6204662322998047, 3.767364025115967, 3.914261817932129, 4.061159610748291, 4.208057403564453, 4.354955196380615, 4.501852989196777, 4.648750305175781, 4.795648097991943, 4.9425458908081055, 5.089443683624268, 5.23634147644043, 5.383238792419434]}, "gradients/encoder.encoder.layers.19.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 1.0, 3.0, 0.0, 1.0, 6.0, 3.0, 5.0, 11.0, 12.0, 15.0, 11.0, 21.0, 29.0, 37.0, 47.0, 75.0, 91.0, 131.0, 190.0, 277.0, 424.0, 752.0, 1428.0, 3683.0, 11884.0, 52723.0, 387425.0, 500107.0, 66723.0, 14207.0, 4328.0, 1694.0, 778.0, 471.0, 280.0, 181.0, 124.0, 99.0, 79.0, 52.0, 37.0, 28.0, 26.0, 14.0, 11.0, 16.0, 8.0, 7.0, 4.0, 2.0, 5.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-1.6650390625, -1.6096649169921875, -1.554290771484375, -1.4989166259765625, -1.44354248046875, -1.3881683349609375, -1.332794189453125, -1.2774200439453125, -1.2220458984375, -1.1666717529296875, -1.111297607421875, -1.0559234619140625, -1.00054931640625, -0.9451751708984375, -0.889801025390625, -0.8344268798828125, -0.779052734375, -0.7236785888671875, -0.668304443359375, -0.6129302978515625, -0.55755615234375, -0.5021820068359375, -0.446807861328125, -0.3914337158203125, -0.3360595703125, -0.2806854248046875, -0.225311279296875, -0.1699371337890625, -0.11456298828125, -0.0591888427734375, -0.003814697265625, 0.0515594482421875, 0.10693359375, 0.1623077392578125, 0.217681884765625, 0.2730560302734375, 0.32843017578125, 0.3838043212890625, 0.439178466796875, 0.4945526123046875, 0.5499267578125, 0.6053009033203125, 0.660675048828125, 0.7160491943359375, 0.77142333984375, 0.8267974853515625, 0.882171630859375, 0.9375457763671875, 0.992919921875, 1.0482940673828125, 1.103668212890625, 1.1590423583984375, 1.21441650390625, 1.2697906494140625, 1.325164794921875, 1.3805389404296875, 1.4359130859375, 1.4912872314453125, 1.546661376953125, 1.6020355224609375, 1.65740966796875, 1.7127838134765625, 1.768157958984375, 1.8235321044921875, 1.87890625]}, "gradients/encoder.encoder.layers.19.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 4.0, 5.0, 5.0, 8.0, 15.0, 26.0, 51.0, 74.0, 100.0, 110.0, 128.0, 114.0, 104.0, 101.0, 65.0, 41.0, 22.0, 15.0, 12.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.399658203125, -0.3842353820800781, -0.36881256103515625, -0.3533897399902344, -0.3379669189453125, -0.3225440979003906, -0.30712127685546875, -0.2916984558105469, -0.276275634765625, -0.2608528137207031, -0.24542999267578125, -0.23000717163085938, -0.2145843505859375, -0.19916152954101562, -0.18373870849609375, -0.16831588745117188, -0.15289306640625, -0.13747024536132812, -0.12204742431640625, -0.10662460327148438, -0.0912017822265625, -0.07577896118164062, -0.06035614013671875, -0.044933319091796875, -0.029510498046875, -0.014087677001953125, 0.00133514404296875, 0.016757965087890625, 0.0321807861328125, 0.047603607177734375, 0.06302642822265625, 0.07844924926757812, 0.0938720703125, 0.10929489135742188, 0.12471771240234375, 0.14014053344726562, 0.1555633544921875, 0.17098617553710938, 0.18640899658203125, 0.20183181762695312, 0.217254638671875, 0.23267745971679688, 0.24810028076171875, 0.2635231018066406, 0.2789459228515625, 0.2943687438964844, 0.30979156494140625, 0.3252143859863281, 0.34063720703125, 0.3560600280761719, 0.37148284912109375, 0.3869056701660156, 0.4023284912109375, 0.4177513122558594, 0.43317413330078125, 0.4485969543457031, 0.464019775390625, 0.4794425964355469, 0.49486541748046875, 0.5102882385253906, 0.5257110595703125, 0.5411338806152344, 0.5565567016601562, 0.5719795227050781, 0.58740234375]}, "gradients/encoder.encoder.layers.19.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 3.0, 3.0, 2.0, 8.0, 11.0, 13.0, 19.0, 23.0, 35.0, 45.0, 68.0, 111.0, 150.0, 297.0, 610.0, 1375.0, 3861.0, 14869.0, 101960.0, 693439.0, 199477.0, 23338.0, 5456.0, 1743.0, 712.0, 357.0, 195.0, 124.0, 88.0, 42.0, 28.0, 17.0, 17.0, 14.0, 16.0, 8.0, 7.0, 6.0, 3.0, 5.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0], "bins": [-1.685546875, -1.6395416259765625, -1.593536376953125, -1.5475311279296875, -1.50152587890625, -1.4555206298828125, -1.409515380859375, -1.3635101318359375, -1.3175048828125, -1.2714996337890625, -1.225494384765625, -1.1794891357421875, -1.13348388671875, -1.0874786376953125, -1.041473388671875, -0.9954681396484375, -0.949462890625, -0.9034576416015625, -0.857452392578125, -0.8114471435546875, -0.76544189453125, -0.7194366455078125, -0.673431396484375, -0.6274261474609375, -0.5814208984375, -0.5354156494140625, -0.489410400390625, -0.4434051513671875, -0.39739990234375, -0.3513946533203125, -0.305389404296875, -0.2593841552734375, -0.21337890625, -0.1673736572265625, -0.121368408203125, -0.0753631591796875, -0.02935791015625, 0.0166473388671875, 0.062652587890625, 0.1086578369140625, 0.1546630859375, 0.2006683349609375, 0.246673583984375, 0.2926788330078125, 0.33868408203125, 0.3846893310546875, 0.430694580078125, 0.4766998291015625, 0.522705078125, 0.5687103271484375, 0.614715576171875, 0.6607208251953125, 0.70672607421875, 0.7527313232421875, 0.798736572265625, 0.8447418212890625, 0.8907470703125, 0.9367523193359375, 0.982757568359375, 1.0287628173828125, 1.07476806640625, 1.1207733154296875, 1.166778564453125, 1.2127838134765625, 1.2587890625]}, "gradients/encoder.encoder.layers.19.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 5.0, 7.0, 11.0, 5.0, 4.0, 19.0, 18.0, 42.0, 23.0, 24.0, 43.0, 50.0, 56.0, 59.0, 68.0, 41.0, 66.0, 53.0, 63.0, 42.0, 52.0, 36.0, 35.0, 37.0, 29.0, 26.0, 18.0, 16.0, 13.0, 11.0, 8.0, 5.0, 7.0, 0.0, 4.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.1455078125, -1.1124343872070312, -1.0793609619140625, -1.0462875366210938, -1.013214111328125, -0.9801406860351562, -0.9470672607421875, -0.9139938354492188, -0.88092041015625, -0.8478469848632812, -0.8147735595703125, -0.7817001342773438, -0.748626708984375, -0.7155532836914062, -0.6824798583984375, -0.6494064331054688, -0.6163330078125, -0.5832595825195312, -0.5501861572265625, -0.5171127319335938, -0.484039306640625, -0.45096588134765625, -0.4178924560546875, -0.38481903076171875, -0.35174560546875, -0.31867218017578125, -0.2855987548828125, -0.25252532958984375, -0.219451904296875, -0.18637847900390625, -0.1533050537109375, -0.12023162841796875, -0.087158203125, -0.05408477783203125, -0.0210113525390625, 0.01206207275390625, 0.045135498046875, 0.07820892333984375, 0.1112823486328125, 0.14435577392578125, 0.17742919921875, 0.21050262451171875, 0.2435760498046875, 0.27664947509765625, 0.309722900390625, 0.34279632568359375, 0.3758697509765625, 0.40894317626953125, 0.4420166015625, 0.47509002685546875, 0.5081634521484375, 0.5412368774414062, 0.574310302734375, 0.6073837280273438, 0.6404571533203125, 0.6735305786132812, 0.70660400390625, 0.7396774291992188, 0.7727508544921875, 0.8058242797851562, 0.838897705078125, 0.8719711303710938, 0.9050445556640625, 0.9381179809570312, 0.97119140625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 1.0, 3.0, 5.0, 4.0, 0.0, 7.0, 13.0, 8.0, 4.0, 19.0, 26.0, 38.0, 44.0, 72.0, 115.0, 229.0, 538.0, 1347.0, 4041.0, 17891.0, 187296.0, 728758.0, 91668.0, 11663.0, 2913.0, 970.0, 385.0, 190.0, 108.0, 64.0, 44.0, 25.0, 10.0, 15.0, 8.0, 7.0, 6.0, 6.0, 6.0, 4.0, 1.0, 5.0, 5.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0], "bins": [-0.6611328125, -0.6424407958984375, -0.623748779296875, -0.6050567626953125, -0.58636474609375, -0.5676727294921875, -0.548980712890625, -0.5302886962890625, -0.5115966796875, -0.4929046630859375, -0.474212646484375, -0.4555206298828125, -0.43682861328125, -0.4181365966796875, -0.399444580078125, -0.3807525634765625, -0.362060546875, -0.3433685302734375, -0.324676513671875, -0.3059844970703125, -0.28729248046875, -0.2686004638671875, -0.249908447265625, -0.2312164306640625, -0.2125244140625, -0.1938323974609375, -0.175140380859375, -0.1564483642578125, -0.13775634765625, -0.1190643310546875, -0.100372314453125, -0.0816802978515625, -0.06298828125, -0.0442962646484375, -0.025604248046875, -0.0069122314453125, 0.01177978515625, 0.0304718017578125, 0.049163818359375, 0.0678558349609375, 0.0865478515625, 0.1052398681640625, 0.123931884765625, 0.1426239013671875, 0.16131591796875, 0.1800079345703125, 0.198699951171875, 0.2173919677734375, 0.236083984375, 0.2547760009765625, 0.273468017578125, 0.2921600341796875, 0.31085205078125, 0.3295440673828125, 0.348236083984375, 0.3669281005859375, 0.3856201171875, 0.4043121337890625, 0.423004150390625, 0.4416961669921875, 0.46038818359375, 0.4790802001953125, 0.497772216796875, 0.5164642333984375, 0.53515625]}, "gradients/encoder.encoder.layers.19.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 1.0, 2.0, 4.0, 7.0, 15.0, 8.0, 17.0, 21.0, 18.0, 17.0, 41.0, 44.0, 51.0, 59.0, 71.0, 80.0, 95.0, 77.0, 92.0, 54.0, 51.0, 47.0, 26.0, 24.0, 15.0, 13.0, 15.0, 9.0, 8.0, 10.0, 4.0, 0.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.3822994232177734e-05, -5.221273750066757e-05, -5.060248076915741e-05, -4.899222403764725e-05, -4.7381967306137085e-05, -4.577171057462692e-05, -4.416145384311676e-05, -4.25511971116066e-05, -4.0940940380096436e-05, -3.933068364858627e-05, -3.772042691707611e-05, -3.611017018556595e-05, -3.4499913454055786e-05, -3.2889656722545624e-05, -3.127939999103546e-05, -2.96691432595253e-05, -2.8058886528015137e-05, -2.6448629796504974e-05, -2.4838373064994812e-05, -2.322811633348465e-05, -2.1617859601974487e-05, -2.0007602870464325e-05, -1.8397346138954163e-05, -1.6787089407444e-05, -1.5176832675933838e-05, -1.3566575944423676e-05, -1.1956319212913513e-05, -1.034606248140335e-05, -8.735805749893188e-06, -7.125549018383026e-06, -5.515292286872864e-06, -3.905035555362701e-06, -2.294778823852539e-06, -6.845220923423767e-07, 9.257346391677856e-07, 2.535991370677948e-06, 4.14624810218811e-06, 5.756504833698273e-06, 7.366761565208435e-06, 8.977018296718597e-06, 1.058727502822876e-05, 1.2197531759738922e-05, 1.3807788491249084e-05, 1.5418045222759247e-05, 1.702830195426941e-05, 1.863855868577957e-05, 2.0248815417289734e-05, 2.1859072148799896e-05, 2.346932888031006e-05, 2.507958561182022e-05, 2.6689842343330383e-05, 2.8300099074840546e-05, 2.9910355806350708e-05, 3.152061253786087e-05, 3.313086926937103e-05, 3.4741126000881195e-05, 3.635138273239136e-05, 3.796163946390152e-05, 3.957189619541168e-05, 4.1182152926921844e-05, 4.279240965843201e-05, 4.440266638994217e-05, 4.601292312145233e-05, 4.7623179852962494e-05, 4.9233436584472656e-05]}, "gradients/encoder.encoder.layers.19.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 0.0, 3.0, 6.0, 5.0, 10.0, 18.0, 14.0, 17.0, 30.0, 41.0, 61.0, 120.0, 156.0, 342.0, 758.0, 2103.0, 7181.0, 34345.0, 362140.0, 567345.0, 58895.0, 10194.0, 2832.0, 977.0, 415.0, 218.0, 135.0, 68.0, 41.0, 29.0, 17.0, 8.0, 7.0, 6.0, 4.0, 4.0, 3.0, 4.0, 2.0, 4.0, 3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.469482421875, -0.4533653259277344, -0.43724822998046875, -0.4211311340332031, -0.4050140380859375, -0.3888969421386719, -0.37277984619140625, -0.3566627502441406, -0.340545654296875, -0.3244285583496094, -0.30831146240234375, -0.2921943664550781, -0.2760772705078125, -0.2599601745605469, -0.24384307861328125, -0.22772598266601562, -0.21160888671875, -0.19549179077148438, -0.17937469482421875, -0.16325759887695312, -0.1471405029296875, -0.13102340698242188, -0.11490631103515625, -0.09878921508789062, -0.082672119140625, -0.06655502319335938, -0.05043792724609375, -0.034320831298828125, -0.0182037353515625, -0.002086639404296875, 0.01403045654296875, 0.030147552490234375, 0.0462646484375, 0.062381744384765625, 0.07849884033203125, 0.09461593627929688, 0.1107330322265625, 0.12685012817382812, 0.14296722412109375, 0.15908432006835938, 0.175201416015625, 0.19131851196289062, 0.20743560791015625, 0.22355270385742188, 0.2396697998046875, 0.2557868957519531, 0.27190399169921875, 0.2880210876464844, 0.30413818359375, 0.3202552795410156, 0.33637237548828125, 0.3524894714355469, 0.3686065673828125, 0.3847236633300781, 0.40084075927734375, 0.4169578552246094, 0.433074951171875, 0.4491920471191406, 0.46530914306640625, 0.4814262390136719, 0.4975433349609375, 0.5136604309082031, 0.5297775268554688, 0.5458946228027344, 0.56201171875]}, "gradients/encoder.encoder.layers.19.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 4.0, 0.0, 4.0, 1.0, 3.0, 4.0, 8.0, 7.0, 11.0, 6.0, 24.0, 26.0, 29.0, 49.0, 51.0, 67.0, 83.0, 104.0, 94.0, 87.0, 79.0, 70.0, 60.0, 41.0, 20.0, 16.0, 13.0, 9.0, 4.0, 3.0, 5.0, 5.0, 0.0, 2.0, 4.0, 3.0, 3.0, 0.0, 1.0, 5.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.34326171875, -0.332977294921875, -0.32269287109375, -0.312408447265625, -0.3021240234375, -0.291839599609375, -0.28155517578125, -0.271270751953125, -0.260986328125, -0.250701904296875, -0.24041748046875, -0.230133056640625, -0.2198486328125, -0.209564208984375, -0.19927978515625, -0.188995361328125, -0.1787109375, -0.168426513671875, -0.15814208984375, -0.147857666015625, -0.1375732421875, -0.127288818359375, -0.11700439453125, -0.106719970703125, -0.096435546875, -0.086151123046875, -0.07586669921875, -0.065582275390625, -0.0552978515625, -0.045013427734375, -0.03472900390625, -0.024444580078125, -0.01416015625, -0.003875732421875, 0.00640869140625, 0.016693115234375, 0.0269775390625, 0.037261962890625, 0.04754638671875, 0.057830810546875, 0.068115234375, 0.078399658203125, 0.08868408203125, 0.098968505859375, 0.1092529296875, 0.119537353515625, 0.12982177734375, 0.140106201171875, 0.150390625, 0.160675048828125, 0.17095947265625, 0.181243896484375, 0.1915283203125, 0.201812744140625, 0.21209716796875, 0.222381591796875, 0.232666015625, 0.242950439453125, 0.25323486328125, 0.263519287109375, 0.2738037109375, 0.284088134765625, 0.29437255859375, 0.304656982421875, 0.31494140625]}, "gradients/encoder.encoder.layers.19.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 4.0, 7.0, 11.0, 18.0, 68.0, 250.0, 437.0, 164.0, 39.0, 5.0, 6.0, 3.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-8.110148429870605, -7.644254684448242, -7.178360462188721, -6.712466716766357, -6.246572494506836, -5.780678749084473, -5.314785003662109, -4.848891258239746, -4.382997035980225, -3.9171030521392822, -3.45120906829834, -2.9853153228759766, -2.519421339035034, -2.053527355194092, -1.5876336097717285, -1.1217396259307861, -0.6558456420898438, -0.18995171785354614, 0.27594220638275146, 0.7418360710144043, 1.2077300548553467, 1.673624038696289, 2.1395177841186523, 2.6054117679595947, 3.071305751800537, 3.5371997356414795, 4.003093719482422, 4.468987464904785, 4.934881210327148, 5.40077543258667, 5.866669178009033, 6.332563400268555, 6.798458099365234, 7.264351844787598, 7.730246067047119, 8.19614028930664, 8.662034034729004, 9.127927780151367, 9.59382152557373, 10.059715270996094, 10.525609970092773, 10.991503715515137, 11.4573974609375, 11.92329216003418, 12.389185905456543, 12.855079650878906, 13.32097339630127, 13.786867141723633, 14.252760887145996, 14.71865463256836, 15.184548377990723, 15.650442123413086, 16.116336822509766, 16.582229614257812, 17.048124313354492, 17.514019012451172, 17.97991180419922, 18.4458065032959, 18.911699295043945, 19.377593994140625, 19.843486785888672, 20.30938148498535, 20.77527618408203, 21.241168975830078, 21.707063674926758]}, "gradients/encoder.encoder.layers.19.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 8.0, 6.0, 11.0, 12.0, 9.0, 16.0, 16.0, 24.0, 30.0, 29.0, 39.0, 45.0, 47.0, 54.0, 64.0, 52.0, 80.0, 54.0, 55.0, 45.0, 47.0, 38.0, 43.0, 32.0, 35.0, 22.0, 24.0, 12.0, 20.0, 13.0, 6.0, 2.0, 8.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.703734874725342, -5.513448715209961, -5.323163032531738, -5.132876873016357, -4.942591190338135, -4.752305030822754, -4.562019348144531, -4.37173318862915, -4.1814470291137695, -3.9911611080169678, -3.800875186920166, -3.610589027404785, -3.4203033447265625, -3.2300171852111816, -3.03973126411438, -2.849445343017578, -2.6591596603393555, -2.4688737392425537, -2.278587818145752, -2.088301658630371, -1.8980158567428589, -1.7077299356460571, -1.5174438953399658, -1.327157974243164, -1.1368720531463623, -0.9465861320495605, -0.756300151348114, -0.5660141706466675, -0.3757282495498657, -0.18544232845306396, 0.004843711853027344, 0.1951296329498291, 0.38541603088378906, 0.5757019519805908, 0.7659879326820374, 0.9562739133834839, 1.1465598344802856, 1.3368457555770874, 1.5271317958831787, 1.7174177169799805, 1.9077036380767822, 2.097989559173584, 2.2882754802703857, 2.4785614013671875, 2.6688475608825684, 2.859133243560791, 3.049419403076172, 3.2397053241729736, 3.4299912452697754, 3.620277166366577, 3.810563087463379, 4.00084924697876, 4.191134929656982, 4.381421089172363, 4.571706771850586, 4.761992931365967, 4.952279090881348, 5.1425652503967285, 5.332850933074951, 5.523137092590332, 5.713422775268555, 5.9037089347839355, 6.093995094299316, 6.284280776977539, 6.474566459655762]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 6.0, 12.0, 13.0, 16.0, 25.0, 52.0, 65.0, 96.0, 153.0, 304.0, 591.0, 1269.0, 2942.0, 9081.0, 49760.0, 3485387.0, 604990.0, 27707.0, 6523.0, 2471.0, 1125.0, 648.0, 348.0, 189.0, 140.0, 100.0, 56.0, 38.0, 29.0, 18.0, 26.0, 16.0, 12.0, 15.0, 13.0, 8.0, 5.0, 7.0, 7.0, 4.0, 2.0, 3.0, 4.0, 1.0, 2.0, 1.0, 2.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.5615234375, -1.4961090087890625, -1.430694580078125, -1.3652801513671875, -1.29986572265625, -1.2344512939453125, -1.169036865234375, -1.1036224365234375, -1.0382080078125, -0.9727935791015625, -0.907379150390625, -0.8419647216796875, -0.77655029296875, -0.7111358642578125, -0.645721435546875, -0.5803070068359375, -0.514892578125, -0.4494781494140625, -0.384063720703125, -0.3186492919921875, -0.25323486328125, -0.1878204345703125, -0.122406005859375, -0.0569915771484375, 0.0084228515625, 0.0738372802734375, 0.139251708984375, 0.2046661376953125, 0.27008056640625, 0.3354949951171875, 0.400909423828125, 0.4663238525390625, 0.53173828125, 0.5971527099609375, 0.662567138671875, 0.7279815673828125, 0.79339599609375, 0.8588104248046875, 0.924224853515625, 0.9896392822265625, 1.0550537109375, 1.1204681396484375, 1.185882568359375, 1.2512969970703125, 1.31671142578125, 1.3821258544921875, 1.447540283203125, 1.5129547119140625, 1.578369140625, 1.6437835693359375, 1.709197998046875, 1.7746124267578125, 1.84002685546875, 1.9054412841796875, 1.970855712890625, 2.0362701416015625, 2.1016845703125, 2.1670989990234375, 2.232513427734375, 2.2979278564453125, 2.36334228515625, 2.4287567138671875, 2.494171142578125, 2.5595855712890625, 2.625]}, "gradients/encoder.encoder.layers.18.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 3.0, 7.0, 4.0, 6.0, 15.0, 27.0, 33.0, 44.0, 80.0, 89.0, 105.0, 105.0, 108.0, 108.0, 86.0, 61.0, 44.0, 32.0, 20.0, 11.0, 7.0, 4.0, 2.0, 3.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.302734375, -0.28887939453125, -0.2750244140625, -0.26116943359375, -0.247314453125, -0.23345947265625, -0.2196044921875, -0.20574951171875, -0.19189453125, -0.17803955078125, -0.1641845703125, -0.15032958984375, -0.136474609375, -0.12261962890625, -0.1087646484375, -0.09490966796875, -0.0810546875, -0.06719970703125, -0.0533447265625, -0.03948974609375, -0.025634765625, -0.01177978515625, 0.0020751953125, 0.01593017578125, 0.02978515625, 0.04364013671875, 0.0574951171875, 0.07135009765625, 0.085205078125, 0.09906005859375, 0.1129150390625, 0.12677001953125, 0.140625, 0.15447998046875, 0.1683349609375, 0.18218994140625, 0.196044921875, 0.20989990234375, 0.2237548828125, 0.23760986328125, 0.25146484375, 0.26531982421875, 0.2791748046875, 0.29302978515625, 0.306884765625, 0.32073974609375, 0.3345947265625, 0.34844970703125, 0.3623046875, 0.37615966796875, 0.3900146484375, 0.40386962890625, 0.417724609375, 0.43157958984375, 0.4454345703125, 0.45928955078125, 0.47314453125, 0.48699951171875, 0.5008544921875, 0.51470947265625, 0.528564453125, 0.54241943359375, 0.5562744140625, 0.57012939453125, 0.583984375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 11.0, 18.0, 32.0, 62.0, 124.0, 315.0, 1203.0, 622483.0, 3567648.0, 1538.0, 402.0, 223.0, 100.0, 58.0, 31.0, 15.0, 7.0, 7.0, 3.0, 2.0, 1.0, 0.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.25390625, -5.03533935546875, -4.8167724609375, -4.59820556640625, -4.379638671875, -4.16107177734375, -3.9425048828125, -3.72393798828125, -3.50537109375, -3.28680419921875, -3.0682373046875, -2.84967041015625, -2.631103515625, -2.41253662109375, -2.1939697265625, -1.97540283203125, -1.7568359375, -1.53826904296875, -1.3197021484375, -1.10113525390625, -0.882568359375, -0.66400146484375, -0.4454345703125, -0.22686767578125, -0.00830078125, 0.21026611328125, 0.4288330078125, 0.64739990234375, 0.865966796875, 1.08453369140625, 1.3031005859375, 1.52166748046875, 1.740234375, 1.95880126953125, 2.1773681640625, 2.39593505859375, 2.614501953125, 2.83306884765625, 3.0516357421875, 3.27020263671875, 3.48876953125, 3.70733642578125, 3.9259033203125, 4.14447021484375, 4.363037109375, 4.58160400390625, 4.8001708984375, 5.01873779296875, 5.2373046875, 5.45587158203125, 5.6744384765625, 5.89300537109375, 6.111572265625, 6.33013916015625, 6.5487060546875, 6.76727294921875, 6.98583984375, 7.20440673828125, 7.4229736328125, 7.64154052734375, 7.860107421875, 8.07867431640625, 8.2972412109375, 8.51580810546875, 8.734375]}, "gradients/encoder.encoder.layers.18.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 6.0, 2.0, 8.0, 12.0, 50.0, 316.0, 3023.0, 552.0, 78.0, 21.0, 13.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.775390625, -0.7394561767578125, -0.703521728515625, -0.6675872802734375, -0.63165283203125, -0.5957183837890625, -0.559783935546875, -0.5238494873046875, -0.4879150390625, -0.4519805908203125, -0.416046142578125, -0.3801116943359375, -0.34417724609375, -0.3082427978515625, -0.272308349609375, -0.2363739013671875, -0.200439453125, -0.1645050048828125, -0.128570556640625, -0.0926361083984375, -0.05670166015625, -0.0207672119140625, 0.015167236328125, 0.0511016845703125, 0.0870361328125, 0.1229705810546875, 0.158905029296875, 0.1948394775390625, 0.23077392578125, 0.2667083740234375, 0.302642822265625, 0.3385772705078125, 0.37451171875, 0.4104461669921875, 0.446380615234375, 0.4823150634765625, 0.51824951171875, 0.5541839599609375, 0.590118408203125, 0.6260528564453125, 0.6619873046875, 0.6979217529296875, 0.733856201171875, 0.7697906494140625, 0.80572509765625, 0.8416595458984375, 0.877593994140625, 0.9135284423828125, 0.949462890625, 0.9853973388671875, 1.021331787109375, 1.0572662353515625, 1.09320068359375, 1.1291351318359375, 1.165069580078125, 1.2010040283203125, 1.2369384765625, 1.2728729248046875, 1.308807373046875, 1.3447418212890625, 1.38067626953125, 1.4166107177734375, 1.452545166015625, 1.4884796142578125, 1.5244140625]}, "gradients/encoder.encoder.layers.18.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 5.0, 14.0, 149.0, 636.0, 176.0, 14.0, 6.0, 3.0, 2.0, 3.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.7808456420898438, -3.5183842182159424, -3.255922794342041, -2.9934611320495605, -2.730999708175659, -2.468538284301758, -2.2060766220092773, -1.943615198135376, -1.6811537742614746, -1.4186923503875732, -1.1562308073043823, -0.8937693238258362, -0.63130784034729, -0.36884641647338867, -0.10638487339019775, 0.15607666969299316, 0.41853809356689453, 0.6809995770454407, 0.9434610605239868, 1.2059226036071777, 1.468384027481079, 1.7308454513549805, 1.9933069944381714, 2.2557685375213623, 2.5182299613952637, 2.780691385269165, 3.0431528091430664, 3.305614471435547, 3.5680758953094482, 3.8305373191833496, 4.09299898147583, 4.355460166931152, 4.617920875549316, 4.880382537841797, 5.142843723297119, 5.4053053855896, 5.667766571044922, 5.930228233337402, 6.192689895629883, 6.455151557922363, 6.7176127433776855, 6.980074405670166, 7.242535591125488, 7.504997253417969, 7.767458915710449, 8.02992057800293, 8.292381286621094, 8.554842948913574, 8.817304611206055, 9.079766273498535, 9.342227935791016, 9.60468864440918, 9.86715030670166, 10.12961196899414, 10.392073631286621, 10.654535293579102, 10.916996002197266, 11.179457664489746, 11.441919326782227, 11.70438003540039, 11.966841697692871, 12.229303359985352, 12.491765022277832, 12.754226684570312, 13.016688346862793]}, "gradients/encoder.encoder.layers.18.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 0.0, 3.0, 3.0, 12.0, 11.0, 12.0, 13.0, 20.0, 34.0, 32.0, 42.0, 50.0, 57.0, 42.0, 70.0, 75.0, 71.0, 66.0, 71.0, 62.0, 52.0, 56.0, 36.0, 27.0, 26.0, 21.0, 12.0, 11.0, 6.0, 3.0, 6.0, 2.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1153998374938965, -2.047651767730713, -1.9799038171768188, -1.9121558666229248, -1.8444077968597412, -1.7766598463058472, -1.7089118957519531, -1.6411638259887695, -1.573415756225586, -1.505667805671692, -1.4379197359085083, -1.3701717853546143, -1.3024237155914307, -1.2346757650375366, -1.1669278144836426, -1.099179744720459, -1.031431794166565, -0.9636837840080261, -0.8959357738494873, -0.8281878232955933, -0.7604397535324097, -0.6926918029785156, -0.6249437928199768, -0.557195782661438, -0.48944777250289917, -0.42169976234436035, -0.35395175218582153, -0.2862037718296051, -0.21845576167106628, -0.15070775151252747, -0.08295977115631104, -0.015211760997772217, 0.0525362491607666, 0.12028425186872482, 0.18803225457668304, 0.25578024983406067, 0.3235282599925995, 0.3912762701511383, 0.45902425050735474, 0.5267722606658936, 0.5945202708244324, 0.6622682809829712, 0.73001629114151, 0.7977643013000488, 0.8655122518539429, 0.9332603216171265, 1.0010082721710205, 1.068756341934204, 1.1365042924880981, 1.2042522430419922, 1.2720003128051758, 1.3397482633590698, 1.4074963331222534, 1.4752442836761475, 1.542992353439331, 1.610740303993225, 1.6784882545471191, 1.7462362051010132, 1.8139842748641968, 1.8817322254180908, 1.9494802951812744, 2.017228364944458, 2.0849761962890625, 2.152724266052246, 2.2204723358154297]}, "gradients/encoder.encoder.layers.18.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 7.0, 9.0, 18.0, 27.0, 42.0, 65.0, 98.0, 142.0, 224.0, 413.0, 782.0, 1693.0, 4511.0, 18115.0, 127598.0, 719078.0, 147536.0, 19931.0, 4716.0, 1661.0, 734.0, 409.0, 263.0, 152.0, 100.0, 61.0, 53.0, 30.0, 25.0, 11.0, 12.0, 8.0, 10.0, 8.0, 2.0, 5.0, 3.0, 4.0, 1.0, 1.0, 2.0], "bins": [-2.50390625, -2.4389190673828125, -2.373931884765625, -2.3089447021484375, -2.24395751953125, -2.1789703369140625, -2.113983154296875, -2.0489959716796875, -1.9840087890625, -1.9190216064453125, -1.854034423828125, -1.7890472412109375, -1.72406005859375, -1.6590728759765625, -1.594085693359375, -1.5290985107421875, -1.464111328125, -1.3991241455078125, -1.334136962890625, -1.2691497802734375, -1.20416259765625, -1.1391754150390625, -1.074188232421875, -1.0092010498046875, -0.9442138671875, -0.8792266845703125, -0.814239501953125, -0.7492523193359375, -0.68426513671875, -0.6192779541015625, -0.554290771484375, -0.4893035888671875, -0.42431640625, -0.3593292236328125, -0.294342041015625, -0.2293548583984375, -0.16436767578125, -0.0993804931640625, -0.034393310546875, 0.0305938720703125, 0.0955810546875, 0.1605682373046875, 0.225555419921875, 0.2905426025390625, 0.35552978515625, 0.4205169677734375, 0.485504150390625, 0.5504913330078125, 0.615478515625, 0.6804656982421875, 0.745452880859375, 0.8104400634765625, 0.87542724609375, 0.9404144287109375, 1.005401611328125, 1.0703887939453125, 1.1353759765625, 1.2003631591796875, 1.265350341796875, 1.3303375244140625, 1.39532470703125, 1.4603118896484375, 1.525299072265625, 1.5902862548828125, 1.6552734375]}, "gradients/encoder.encoder.layers.18.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 4.0, 3.0, 3.0, 8.0, 12.0, 19.0, 22.0, 30.0, 50.0, 55.0, 78.0, 103.0, 83.0, 83.0, 82.0, 87.0, 69.0, 68.0, 33.0, 32.0, 25.0, 17.0, 13.0, 14.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.3125, -0.29920196533203125, -0.2859039306640625, -0.27260589599609375, -0.259307861328125, -0.24600982666015625, -0.2327117919921875, -0.21941375732421875, -0.20611572265625, -0.19281768798828125, -0.1795196533203125, -0.16622161865234375, -0.152923583984375, -0.13962554931640625, -0.1263275146484375, -0.11302947998046875, -0.0997314453125, -0.08643341064453125, -0.0731353759765625, -0.05983734130859375, -0.046539306640625, -0.03324127197265625, -0.0199432373046875, -0.00664520263671875, 0.00665283203125, 0.01995086669921875, 0.0332489013671875, 0.04654693603515625, 0.059844970703125, 0.07314300537109375, 0.0864410400390625, 0.09973907470703125, 0.113037109375, 0.12633514404296875, 0.1396331787109375, 0.15293121337890625, 0.166229248046875, 0.17952728271484375, 0.1928253173828125, 0.20612335205078125, 0.21942138671875, 0.23271942138671875, 0.2460174560546875, 0.25931549072265625, 0.272613525390625, 0.28591156005859375, 0.2992095947265625, 0.31250762939453125, 0.3258056640625, 0.33910369873046875, 0.3524017333984375, 0.36569976806640625, 0.378997802734375, 0.39229583740234375, 0.4055938720703125, 0.41889190673828125, 0.43218994140625, 0.44548797607421875, 0.4587860107421875, 0.47208404541015625, 0.485382080078125, 0.49868011474609375, 0.5119781494140625, 0.5252761840820312, 0.53857421875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 4.0, 4.0, 7.0, 8.0, 26.0, 22.0, 45.0, 61.0, 86.0, 175.0, 338.0, 719.0, 1893.0, 7265.0, 59786.0, 825012.0, 137053.0, 11570.0, 2631.0, 928.0, 397.0, 205.0, 101.0, 83.0, 43.0, 30.0, 15.0, 16.0, 6.0, 9.0, 6.0, 4.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.064453125, -1.98974609375, -1.9150390625, -1.84033203125, -1.765625, -1.69091796875, -1.6162109375, -1.54150390625, -1.466796875, -1.39208984375, -1.3173828125, -1.24267578125, -1.16796875, -1.09326171875, -1.0185546875, -0.94384765625, -0.869140625, -0.79443359375, -0.7197265625, -0.64501953125, -0.5703125, -0.49560546875, -0.4208984375, -0.34619140625, -0.271484375, -0.19677734375, -0.1220703125, -0.04736328125, 0.02734375, 0.10205078125, 0.1767578125, 0.25146484375, 0.326171875, 0.40087890625, 0.4755859375, 0.55029296875, 0.625, 0.69970703125, 0.7744140625, 0.84912109375, 0.923828125, 0.99853515625, 1.0732421875, 1.14794921875, 1.22265625, 1.29736328125, 1.3720703125, 1.44677734375, 1.521484375, 1.59619140625, 1.6708984375, 1.74560546875, 1.8203125, 1.89501953125, 1.9697265625, 2.04443359375, 2.119140625, 2.19384765625, 2.2685546875, 2.34326171875, 2.41796875, 2.49267578125, 2.5673828125, 2.64208984375, 2.716796875]}, "gradients/encoder.encoder.layers.18.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 5.0, 0.0, 1.0, 3.0, 6.0, 4.0, 10.0, 19.0, 16.0, 15.0, 25.0, 40.0, 35.0, 56.0, 72.0, 73.0, 83.0, 84.0, 91.0, 76.0, 73.0, 46.0, 41.0, 28.0, 36.0, 21.0, 6.0, 11.0, 10.0, 10.0, 3.0, 5.0, 4.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.32421875, -1.269989013671875, -1.21575927734375, -1.161529541015625, -1.1072998046875, -1.053070068359375, -0.99884033203125, -0.944610595703125, -0.890380859375, -0.836151123046875, -0.78192138671875, -0.727691650390625, -0.6734619140625, -0.619232177734375, -0.56500244140625, -0.510772705078125, -0.45654296875, -0.402313232421875, -0.34808349609375, -0.293853759765625, -0.2396240234375, -0.185394287109375, -0.13116455078125, -0.076934814453125, -0.022705078125, 0.031524658203125, 0.08575439453125, 0.139984130859375, 0.1942138671875, 0.248443603515625, 0.30267333984375, 0.356903076171875, 0.4111328125, 0.465362548828125, 0.51959228515625, 0.573822021484375, 0.6280517578125, 0.682281494140625, 0.73651123046875, 0.790740966796875, 0.844970703125, 0.899200439453125, 0.95343017578125, 1.007659912109375, 1.0618896484375, 1.116119384765625, 1.17034912109375, 1.224578857421875, 1.27880859375, 1.333038330078125, 1.38726806640625, 1.441497802734375, 1.4957275390625, 1.549957275390625, 1.60418701171875, 1.658416748046875, 1.712646484375, 1.766876220703125, 1.82110595703125, 1.875335693359375, 1.9295654296875, 1.983795166015625, 2.03802490234375, 2.092254638671875, 2.146484375]}, "gradients/encoder.encoder.layers.18.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 0.0, 2.0, 5.0, 4.0, 8.0, 8.0, 4.0, 21.0, 25.0, 25.0, 33.0, 70.0, 115.0, 204.0, 392.0, 764.0, 1810.0, 6238.0, 34816.0, 403030.0, 539303.0, 49861.0, 7814.0, 2239.0, 857.0, 398.0, 198.0, 119.0, 63.0, 42.0, 29.0, 13.0, 11.0, 13.0, 9.0, 6.0, 7.0, 3.0, 2.0, 2.0, 4.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5087890625, -0.49066925048828125, -0.4725494384765625, -0.45442962646484375, -0.436309814453125, -0.41819000244140625, -0.4000701904296875, -0.38195037841796875, -0.36383056640625, -0.34571075439453125, -0.3275909423828125, -0.30947113037109375, -0.291351318359375, -0.27323150634765625, -0.2551116943359375, -0.23699188232421875, -0.2188720703125, -0.20075225830078125, -0.1826324462890625, -0.16451263427734375, -0.146392822265625, -0.12827301025390625, -0.1101531982421875, -0.09203338623046875, -0.07391357421875, -0.05579376220703125, -0.0376739501953125, -0.01955413818359375, -0.001434326171875, 0.01668548583984375, 0.0348052978515625, 0.05292510986328125, 0.071044921875, 0.08916473388671875, 0.1072845458984375, 0.12540435791015625, 0.143524169921875, 0.16164398193359375, 0.1797637939453125, 0.19788360595703125, 0.21600341796875, 0.23412322998046875, 0.2522430419921875, 0.27036285400390625, 0.288482666015625, 0.30660247802734375, 0.3247222900390625, 0.34284210205078125, 0.3609619140625, 0.37908172607421875, 0.3972015380859375, 0.41532135009765625, 0.433441162109375, 0.45156097412109375, 0.4696807861328125, 0.48780059814453125, 0.50592041015625, 0.5240402221679688, 0.5421600341796875, 0.5602798461914062, 0.578399658203125, 0.5965194702148438, 0.6146392822265625, 0.6327590942382812, 0.65087890625]}, "gradients/encoder.encoder.layers.18.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 6.0, 7.0, 11.0, 21.0, 38.0, 56.0, 95.0, 173.0, 211.0, 180.0, 102.0, 60.0, 29.0, 12.0, 9.0, 0.0, 6.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00018477439880371094, -0.00018032174557447433, -0.00017586909234523773, -0.00017141643911600113, -0.00016696378588676453, -0.00016251113265752792, -0.00015805847942829132, -0.00015360582619905472, -0.00014915317296981812, -0.0001447005197405815, -0.0001402478665113449, -0.0001357952132821083, -0.0001313425600528717, -0.0001268899068236351, -0.0001224372535943985, -0.0001179846003651619, -0.00011353194713592529, -0.00010907929390668869, -0.00010462664067745209, -0.00010017398744821548, -9.572133421897888e-05, -9.126868098974228e-05, -8.681602776050568e-05, -8.236337453126907e-05, -7.791072130203247e-05, -7.345806807279587e-05, -6.900541484355927e-05, -6.455276161432266e-05, -6.010010838508606e-05, -5.564745515584946e-05, -5.1194801926612854e-05, -4.674214869737625e-05, -4.228949546813965e-05, -3.7836842238903046e-05, -3.338418900966644e-05, -2.893153578042984e-05, -2.4478882551193237e-05, -2.0026229321956635e-05, -1.5573576092720032e-05, -1.1120922863483429e-05, -6.668269634246826e-06, -2.2156164050102234e-06, 2.2370368242263794e-06, 6.689690053462982e-06, 1.1142343282699585e-05, 1.5594996511936188e-05, 2.004764974117279e-05, 2.4500302970409393e-05, 2.8952956199645996e-05, 3.34056094288826e-05, 3.78582626581192e-05, 4.2310915887355804e-05, 4.676356911659241e-05, 5.121622234582901e-05, 5.566887557506561e-05, 6.0121528804302216e-05, 6.457418203353882e-05, 6.902683526277542e-05, 7.347948849201202e-05, 7.793214172124863e-05, 8.238479495048523e-05, 8.683744817972183e-05, 9.129010140895844e-05, 9.574275463819504e-05, 0.00010019540786743164]}, "gradients/encoder.encoder.layers.18.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 4.0, 1.0, 5.0, 10.0, 11.0, 21.0, 22.0, 31.0, 67.0, 91.0, 202.0, 504.0, 1435.0, 5903.0, 50407.0, 762704.0, 209927.0, 13227.0, 2536.0, 792.0, 303.0, 163.0, 82.0, 41.0, 24.0, 16.0, 8.0, 10.0, 2.0, 7.0, 3.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.6416015625, -0.6192626953125, -0.596923828125, -0.5745849609375, -0.55224609375, -0.5299072265625, -0.507568359375, -0.4852294921875, -0.462890625, -0.4405517578125, -0.418212890625, -0.3958740234375, -0.37353515625, -0.3511962890625, -0.328857421875, -0.3065185546875, -0.2841796875, -0.2618408203125, -0.239501953125, -0.2171630859375, -0.19482421875, -0.1724853515625, -0.150146484375, -0.1278076171875, -0.10546875, -0.0831298828125, -0.060791015625, -0.0384521484375, -0.01611328125, 0.0062255859375, 0.028564453125, 0.0509033203125, 0.0732421875, 0.0955810546875, 0.117919921875, 0.1402587890625, 0.16259765625, 0.1849365234375, 0.207275390625, 0.2296142578125, 0.251953125, 0.2742919921875, 0.296630859375, 0.3189697265625, 0.34130859375, 0.3636474609375, 0.385986328125, 0.4083251953125, 0.4306640625, 0.4530029296875, 0.475341796875, 0.4976806640625, 0.52001953125, 0.5423583984375, 0.564697265625, 0.5870361328125, 0.609375, 0.6317138671875, 0.654052734375, 0.6763916015625, 0.69873046875, 0.7210693359375, 0.743408203125, 0.7657470703125, 0.7880859375]}, "gradients/encoder.encoder.layers.18.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 3.0, 3.0, 6.0, 6.0, 8.0, 9.0, 16.0, 22.0, 44.0, 50.0, 77.0, 115.0, 120.0, 161.0, 115.0, 95.0, 61.0, 32.0, 28.0, 7.0, 6.0, 6.0, 3.0, 4.0, 2.0, 6.0, 3.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.46533203125, -0.4508018493652344, -0.43627166748046875, -0.4217414855957031, -0.4072113037109375, -0.3926811218261719, -0.37815093994140625, -0.3636207580566406, -0.349090576171875, -0.3345603942871094, -0.32003021240234375, -0.3055000305175781, -0.2909698486328125, -0.2764396667480469, -0.26190948486328125, -0.24737930297851562, -0.23284912109375, -0.21831893920898438, -0.20378875732421875, -0.18925857543945312, -0.1747283935546875, -0.16019821166992188, -0.14566802978515625, -0.13113784790039062, -0.116607666015625, -0.10207748413085938, -0.08754730224609375, -0.07301712036132812, -0.0584869384765625, -0.043956756591796875, -0.02942657470703125, -0.014896392822265625, -0.0003662109375, 0.014163970947265625, 0.02869415283203125, 0.043224334716796875, 0.0577545166015625, 0.07228469848632812, 0.08681488037109375, 0.10134506225585938, 0.115875244140625, 0.13040542602539062, 0.14493560791015625, 0.15946578979492188, 0.1739959716796875, 0.18852615356445312, 0.20305633544921875, 0.21758651733398438, 0.23211669921875, 0.24664688110351562, 0.26117706298828125, 0.2757072448730469, 0.2902374267578125, 0.3047676086425781, 0.31929779052734375, 0.3338279724121094, 0.348358154296875, 0.3628883361816406, 0.37741851806640625, 0.3919486999511719, 0.4064788818359375, 0.4210090637207031, 0.43553924560546875, 0.4500694274902344, 0.464599609375]}, "gradients/encoder.encoder.layers.18.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 0.0, 13.0, 43.0, 130.0, 390.0, 303.0, 81.0, 31.0, 8.0, 6.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.776620864868164, -6.20587158203125, -5.635122299194336, -5.064373016357422, -4.493623733520508, -3.9228744506835938, -3.3521251678466797, -2.7813758850097656, -2.2106266021728516, -1.6398773193359375, -1.0691280364990234, -0.4983787536621094, 0.07237052917480469, 0.6431198120117188, 1.2138690948486328, 1.7846183776855469, 2.355367660522461, 2.926116943359375, 3.496866226196289, 4.067615509033203, 4.638364791870117, 5.209114074707031, 5.779863357543945, 6.350612640380859, 6.921361923217773, 7.4921112060546875, 8.062860488891602, 8.633609771728516, 9.20435905456543, 9.775108337402344, 10.345857620239258, 10.916606903076172, 11.487358093261719, 12.058107376098633, 12.628856658935547, 13.199605941772461, 13.770355224609375, 14.341104507446289, 14.911853790283203, 15.482603073120117, 16.05335235595703, 16.624101638793945, 17.19485092163086, 17.765600204467773, 18.336349487304688, 18.9070987701416, 19.477848052978516, 20.04859733581543, 20.619346618652344, 21.190095901489258, 21.760845184326172, 22.331594467163086, 22.90234375, 23.473093032836914, 24.043842315673828, 24.614591598510742, 25.185340881347656, 25.75609016418457, 26.326839447021484, 26.8975887298584, 27.468338012695312, 28.039087295532227, 28.60983657836914, 29.180585861206055, 29.75133514404297]}, "gradients/encoder.encoder.layers.18.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 1.0, 1.0, 3.0, 2.0, 6.0, 4.0, 8.0, 8.0, 13.0, 18.0, 24.0, 20.0, 30.0, 21.0, 34.0, 45.0, 48.0, 49.0, 50.0, 49.0, 58.0, 53.0, 50.0, 53.0, 62.0, 40.0, 41.0, 34.0, 36.0, 30.0, 24.0, 19.0, 22.0, 11.0, 11.0, 11.0, 2.0, 4.0, 3.0, 6.0, 2.0, 1.0, 5.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-7.640623569488525, -7.410745143890381, -7.180866241455078, -6.950987815856934, -6.721109390258789, -6.4912309646606445, -6.261352062225342, -6.031473636627197, -5.8015947341918945, -5.57171630859375, -5.341837406158447, -5.111958980560303, -4.882080554962158, -4.6522016525268555, -4.422323226928711, -4.192444801330566, -3.962566375732422, -3.7326877117156982, -3.5028092861175537, -3.27293062210083, -3.0430521965026855, -2.813173532485962, -2.5832948684692383, -2.3534164428710938, -2.12353777885437, -1.893659234046936, -1.663780689239502, -1.4339020252227783, -1.2040234804153442, -0.9741449356079102, -0.7442662715911865, -0.5143877267837524, -0.28450918197631836, -0.05463060736656189, 0.17524796724319458, 0.40512657165527344, 0.6350051164627075, 0.8648836612701416, 1.0947623252868652, 1.3246408700942993, 1.5545194149017334, 1.7843979597091675, 2.0142765045166016, 2.244155168533325, 2.474033832550049, 2.7039122581481934, 2.933790922164917, 3.1636695861816406, 3.393548011779785, 3.623426675796509, 3.8533051013946533, 4.083183765411377, 4.3130621910095215, 4.542941093444824, 4.772819519042969, 5.002697944641113, 5.232576370239258, 5.462454795837402, 5.692333698272705, 5.92221212387085, 6.152090549468994, 6.381969451904297, 6.611847877502441, 6.841726303100586, 7.071605205535889]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 2.0, 3.0, 6.0, 5.0, 11.0, 13.0, 16.0, 33.0, 26.0, 51.0, 76.0, 156.0, 247.0, 398.0, 806.0, 1415.0, 3273.0, 9134.0, 37121.0, 584785.0, 3463139.0, 70218.0, 13732.0, 4693.0, 2059.0, 1050.0, 622.0, 339.0, 250.0, 156.0, 117.0, 70.0, 57.0, 34.0, 40.0, 26.0, 31.0, 9.0, 10.0, 13.0, 10.0, 9.0, 3.0, 8.0, 5.0, 2.0, 2.0, 5.0, 4.0, 1.0, 0.0, 4.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.615234375, -1.5389404296875, -1.462646484375, -1.3863525390625, -1.31005859375, -1.2337646484375, -1.157470703125, -1.0811767578125, -1.0048828125, -0.9285888671875, -0.852294921875, -0.7760009765625, -0.69970703125, -0.6234130859375, -0.547119140625, -0.4708251953125, -0.39453125, -0.3182373046875, -0.241943359375, -0.1656494140625, -0.08935546875, -0.0130615234375, 0.063232421875, 0.1395263671875, 0.2158203125, 0.2921142578125, 0.368408203125, 0.4447021484375, 0.52099609375, 0.5972900390625, 0.673583984375, 0.7498779296875, 0.826171875, 0.9024658203125, 0.978759765625, 1.0550537109375, 1.13134765625, 1.2076416015625, 1.283935546875, 1.3602294921875, 1.4365234375, 1.5128173828125, 1.589111328125, 1.6654052734375, 1.74169921875, 1.8179931640625, 1.894287109375, 1.9705810546875, 2.046875, 2.1231689453125, 2.199462890625, 2.2757568359375, 2.35205078125, 2.4283447265625, 2.504638671875, 2.5809326171875, 2.6572265625, 2.7335205078125, 2.809814453125, 2.8861083984375, 2.96240234375, 3.0386962890625, 3.114990234375, 3.1912841796875, 3.267578125]}, "gradients/encoder.encoder.layers.17.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 4.0, 1.0, 0.0, 2.0, 3.0, 3.0, 6.0, 11.0, 17.0, 19.0, 28.0, 21.0, 54.0, 49.0, 73.0, 71.0, 83.0, 112.0, 74.0, 85.0, 65.0, 57.0, 45.0, 39.0, 26.0, 22.0, 16.0, 7.0, 5.0, 6.0, 3.0, 2.0, 2.0, 0.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.289306640625, -0.2765617370605469, -0.26381683349609375, -0.2510719299316406, -0.2383270263671875, -0.22558212280273438, -0.21283721923828125, -0.20009231567382812, -0.187347412109375, -0.17460250854492188, -0.16185760498046875, -0.14911270141601562, -0.1363677978515625, -0.12362289428710938, -0.11087799072265625, -0.09813308715820312, -0.08538818359375, -0.07264328002929688, -0.05989837646484375, -0.047153472900390625, -0.0344085693359375, -0.021663665771484375, -0.00891876220703125, 0.003826141357421875, 0.016571044921875, 0.029315948486328125, 0.04206085205078125, 0.054805755615234375, 0.0675506591796875, 0.08029556274414062, 0.09304046630859375, 0.10578536987304688, 0.1185302734375, 0.13127517700195312, 0.14402008056640625, 0.15676498413085938, 0.1695098876953125, 0.18225479125976562, 0.19499969482421875, 0.20774459838867188, 0.220489501953125, 0.23323440551757812, 0.24597930908203125, 0.2587242126464844, 0.2714691162109375, 0.2842140197753906, 0.29695892333984375, 0.3097038269042969, 0.32244873046875, 0.3351936340332031, 0.34793853759765625, 0.3606834411621094, 0.3734283447265625, 0.3861732482910156, 0.39891815185546875, 0.4116630554199219, 0.424407958984375, 0.4371528625488281, 0.44989776611328125, 0.4626426696777344, 0.4753875732421875, 0.4881324768066406, 0.5008773803710938, 0.5136222839355469, 0.5263671875]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 2.0, 2.0, 3.0, 5.0, 9.0, 9.0, 31.0, 39.0, 64.0, 173.0, 432.0, 1908.0, 16493.0, 4140130.0, 31004.0, 2851.0, 628.0, 240.0, 128.0, 50.0, 35.0, 27.0, 10.0, 6.0, 8.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.5, -7.28924560546875, -7.0784912109375, -6.86773681640625, -6.656982421875, -6.44622802734375, -6.2354736328125, -6.02471923828125, -5.81396484375, -5.60321044921875, -5.3924560546875, -5.18170166015625, -4.970947265625, -4.76019287109375, -4.5494384765625, -4.33868408203125, -4.1279296875, -3.91717529296875, -3.7064208984375, -3.49566650390625, -3.284912109375, -3.07415771484375, -2.8634033203125, -2.65264892578125, -2.44189453125, -2.23114013671875, -2.0203857421875, -1.80963134765625, -1.598876953125, -1.38812255859375, -1.1773681640625, -0.96661376953125, -0.755859375, -0.54510498046875, -0.3343505859375, -0.12359619140625, 0.087158203125, 0.29791259765625, 0.5086669921875, 0.71942138671875, 0.93017578125, 1.14093017578125, 1.3516845703125, 1.56243896484375, 1.773193359375, 1.98394775390625, 2.1947021484375, 2.40545654296875, 2.6162109375, 2.82696533203125, 3.0377197265625, 3.24847412109375, 3.459228515625, 3.66998291015625, 3.8807373046875, 4.09149169921875, 4.30224609375, 4.51300048828125, 4.7237548828125, 4.93450927734375, 5.145263671875, 5.35601806640625, 5.5667724609375, 5.77752685546875, 5.98828125]}, "gradients/encoder.encoder.layers.17.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 5.0, 2.0, 1.0, 1.0, 1.0, 2.0, 3.0, 6.0, 14.0, 13.0, 32.0, 54.0, 247.0, 2160.0, 1245.0, 186.0, 50.0, 18.0, 10.0, 8.0, 6.0, 6.0, 2.0, 3.0, 5.0, 2.0, 1.0, 3.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.00390625, -0.950775146484375, -0.89764404296875, -0.844512939453125, -0.7913818359375, -0.738250732421875, -0.68511962890625, -0.631988525390625, -0.578857421875, -0.525726318359375, -0.47259521484375, -0.419464111328125, -0.3663330078125, -0.313201904296875, -0.26007080078125, -0.206939697265625, -0.15380859375, -0.100677490234375, -0.04754638671875, 0.005584716796875, 0.0587158203125, 0.111846923828125, 0.16497802734375, 0.218109130859375, 0.271240234375, 0.324371337890625, 0.37750244140625, 0.430633544921875, 0.4837646484375, 0.536895751953125, 0.59002685546875, 0.643157958984375, 0.6962890625, 0.749420166015625, 0.80255126953125, 0.855682373046875, 0.9088134765625, 0.961944580078125, 1.01507568359375, 1.068206787109375, 1.121337890625, 1.174468994140625, 1.22760009765625, 1.280731201171875, 1.3338623046875, 1.386993408203125, 1.44012451171875, 1.493255615234375, 1.54638671875, 1.599517822265625, 1.65264892578125, 1.705780029296875, 1.7589111328125, 1.812042236328125, 1.86517333984375, 1.918304443359375, 1.971435546875, 2.024566650390625, 2.07769775390625, 2.130828857421875, 2.1839599609375, 2.237091064453125, 2.29022216796875, 2.343353271484375, 2.396484375]}, "gradients/encoder.encoder.layers.17.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 20.0, 731.0, 243.0, 9.0, 6.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-10.54916763305664, -9.574657440185547, -8.600146293640137, -7.625636100769043, -6.651125907897949, -5.676615238189697, -4.702104568481445, -3.7275943756103516, -2.7530837059020996, -1.7785732746124268, -0.8040627241134644, 0.17044782638549805, 1.144958257675171, 2.1194686889648438, 3.0939793586730957, 4.0684895515441895, 5.043000221252441, 6.017510890960693, 6.992021083831787, 7.966531753540039, 8.941041946411133, 9.915552139282227, 10.890063285827637, 11.86457347869873, 12.83908462524414, 13.813594818115234, 14.788105964660645, 15.762616157531738, 16.73712730407715, 17.711637496948242, 18.686147689819336, 19.66065788269043, 20.635168075561523, 21.609678268432617, 22.58418846130371, 23.558700561523438, 24.53321075439453, 25.507720947265625, 26.48223114013672, 27.456741333007812, 28.431251525878906, 29.40576171875, 30.380271911621094, 31.354782104492188, 32.32929229736328, 33.303802490234375, 34.27831268310547, 35.25282287597656, 36.22733688354492, 37.201847076416016, 38.17635726928711, 39.1508674621582, 40.1253776550293, 41.09988784790039, 42.07440185546875, 43.048912048339844, 44.02341842651367, 44.997928619384766, 45.97243881225586, 46.94694900512695, 47.92145919799805, 48.89596939086914, 49.8704833984375, 50.844993591308594, 51.81950378417969]}, "gradients/encoder.encoder.layers.17.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 4.0, 5.0, 5.0, 13.0, 14.0, 45.0, 60.0, 83.0, 109.0, 134.0, 126.0, 136.0, 113.0, 61.0, 43.0, 26.0, 17.0, 9.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.170922756195068, -6.939195156097412, -6.707467555999756, -6.4757399559021, -6.244012355804443, -6.012284755706787, -5.780557155609131, -5.548829555511475, -5.317101955413818, -5.085374355316162, -4.853646755218506, -4.62191915512085, -4.390191555023193, -4.158463954925537, -3.926736354827881, -3.6950087547302246, -3.4632811546325684, -3.231553554534912, -2.999825954437256, -2.7680983543395996, -2.5363707542419434, -2.304643154144287, -2.072915554046631, -1.8411879539489746, -1.6094603538513184, -1.377732753753662, -1.1460051536560059, -0.9142775535583496, -0.6825499534606934, -0.4508223533630371, -0.21909475326538086, 0.01263284683227539, 0.24435997009277344, 0.4760875701904297, 0.7078151702880859, 0.9395427703857422, 1.1712703704833984, 1.4029979705810547, 1.634725570678711, 1.8664531707763672, 2.0981807708740234, 2.3299083709716797, 2.561635971069336, 2.793363571166992, 3.0250911712646484, 3.2568187713623047, 3.488546371459961, 3.720273971557617, 3.9520015716552734, 4.18372917175293, 4.415456771850586, 4.647184371948242, 4.878911972045898, 5.110639572143555, 5.342367172241211, 5.574094772338867, 5.805822372436523, 6.03754997253418, 6.269277572631836, 6.501005172729492, 6.732732772827148, 6.964460372924805, 7.196187973022461, 7.427915573120117, 7.659643173217773]}, "gradients/encoder.encoder.layers.17.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 4.0, 4.0, 4.0, 6.0, 10.0, 8.0, 9.0, 24.0, 29.0, 42.0, 49.0, 94.0, 164.0, 263.0, 550.0, 1192.0, 3295.0, 16814.0, 281744.0, 698127.0, 37585.0, 5316.0, 1673.0, 722.0, 332.0, 170.0, 121.0, 73.0, 43.0, 26.0, 21.0, 12.0, 12.0, 9.0, 6.0, 4.0, 6.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.31640625, -2.2279052734375, -2.139404296875, -2.0509033203125, -1.96240234375, -1.8739013671875, -1.785400390625, -1.6968994140625, -1.6083984375, -1.5198974609375, -1.431396484375, -1.3428955078125, -1.25439453125, -1.1658935546875, -1.077392578125, -0.9888916015625, -0.900390625, -0.8118896484375, -0.723388671875, -0.6348876953125, -0.54638671875, -0.4578857421875, -0.369384765625, -0.2808837890625, -0.1923828125, -0.1038818359375, -0.015380859375, 0.0731201171875, 0.16162109375, 0.2501220703125, 0.338623046875, 0.4271240234375, 0.515625, 0.6041259765625, 0.692626953125, 0.7811279296875, 0.86962890625, 0.9581298828125, 1.046630859375, 1.1351318359375, 1.2236328125, 1.3121337890625, 1.400634765625, 1.4891357421875, 1.57763671875, 1.6661376953125, 1.754638671875, 1.8431396484375, 1.931640625, 2.0201416015625, 2.108642578125, 2.1971435546875, 2.28564453125, 2.3741455078125, 2.462646484375, 2.5511474609375, 2.6396484375, 2.7281494140625, 2.816650390625, 2.9051513671875, 2.99365234375, 3.0821533203125, 3.170654296875, 3.2591552734375, 3.34765625]}, "gradients/encoder.encoder.layers.17.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 4.0, 3.0, 2.0, 5.0, 3.0, 19.0, 37.0, 35.0, 71.0, 91.0, 132.0, 128.0, 137.0, 84.0, 102.0, 70.0, 40.0, 17.0, 7.0, 5.0, 6.0, 6.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.39892578125, -0.37984466552734375, -0.3607635498046875, -0.34168243408203125, -0.322601318359375, -0.30352020263671875, -0.2844390869140625, -0.26535797119140625, -0.24627685546875, -0.22719573974609375, -0.2081146240234375, -0.18903350830078125, -0.169952392578125, -0.15087127685546875, -0.1317901611328125, -0.11270904541015625, -0.0936279296875, -0.07454681396484375, -0.0554656982421875, -0.03638458251953125, -0.017303466796875, 0.00177764892578125, 0.0208587646484375, 0.03993988037109375, 0.05902099609375, 0.07810211181640625, 0.0971832275390625, 0.11626434326171875, 0.135345458984375, 0.15442657470703125, 0.1735076904296875, 0.19258880615234375, 0.211669921875, 0.23075103759765625, 0.2498321533203125, 0.26891326904296875, 0.287994384765625, 0.30707550048828125, 0.3261566162109375, 0.34523773193359375, 0.36431884765625, 0.38339996337890625, 0.4024810791015625, 0.42156219482421875, 0.440643310546875, 0.45972442626953125, 0.4788055419921875, 0.49788665771484375, 0.5169677734375, 0.5360488891601562, 0.5551300048828125, 0.5742111206054688, 0.593292236328125, 0.6123733520507812, 0.6314544677734375, 0.6505355834960938, 0.66961669921875, 0.6886978149414062, 0.7077789306640625, 0.7268600463867188, 0.745941162109375, 0.7650222778320312, 0.7841033935546875, 0.8031845092773438, 0.822265625]}, "gradients/encoder.encoder.layers.17.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 2.0, 1.0, 5.0, 16.0, 17.0, 27.0, 32.0, 49.0, 84.0, 120.0, 224.0, 434.0, 975.0, 2879.0, 13784.0, 108487.0, 662602.0, 226241.0, 25254.0, 4621.0, 1344.0, 603.0, 304.0, 190.0, 106.0, 50.0, 39.0, 33.0, 13.0, 13.0, 6.0, 5.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0], "bins": [-1.8037109375, -1.7558135986328125, -1.707916259765625, -1.6600189208984375, -1.61212158203125, -1.5642242431640625, -1.516326904296875, -1.4684295654296875, -1.4205322265625, -1.3726348876953125, -1.324737548828125, -1.2768402099609375, -1.22894287109375, -1.1810455322265625, -1.133148193359375, -1.0852508544921875, -1.037353515625, -0.9894561767578125, -0.941558837890625, -0.8936614990234375, -0.84576416015625, -0.7978668212890625, -0.749969482421875, -0.7020721435546875, -0.6541748046875, -0.6062774658203125, -0.558380126953125, -0.5104827880859375, -0.46258544921875, -0.4146881103515625, -0.366790771484375, -0.3188934326171875, -0.27099609375, -0.2230987548828125, -0.175201416015625, -0.1273040771484375, -0.07940673828125, -0.0315093994140625, 0.016387939453125, 0.0642852783203125, 0.1121826171875, 0.1600799560546875, 0.207977294921875, 0.2558746337890625, 0.30377197265625, 0.3516693115234375, 0.399566650390625, 0.4474639892578125, 0.495361328125, 0.5432586669921875, 0.591156005859375, 0.6390533447265625, 0.68695068359375, 0.7348480224609375, 0.782745361328125, 0.8306427001953125, 0.8785400390625, 0.9264373779296875, 0.974334716796875, 1.0222320556640625, 1.07012939453125, 1.1180267333984375, 1.165924072265625, 1.2138214111328125, 1.26171875]}, "gradients/encoder.encoder.layers.17.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 3.0, 3.0, 4.0, 10.0, 5.0, 12.0, 16.0, 19.0, 14.0, 19.0, 32.0, 31.0, 34.0, 35.0, 42.0, 27.0, 63.0, 41.0, 55.0, 49.0, 40.0, 59.0, 50.0, 57.0, 47.0, 40.0, 43.0, 30.0, 28.0, 23.0, 14.0, 14.0, 13.0, 12.0, 11.0, 3.0, 4.0, 2.0, 5.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.28125, -1.2464828491210938, -1.2117156982421875, -1.1769485473632812, -1.142181396484375, -1.1074142456054688, -1.0726470947265625, -1.0378799438476562, -1.00311279296875, -0.9683456420898438, -0.9335784912109375, -0.8988113403320312, -0.864044189453125, -0.8292770385742188, -0.7945098876953125, -0.7597427368164062, -0.7249755859375, -0.6902084350585938, -0.6554412841796875, -0.6206741333007812, -0.585906982421875, -0.5511398315429688, -0.5163726806640625, -0.48160552978515625, -0.44683837890625, -0.41207122802734375, -0.3773040771484375, -0.34253692626953125, -0.307769775390625, -0.27300262451171875, -0.2382354736328125, -0.20346832275390625, -0.168701171875, -0.13393402099609375, -0.0991668701171875, -0.06439971923828125, -0.029632568359375, 0.00513458251953125, 0.0399017333984375, 0.07466888427734375, 0.10943603515625, 0.14420318603515625, 0.1789703369140625, 0.21373748779296875, 0.248504638671875, 0.28327178955078125, 0.3180389404296875, 0.35280609130859375, 0.3875732421875, 0.42234039306640625, 0.4571075439453125, 0.49187469482421875, 0.526641845703125, 0.5614089965820312, 0.5961761474609375, 0.6309432983398438, 0.66571044921875, 0.7004776000976562, 0.7352447509765625, 0.7700119018554688, 0.804779052734375, 0.8395462036132812, 0.8743133544921875, 0.9090805053710938, 0.94384765625]}, "gradients/encoder.encoder.layers.17.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 4.0, 3.0, 6.0, 15.0, 25.0, 28.0, 60.0, 137.0, 491.0, 1947.0, 19531.0, 922232.0, 98767.0, 4165.0, 730.0, 224.0, 98.0, 35.0, 23.0, 11.0, 11.0, 7.0, 5.0, 5.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7685546875, -1.7239990234375, -1.679443359375, -1.6348876953125, -1.59033203125, -1.5457763671875, -1.501220703125, -1.4566650390625, -1.412109375, -1.3675537109375, -1.322998046875, -1.2784423828125, -1.23388671875, -1.1893310546875, -1.144775390625, -1.1002197265625, -1.0556640625, -1.0111083984375, -0.966552734375, -0.9219970703125, -0.87744140625, -0.8328857421875, -0.788330078125, -0.7437744140625, -0.69921875, -0.6546630859375, -0.610107421875, -0.5655517578125, -0.52099609375, -0.4764404296875, -0.431884765625, -0.3873291015625, -0.3427734375, -0.2982177734375, -0.253662109375, -0.2091064453125, -0.16455078125, -0.1199951171875, -0.075439453125, -0.0308837890625, 0.013671875, 0.0582275390625, 0.102783203125, 0.1473388671875, 0.19189453125, 0.2364501953125, 0.281005859375, 0.3255615234375, 0.3701171875, 0.4146728515625, 0.459228515625, 0.5037841796875, 0.54833984375, 0.5928955078125, 0.637451171875, 0.6820068359375, 0.7265625, 0.7711181640625, 0.815673828125, 0.8602294921875, 0.90478515625, 0.9493408203125, 0.993896484375, 1.0384521484375, 1.0830078125]}, "gradients/encoder.encoder.layers.17.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 7.0, 6.0, 6.0, 17.0, 21.0, 35.0, 43.0, 51.0, 86.0, 90.0, 93.0, 102.0, 103.0, 95.0, 79.0, 50.0, 41.0, 34.0, 14.0, 11.0, 5.0, 7.0, 7.0, 1.0, 3.0, 1.0, 1.0, 1.0, 2.0], "bins": [-0.00011086463928222656, -0.00010847579687833786, -0.00010608695447444916, -0.00010369811207056046, -0.00010130926966667175, -9.892042726278305e-05, -9.653158485889435e-05, -9.414274245500565e-05, -9.175390005111694e-05, -8.936505764722824e-05, -8.697621524333954e-05, -8.458737283945084e-05, -8.219853043556213e-05, -7.980968803167343e-05, -7.742084562778473e-05, -7.503200322389603e-05, -7.264316082000732e-05, -7.025431841611862e-05, -6.786547601222992e-05, -6.547663360834122e-05, -6.308779120445251e-05, -6.069894880056381e-05, -5.831010639667511e-05, -5.592126399278641e-05, -5.3532421588897705e-05, -5.1143579185009e-05, -4.87547367811203e-05, -4.63658943772316e-05, -4.3977051973342896e-05, -4.158820956945419e-05, -3.919936716556549e-05, -3.681052476167679e-05, -3.4421682357788086e-05, -3.2032839953899384e-05, -2.964399755001068e-05, -2.725515514612198e-05, -2.4866312742233276e-05, -2.2477470338344574e-05, -2.008862793445587e-05, -1.769978553056717e-05, -1.5310943126678467e-05, -1.2922100722789764e-05, -1.0533258318901062e-05, -8.14441591501236e-06, -5.755573511123657e-06, -3.366731107234955e-06, -9.778887033462524e-07, 1.41095370054245e-06, 3.7997961044311523e-06, 6.188638508319855e-06, 8.577480912208557e-06, 1.096632331609726e-05, 1.3355165719985962e-05, 1.5744008123874664e-05, 1.8132850527763367e-05, 2.052169293165207e-05, 2.291053533554077e-05, 2.5299377739429474e-05, 2.7688220143318176e-05, 3.007706254720688e-05, 3.246590495109558e-05, 3.4854747354984283e-05, 3.7243589758872986e-05, 3.963243216276169e-05, 4.202127456665039e-05]}, "gradients/encoder.encoder.layers.17.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 1.0, 5.0, 14.0, 14.0, 32.0, 52.0, 131.0, 298.0, 850.0, 4076.0, 52811.0, 901768.0, 81935.0, 4999.0, 988.0, 314.0, 149.0, 63.0, 35.0, 11.0, 1.0, 8.0, 4.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.037109375, -1.0062026977539062, -0.9752960205078125, -0.9443893432617188, -0.913482666015625, -0.8825759887695312, -0.8516693115234375, -0.8207626342773438, -0.78985595703125, -0.7589492797851562, -0.7280426025390625, -0.6971359252929688, -0.666229248046875, -0.6353225708007812, -0.6044158935546875, -0.5735092163085938, -0.5426025390625, -0.5116958618164062, -0.4807891845703125, -0.44988250732421875, -0.418975830078125, -0.38806915283203125, -0.3571624755859375, -0.32625579833984375, -0.29534912109375, -0.26444244384765625, -0.2335357666015625, -0.20262908935546875, -0.171722412109375, -0.14081573486328125, -0.1099090576171875, -0.07900238037109375, -0.048095703125, -0.01718902587890625, 0.0137176513671875, 0.04462432861328125, 0.075531005859375, 0.10643768310546875, 0.1373443603515625, 0.16825103759765625, 0.19915771484375, 0.23006439208984375, 0.2609710693359375, 0.29187774658203125, 0.322784423828125, 0.35369110107421875, 0.3845977783203125, 0.41550445556640625, 0.4464111328125, 0.47731781005859375, 0.5082244873046875, 0.5391311645507812, 0.570037841796875, 0.6009445190429688, 0.6318511962890625, 0.6627578735351562, 0.69366455078125, 0.7245712280273438, 0.7554779052734375, 0.7863845825195312, 0.817291259765625, 0.8481979370117188, 0.8791046142578125, 0.9100112915039062, 0.94091796875]}, "gradients/encoder.encoder.layers.17.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 5.0, 3.0, 6.0, 1.0, 11.0, 11.0, 19.0, 13.0, 39.0, 34.0, 71.0, 109.0, 108.0, 128.0, 112.0, 98.0, 87.0, 44.0, 31.0, 22.0, 19.0, 8.0, 8.0, 10.0, 4.0, 1.0, 4.0, 4.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.69287109375, -0.6766357421875, -0.660400390625, -0.6441650390625, -0.6279296875, -0.6116943359375, -0.595458984375, -0.5792236328125, -0.56298828125, -0.5467529296875, -0.530517578125, -0.5142822265625, -0.498046875, -0.4818115234375, -0.465576171875, -0.4493408203125, -0.43310546875, -0.4168701171875, -0.400634765625, -0.3843994140625, -0.3681640625, -0.3519287109375, -0.335693359375, -0.3194580078125, -0.30322265625, -0.2869873046875, -0.270751953125, -0.2545166015625, -0.23828125, -0.2220458984375, -0.205810546875, -0.1895751953125, -0.17333984375, -0.1571044921875, -0.140869140625, -0.1246337890625, -0.1083984375, -0.0921630859375, -0.075927734375, -0.0596923828125, -0.04345703125, -0.0272216796875, -0.010986328125, 0.0052490234375, 0.021484375, 0.0377197265625, 0.053955078125, 0.0701904296875, 0.08642578125, 0.1026611328125, 0.118896484375, 0.1351318359375, 0.1513671875, 0.1676025390625, 0.183837890625, 0.2000732421875, 0.21630859375, 0.2325439453125, 0.248779296875, 0.2650146484375, 0.28125, 0.2974853515625, 0.313720703125, 0.3299560546875, 0.34619140625]}, "gradients/encoder.encoder.layers.17.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 0.0, 2.0, 6.0, 18.0, 26.0, 41.0, 72.0, 135.0, 187.0, 226.0, 150.0, 69.0, 33.0, 17.0, 10.0, 5.0, 4.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.163978576660156, -10.886470794677734, -10.608963012695312, -10.33145523071289, -10.053947448730469, -9.776439666748047, -9.498931884765625, -9.221423149108887, -8.943915367126465, -8.666407585144043, -8.388899803161621, -8.1113920211792, -7.833883762359619, -7.556375980377197, -7.278868198394775, -7.0013604164123535, -6.723852634429932, -6.44634485244751, -6.168837070465088, -5.891328811645508, -5.613821029663086, -5.336313247680664, -5.058805465698242, -4.78129768371582, -4.503789901733398, -4.226282119750977, -3.9487740993499756, -3.6712663173675537, -3.3937582969665527, -3.116250514984131, -2.838742733001709, -2.561234951019287, -2.2837271690368652, -2.0062193870544434, -1.7287113666534424, -1.4512035846710205, -1.173695683479309, -0.8961877822875977, -0.6186800003051758, -0.34117209911346436, -0.06366419792175293, 0.2138436734676361, 0.49135154485702515, 0.7688593864440918, 1.0463672876358032, 1.3238751888275146, 1.6013829708099365, 1.878890872001648, 2.1563987731933594, 2.4339065551757812, 2.7114145755767822, 2.988922357559204, 3.266430377960205, 3.543938159942627, 3.821445941925049, 4.098953723907471, 4.376461982727051, 4.653969764709473, 4.9314775466918945, 5.208985328674316, 5.4864935874938965, 5.764001369476318, 6.04150915145874, 6.319016933441162, 6.596524715423584]}, "gradients/encoder.encoder.layers.17.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 4.0, 3.0, 0.0, 3.0, 3.0, 7.0, 4.0, 7.0, 10.0, 11.0, 12.0, 18.0, 19.0, 18.0, 29.0, 37.0, 33.0, 28.0, 33.0, 43.0, 38.0, 28.0, 42.0, 36.0, 46.0, 40.0, 39.0, 40.0, 41.0, 39.0, 33.0, 30.0, 37.0, 32.0, 25.0, 24.0, 22.0, 16.0, 15.0, 15.0, 12.0, 10.0, 6.0, 5.0, 3.0, 4.0, 5.0, 3.0, 2.0, 2.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.451428413391113, -5.280288219451904, -5.1091485023498535, -4.9380083084106445, -4.7668681144714355, -4.595727920532227, -4.424588203430176, -4.253448009490967, -4.082307815551758, -3.911167860031128, -3.740027666091919, -3.568887710571289, -3.39774751663208, -3.22660756111145, -3.0554676055908203, -2.8843274116516113, -2.7131876945495605, -2.5420477390289307, -2.3709075450897217, -2.199767589569092, -2.028627395629883, -1.857487440109253, -1.686347484588623, -1.5152074098587036, -1.3440673351287842, -1.1729272603988647, -1.0017871856689453, -0.8306472301483154, -0.659507155418396, -0.48836708068847656, -0.3172271251678467, -0.14608705043792725, 0.025053024291992188, 0.19619306921958923, 0.3673331141471863, 0.5384731292724609, 0.7096132040023804, 0.8807532787322998, 1.0518932342529297, 1.2230333089828491, 1.3941733837127686, 1.565313458442688, 1.7364535331726074, 1.9075934886932373, 2.078733444213867, 2.249873638153076, 2.421013593673706, 2.592153549194336, 2.763293743133545, 2.934433698654175, 3.105573892593384, 3.2767138481140137, 3.4478540420532227, 3.6189939975738525, 3.7901339530944824, 3.9612741470336914, 4.132413864135742, 4.303554058074951, 4.474693775177002, 4.645833969116211, 4.81697416305542, 4.988114356994629, 5.15925407409668, 5.330394268035889, 5.501534461975098]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 6.0, 3.0, 1.0, 3.0, 3.0, 9.0, 13.0, 20.0, 41.0, 49.0, 85.0, 138.0, 287.0, 570.0, 1329.0, 3816.0, 15534.0, 146691.0, 3884966.0, 120255.0, 13790.0, 3546.0, 1383.0, 693.0, 362.0, 225.0, 121.0, 89.0, 76.0, 49.0, 37.0, 25.0, 19.0, 12.0, 9.0, 8.0, 7.0, 6.0, 7.0, 4.0, 2.0, 2.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.6953125, -1.635772705078125, -1.57623291015625, -1.516693115234375, -1.4571533203125, -1.397613525390625, -1.33807373046875, -1.278533935546875, -1.218994140625, -1.159454345703125, -1.09991455078125, -1.040374755859375, -0.9808349609375, -0.921295166015625, -0.86175537109375, -0.802215576171875, -0.74267578125, -0.683135986328125, -0.62359619140625, -0.564056396484375, -0.5045166015625, -0.444976806640625, -0.38543701171875, -0.325897216796875, -0.266357421875, -0.206817626953125, -0.14727783203125, -0.087738037109375, -0.0281982421875, 0.031341552734375, 0.09088134765625, 0.150421142578125, 0.2099609375, 0.269500732421875, 0.32904052734375, 0.388580322265625, 0.4481201171875, 0.507659912109375, 0.56719970703125, 0.626739501953125, 0.686279296875, 0.745819091796875, 0.80535888671875, 0.864898681640625, 0.9244384765625, 0.983978271484375, 1.04351806640625, 1.103057861328125, 1.16259765625, 1.222137451171875, 1.28167724609375, 1.341217041015625, 1.4007568359375, 1.460296630859375, 1.51983642578125, 1.579376220703125, 1.638916015625, 1.698455810546875, 1.75799560546875, 1.817535400390625, 1.8770751953125, 1.936614990234375, 1.99615478515625, 2.055694580078125, 2.115234375]}, "gradients/encoder.encoder.layers.16.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 4.0, 2.0, 3.0, 5.0, 4.0, 9.0, 22.0, 24.0, 32.0, 59.0, 93.0, 92.0, 110.0, 119.0, 107.0, 81.0, 95.0, 63.0, 29.0, 28.0, 15.0, 6.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.427490234375, -0.4084587097167969, -0.38942718505859375, -0.3703956604003906, -0.3513641357421875, -0.3323326110839844, -0.31330108642578125, -0.2942695617675781, -0.275238037109375, -0.2562065124511719, -0.23717498779296875, -0.21814346313476562, -0.1991119384765625, -0.18008041381835938, -0.16104888916015625, -0.14201736450195312, -0.12298583984375, -0.10395431518554688, -0.08492279052734375, -0.06589126586914062, -0.0468597412109375, -0.027828216552734375, -0.00879669189453125, 0.010234832763671875, 0.029266357421875, 0.048297882080078125, 0.06732940673828125, 0.08636093139648438, 0.1053924560546875, 0.12442398071289062, 0.14345550537109375, 0.16248703002929688, 0.1815185546875, 0.20055007934570312, 0.21958160400390625, 0.23861312866210938, 0.2576446533203125, 0.2766761779785156, 0.29570770263671875, 0.3147392272949219, 0.333770751953125, 0.3528022766113281, 0.37183380126953125, 0.3908653259277344, 0.4098968505859375, 0.4289283752441406, 0.44795989990234375, 0.4669914245605469, 0.48602294921875, 0.5050544738769531, 0.5240859985351562, 0.5431175231933594, 0.5621490478515625, 0.5811805725097656, 0.6002120971679688, 0.6192436218261719, 0.638275146484375, 0.6573066711425781, 0.6763381958007812, 0.6953697204589844, 0.7144012451171875, 0.7334327697753906, 0.7524642944335938, 0.7714958190917969, 0.79052734375]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 2.0, 4.0, 7.0, 10.0, 18.0, 38.0, 50.0, 85.0, 175.0, 245.0, 466.0, 1113.0, 5777.0, 339842.0, 3829353.0, 13923.0, 1766.0, 640.0, 281.0, 194.0, 120.0, 60.0, 54.0, 30.0, 16.0, 10.0, 4.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.263671875, -2.16998291015625, -2.0762939453125, -1.98260498046875, -1.888916015625, -1.79522705078125, -1.7015380859375, -1.60784912109375, -1.51416015625, -1.42047119140625, -1.3267822265625, -1.23309326171875, -1.139404296875, -1.04571533203125, -0.9520263671875, -0.85833740234375, -0.7646484375, -0.67095947265625, -0.5772705078125, -0.48358154296875, -0.389892578125, -0.29620361328125, -0.2025146484375, -0.10882568359375, -0.01513671875, 0.07855224609375, 0.1722412109375, 0.26593017578125, 0.359619140625, 0.45330810546875, 0.5469970703125, 0.64068603515625, 0.734375, 0.82806396484375, 0.9217529296875, 1.01544189453125, 1.109130859375, 1.20281982421875, 1.2965087890625, 1.39019775390625, 1.48388671875, 1.57757568359375, 1.6712646484375, 1.76495361328125, 1.858642578125, 1.95233154296875, 2.0460205078125, 2.13970947265625, 2.2333984375, 2.32708740234375, 2.4207763671875, 2.51446533203125, 2.608154296875, 2.70184326171875, 2.7955322265625, 2.88922119140625, 2.98291015625, 3.07659912109375, 3.1702880859375, 3.26397705078125, 3.357666015625, 3.45135498046875, 3.5450439453125, 3.63873291015625, 3.732421875]}, "gradients/encoder.encoder.layers.16.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 1.0, 10.0, 10.0, 20.0, 48.0, 126.0, 422.0, 2558.0, 626.0, 148.0, 56.0, 28.0, 14.0, 5.0, 5.0, 1.0, 0.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.2119140625, -1.1805267333984375, -1.149139404296875, -1.1177520751953125, -1.08636474609375, -1.0549774169921875, -1.023590087890625, -0.9922027587890625, -0.9608154296875, -0.9294281005859375, -0.898040771484375, -0.8666534423828125, -0.83526611328125, -0.8038787841796875, -0.772491455078125, -0.7411041259765625, -0.709716796875, -0.6783294677734375, -0.646942138671875, -0.6155548095703125, -0.58416748046875, -0.5527801513671875, -0.521392822265625, -0.4900054931640625, -0.4586181640625, -0.4272308349609375, -0.395843505859375, -0.3644561767578125, -0.33306884765625, -0.3016815185546875, -0.270294189453125, -0.2389068603515625, -0.20751953125, -0.1761322021484375, -0.144744873046875, -0.1133575439453125, -0.08197021484375, -0.0505828857421875, -0.019195556640625, 0.0121917724609375, 0.0435791015625, 0.0749664306640625, 0.106353759765625, 0.1377410888671875, 0.16912841796875, 0.2005157470703125, 0.231903076171875, 0.2632904052734375, 0.294677734375, 0.3260650634765625, 0.357452392578125, 0.3888397216796875, 0.42022705078125, 0.4516143798828125, 0.483001708984375, 0.5143890380859375, 0.5457763671875, 0.5771636962890625, 0.608551025390625, 0.6399383544921875, 0.67132568359375, 0.7027130126953125, 0.734100341796875, 0.7654876708984375, 0.796875]}, "gradients/encoder.encoder.layers.16.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 7.0, 43.0, 513.0, 423.0, 21.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.56855583190918, -13.129997253417969, -12.691439628601074, -12.252881050109863, -11.814323425292969, -11.375764846801758, -10.937207221984863, -10.498648643493652, -10.060091018676758, -9.621532440185547, -9.182974815368652, -8.744416236877441, -8.305858612060547, -7.867300033569336, -7.428742408752441, -6.9901838302612305, -6.551625728607178, -6.113067626953125, -5.674509525299072, -5.2359514236450195, -4.797393321990967, -4.358835220336914, -3.9202768802642822, -3.4817187786102295, -3.0431606769561768, -2.604602575302124, -2.1660444736480713, -1.727486252784729, -1.2889281511306763, -0.850369930267334, -0.41181182861328125, 0.026746273040771484, 0.4653043746948242, 0.903862476348877, 1.3424205780029297, 1.780978798866272, 2.219536781311035, 2.658095121383667, 3.0966532230377197, 3.5352113246917725, 3.973769426345825, 4.412327766418457, 4.85088586807251, 5.2894439697265625, 5.728002071380615, 6.166560173034668, 6.605118274688721, 7.043676376342773, 7.482234477996826, 7.920792579650879, 8.35935115814209, 8.797908782958984, 9.236467361450195, 9.67502498626709, 10.1135835647583, 10.552141189575195, 10.990699768066406, 11.429258346557617, 11.867815971374512, 12.306374549865723, 12.744932174682617, 13.183490753173828, 13.622048377990723, 14.060606956481934, 14.499164581298828]}, "gradients/encoder.encoder.layers.16.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 4.0, 3.0, 5.0, 5.0, 5.0, 8.0, 6.0, 6.0, 16.0, 15.0, 15.0, 23.0, 27.0, 38.0, 30.0, 40.0, 33.0, 55.0, 45.0, 55.0, 69.0, 55.0, 66.0, 60.0, 48.0, 48.0, 33.0, 43.0, 20.0, 30.0, 17.0, 20.0, 14.0, 14.0, 13.0, 6.0, 7.0, 3.0, 8.0, 3.0, 4.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.477252721786499, -1.4193100929260254, -1.3613675832748413, -1.3034249544143677, -1.2454824447631836, -1.18753981590271, -1.1295971870422363, -1.0716546773910522, -1.0137121677398682, -0.9557695984840393, -0.8978270292282104, -0.8398844003677368, -0.7819418907165527, -0.7239992618560791, -0.6660566926002502, -0.6081141233444214, -0.5501714944839478, -0.4922289252281189, -0.43428635597229004, -0.3763437569141388, -0.31840118765830994, -0.2604586184024811, -0.20251601934432983, -0.14457345008850098, -0.08663088083267212, -0.028688304126262665, 0.02925427258014679, 0.08719685673713684, 0.1451394259929657, 0.20308199524879456, 0.2610245943069458, 0.31896716356277466, 0.3769097328186035, 0.4348523020744324, 0.49279487133026123, 0.5507375001907349, 0.608680009841919, 0.6666226387023926, 0.7245652079582214, 0.7825077772140503, 0.8404503464698792, 0.898392915725708, 0.9563354849815369, 1.0142780542373657, 1.0722206830978394, 1.1301631927490234, 1.188105821609497, 1.2460484504699707, 1.3039909601211548, 1.3619335889816284, 1.4198760986328125, 1.4778187274932861, 1.5357612371444702, 1.5937038660049438, 1.651646375656128, 1.7095890045166016, 1.7675316333770752, 1.8254742622375488, 1.883416771888733, 1.9413594007492065, 1.9993019104003906, 2.0572445392608643, 2.115187168121338, 2.1731295585632324, 2.231072187423706]}, "gradients/encoder.encoder.layers.16.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 5.0, 5.0, 8.0, 11.0, 10.0, 7.0, 16.0, 16.0, 29.0, 30.0, 54.0, 81.0, 122.0, 173.0, 235.0, 490.0, 880.0, 2070.0, 6512.0, 32780.0, 304317.0, 607739.0, 75331.0, 11570.0, 3174.0, 1252.0, 652.0, 348.0, 199.0, 129.0, 86.0, 65.0, 51.0, 28.0, 18.0, 19.0, 14.0, 14.0, 4.0, 3.0, 1.0, 8.0, 2.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-2.1875, -2.121612548828125, -2.05572509765625, -1.989837646484375, -1.9239501953125, -1.858062744140625, -1.79217529296875, -1.726287841796875, -1.660400390625, -1.594512939453125, -1.52862548828125, -1.462738037109375, -1.3968505859375, -1.330963134765625, -1.26507568359375, -1.199188232421875, -1.13330078125, -1.067413330078125, -1.00152587890625, -0.935638427734375, -0.8697509765625, -0.803863525390625, -0.73797607421875, -0.672088623046875, -0.606201171875, -0.540313720703125, -0.47442626953125, -0.408538818359375, -0.3426513671875, -0.276763916015625, -0.21087646484375, -0.144989013671875, -0.0791015625, -0.013214111328125, 0.05267333984375, 0.118560791015625, 0.1844482421875, 0.250335693359375, 0.31622314453125, 0.382110595703125, 0.447998046875, 0.513885498046875, 0.57977294921875, 0.645660400390625, 0.7115478515625, 0.777435302734375, 0.84332275390625, 0.909210205078125, 0.97509765625, 1.040985107421875, 1.10687255859375, 1.172760009765625, 1.2386474609375, 1.304534912109375, 1.37042236328125, 1.436309814453125, 1.502197265625, 1.568084716796875, 1.63397216796875, 1.699859619140625, 1.7657470703125, 1.831634521484375, 1.89752197265625, 1.963409423828125, 2.029296875]}, "gradients/encoder.encoder.layers.16.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 4.0, 2.0, 4.0, 4.0, 1.0, 6.0, 17.0, 28.0, 37.0, 55.0, 88.0, 92.0, 121.0, 124.0, 96.0, 95.0, 100.0, 52.0, 36.0, 23.0, 9.0, 2.0, 6.0, 3.0, 3.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.45458984375, -0.43524169921875, -0.4158935546875, -0.39654541015625, -0.377197265625, -0.35784912109375, -0.3385009765625, -0.31915283203125, -0.2998046875, -0.28045654296875, -0.2611083984375, -0.24176025390625, -0.222412109375, -0.20306396484375, -0.1837158203125, -0.16436767578125, -0.14501953125, -0.12567138671875, -0.1063232421875, -0.08697509765625, -0.067626953125, -0.04827880859375, -0.0289306640625, -0.00958251953125, 0.009765625, 0.02911376953125, 0.0484619140625, 0.06781005859375, 0.087158203125, 0.10650634765625, 0.1258544921875, 0.14520263671875, 0.16455078125, 0.18389892578125, 0.2032470703125, 0.22259521484375, 0.241943359375, 0.26129150390625, 0.2806396484375, 0.29998779296875, 0.3193359375, 0.33868408203125, 0.3580322265625, 0.37738037109375, 0.396728515625, 0.41607666015625, 0.4354248046875, 0.45477294921875, 0.47412109375, 0.49346923828125, 0.5128173828125, 0.53216552734375, 0.551513671875, 0.57086181640625, 0.5902099609375, 0.60955810546875, 0.62890625, 0.64825439453125, 0.6676025390625, 0.68695068359375, 0.706298828125, 0.72564697265625, 0.7449951171875, 0.76434326171875, 0.78369140625]}, "gradients/encoder.encoder.layers.16.attention.v_proj.weight": {"_type": "histogram", "values": [4.0, 3.0, 3.0, 2.0, 10.0, 6.0, 8.0, 8.0, 11.0, 19.0, 21.0, 31.0, 32.0, 44.0, 51.0, 73.0, 74.0, 106.0, 150.0, 207.0, 316.0, 484.0, 768.0, 1476.0, 2878.0, 6297.0, 14515.0, 37665.0, 114704.0, 331111.0, 345074.0, 122916.0, 40957.0, 15224.0, 6346.0, 2955.0, 1489.0, 866.0, 533.0, 298.0, 179.0, 146.0, 124.0, 84.0, 57.0, 49.0, 42.0, 32.0, 26.0, 21.0, 22.0, 14.0, 9.0, 5.0, 7.0, 5.0, 6.0, 6.0, 0.0, 1.0, 2.0, 1.0, 0.0, 3.0], "bins": [-0.76318359375, -0.7377700805664062, -0.7123565673828125, -0.6869430541992188, -0.661529541015625, -0.6361160278320312, -0.6107025146484375, -0.5852890014648438, -0.55987548828125, -0.5344619750976562, -0.5090484619140625, -0.48363494873046875, -0.458221435546875, -0.43280792236328125, -0.4073944091796875, -0.38198089599609375, -0.3565673828125, -0.33115386962890625, -0.3057403564453125, -0.28032684326171875, -0.254913330078125, -0.22949981689453125, -0.2040863037109375, -0.17867279052734375, -0.15325927734375, -0.12784576416015625, -0.1024322509765625, -0.07701873779296875, -0.051605224609375, -0.02619171142578125, -0.0007781982421875, 0.02463531494140625, 0.050048828125, 0.07546234130859375, 0.1008758544921875, 0.12628936767578125, 0.151702880859375, 0.17711639404296875, 0.2025299072265625, 0.22794342041015625, 0.25335693359375, 0.27877044677734375, 0.3041839599609375, 0.32959747314453125, 0.355010986328125, 0.38042449951171875, 0.4058380126953125, 0.43125152587890625, 0.4566650390625, 0.48207855224609375, 0.5074920654296875, 0.5329055786132812, 0.558319091796875, 0.5837326049804688, 0.6091461181640625, 0.6345596313476562, 0.65997314453125, 0.6853866577148438, 0.7108001708984375, 0.7362136840820312, 0.761627197265625, 0.7870407104492188, 0.8124542236328125, 0.8378677368164062, 0.86328125]}, "gradients/encoder.encoder.layers.16.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 1.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 4.0, 1.0, 2.0, 5.0, 9.0, 10.0, 8.0, 17.0, 24.0, 19.0, 22.0, 19.0, 32.0, 34.0, 29.0, 39.0, 33.0, 39.0, 55.0, 52.0, 51.0, 45.0, 38.0, 47.0, 44.0, 37.0, 46.0, 27.0, 24.0, 22.0, 26.0, 19.0, 37.0, 13.0, 10.0, 13.0, 10.0, 8.0, 9.0, 5.0, 5.0, 6.0, 5.0, 2.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.0224609375, -0.9888916015625, -0.955322265625, -0.9217529296875, -0.88818359375, -0.8546142578125, -0.821044921875, -0.7874755859375, -0.75390625, -0.7203369140625, -0.686767578125, -0.6531982421875, -0.61962890625, -0.5860595703125, -0.552490234375, -0.5189208984375, -0.4853515625, -0.4517822265625, -0.418212890625, -0.3846435546875, -0.35107421875, -0.3175048828125, -0.283935546875, -0.2503662109375, -0.216796875, -0.1832275390625, -0.149658203125, -0.1160888671875, -0.08251953125, -0.0489501953125, -0.015380859375, 0.0181884765625, 0.0517578125, 0.0853271484375, 0.118896484375, 0.1524658203125, 0.18603515625, 0.2196044921875, 0.253173828125, 0.2867431640625, 0.3203125, 0.3538818359375, 0.387451171875, 0.4210205078125, 0.45458984375, 0.4881591796875, 0.521728515625, 0.5552978515625, 0.5888671875, 0.6224365234375, 0.656005859375, 0.6895751953125, 0.72314453125, 0.7567138671875, 0.790283203125, 0.8238525390625, 0.857421875, 0.8909912109375, 0.924560546875, 0.9581298828125, 0.99169921875, 1.0252685546875, 1.058837890625, 1.0924072265625, 1.1259765625]}, "gradients/encoder.encoder.layers.16.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 0.0, 1.0, 1.0, 0.0, 4.0, 7.0, 5.0, 5.0, 10.0, 7.0, 14.0, 16.0, 33.0, 51.0, 97.0, 175.0, 341.0, 697.0, 1758.0, 6297.0, 47229.0, 480078.0, 458144.0, 44332.0, 6058.0, 1764.0, 698.0, 325.0, 150.0, 102.0, 54.0, 40.0, 28.0, 11.0, 4.0, 7.0, 5.0, 2.0, 4.0, 2.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 2.0], "bins": [-0.6142578125, -0.5961837768554688, -0.5781097412109375, -0.5600357055664062, -0.541961669921875, -0.5238876342773438, -0.5058135986328125, -0.48773956298828125, -0.46966552734375, -0.45159149169921875, -0.4335174560546875, -0.41544342041015625, -0.397369384765625, -0.37929534912109375, -0.3612213134765625, -0.34314727783203125, -0.3250732421875, -0.30699920654296875, -0.2889251708984375, -0.27085113525390625, -0.252777099609375, -0.23470306396484375, -0.2166290283203125, -0.19855499267578125, -0.18048095703125, -0.16240692138671875, -0.1443328857421875, -0.12625885009765625, -0.108184814453125, -0.09011077880859375, -0.0720367431640625, -0.05396270751953125, -0.035888671875, -0.01781463623046875, 0.0002593994140625, 0.01833343505859375, 0.036407470703125, 0.05448150634765625, 0.0725555419921875, 0.09062957763671875, 0.10870361328125, 0.12677764892578125, 0.1448516845703125, 0.16292572021484375, 0.180999755859375, 0.19907379150390625, 0.2171478271484375, 0.23522186279296875, 0.2532958984375, 0.27136993408203125, 0.2894439697265625, 0.30751800537109375, 0.325592041015625, 0.34366607666015625, 0.3617401123046875, 0.37981414794921875, 0.39788818359375, 0.41596221923828125, 0.4340362548828125, 0.45211029052734375, 0.470184326171875, 0.48825836181640625, 0.5063323974609375, 0.5244064331054688, 0.54248046875]}, "gradients/encoder.encoder.layers.16.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 6.0, 1.0, 2.0, 6.0, 6.0, 16.0, 7.0, 16.0, 29.0, 23.0, 34.0, 58.0, 56.0, 44.0, 77.0, 81.0, 91.0, 88.0, 95.0, 57.0, 56.0, 41.0, 30.0, 18.0, 20.0, 19.0, 8.0, 9.0, 6.0, 3.0, 7.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0], "bins": [-8.630752563476562e-05, -8.426979184150696e-05, -8.223205804824829e-05, -8.019432425498962e-05, -7.815659046173096e-05, -7.611885666847229e-05, -7.408112287521362e-05, -7.204338908195496e-05, -7.000565528869629e-05, -6.796792149543762e-05, -6.593018770217896e-05, -6.389245390892029e-05, -6.185472011566162e-05, -5.9816986322402954e-05, -5.777925252914429e-05, -5.574151873588562e-05, -5.370378494262695e-05, -5.1666051149368286e-05, -4.962831735610962e-05, -4.759058356285095e-05, -4.5552849769592285e-05, -4.351511597633362e-05, -4.147738218307495e-05, -3.9439648389816284e-05, -3.740191459655762e-05, -3.536418080329895e-05, -3.332644701004028e-05, -3.1288713216781616e-05, -2.925097942352295e-05, -2.7213245630264282e-05, -2.5175511837005615e-05, -2.3137778043746948e-05, -2.110004425048828e-05, -1.9062310457229614e-05, -1.7024576663970947e-05, -1.498684287071228e-05, -1.2949109077453613e-05, -1.0911375284194946e-05, -8.87364149093628e-06, -6.835907697677612e-06, -4.798173904418945e-06, -2.7604401111602783e-06, -7.227063179016113e-07, 1.3150274753570557e-06, 3.3527612686157227e-06, 5.39049506187439e-06, 7.428228855133057e-06, 9.465962648391724e-06, 1.150369644165039e-05, 1.3541430234909058e-05, 1.5579164028167725e-05, 1.761689782142639e-05, 1.965463161468506e-05, 2.1692365407943726e-05, 2.3730099201202393e-05, 2.576783299446106e-05, 2.7805566787719727e-05, 2.9843300580978394e-05, 3.188103437423706e-05, 3.391876816749573e-05, 3.5956501960754395e-05, 3.799423575401306e-05, 4.003196954727173e-05, 4.2069703340530396e-05, 4.410743713378906e-05]}, "gradients/encoder.encoder.layers.16.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 3.0, 2.0, 3.0, 2.0, 7.0, 6.0, 21.0, 23.0, 35.0, 66.0, 110.0, 218.0, 463.0, 1021.0, 2548.0, 9214.0, 55921.0, 406741.0, 482437.0, 73452.0, 11155.0, 2928.0, 1123.0, 452.0, 245.0, 143.0, 81.0, 46.0, 36.0, 20.0, 7.0, 12.0, 5.0, 4.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.5068359375, -0.4923820495605469, -0.47792816162109375, -0.4634742736816406, -0.4490203857421875, -0.4345664978027344, -0.42011260986328125, -0.4056587219238281, -0.391204833984375, -0.3767509460449219, -0.36229705810546875, -0.3478431701660156, -0.3333892822265625, -0.3189353942871094, -0.30448150634765625, -0.2900276184082031, -0.27557373046875, -0.2611198425292969, -0.24666595458984375, -0.23221206665039062, -0.2177581787109375, -0.20330429077148438, -0.18885040283203125, -0.17439651489257812, -0.159942626953125, -0.14548873901367188, -0.13103485107421875, -0.11658096313476562, -0.1021270751953125, -0.08767318725585938, -0.07321929931640625, -0.058765411376953125, -0.0443115234375, -0.029857635498046875, -0.01540374755859375, -0.000949859619140625, 0.0135040283203125, 0.027957916259765625, 0.04241180419921875, 0.056865692138671875, 0.071319580078125, 0.08577346801757812, 0.10022735595703125, 0.11468124389648438, 0.1291351318359375, 0.14358901977539062, 0.15804290771484375, 0.17249679565429688, 0.18695068359375, 0.20140457153320312, 0.21585845947265625, 0.23031234741210938, 0.2447662353515625, 0.2592201232910156, 0.27367401123046875, 0.2881278991699219, 0.302581787109375, 0.3170356750488281, 0.33148956298828125, 0.3459434509277344, 0.3603973388671875, 0.3748512268066406, 0.38930511474609375, 0.4037590026855469, 0.418212890625]}, "gradients/encoder.encoder.layers.16.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 3.0, 1.0, 4.0, 7.0, 8.0, 5.0, 14.0, 20.0, 24.0, 36.0, 47.0, 56.0, 62.0, 86.0, 96.0, 96.0, 93.0, 82.0, 52.0, 50.0, 46.0, 31.0, 30.0, 20.0, 5.0, 9.0, 7.0, 6.0, 5.0, 3.0, 0.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.4033203125, -0.3908958435058594, -0.37847137451171875, -0.3660469055175781, -0.3536224365234375, -0.3411979675292969, -0.32877349853515625, -0.3163490295410156, -0.303924560546875, -0.2915000915527344, -0.27907562255859375, -0.2666511535644531, -0.2542266845703125, -0.24180221557617188, -0.22937774658203125, -0.21695327758789062, -0.20452880859375, -0.19210433959960938, -0.17967987060546875, -0.16725540161132812, -0.1548309326171875, -0.14240646362304688, -0.12998199462890625, -0.11755752563476562, -0.105133056640625, -0.09270858764648438, -0.08028411865234375, -0.06785964965820312, -0.0554351806640625, -0.043010711669921875, -0.03058624267578125, -0.018161773681640625, -0.0057373046875, 0.006687164306640625, 0.01911163330078125, 0.031536102294921875, 0.0439605712890625, 0.056385040283203125, 0.06880950927734375, 0.08123397827148438, 0.093658447265625, 0.10608291625976562, 0.11850738525390625, 0.13093185424804688, 0.1433563232421875, 0.15578079223632812, 0.16820526123046875, 0.18062973022460938, 0.19305419921875, 0.20547866821289062, 0.21790313720703125, 0.23032760620117188, 0.2427520751953125, 0.2551765441894531, 0.26760101318359375, 0.2800254821777344, 0.292449951171875, 0.3048744201660156, 0.31729888916015625, 0.3297233581542969, 0.3421478271484375, 0.3545722961425781, 0.36699676513671875, 0.3794212341308594, 0.391845703125]}, "gradients/encoder.encoder.layers.16.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 5.0, 8.0, 11.0, 36.0, 42.0, 101.0, 138.0, 184.0, 200.0, 135.0, 53.0, 38.0, 25.0, 20.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.6469926834106445, -6.356942176818848, -6.066891670227051, -5.776841163635254, -5.486790657043457, -5.19674015045166, -4.906689167022705, -4.616638660430908, -4.326588153839111, -4.0365376472473145, -3.7464871406555176, -3.4564363956451416, -3.1663858890533447, -2.876335382461548, -2.586284637451172, -2.296234130859375, -2.006183624267578, -1.7161331176757812, -1.4260824918746948, -1.1360318660736084, -0.8459813594818115, -0.5559308528900146, -0.2658802270889282, 0.024170398712158203, 0.3142209053039551, 0.6042714715003967, 0.8943220376968384, 1.1843726634979248, 1.4744231700897217, 1.7644736766815186, 2.0545244216918945, 2.3445749282836914, 2.6346263885498047, 2.9246768951416016, 3.2147274017333984, 3.5047781467437744, 3.7948286533355713, 4.084878921508789, 4.374929904937744, 4.664980411529541, 4.955030918121338, 5.245081424713135, 5.535131931304932, 5.8251824378967285, 6.115233421325684, 6.4052839279174805, 6.695334434509277, 6.985384941101074, 7.275435447692871, 7.565485954284668, 7.855536460876465, 8.145586967468262, 8.435637474060059, 8.725687980651855, 9.015738487243652, 9.305789947509766, 9.595840454101562, 9.88589096069336, 10.175941467285156, 10.465991973876953, 10.75604248046875, 11.046092987060547, 11.336143493652344, 11.62619400024414, 11.916244506835938]}, "gradients/encoder.encoder.layers.16.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 2.0, 3.0, 5.0, 7.0, 4.0, 7.0, 11.0, 12.0, 17.0, 12.0, 14.0, 14.0, 25.0, 29.0, 31.0, 33.0, 32.0, 30.0, 38.0, 52.0, 55.0, 58.0, 49.0, 42.0, 48.0, 37.0, 46.0, 30.0, 37.0, 32.0, 32.0, 26.0, 21.0, 31.0, 13.0, 20.0, 13.0, 12.0, 7.0, 5.0, 6.0, 1.0, 1.0, 3.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.400047302246094, -6.196839332580566, -5.993630886077881, -5.7904229164123535, -5.587214469909668, -5.384006500244141, -5.180798530578613, -4.977590084075928, -4.774381637573242, -4.571173667907715, -4.367965221405029, -4.164757251739502, -3.9615488052368164, -3.758340835571289, -3.5551326274871826, -3.351924419403076, -3.148716449737549, -2.9455082416534424, -2.742300033569336, -2.5390920639038086, -2.335883617401123, -2.1326756477355957, -1.9294674396514893, -1.7262592315673828, -1.5230510234832764, -1.31984281539917, -1.1166346073150635, -0.9134265184402466, -0.7102183103561401, -0.5070101022720337, -0.3038020133972168, -0.10059380531311035, 0.1026144027709961, 0.30582258105278015, 0.5090307593345642, 0.7122389078140259, 0.9154471158981323, 1.1186553239822388, 1.3218634128570557, 1.525071620941162, 1.7282798290252686, 1.931488037109375, 2.1346962451934814, 2.337904453277588, 2.5411124229431152, 2.744320869445801, 2.947528839111328, 3.1507370471954346, 3.353945255279541, 3.5571534633636475, 3.760361671447754, 3.9635696411132812, 4.166778087615967, 4.369986057281494, 4.57319450378418, 4.776402473449707, 4.979610443115234, 5.182818412780762, 5.386026859283447, 5.589234828948975, 5.79244327545166, 5.9956512451171875, 6.198859214782715, 6.4020676612854, 6.605276107788086]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 7.0, 9.0, 12.0, 19.0, 28.0, 23.0, 56.0, 120.0, 190.0, 379.0, 825.0, 2146.0, 7458.0, 53103.0, 3913822.0, 196809.0, 13435.0, 3289.0, 1233.0, 559.0, 297.0, 157.0, 95.0, 63.0, 36.0, 29.0, 25.0, 15.0, 5.0, 9.0, 9.0, 10.0, 3.0, 3.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.935546875, -1.853851318359375, -1.77215576171875, -1.690460205078125, -1.6087646484375, -1.527069091796875, -1.44537353515625, -1.363677978515625, -1.281982421875, -1.200286865234375, -1.11859130859375, -1.036895751953125, -0.9552001953125, -0.873504638671875, -0.79180908203125, -0.710113525390625, -0.62841796875, -0.546722412109375, -0.46502685546875, -0.383331298828125, -0.3016357421875, -0.219940185546875, -0.13824462890625, -0.056549072265625, 0.025146484375, 0.106842041015625, 0.18853759765625, 0.270233154296875, 0.3519287109375, 0.433624267578125, 0.51531982421875, 0.597015380859375, 0.6787109375, 0.760406494140625, 0.84210205078125, 0.923797607421875, 1.0054931640625, 1.087188720703125, 1.16888427734375, 1.250579833984375, 1.332275390625, 1.413970947265625, 1.49566650390625, 1.577362060546875, 1.6590576171875, 1.740753173828125, 1.82244873046875, 1.904144287109375, 1.98583984375, 2.067535400390625, 2.14923095703125, 2.230926513671875, 2.3126220703125, 2.394317626953125, 2.47601318359375, 2.557708740234375, 2.639404296875, 2.721099853515625, 2.80279541015625, 2.884490966796875, 2.9661865234375, 3.047882080078125, 3.12957763671875, 3.211273193359375, 3.29296875]}, "gradients/encoder.encoder.layers.15.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 6.0, 3.0, 5.0, 1.0, 4.0, 8.0, 22.0, 25.0, 28.0, 49.0, 52.0, 64.0, 88.0, 104.0, 114.0, 91.0, 85.0, 69.0, 67.0, 47.0, 31.0, 22.0, 11.0, 5.0, 3.0, 3.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.53564453125, -0.51611328125, -0.49658203125, -0.47705078125, -0.45751953125, -0.43798828125, -0.41845703125, -0.39892578125, -0.37939453125, -0.35986328125, -0.34033203125, -0.32080078125, -0.30126953125, -0.28173828125, -0.26220703125, -0.24267578125, -0.22314453125, -0.20361328125, -0.18408203125, -0.16455078125, -0.14501953125, -0.12548828125, -0.10595703125, -0.08642578125, -0.06689453125, -0.04736328125, -0.02783203125, -0.00830078125, 0.01123046875, 0.03076171875, 0.05029296875, 0.06982421875, 0.08935546875, 0.10888671875, 0.12841796875, 0.14794921875, 0.16748046875, 0.18701171875, 0.20654296875, 0.22607421875, 0.24560546875, 0.26513671875, 0.28466796875, 0.30419921875, 0.32373046875, 0.34326171875, 0.36279296875, 0.38232421875, 0.40185546875, 0.42138671875, 0.44091796875, 0.46044921875, 0.47998046875, 0.49951171875, 0.51904296875, 0.53857421875, 0.55810546875, 0.57763671875, 0.59716796875, 0.61669921875, 0.63623046875, 0.65576171875, 0.67529296875, 0.69482421875, 0.71435546875]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 2.0, 2.0, 8.0, 1.0, 3.0, 5.0, 11.0, 11.0, 12.0, 22.0, 33.0, 59.0, 102.0, 174.0, 325.0, 552.0, 1150.0, 2723.0, 7903.0, 36922.0, 508804.0, 3506450.0, 105303.0, 15813.0, 4418.0, 1589.0, 832.0, 427.0, 246.0, 145.0, 90.0, 47.0, 38.0, 13.0, 15.0, 9.0, 6.0, 7.0, 7.0, 3.0, 3.0, 1.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.296875, -1.2509613037109375, -1.205047607421875, -1.1591339111328125, -1.11322021484375, -1.0673065185546875, -1.021392822265625, -0.9754791259765625, -0.9295654296875, -0.8836517333984375, -0.837738037109375, -0.7918243408203125, -0.74591064453125, -0.6999969482421875, -0.654083251953125, -0.6081695556640625, -0.562255859375, -0.5163421630859375, -0.470428466796875, -0.4245147705078125, -0.37860107421875, -0.3326873779296875, -0.286773681640625, -0.2408599853515625, -0.1949462890625, -0.1490325927734375, -0.103118896484375, -0.0572052001953125, -0.01129150390625, 0.0346221923828125, 0.080535888671875, 0.1264495849609375, 0.17236328125, 0.2182769775390625, 0.264190673828125, 0.3101043701171875, 0.35601806640625, 0.4019317626953125, 0.447845458984375, 0.4937591552734375, 0.5396728515625, 0.5855865478515625, 0.631500244140625, 0.6774139404296875, 0.72332763671875, 0.7692413330078125, 0.815155029296875, 0.8610687255859375, 0.906982421875, 0.9528961181640625, 0.998809814453125, 1.0447235107421875, 1.09063720703125, 1.1365509033203125, 1.182464599609375, 1.2283782958984375, 1.2742919921875, 1.3202056884765625, 1.366119384765625, 1.4120330810546875, 1.45794677734375, 1.5038604736328125, 1.549774169921875, 1.5956878662109375, 1.6416015625]}, "gradients/encoder.encoder.layers.15.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 2.0, 1.0, 4.0, 12.0, 8.0, 14.0, 27.0, 33.0, 57.0, 117.0, 248.0, 977.0, 1801.0, 387.0, 170.0, 75.0, 41.0, 33.0, 24.0, 13.0, 11.0, 6.0, 5.0, 3.0, 3.0, 1.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7490234375, -0.7233734130859375, -0.697723388671875, -0.6720733642578125, -0.64642333984375, -0.6207733154296875, -0.595123291015625, -0.5694732666015625, -0.5438232421875, -0.5181732177734375, -0.492523193359375, -0.4668731689453125, -0.44122314453125, -0.4155731201171875, -0.389923095703125, -0.3642730712890625, -0.338623046875, -0.3129730224609375, -0.287322998046875, -0.2616729736328125, -0.23602294921875, -0.2103729248046875, -0.184722900390625, -0.1590728759765625, -0.1334228515625, -0.1077728271484375, -0.082122802734375, -0.0564727783203125, -0.03082275390625, -0.0051727294921875, 0.020477294921875, 0.0461273193359375, 0.07177734375, 0.0974273681640625, 0.123077392578125, 0.1487274169921875, 0.17437744140625, 0.2000274658203125, 0.225677490234375, 0.2513275146484375, 0.2769775390625, 0.3026275634765625, 0.328277587890625, 0.3539276123046875, 0.37957763671875, 0.4052276611328125, 0.430877685546875, 0.4565277099609375, 0.482177734375, 0.5078277587890625, 0.533477783203125, 0.5591278076171875, 0.58477783203125, 0.6104278564453125, 0.636077880859375, 0.6617279052734375, 0.6873779296875, 0.7130279541015625, 0.738677978515625, 0.7643280029296875, 0.78997802734375, 0.8156280517578125, 0.841278076171875, 0.8669281005859375, 0.892578125]}, "gradients/encoder.encoder.layers.15.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 5.0, 7.0, 9.0, 28.0, 53.0, 168.0, 259.0, 222.0, 152.0, 63.0, 27.0, 9.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.8459692001342773, -2.6874990463256836, -2.52902889251709, -2.370558738708496, -2.2120885848999023, -2.0536184310913086, -1.8951480388641357, -1.736677885055542, -1.5782077312469482, -1.4197375774383545, -1.2612674236297607, -1.1027971506118774, -0.9443269968032837, -0.7858568429946899, -0.6273866295814514, -0.4689164161682129, -0.31044626235961914, -0.151976078748703, 0.006494104862213135, 0.16496428847312927, 0.3234344720840454, 0.48190462589263916, 0.6403748393058777, 0.7988450527191162, 0.95731520652771, 1.1157853603363037, 1.2742555141448975, 1.4327257871627808, 1.5911959409713745, 1.7496660947799683, 1.9081363677978516, 2.0666065216064453, 2.225076675415039, 2.383546829223633, 2.5420169830322266, 2.7004871368408203, 2.858957290649414, 3.017427444458008, 3.1758978366851807, 3.3343679904937744, 3.492838144302368, 3.651308298110962, 3.8097784519195557, 3.9682486057281494, 4.126718997955322, 4.285189151763916, 4.44365930557251, 4.6021294593811035, 4.760599613189697, 4.919069766998291, 5.077539920806885, 5.2360100746154785, 5.394480228424072, 5.552950382232666, 5.71142053604126, 5.869891166687012, 6.0283613204956055, 6.186831474304199, 6.345301628112793, 6.503771781921387, 6.6622419357299805, 6.820712089538574, 6.979182243347168, 7.137652397155762, 7.2961225509643555]}, "gradients/encoder.encoder.layers.15.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 10.0, 10.0, 23.0, 19.0, 35.0, 37.0, 56.0, 55.0, 71.0, 62.0, 73.0, 89.0, 74.0, 69.0, 73.0, 65.0, 45.0, 38.0, 25.0, 24.0, 19.0, 16.0, 7.0, 2.0, 3.0, 5.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.082407474517822, -3.9742565155029297, -3.866105318069458, -3.7579543590545654, -3.6498031616210938, -3.541652202606201, -3.4335012435913086, -3.325350046157837, -3.2171990871429443, -3.1090481281280518, -3.00089693069458, -2.8927459716796875, -2.784594774246216, -2.6764438152313232, -2.5682926177978516, -2.460141658782959, -2.3519906997680664, -2.243839740753174, -2.135688543319702, -2.0275375843048096, -1.9193865060806274, -1.8112354278564453, -1.7030843496322632, -1.594933271408081, -1.4867820739746094, -1.3786309957504272, -1.2704799175262451, -1.1623289585113525, -1.0541778802871704, -0.9460268020629883, -0.8378757238388062, -0.7297247052192688, -0.6215736865997314, -0.5134226083755493, -0.40527158975601196, -0.29712051153182983, -0.1889694631099701, -0.08081841468811035, 0.027332663536071777, 0.13548368215560913, 0.24363476037979126, 0.351785808801651, 0.45993685722351074, 0.5680879354476929, 0.676239013671875, 0.7843900322914124, 0.8925411105155945, 1.0006921291351318, 1.108843207359314, 1.216994285583496, 1.3251453638076782, 1.4332964420318604, 1.541447401046753, 1.649598479270935, 1.7577495574951172, 1.8659005165100098, 1.9740517139434814, 2.082202672958374, 2.1903538703918457, 2.2985048294067383, 2.40665602684021, 2.5148069858551025, 2.622958183288574, 2.731109142303467, 2.8392601013183594]}, "gradients/encoder.encoder.layers.15.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 3.0, 3.0, 3.0, 7.0, 8.0, 6.0, 12.0, 27.0, 31.0, 49.0, 101.0, 142.0, 334.0, 785.0, 2528.0, 12244.0, 227708.0, 767519.0, 30536.0, 4263.0, 1235.0, 533.0, 203.0, 101.0, 65.0, 40.0, 22.0, 14.0, 13.0, 9.0, 2.0, 7.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.7109375, -3.6024169921875, -3.493896484375, -3.3853759765625, -3.27685546875, -3.1683349609375, -3.059814453125, -2.9512939453125, -2.8427734375, -2.7342529296875, -2.625732421875, -2.5172119140625, -2.40869140625, -2.3001708984375, -2.191650390625, -2.0831298828125, -1.974609375, -1.8660888671875, -1.757568359375, -1.6490478515625, -1.54052734375, -1.4320068359375, -1.323486328125, -1.2149658203125, -1.1064453125, -0.9979248046875, -0.889404296875, -0.7808837890625, -0.67236328125, -0.5638427734375, -0.455322265625, -0.3468017578125, -0.23828125, -0.1297607421875, -0.021240234375, 0.0872802734375, 0.19580078125, 0.3043212890625, 0.412841796875, 0.5213623046875, 0.6298828125, 0.7384033203125, 0.846923828125, 0.9554443359375, 1.06396484375, 1.1724853515625, 1.281005859375, 1.3895263671875, 1.498046875, 1.6065673828125, 1.715087890625, 1.8236083984375, 1.93212890625, 2.0406494140625, 2.149169921875, 2.2576904296875, 2.3662109375, 2.4747314453125, 2.583251953125, 2.6917724609375, 2.80029296875, 2.9088134765625, 3.017333984375, 3.1258544921875, 3.234375]}, "gradients/encoder.encoder.layers.15.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 3.0, 1.0, 5.0, 3.0, 4.0, 3.0, 8.0, 13.0, 18.0, 39.0, 47.0, 55.0, 53.0, 108.0, 99.0, 114.0, 108.0, 80.0, 80.0, 54.0, 46.0, 23.0, 22.0, 12.0, 5.0, 2.0, 1.0, 1.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.54052734375, -0.52008056640625, -0.4996337890625, -0.47918701171875, -0.458740234375, -0.43829345703125, -0.4178466796875, -0.39739990234375, -0.376953125, -0.35650634765625, -0.3360595703125, -0.31561279296875, -0.295166015625, -0.27471923828125, -0.2542724609375, -0.23382568359375, -0.21337890625, -0.19293212890625, -0.1724853515625, -0.15203857421875, -0.131591796875, -0.11114501953125, -0.0906982421875, -0.07025146484375, -0.0498046875, -0.02935791015625, -0.0089111328125, 0.01153564453125, 0.031982421875, 0.05242919921875, 0.0728759765625, 0.09332275390625, 0.11376953125, 0.13421630859375, 0.1546630859375, 0.17510986328125, 0.195556640625, 0.21600341796875, 0.2364501953125, 0.25689697265625, 0.27734375, 0.29779052734375, 0.3182373046875, 0.33868408203125, 0.359130859375, 0.37957763671875, 0.4000244140625, 0.42047119140625, 0.44091796875, 0.46136474609375, 0.4818115234375, 0.50225830078125, 0.522705078125, 0.54315185546875, 0.5635986328125, 0.58404541015625, 0.6044921875, 0.62493896484375, 0.6453857421875, 0.66583251953125, 0.686279296875, 0.70672607421875, 0.7271728515625, 0.74761962890625, 0.76806640625]}, "gradients/encoder.encoder.layers.15.attention.v_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 6.0, 6.0, 5.0, 10.0, 16.0, 19.0, 14.0, 16.0, 29.0, 41.0, 51.0, 67.0, 102.0, 152.0, 248.0, 473.0, 1018.0, 3113.0, 12804.0, 79501.0, 638463.0, 270912.0, 31649.0, 6410.0, 1744.0, 732.0, 319.0, 197.0, 129.0, 74.0, 60.0, 54.0, 35.0, 23.0, 15.0, 9.0, 13.0, 10.0, 7.0, 4.0, 2.0, 5.0, 2.0, 3.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.681640625, -1.6287078857421875, -1.575775146484375, -1.5228424072265625, -1.46990966796875, -1.4169769287109375, -1.364044189453125, -1.3111114501953125, -1.2581787109375, -1.2052459716796875, -1.152313232421875, -1.0993804931640625, -1.04644775390625, -0.9935150146484375, -0.940582275390625, -0.8876495361328125, -0.834716796875, -0.7817840576171875, -0.728851318359375, -0.6759185791015625, -0.62298583984375, -0.5700531005859375, -0.517120361328125, -0.4641876220703125, -0.4112548828125, -0.3583221435546875, -0.305389404296875, -0.2524566650390625, -0.19952392578125, -0.1465911865234375, -0.093658447265625, -0.0407257080078125, 0.01220703125, 0.0651397705078125, 0.118072509765625, 0.1710052490234375, 0.22393798828125, 0.2768707275390625, 0.329803466796875, 0.3827362060546875, 0.4356689453125, 0.4886016845703125, 0.541534423828125, 0.5944671630859375, 0.64739990234375, 0.7003326416015625, 0.753265380859375, 0.8061981201171875, 0.859130859375, 0.9120635986328125, 0.964996337890625, 1.0179290771484375, 1.07086181640625, 1.1237945556640625, 1.176727294921875, 1.2296600341796875, 1.2825927734375, 1.3355255126953125, 1.388458251953125, 1.4413909912109375, 1.49432373046875, 1.5472564697265625, 1.600189208984375, 1.6531219482421875, 1.7060546875]}, "gradients/encoder.encoder.layers.15.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 2.0, 3.0, 4.0, 4.0, 4.0, 11.0, 11.0, 12.0, 22.0, 19.0, 29.0, 35.0, 33.0, 30.0, 27.0, 46.0, 41.0, 49.0, 48.0, 47.0, 63.0, 52.0, 51.0, 58.0, 44.0, 46.0, 37.0, 31.0, 28.0, 19.0, 18.0, 18.0, 12.0, 16.0, 8.0, 9.0, 9.0, 3.0, 1.0, 1.0, 4.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-1.46875, -1.425048828125, -1.38134765625, -1.337646484375, -1.2939453125, -1.250244140625, -1.20654296875, -1.162841796875, -1.119140625, -1.075439453125, -1.03173828125, -0.988037109375, -0.9443359375, -0.900634765625, -0.85693359375, -0.813232421875, -0.76953125, -0.725830078125, -0.68212890625, -0.638427734375, -0.5947265625, -0.551025390625, -0.50732421875, -0.463623046875, -0.419921875, -0.376220703125, -0.33251953125, -0.288818359375, -0.2451171875, -0.201416015625, -0.15771484375, -0.114013671875, -0.0703125, -0.026611328125, 0.01708984375, 0.060791015625, 0.1044921875, 0.148193359375, 0.19189453125, 0.235595703125, 0.279296875, 0.322998046875, 0.36669921875, 0.410400390625, 0.4541015625, 0.497802734375, 0.54150390625, 0.585205078125, 0.62890625, 0.672607421875, 0.71630859375, 0.760009765625, 0.8037109375, 0.847412109375, 0.89111328125, 0.934814453125, 0.978515625, 1.022216796875, 1.06591796875, 1.109619140625, 1.1533203125, 1.197021484375, 1.24072265625, 1.284423828125, 1.328125]}, "gradients/encoder.encoder.layers.15.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 1.0, 1.0, 0.0, 4.0, 3.0, 11.0, 10.0, 36.0, 102.0, 408.0, 5791.0, 1036576.0, 5065.0, 398.0, 110.0, 30.0, 9.0, 4.0, 2.0, 4.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.0234375, -3.903289794921875, -3.78314208984375, -3.662994384765625, -3.5428466796875, -3.422698974609375, -3.30255126953125, -3.182403564453125, -3.062255859375, -2.942108154296875, -2.82196044921875, -2.701812744140625, -2.5816650390625, -2.461517333984375, -2.34136962890625, -2.221221923828125, -2.10107421875, -1.980926513671875, -1.86077880859375, -1.740631103515625, -1.6204833984375, -1.500335693359375, -1.38018798828125, -1.260040283203125, -1.139892578125, -1.019744873046875, -0.89959716796875, -0.779449462890625, -0.6593017578125, -0.539154052734375, -0.41900634765625, -0.298858642578125, -0.1787109375, -0.058563232421875, 0.06158447265625, 0.181732177734375, 0.3018798828125, 0.422027587890625, 0.54217529296875, 0.662322998046875, 0.782470703125, 0.902618408203125, 1.02276611328125, 1.142913818359375, 1.2630615234375, 1.383209228515625, 1.50335693359375, 1.623504638671875, 1.74365234375, 1.863800048828125, 1.98394775390625, 2.104095458984375, 2.2242431640625, 2.344390869140625, 2.46453857421875, 2.584686279296875, 2.704833984375, 2.824981689453125, 2.94512939453125, 3.065277099609375, 3.1854248046875, 3.305572509765625, 3.42572021484375, 3.545867919921875, 3.666015625]}, "gradients/encoder.encoder.layers.15.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 2.0, 3.0, 2.0, 0.0, 4.0, 1.0, 2.0, 12.0, 15.0, 16.0, 42.0, 76.0, 117.0, 191.0, 189.0, 131.0, 93.0, 42.0, 23.0, 18.0, 9.0, 3.0, 3.0, 2.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 2.0, 2.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.459257125854492e-05, -9.080860763788223e-05, -8.702464401721954e-05, -8.324068039655685e-05, -7.945671677589417e-05, -7.567275315523148e-05, -7.188878953456879e-05, -6.81048259139061e-05, -6.432086229324341e-05, -6.053689867258072e-05, -5.675293505191803e-05, -5.296897143125534e-05, -4.918500781059265e-05, -4.540104418992996e-05, -4.161708056926727e-05, -3.7833116948604584e-05, -3.4049153327941895e-05, -3.0265189707279205e-05, -2.6481226086616516e-05, -2.2697262465953827e-05, -1.8913298845291138e-05, -1.5129335224628448e-05, -1.134537160396576e-05, -7.56140798330307e-06, -3.777444362640381e-06, 6.51925802230835e-09, 3.7904828786849976e-06, 7.574446499347687e-06, 1.1358410120010376e-05, 1.5142373740673065e-05, 1.8926337361335754e-05, 2.2710300981998444e-05, 2.6494264602661133e-05, 3.0278228223323822e-05, 3.406219184398651e-05, 3.78461554646492e-05, 4.163011908531189e-05, 4.541408270597458e-05, 4.919804632663727e-05, 5.298200994729996e-05, 5.6765973567962646e-05, 6.0549937188625336e-05, 6.433390080928802e-05, 6.811786442995071e-05, 7.19018280506134e-05, 7.568579167127609e-05, 7.946975529193878e-05, 8.325371891260147e-05, 8.703768253326416e-05, 9.082164615392685e-05, 9.460560977458954e-05, 9.838957339525223e-05, 0.00010217353701591492, 0.0001059575006365776, 0.0001097414642572403, 0.00011352542787790298, 0.00011730939149856567, 0.00012109335511922836, 0.00012487731873989105, 0.00012866128236055374, 0.00013244524598121643, 0.00013622920960187912, 0.0001400131732225418, 0.0001437971368432045, 0.0001475811004638672]}, "gradients/encoder.encoder.layers.15.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 1.0, 10.0, 11.0, 34.0, 114.0, 208.0, 745.0, 439178.0, 607071.0, 796.0, 215.0, 101.0, 36.0, 17.0, 9.0, 7.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.4140625, -3.29217529296875, -3.1702880859375, -3.04840087890625, -2.926513671875, -2.80462646484375, -2.6827392578125, -2.56085205078125, -2.43896484375, -2.31707763671875, -2.1951904296875, -2.07330322265625, -1.951416015625, -1.82952880859375, -1.7076416015625, -1.58575439453125, -1.4638671875, -1.34197998046875, -1.2200927734375, -1.09820556640625, -0.976318359375, -0.85443115234375, -0.7325439453125, -0.61065673828125, -0.48876953125, -0.36688232421875, -0.2449951171875, -0.12310791015625, -0.001220703125, 0.12066650390625, 0.2425537109375, 0.36444091796875, 0.486328125, 0.60821533203125, 0.7301025390625, 0.85198974609375, 0.973876953125, 1.09576416015625, 1.2176513671875, 1.33953857421875, 1.46142578125, 1.58331298828125, 1.7052001953125, 1.82708740234375, 1.948974609375, 2.07086181640625, 2.1927490234375, 2.31463623046875, 2.4365234375, 2.55841064453125, 2.6802978515625, 2.80218505859375, 2.924072265625, 3.04595947265625, 3.1678466796875, 3.28973388671875, 3.41162109375, 3.53350830078125, 3.6553955078125, 3.77728271484375, 3.899169921875, 4.02105712890625, 4.1429443359375, 4.26483154296875, 4.38671875]}, "gradients/encoder.encoder.layers.15.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 5.0, 11.0, 64.0, 301.0, 516.0, 91.0, 17.0, 11.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.40625, -2.320892333984375, -2.23553466796875, -2.150177001953125, -2.0648193359375, -1.979461669921875, -1.89410400390625, -1.808746337890625, -1.723388671875, -1.638031005859375, -1.55267333984375, -1.467315673828125, -1.3819580078125, -1.296600341796875, -1.21124267578125, -1.125885009765625, -1.04052734375, -0.955169677734375, -0.86981201171875, -0.784454345703125, -0.6990966796875, -0.613739013671875, -0.52838134765625, -0.443023681640625, -0.357666015625, -0.272308349609375, -0.18695068359375, -0.101593017578125, -0.0162353515625, 0.069122314453125, 0.15447998046875, 0.239837646484375, 0.3251953125, 0.410552978515625, 0.49591064453125, 0.581268310546875, 0.6666259765625, 0.751983642578125, 0.83734130859375, 0.922698974609375, 1.008056640625, 1.093414306640625, 1.17877197265625, 1.264129638671875, 1.3494873046875, 1.434844970703125, 1.52020263671875, 1.605560302734375, 1.69091796875, 1.776275634765625, 1.86163330078125, 1.946990966796875, 2.0323486328125, 2.117706298828125, 2.20306396484375, 2.288421630859375, 2.373779296875, 2.459136962890625, 2.54449462890625, 2.629852294921875, 2.7152099609375, 2.800567626953125, 2.88592529296875, 2.971282958984375, 3.056640625]}, "gradients/encoder.encoder.layers.15.layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 4.0, 9.0, 15.0, 59.0, 169.0, 354.0, 283.0, 85.0, 21.0, 9.0, 4.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.268885612487793, -5.632908821105957, -4.996932029724121, -4.360955715179443, -3.7249789237976074, -3.0890021324157715, -2.4530255794525146, -1.8170490264892578, -1.1810722351074219, -0.5450955629348755, 0.0908811092376709, 0.7268577814102173, 1.3628344535827637, 1.9988112449645996, 2.6347877979278564, 3.2707643508911133, 3.906741142272949, 4.542717933654785, 5.178694725036621, 5.814671039581299, 6.450647830963135, 7.086624622344971, 7.722600936889648, 8.358577728271484, 8.99455451965332, 9.630531311035156, 10.266508102416992, 10.902484893798828, 11.538461685180664, 12.1744384765625, 12.81041431427002, 13.446391105651855, 14.082366943359375, 14.718343734741211, 15.354320526123047, 15.990297317504883, 16.62627410888672, 17.262250900268555, 17.89822769165039, 18.534202575683594, 19.170181274414062, 19.8061580657959, 20.442134857177734, 21.07811164855957, 21.714088439941406, 22.350065231323242, 22.986042022705078, 23.62201690673828, 24.257993698120117, 24.893970489501953, 25.52994728088379, 26.165924072265625, 26.80190086364746, 27.437877655029297, 28.073854446411133, 28.70983123779297, 29.345806121826172, 29.981782913208008, 30.617759704589844, 31.25373649597168, 31.889713287353516, 32.52568817138672, 33.16166687011719, 33.79764175415039, 34.43362045288086]}, "gradients/encoder.encoder.layers.15.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 5.0, 9.0, 5.0, 18.0, 5.0, 11.0, 16.0, 14.0, 20.0, 22.0, 19.0, 28.0, 26.0, 29.0, 31.0, 36.0, 29.0, 45.0, 29.0, 29.0, 48.0, 54.0, 41.0, 38.0, 36.0, 42.0, 34.0, 28.0, 28.0, 22.0, 21.0, 26.0, 22.0, 28.0, 26.0, 15.0, 9.0, 17.0, 5.0, 10.0, 5.0, 6.0, 1.0, 3.0, 5.0, 3.0, 1.0, 2.0, 2.0, 2.0, 3.0], "bins": [-6.289222717285156, -6.104809284210205, -5.920395851135254, -5.735982418060303, -5.551568984985352, -5.3671555519104, -5.182742118835449, -4.998329162597656, -4.813915252685547, -4.629501819610596, -4.4450883865356445, -4.260674953460693, -4.076261520385742, -3.891848087310791, -3.707434892654419, -3.5230214595794678, -3.3386082649230957, -3.1541948318481445, -2.9697813987731934, -2.785367965698242, -2.600954532623291, -2.41654109954834, -2.2321279048919678, -2.0477144718170166, -1.8633010387420654, -1.6788876056671143, -1.494474172592163, -1.3100608587265015, -1.1256474256515503, -0.9412339925765991, -0.7568206787109375, -0.5724072456359863, -0.38799428939819336, -0.20358088612556458, -0.01916748285293579, 0.1652458906173706, 0.3496593236923218, 0.534072756767273, 0.7184860706329346, 0.9028995037078857, 1.087312936782837, 1.271726369857788, 1.4561398029327393, 1.6405531167984009, 1.824966549873352, 2.0093798637390137, 2.193793296813965, 2.378206729888916, 2.562620162963867, 2.7470335960388184, 2.9314470291137695, 3.1158604621887207, 3.300273895263672, 3.484687328338623, 3.669100522994995, 3.8535139560699463, 4.037927627563477, 4.222341060638428, 4.406754493713379, 4.59116792678833, 4.775581359863281, 4.959994792938232, 5.144408226013184, 5.328821182250977, 5.513234615325928]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 5.0, 3.0, 7.0, 10.0, 11.0, 20.0, 32.0, 42.0, 64.0, 103.0, 180.0, 359.0, 693.0, 1428.0, 3740.0, 12012.0, 69646.0, 3761034.0, 309566.0, 24643.0, 6157.0, 2241.0, 997.0, 476.0, 268.0, 166.0, 111.0, 70.0, 59.0, 34.0, 18.0, 20.0, 21.0, 16.0, 5.0, 4.0, 8.0, 7.0, 3.0, 3.0, 1.0, 3.0, 2.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.421875, -1.36199951171875, -1.3021240234375, -1.24224853515625, -1.182373046875, -1.12249755859375, -1.0626220703125, -1.00274658203125, -0.94287109375, -0.88299560546875, -0.8231201171875, -0.76324462890625, -0.703369140625, -0.64349365234375, -0.5836181640625, -0.52374267578125, -0.4638671875, -0.40399169921875, -0.3441162109375, -0.28424072265625, -0.224365234375, -0.16448974609375, -0.1046142578125, -0.04473876953125, 0.01513671875, 0.07501220703125, 0.1348876953125, 0.19476318359375, 0.254638671875, 0.31451416015625, 0.3743896484375, 0.43426513671875, 0.494140625, 0.55401611328125, 0.6138916015625, 0.67376708984375, 0.733642578125, 0.79351806640625, 0.8533935546875, 0.91326904296875, 0.97314453125, 1.03302001953125, 1.0928955078125, 1.15277099609375, 1.212646484375, 1.27252197265625, 1.3323974609375, 1.39227294921875, 1.4521484375, 1.51202392578125, 1.5718994140625, 1.63177490234375, 1.691650390625, 1.75152587890625, 1.8114013671875, 1.87127685546875, 1.93115234375, 1.99102783203125, 2.0509033203125, 2.11077880859375, 2.170654296875, 2.23052978515625, 2.2904052734375, 2.35028076171875, 2.41015625]}, "gradients/encoder.encoder.layers.14.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 3.0, 3.0, 5.0, 2.0, 8.0, 4.0, 18.0, 18.0, 22.0, 37.0, 44.0, 52.0, 98.0, 80.0, 91.0, 108.0, 90.0, 83.0, 72.0, 51.0, 29.0, 28.0, 27.0, 15.0, 10.0, 5.0, 2.0, 1.0, 2.0, 3.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.55126953125, -0.5302200317382812, -0.5091705322265625, -0.48812103271484375, -0.467071533203125, -0.44602203369140625, -0.4249725341796875, -0.40392303466796875, -0.38287353515625, -0.36182403564453125, -0.3407745361328125, -0.31972503662109375, -0.298675537109375, -0.27762603759765625, -0.2565765380859375, -0.23552703857421875, -0.2144775390625, -0.19342803955078125, -0.1723785400390625, -0.15132904052734375, -0.130279541015625, -0.10923004150390625, -0.0881805419921875, -0.06713104248046875, -0.04608154296875, -0.02503204345703125, -0.0039825439453125, 0.01706695556640625, 0.038116455078125, 0.05916595458984375, 0.0802154541015625, 0.10126495361328125, 0.122314453125, 0.14336395263671875, 0.1644134521484375, 0.18546295166015625, 0.206512451171875, 0.22756195068359375, 0.2486114501953125, 0.26966094970703125, 0.29071044921875, 0.31175994873046875, 0.3328094482421875, 0.35385894775390625, 0.374908447265625, 0.39595794677734375, 0.4170074462890625, 0.43805694580078125, 0.4591064453125, 0.48015594482421875, 0.5012054443359375, 0.5222549438476562, 0.543304443359375, 0.5643539428710938, 0.5854034423828125, 0.6064529418945312, 0.62750244140625, 0.6485519409179688, 0.6696014404296875, 0.6906509399414062, 0.711700439453125, 0.7327499389648438, 0.7537994384765625, 0.7748489379882812, 0.7958984375]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 12.0, 11.0, 23.0, 28.0, 58.0, 83.0, 210.0, 376.0, 1190.0, 4659.0, 56963.0, 4046698.0, 76143.0, 5546.0, 1341.0, 517.0, 207.0, 98.0, 56.0, 30.0, 13.0, 11.0, 3.0, 6.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4453125, -2.35650634765625, -2.2677001953125, -2.17889404296875, -2.090087890625, -2.00128173828125, -1.9124755859375, -1.82366943359375, -1.73486328125, -1.64605712890625, -1.5572509765625, -1.46844482421875, -1.379638671875, -1.29083251953125, -1.2020263671875, -1.11322021484375, -1.0244140625, -0.93560791015625, -0.8468017578125, -0.75799560546875, -0.669189453125, -0.58038330078125, -0.4915771484375, -0.40277099609375, -0.31396484375, -0.22515869140625, -0.1363525390625, -0.04754638671875, 0.041259765625, 0.13006591796875, 0.2188720703125, 0.30767822265625, 0.396484375, 0.48529052734375, 0.5740966796875, 0.66290283203125, 0.751708984375, 0.84051513671875, 0.9293212890625, 1.01812744140625, 1.10693359375, 1.19573974609375, 1.2845458984375, 1.37335205078125, 1.462158203125, 1.55096435546875, 1.6397705078125, 1.72857666015625, 1.8173828125, 1.90618896484375, 1.9949951171875, 2.08380126953125, 2.172607421875, 2.26141357421875, 2.3502197265625, 2.43902587890625, 2.52783203125, 2.61663818359375, 2.7054443359375, 2.79425048828125, 2.883056640625, 2.97186279296875, 3.0606689453125, 3.14947509765625, 3.23828125]}, "gradients/encoder.encoder.layers.14.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 3.0, 2.0, 4.0, 6.0, 5.0, 12.0, 16.0, 31.0, 68.0, 171.0, 471.0, 2319.0, 592.0, 186.0, 72.0, 42.0, 24.0, 21.0, 10.0, 7.0, 5.0, 6.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.869140625, -0.844696044921875, -0.82025146484375, -0.795806884765625, -0.7713623046875, -0.746917724609375, -0.72247314453125, -0.698028564453125, -0.673583984375, -0.649139404296875, -0.62469482421875, -0.600250244140625, -0.5758056640625, -0.551361083984375, -0.52691650390625, -0.502471923828125, -0.47802734375, -0.453582763671875, -0.42913818359375, -0.404693603515625, -0.3802490234375, -0.355804443359375, -0.33135986328125, -0.306915283203125, -0.282470703125, -0.258026123046875, -0.23358154296875, -0.209136962890625, -0.1846923828125, -0.160247802734375, -0.13580322265625, -0.111358642578125, -0.0869140625, -0.062469482421875, -0.03802490234375, -0.013580322265625, 0.0108642578125, 0.035308837890625, 0.05975341796875, 0.084197998046875, 0.108642578125, 0.133087158203125, 0.15753173828125, 0.181976318359375, 0.2064208984375, 0.230865478515625, 0.25531005859375, 0.279754638671875, 0.30419921875, 0.328643798828125, 0.35308837890625, 0.377532958984375, 0.4019775390625, 0.426422119140625, 0.45086669921875, 0.475311279296875, 0.499755859375, 0.524200439453125, 0.54864501953125, 0.573089599609375, 0.5975341796875, 0.621978759765625, 0.64642333984375, 0.670867919921875, 0.6953125]}, "gradients/encoder.encoder.layers.14.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 17.0, 27.0, 138.0, 375.0, 320.0, 86.0, 28.0, 5.0, 5.0, 1.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.6058623790740967, -2.3814826011657715, -2.1571028232574463, -1.9327229261398315, -1.7083431482315063, -1.4839633703231812, -1.2595834732055664, -1.0352036952972412, -0.810823917388916, -0.5864441394805908, -0.36206430196762085, -0.13768446445465088, 0.08669531345367432, 0.3110750913619995, 0.5354549884796143, 0.7598347663879395, 0.9842145442962646, 1.2085943222045898, 1.432974100112915, 1.6573539972305298, 1.881733775138855, 2.1061134338378906, 2.330493450164795, 2.55487322807312, 2.7792530059814453, 3.0036327838897705, 3.2280125617980957, 3.452392578125, 3.676772117614746, 3.9011521339416504, 4.125532150268555, 4.349911689758301, 4.574291229248047, 4.798671245574951, 5.023050785064697, 5.247430801391602, 5.471810340881348, 5.696190357208252, 5.920570373535156, 6.144949913024902, 6.369329452514648, 6.593709468841553, 6.818089008331299, 7.042469024658203, 7.266848564147949, 7.4912285804748535, 7.715608596801758, 7.939988136291504, 8.16436767578125, 8.388747215270996, 8.613127708435059, 8.837507247924805, 9.06188678741455, 9.286266326904297, 9.51064682006836, 9.735026359558105, 9.959406852722168, 10.183786392211914, 10.408166885375977, 10.632546424865723, 10.856925964355469, 11.081305503845215, 11.305685997009277, 11.530065536499023, 11.75444507598877]}, "gradients/encoder.encoder.layers.14.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 3.0, 2.0, 7.0, 8.0, 7.0, 21.0, 9.0, 16.0, 24.0, 20.0, 38.0, 51.0, 38.0, 56.0, 57.0, 54.0, 60.0, 61.0, 68.0, 56.0, 54.0, 49.0, 44.0, 28.0, 36.0, 26.0, 21.0, 22.0, 17.0, 18.0, 8.0, 7.0, 6.0, 5.0, 8.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0], "bins": [-2.2382194995880127, -2.172811269760132, -2.107403039932251, -2.04199481010437, -1.9765865802764893, -1.9111783504486084, -1.8457701206207275, -1.7803618907928467, -1.7149536609649658, -1.649545431137085, -1.584137201309204, -1.5187289714813232, -1.4533207416534424, -1.3879125118255615, -1.3225042819976807, -1.2570960521697998, -1.1916877031326294, -1.1262794733047485, -1.0608712434768677, -0.9954630136489868, -0.930054783821106, -0.8646465539932251, -0.7992382645606995, -0.7338300347328186, -0.6684218049049377, -0.6030135750770569, -0.537605345249176, -0.4721970856189728, -0.4067888557910919, -0.34138062596321106, -0.2759723663330078, -0.21056413650512695, -0.14515602588653564, -0.07974778860807419, -0.014339551329612732, 0.05106869339942932, 0.11647692322731018, 0.18188515305519104, 0.2472934126853943, 0.31270164251327515, 0.378109872341156, 0.44351810216903687, 0.5089263319969177, 0.5743346214294434, 0.6397428512573242, 0.7051510810852051, 0.7705593109130859, 0.8359675407409668, 0.9013757705688477, 0.9667840003967285, 1.0321922302246094, 1.0976004600524902, 1.163008689880371, 1.228416919708252, 1.2938251495361328, 1.3592333793640137, 1.4246416091918945, 1.4900498390197754, 1.5554580688476562, 1.620866298675537, 1.686274528503418, 1.7516827583312988, 1.8170909881591797, 1.8824992179870605, 1.947907567024231]}, "gradients/encoder.encoder.layers.14.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 0.0, 2.0, 1.0, 2.0, 0.0, 2.0, 9.0, 7.0, 7.0, 8.0, 16.0, 22.0, 37.0, 64.0, 112.0, 222.0, 448.0, 1241.0, 5676.0, 60284.0, 830182.0, 137819.0, 9408.0, 1856.0, 582.0, 238.0, 130.0, 77.0, 46.0, 24.0, 12.0, 12.0, 3.0, 5.0, 6.0, 2.0, 4.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.4921875, -2.38671875, -2.28125, -2.17578125, -2.0703125, -1.96484375, -1.859375, -1.75390625, -1.6484375, -1.54296875, -1.4375, -1.33203125, -1.2265625, -1.12109375, -1.015625, -0.91015625, -0.8046875, -0.69921875, -0.59375, -0.48828125, -0.3828125, -0.27734375, -0.171875, -0.06640625, 0.0390625, 0.14453125, 0.25, 0.35546875, 0.4609375, 0.56640625, 0.671875, 0.77734375, 0.8828125, 0.98828125, 1.09375, 1.19921875, 1.3046875, 1.41015625, 1.515625, 1.62109375, 1.7265625, 1.83203125, 1.9375, 2.04296875, 2.1484375, 2.25390625, 2.359375, 2.46484375, 2.5703125, 2.67578125, 2.78125, 2.88671875, 2.9921875, 3.09765625, 3.203125, 3.30859375, 3.4140625, 3.51953125, 3.625, 3.73046875, 3.8359375, 3.94140625, 4.046875, 4.15234375, 4.2578125]}, "gradients/encoder.encoder.layers.14.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 3.0, 3.0, 3.0, 6.0, 12.0, 14.0, 21.0, 27.0, 39.0, 46.0, 68.0, 90.0, 88.0, 101.0, 129.0, 93.0, 64.0, 67.0, 41.0, 30.0, 27.0, 15.0, 7.0, 6.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.5947265625, -0.5724945068359375, -0.550262451171875, -0.5280303955078125, -0.50579833984375, -0.4835662841796875, -0.461334228515625, -0.4391021728515625, -0.4168701171875, -0.3946380615234375, -0.372406005859375, -0.3501739501953125, -0.32794189453125, -0.3057098388671875, -0.283477783203125, -0.2612457275390625, -0.239013671875, -0.2167816162109375, -0.194549560546875, -0.1723175048828125, -0.15008544921875, -0.1278533935546875, -0.105621337890625, -0.0833892822265625, -0.0611572265625, -0.0389251708984375, -0.016693115234375, 0.0055389404296875, 0.02777099609375, 0.0500030517578125, 0.072235107421875, 0.0944671630859375, 0.11669921875, 0.1389312744140625, 0.161163330078125, 0.1833953857421875, 0.20562744140625, 0.2278594970703125, 0.250091552734375, 0.2723236083984375, 0.2945556640625, 0.3167877197265625, 0.339019775390625, 0.3612518310546875, 0.38348388671875, 0.4057159423828125, 0.427947998046875, 0.4501800537109375, 0.472412109375, 0.4946441650390625, 0.516876220703125, 0.5391082763671875, 0.56134033203125, 0.5835723876953125, 0.605804443359375, 0.6280364990234375, 0.6502685546875, 0.6725006103515625, 0.694732666015625, 0.7169647216796875, 0.73919677734375, 0.7614288330078125, 0.783660888671875, 0.8058929443359375, 0.828125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 2.0, 1.0, 4.0, 10.0, 9.0, 11.0, 9.0, 12.0, 25.0, 27.0, 36.0, 32.0, 47.0, 75.0, 91.0, 124.0, 224.0, 395.0, 841.0, 2223.0, 7356.0, 29496.0, 156122.0, 590485.0, 208783.0, 38212.0, 9060.0, 2658.0, 942.0, 443.0, 263.0, 148.0, 94.0, 54.0, 68.0, 37.0, 29.0, 28.0, 21.0, 11.0, 16.0, 4.0, 16.0, 5.0, 9.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3203125, -1.2756805419921875, -1.231048583984375, -1.1864166259765625, -1.14178466796875, -1.0971527099609375, -1.052520751953125, -1.0078887939453125, -0.9632568359375, -0.9186248779296875, -0.873992919921875, -0.8293609619140625, -0.78472900390625, -0.7400970458984375, -0.695465087890625, -0.6508331298828125, -0.606201171875, -0.5615692138671875, -0.516937255859375, -0.4723052978515625, -0.42767333984375, -0.3830413818359375, -0.338409423828125, -0.2937774658203125, -0.2491455078125, -0.2045135498046875, -0.159881591796875, -0.1152496337890625, -0.07061767578125, -0.0259857177734375, 0.018646240234375, 0.0632781982421875, 0.10791015625, 0.1525421142578125, 0.197174072265625, 0.2418060302734375, 0.28643798828125, 0.3310699462890625, 0.375701904296875, 0.4203338623046875, 0.4649658203125, 0.5095977783203125, 0.554229736328125, 0.5988616943359375, 0.64349365234375, 0.6881256103515625, 0.732757568359375, 0.7773895263671875, 0.822021484375, 0.8666534423828125, 0.911285400390625, 0.9559173583984375, 1.00054931640625, 1.0451812744140625, 1.089813232421875, 1.1344451904296875, 1.1790771484375, 1.2237091064453125, 1.268341064453125, 1.3129730224609375, 1.35760498046875, 1.4022369384765625, 1.446868896484375, 1.4915008544921875, 1.5361328125]}, "gradients/encoder.encoder.layers.14.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 6.0, 1.0, 4.0, 5.0, 1.0, 3.0, 10.0, 11.0, 10.0, 13.0, 15.0, 16.0, 17.0, 19.0, 23.0, 23.0, 29.0, 20.0, 43.0, 45.0, 43.0, 44.0, 38.0, 37.0, 55.0, 39.0, 37.0, 48.0, 35.0, 44.0, 55.0, 30.0, 32.0, 31.0, 30.0, 17.0, 21.0, 13.0, 10.0, 5.0, 6.0, 3.0, 2.0, 9.0, 6.0, 4.0, 2.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.29296875, -1.2508087158203125, -1.208648681640625, -1.1664886474609375, -1.12432861328125, -1.0821685791015625, -1.040008544921875, -0.9978485107421875, -0.9556884765625, -0.9135284423828125, -0.871368408203125, -0.8292083740234375, -0.78704833984375, -0.7448883056640625, -0.702728271484375, -0.6605682373046875, -0.618408203125, -0.5762481689453125, -0.534088134765625, -0.4919281005859375, -0.44976806640625, -0.4076080322265625, -0.365447998046875, -0.3232879638671875, -0.2811279296875, -0.2389678955078125, -0.196807861328125, -0.1546478271484375, -0.11248779296875, -0.0703277587890625, -0.028167724609375, 0.0139923095703125, 0.05615234375, 0.0983123779296875, 0.140472412109375, 0.1826324462890625, 0.22479248046875, 0.2669525146484375, 0.309112548828125, 0.3512725830078125, 0.3934326171875, 0.4355926513671875, 0.477752685546875, 0.5199127197265625, 0.56207275390625, 0.6042327880859375, 0.646392822265625, 0.6885528564453125, 0.730712890625, 0.7728729248046875, 0.815032958984375, 0.8571929931640625, 0.89935302734375, 0.9415130615234375, 0.983673095703125, 1.0258331298828125, 1.0679931640625, 1.1101531982421875, 1.152313232421875, 1.1944732666015625, 1.23663330078125, 1.2787933349609375, 1.320953369140625, 1.3631134033203125, 1.4052734375]}, "gradients/encoder.encoder.layers.14.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 2.0, 1.0, 2.0, 5.0, 9.0, 6.0, 15.0, 11.0, 24.0, 41.0, 71.0, 92.0, 146.0, 365.0, 1721.0, 22848.0, 934961.0, 84115.0, 3065.0, 576.0, 204.0, 84.0, 57.0, 54.0, 23.0, 30.0, 14.0, 9.0, 4.0, 4.0, 2.0, 4.0, 0.0, 0.0, 1.0, 0.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.27734375, -1.23822021484375, -1.1990966796875, -1.15997314453125, -1.120849609375, -1.08172607421875, -1.0426025390625, -1.00347900390625, -0.96435546875, -0.92523193359375, -0.8861083984375, -0.84698486328125, -0.807861328125, -0.76873779296875, -0.7296142578125, -0.69049072265625, -0.6513671875, -0.61224365234375, -0.5731201171875, -0.53399658203125, -0.494873046875, -0.45574951171875, -0.4166259765625, -0.37750244140625, -0.33837890625, -0.29925537109375, -0.2601318359375, -0.22100830078125, -0.181884765625, -0.14276123046875, -0.1036376953125, -0.06451416015625, -0.025390625, 0.01373291015625, 0.0528564453125, 0.09197998046875, 0.131103515625, 0.17022705078125, 0.2093505859375, 0.24847412109375, 0.28759765625, 0.32672119140625, 0.3658447265625, 0.40496826171875, 0.444091796875, 0.48321533203125, 0.5223388671875, 0.56146240234375, 0.6005859375, 0.63970947265625, 0.6788330078125, 0.71795654296875, 0.757080078125, 0.79620361328125, 0.8353271484375, 0.87445068359375, 0.91357421875, 0.95269775390625, 0.9918212890625, 1.03094482421875, 1.070068359375, 1.10919189453125, 1.1483154296875, 1.18743896484375, 1.2265625]}, "gradients/encoder.encoder.layers.14.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 7.0, 4.0, 14.0, 9.0, 6.0, 23.0, 34.0, 36.0, 60.0, 82.0, 98.0, 114.0, 111.0, 93.0, 80.0, 59.0, 40.0, 43.0, 20.0, 18.0, 21.0, 8.0, 4.0, 2.0, 6.0, 7.0, 4.0, 3.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.37905502319336e-05, -7.115211337804794e-05, -6.851367652416229e-05, -6.587523967027664e-05, -6.323680281639099e-05, -6.059836596250534e-05, -5.795992910861969e-05, -5.532149225473404e-05, -5.268305540084839e-05, -5.004461854696274e-05, -4.740618169307709e-05, -4.476774483919144e-05, -4.2129307985305786e-05, -3.9490871131420135e-05, -3.6852434277534485e-05, -3.4213997423648834e-05, -3.1575560569763184e-05, -2.8937123715877533e-05, -2.6298686861991882e-05, -2.366025000810623e-05, -2.102181315422058e-05, -1.838337630033493e-05, -1.574493944644928e-05, -1.3106502592563629e-05, -1.0468065738677979e-05, -7.829628884792328e-06, -5.191192030906677e-06, -2.5527551770210266e-06, 8.568167686462402e-08, 2.7241185307502747e-06, 5.362555384635925e-06, 8.000992238521576e-06, 1.0639429092407227e-05, 1.3277865946292877e-05, 1.5916302800178528e-05, 1.855473965406418e-05, 2.119317650794983e-05, 2.383161336183548e-05, 2.647005021572113e-05, 2.910848706960678e-05, 3.174692392349243e-05, 3.438536077737808e-05, 3.702379763126373e-05, 3.9662234485149384e-05, 4.2300671339035034e-05, 4.4939108192920685e-05, 4.7577545046806335e-05, 5.0215981900691986e-05, 5.285441875457764e-05, 5.549285560846329e-05, 5.813129246234894e-05, 6.076972931623459e-05, 6.340816617012024e-05, 6.604660302400589e-05, 6.868503987789154e-05, 7.132347673177719e-05, 7.396191358566284e-05, 7.660035043954849e-05, 7.923878729343414e-05, 8.18772241473198e-05, 8.451566100120544e-05, 8.71540978550911e-05, 8.979253470897675e-05, 9.24309715628624e-05, 9.506940841674805e-05]}, "gradients/encoder.encoder.layers.14.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 1.0, 4.0, 4.0, 11.0, 13.0, 49.0, 105.0, 300.0, 1086.0, 15824.0, 947835.0, 80542.0, 2073.0, 449.0, 154.0, 56.0, 24.0, 13.0, 8.0, 4.0, 6.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.7529296875, -1.7108612060546875, -1.668792724609375, -1.6267242431640625, -1.58465576171875, -1.5425872802734375, -1.500518798828125, -1.4584503173828125, -1.4163818359375, -1.3743133544921875, -1.332244873046875, -1.2901763916015625, -1.24810791015625, -1.2060394287109375, -1.163970947265625, -1.1219024658203125, -1.079833984375, -1.0377655029296875, -0.995697021484375, -0.9536285400390625, -0.91156005859375, -0.8694915771484375, -0.827423095703125, -0.7853546142578125, -0.7432861328125, -0.7012176513671875, -0.659149169921875, -0.6170806884765625, -0.57501220703125, -0.5329437255859375, -0.490875244140625, -0.4488067626953125, -0.40673828125, -0.3646697998046875, -0.322601318359375, -0.2805328369140625, -0.23846435546875, -0.1963958740234375, -0.154327392578125, -0.1122589111328125, -0.0701904296875, -0.0281219482421875, 0.013946533203125, 0.0560150146484375, 0.09808349609375, 0.1401519775390625, 0.182220458984375, 0.2242889404296875, 0.266357421875, 0.3084259033203125, 0.350494384765625, 0.3925628662109375, 0.43463134765625, 0.4766998291015625, 0.518768310546875, 0.5608367919921875, 0.6029052734375, 0.6449737548828125, 0.687042236328125, 0.7291107177734375, 0.77117919921875, 0.8132476806640625, 0.855316162109375, 0.8973846435546875, 0.939453125]}, "gradients/encoder.encoder.layers.14.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 7.0, 5.0, 14.0, 28.0, 54.0, 85.0, 154.0, 182.0, 171.0, 135.0, 71.0, 48.0, 29.0, 15.0, 7.0, 6.0, 2.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.455078125, -1.4259147644042969, -1.3967514038085938, -1.3675880432128906, -1.3384246826171875, -1.3092613220214844, -1.2800979614257812, -1.2509346008300781, -1.221771240234375, -1.1926078796386719, -1.1634445190429688, -1.1342811584472656, -1.1051177978515625, -1.0759544372558594, -1.0467910766601562, -1.0176277160644531, -0.98846435546875, -0.9593009948730469, -0.9301376342773438, -0.9009742736816406, -0.8718109130859375, -0.8426475524902344, -0.8134841918945312, -0.7843208312988281, -0.755157470703125, -0.7259941101074219, -0.6968307495117188, -0.6676673889160156, -0.6385040283203125, -0.6093406677246094, -0.5801773071289062, -0.5510139465332031, -0.5218505859375, -0.4926872253417969, -0.46352386474609375, -0.4343605041503906, -0.4051971435546875, -0.3760337829589844, -0.34687042236328125, -0.3177070617675781, -0.288543701171875, -0.2593803405761719, -0.23021697998046875, -0.20105361938476562, -0.1718902587890625, -0.14272689819335938, -0.11356353759765625, -0.08440017700195312, -0.05523681640625, -0.026073455810546875, 0.00308990478515625, 0.032253265380859375, 0.0614166259765625, 0.09057998657226562, 0.11974334716796875, 0.14890670776367188, 0.178070068359375, 0.20723342895507812, 0.23639678955078125, 0.2655601501464844, 0.2947235107421875, 0.3238868713378906, 0.35305023193359375, 0.3822135925292969, 0.411376953125]}, "gradients/encoder.encoder.layers.14.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 4.0, 7.0, 8.0, 20.0, 58.0, 179.0, 347.0, 248.0, 103.0, 24.0, 13.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.727996826171875, -19.127971649169922, -18.52794647216797, -17.927921295166016, -17.327898025512695, -16.727872848510742, -16.12784767150879, -15.527822494506836, -14.927797317504883, -14.32777214050293, -13.727747917175293, -13.12772274017334, -12.527697563171387, -11.92767333984375, -11.327648162841797, -10.727622985839844, -10.127598762512207, -9.527573585510254, -8.927549362182617, -8.327524185180664, -7.727499008178711, -7.127474308013916, -6.527449607849121, -5.927424430847168, -5.327399730682373, -4.727375030517578, -4.127349853515625, -3.52732515335083, -2.927300214767456, -2.327275276184082, -1.727250576019287, -1.127225399017334, -0.5272006988525391, 0.07282418012619019, 0.6728490591049194, 1.272873878479004, 1.872898817062378, 2.472923755645752, 3.072948455810547, 3.6729736328125, 4.272998332977295, 4.87302303314209, 5.473048210144043, 6.073072910308838, 6.673097610473633, 7.273122787475586, 7.873147487640381, 8.473173141479492, 9.073197364807129, 9.673222541809082, 10.273246765136719, 10.873271942138672, 11.473297119140625, 12.073322296142578, 12.673346519470215, 13.273371696472168, 13.873395919799805, 14.473421096801758, 15.073445320129395, 15.673470497131348, 16.273494720458984, 16.873519897460938, 17.47354507446289, 18.073570251464844, 18.673595428466797]}, "gradients/encoder.encoder.layers.14.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 5.0, 2.0, 2.0, 5.0, 11.0, 6.0, 16.0, 19.0, 34.0, 20.0, 37.0, 34.0, 34.0, 29.0, 50.0, 38.0, 47.0, 51.0, 50.0, 45.0, 39.0, 45.0, 50.0, 51.0, 40.0, 50.0, 36.0, 29.0, 25.0, 22.0, 20.0, 18.0, 8.0, 11.0, 3.0, 12.0, 8.0, 6.0, 1.0, 2.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.005902290344238, -8.745743751525879, -8.48558521270752, -8.225425720214844, -7.965267181396484, -7.705108642578125, -7.444950103759766, -7.184791088104248, -6.9246320724487305, -6.664473533630371, -6.4043145179748535, -6.144155979156494, -5.883996963500977, -5.623838424682617, -5.363679885864258, -5.10352087020874, -4.843362331390381, -4.5832037925720215, -4.323044776916504, -4.0628862380981445, -3.802727222442627, -3.5425686836242676, -3.282409906387329, -3.0222511291503906, -2.762092351913452, -2.5019335746765137, -2.241774797439575, -1.9816161394119263, -1.7214573621749878, -1.4612985849380493, -1.2011399269104004, -0.9409811496734619, -0.6808223724365234, -0.42066362500190735, -0.16050487756729126, 0.09965384006500244, 0.3598126173019409, 0.6199713945388794, 0.8801300525665283, 1.1402888298034668, 1.4004476070404053, 1.6606063842773438, 1.9207651615142822, 2.1809239387512207, 2.44108247756958, 2.7012414932250977, 2.961400032043457, 3.2215588092803955, 3.481717586517334, 3.7418763637542725, 4.002035140991211, 4.26219367980957, 4.522352695465088, 4.782511234283447, 5.042670249938965, 5.302828788757324, 5.562987327575684, 5.823145866394043, 6.0833048820495605, 6.34346342086792, 6.6036224365234375, 6.863780975341797, 7.123939514160156, 7.384098529815674, 7.644257545471191]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 3.0, 9.0, 16.0, 24.0, 50.0, 67.0, 93.0, 188.0, 331.0, 671.0, 1393.0, 3601.0, 10940.0, 53001.0, 3856557.0, 234831.0, 22155.0, 5992.0, 2208.0, 911.0, 451.0, 239.0, 174.0, 101.0, 67.0, 52.0, 28.0, 39.0, 24.0, 21.0, 9.0, 9.0, 8.0, 6.0, 5.0, 3.0, 3.0, 2.0, 4.0, 1.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.326171875, -2.235870361328125, -2.14556884765625, -2.055267333984375, -1.9649658203125, -1.874664306640625, -1.78436279296875, -1.694061279296875, -1.603759765625, -1.513458251953125, -1.42315673828125, -1.332855224609375, -1.2425537109375, -1.152252197265625, -1.06195068359375, -0.971649169921875, -0.88134765625, -0.791046142578125, -0.70074462890625, -0.610443115234375, -0.5201416015625, -0.429840087890625, -0.33953857421875, -0.249237060546875, -0.158935546875, -0.068634033203125, 0.02166748046875, 0.111968994140625, 0.2022705078125, 0.292572021484375, 0.38287353515625, 0.473175048828125, 0.5634765625, 0.653778076171875, 0.74407958984375, 0.834381103515625, 0.9246826171875, 1.014984130859375, 1.10528564453125, 1.195587158203125, 1.285888671875, 1.376190185546875, 1.46649169921875, 1.556793212890625, 1.6470947265625, 1.737396240234375, 1.82769775390625, 1.917999267578125, 2.00830078125, 2.098602294921875, 2.18890380859375, 2.279205322265625, 2.3695068359375, 2.459808349609375, 2.55010986328125, 2.640411376953125, 2.730712890625, 2.821014404296875, 2.91131591796875, 3.001617431640625, 3.0919189453125, 3.182220458984375, 3.27252197265625, 3.362823486328125, 3.453125]}, "gradients/encoder.encoder.layers.13.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 4.0, 0.0, 5.0, 3.0, 10.0, 7.0, 16.0, 21.0, 19.0, 37.0, 41.0, 45.0, 76.0, 89.0, 67.0, 93.0, 80.0, 88.0, 71.0, 59.0, 43.0, 38.0, 29.0, 20.0, 20.0, 10.0, 6.0, 4.0, 2.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.611328125, -0.5900497436523438, -0.5687713623046875, -0.5474929809570312, -0.526214599609375, -0.5049362182617188, -0.4836578369140625, -0.46237945556640625, -0.44110107421875, -0.41982269287109375, -0.3985443115234375, -0.37726593017578125, -0.355987548828125, -0.33470916748046875, -0.3134307861328125, -0.29215240478515625, -0.2708740234375, -0.24959564208984375, -0.2283172607421875, -0.20703887939453125, -0.185760498046875, -0.16448211669921875, -0.1432037353515625, -0.12192535400390625, -0.10064697265625, -0.07936859130859375, -0.0580902099609375, -0.03681182861328125, -0.015533447265625, 0.00574493408203125, 0.0270233154296875, 0.04830169677734375, 0.069580078125, 0.09085845947265625, 0.1121368408203125, 0.13341522216796875, 0.154693603515625, 0.17597198486328125, 0.1972503662109375, 0.21852874755859375, 0.23980712890625, 0.26108551025390625, 0.2823638916015625, 0.30364227294921875, 0.324920654296875, 0.34619903564453125, 0.3674774169921875, 0.38875579833984375, 0.4100341796875, 0.43131256103515625, 0.4525909423828125, 0.47386932373046875, 0.495147705078125, 0.5164260864257812, 0.5377044677734375, 0.5589828491210938, 0.58026123046875, 0.6015396118164062, 0.6228179931640625, 0.6440963745117188, 0.665374755859375, 0.6866531372070312, 0.7079315185546875, 0.7292098999023438, 0.75048828125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 4.0, 3.0, 4.0, 8.0, 7.0, 22.0, 27.0, 37.0, 55.0, 104.0, 175.0, 258.0, 451.0, 790.0, 1565.0, 3362.0, 7765.0, 24493.0, 124086.0, 3673059.0, 298725.0, 39336.0, 11232.0, 4364.0, 1940.0, 993.0, 554.0, 313.0, 208.0, 112.0, 82.0, 57.0, 30.0, 25.0, 18.0, 7.0, 9.0, 5.0, 0.0, 5.0, 1.0, 4.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4599609375, -1.4090423583984375, -1.358123779296875, -1.3072052001953125, -1.25628662109375, -1.2053680419921875, -1.154449462890625, -1.1035308837890625, -1.0526123046875, -1.0016937255859375, -0.950775146484375, -0.8998565673828125, -0.84893798828125, -0.7980194091796875, -0.747100830078125, -0.6961822509765625, -0.645263671875, -0.5943450927734375, -0.543426513671875, -0.4925079345703125, -0.44158935546875, -0.3906707763671875, -0.339752197265625, -0.2888336181640625, -0.2379150390625, -0.1869964599609375, -0.136077880859375, -0.0851593017578125, -0.03424072265625, 0.0166778564453125, 0.067596435546875, 0.1185150146484375, 0.16943359375, 0.2203521728515625, 0.271270751953125, 0.3221893310546875, 0.37310791015625, 0.4240264892578125, 0.474945068359375, 0.5258636474609375, 0.5767822265625, 0.6277008056640625, 0.678619384765625, 0.7295379638671875, 0.78045654296875, 0.8313751220703125, 0.882293701171875, 0.9332122802734375, 0.984130859375, 1.0350494384765625, 1.085968017578125, 1.1368865966796875, 1.18780517578125, 1.2387237548828125, 1.289642333984375, 1.3405609130859375, 1.3914794921875, 1.4423980712890625, 1.493316650390625, 1.5442352294921875, 1.59515380859375, 1.6460723876953125, 1.696990966796875, 1.7479095458984375, 1.798828125]}, "gradients/encoder.encoder.layers.13.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 2.0, 2.0, 0.0, 3.0, 1.0, 4.0, 3.0, 6.0, 2.0, 9.0, 7.0, 14.0, 21.0, 34.0, 46.0, 99.0, 204.0, 888.0, 2174.0, 258.0, 115.0, 49.0, 35.0, 29.0, 23.0, 12.0, 8.0, 4.0, 6.0, 6.0, 6.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 4.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.8291015625, -0.8040847778320312, -0.7790679931640625, -0.7540512084960938, -0.729034423828125, -0.7040176391601562, -0.6790008544921875, -0.6539840698242188, -0.62896728515625, -0.6039505004882812, -0.5789337158203125, -0.5539169311523438, -0.528900146484375, -0.5038833618164062, -0.4788665771484375, -0.45384979248046875, -0.4288330078125, -0.40381622314453125, -0.3787994384765625, -0.35378265380859375, -0.328765869140625, -0.30374908447265625, -0.2787322998046875, -0.25371551513671875, -0.22869873046875, -0.20368194580078125, -0.1786651611328125, -0.15364837646484375, -0.128631591796875, -0.10361480712890625, -0.0785980224609375, -0.05358123779296875, -0.028564453125, -0.00354766845703125, 0.0214691162109375, 0.04648590087890625, 0.071502685546875, 0.09651947021484375, 0.1215362548828125, 0.14655303955078125, 0.17156982421875, 0.19658660888671875, 0.2216033935546875, 0.24662017822265625, 0.271636962890625, 0.29665374755859375, 0.3216705322265625, 0.34668731689453125, 0.3717041015625, 0.39672088623046875, 0.4217376708984375, 0.44675445556640625, 0.471771240234375, 0.49678802490234375, 0.5218048095703125, 0.5468215942382812, 0.57183837890625, 0.5968551635742188, 0.6218719482421875, 0.6468887329101562, 0.671905517578125, 0.6969223022460938, 0.7219390869140625, 0.7469558715820312, 0.77197265625]}, "gradients/encoder.encoder.layers.13.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 5.0, 35.0, 325.0, 489.0, 117.0, 18.0, 5.0, 5.0, 3.0, 2.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.956040859222412, -6.613516330718994, -6.270991802215576, -5.928467750549316, -5.585943222045898, -5.2434186935424805, -4.9008941650390625, -4.5583696365356445, -4.215845108032227, -3.8733205795288086, -3.5307962894439697, -3.1882717609405518, -2.845747470855713, -2.503222942352295, -2.160698413848877, -1.818174123764038, -1.4756498336791992, -1.1331254243850708, -0.7906009554862976, -0.4480764865875244, -0.105552077293396, 0.23697233200073242, 0.5794968605041504, 0.9220211505889893, 1.2645456790924072, 1.6070700883865356, 1.949594497680664, 2.292119026184082, 2.6346435546875, 2.977167844772339, 3.319692373275757, 3.6622166633605957, 4.0047407150268555, 4.347265243530273, 4.689789772033691, 5.032314300537109, 5.374838352203369, 5.717362880706787, 6.059887409210205, 6.402411460876465, 6.744935989379883, 7.087460517883301, 7.429985046386719, 7.772509574890137, 8.115034103393555, 8.457557678222656, 8.80008316040039, 9.142606735229492, 9.485132217407227, 9.827656745910645, 10.170181274414062, 10.51270580291748, 10.855230331420898, 11.19775390625, 11.540279388427734, 11.882802963256836, 12.225327491760254, 12.567852020263672, 12.91037654876709, 13.252901077270508, 13.595425605773926, 13.937950134277344, 14.280473709106445, 14.622998237609863, 14.965522766113281]}, "gradients/encoder.encoder.layers.13.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 4.0, 6.0, 10.0, 20.0, 16.0, 26.0, 31.0, 31.0, 45.0, 52.0, 64.0, 55.0, 72.0, 70.0, 76.0, 82.0, 63.0, 70.0, 48.0, 35.0, 34.0, 27.0, 20.0, 15.0, 10.0, 8.0, 6.0, 1.0, 4.0, 1.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9553394317626953, -2.8630781173706055, -2.7708168029785156, -2.678555488586426, -2.586294174194336, -2.494032859802246, -2.4017715454101562, -2.3095102310180664, -2.2172489166259766, -2.1249876022338867, -2.032726287841797, -1.940464973449707, -1.8482036590576172, -1.7559423446655273, -1.6636810302734375, -1.5714197158813477, -1.4791582822799683, -1.3868969678878784, -1.2946356534957886, -1.2023743391036987, -1.1101130247116089, -1.017851710319519, -0.9255903363227844, -0.8333290219306946, -0.7410677075386047, -0.6488063931465149, -0.556545078754425, -0.4642837345600128, -0.372022420167923, -0.27976110577583313, -0.1874997615814209, -0.09523844718933105, -0.002977132797241211, 0.08928418904542923, 0.18154551088809967, 0.2738068401813507, 0.36606815457344055, 0.4583294689655304, 0.5505908131599426, 0.6428521275520325, 0.7351134419441223, 0.8273747563362122, 0.919636070728302, 1.0118974447250366, 1.1041587591171265, 1.1964200735092163, 1.2886813879013062, 1.380942702293396, 1.4732040166854858, 1.5654653310775757, 1.6577266454696655, 1.7499879598617554, 1.8422492742538452, 1.934510588645935, 2.0267720222473145, 2.1190333366394043, 2.211294651031494, 2.303555965423584, 2.395817279815674, 2.4880785942077637, 2.5803399085998535, 2.6726012229919434, 2.764862537384033, 2.857123851776123, 2.949385166168213]}, "gradients/encoder.encoder.layers.13.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 4.0, 8.0, 5.0, 7.0, 16.0, 21.0, 20.0, 30.0, 51.0, 74.0, 127.0, 229.0, 415.0, 986.0, 3017.0, 13409.0, 98872.0, 695968.0, 204869.0, 22971.0, 4726.0, 1519.0, 610.0, 247.0, 149.0, 78.0, 48.0, 26.0, 20.0, 9.0, 15.0, 4.0, 6.0, 5.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.9296875, -2.837127685546875, -2.74456787109375, -2.652008056640625, -2.5594482421875, -2.466888427734375, -2.37432861328125, -2.281768798828125, -2.189208984375, -2.096649169921875, -2.00408935546875, -1.911529541015625, -1.8189697265625, -1.726409912109375, -1.63385009765625, -1.541290283203125, -1.44873046875, -1.356170654296875, -1.26361083984375, -1.171051025390625, -1.0784912109375, -0.985931396484375, -0.89337158203125, -0.800811767578125, -0.708251953125, -0.615692138671875, -0.52313232421875, -0.430572509765625, -0.3380126953125, -0.245452880859375, -0.15289306640625, -0.060333251953125, 0.0322265625, 0.124786376953125, 0.21734619140625, 0.309906005859375, 0.4024658203125, 0.495025634765625, 0.58758544921875, 0.680145263671875, 0.772705078125, 0.865264892578125, 0.95782470703125, 1.050384521484375, 1.1429443359375, 1.235504150390625, 1.32806396484375, 1.420623779296875, 1.51318359375, 1.605743408203125, 1.69830322265625, 1.790863037109375, 1.8834228515625, 1.975982666015625, 2.06854248046875, 2.161102294921875, 2.253662109375, 2.346221923828125, 2.43878173828125, 2.531341552734375, 2.6239013671875, 2.716461181640625, 2.80902099609375, 2.901580810546875, 2.994140625]}, "gradients/encoder.encoder.layers.13.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 4.0, 3.0, 12.0, 22.0, 21.0, 31.0, 47.0, 56.0, 69.0, 78.0, 90.0, 80.0, 88.0, 94.0, 72.0, 70.0, 43.0, 34.0, 31.0, 18.0, 13.0, 8.0, 7.0, 5.0, 2.0, 2.0, 0.0, 2.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.68115234375, -0.65753173828125, -0.6339111328125, -0.61029052734375, -0.586669921875, -0.56304931640625, -0.5394287109375, -0.51580810546875, -0.4921875, -0.46856689453125, -0.4449462890625, -0.42132568359375, -0.397705078125, -0.37408447265625, -0.3504638671875, -0.32684326171875, -0.30322265625, -0.27960205078125, -0.2559814453125, -0.23236083984375, -0.208740234375, -0.18511962890625, -0.1614990234375, -0.13787841796875, -0.1142578125, -0.09063720703125, -0.0670166015625, -0.04339599609375, -0.019775390625, 0.00384521484375, 0.0274658203125, 0.05108642578125, 0.07470703125, 0.09832763671875, 0.1219482421875, 0.14556884765625, 0.169189453125, 0.19281005859375, 0.2164306640625, 0.24005126953125, 0.263671875, 0.28729248046875, 0.3109130859375, 0.33453369140625, 0.358154296875, 0.38177490234375, 0.4053955078125, 0.42901611328125, 0.45263671875, 0.47625732421875, 0.4998779296875, 0.52349853515625, 0.547119140625, 0.57073974609375, 0.5943603515625, 0.61798095703125, 0.6416015625, 0.66522216796875, 0.6888427734375, 0.71246337890625, 0.736083984375, 0.75970458984375, 0.7833251953125, 0.80694580078125, 0.83056640625]}, "gradients/encoder.encoder.layers.13.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 4.0, 6.0, 9.0, 5.0, 10.0, 8.0, 19.0, 26.0, 42.0, 56.0, 95.0, 132.0, 209.0, 376.0, 610.0, 1155.0, 2235.0, 4716.0, 11306.0, 31023.0, 98684.0, 320437.0, 385674.0, 127366.0, 39114.0, 13827.0, 5559.0, 2613.0, 1318.0, 745.0, 428.0, 263.0, 184.0, 99.0, 53.0, 51.0, 35.0, 23.0, 17.0, 6.0, 7.0, 4.0, 7.0, 3.0, 2.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0], "bins": [-1.318359375, -1.278533935546875, -1.23870849609375, -1.198883056640625, -1.1590576171875, -1.119232177734375, -1.07940673828125, -1.039581298828125, -0.999755859375, -0.959930419921875, -0.92010498046875, -0.880279541015625, -0.8404541015625, -0.800628662109375, -0.76080322265625, -0.720977783203125, -0.68115234375, -0.641326904296875, -0.60150146484375, -0.561676025390625, -0.5218505859375, -0.482025146484375, -0.44219970703125, -0.402374267578125, -0.362548828125, -0.322723388671875, -0.28289794921875, -0.243072509765625, -0.2032470703125, -0.163421630859375, -0.12359619140625, -0.083770751953125, -0.0439453125, -0.004119873046875, 0.03570556640625, 0.075531005859375, 0.1153564453125, 0.155181884765625, 0.19500732421875, 0.234832763671875, 0.274658203125, 0.314483642578125, 0.35430908203125, 0.394134521484375, 0.4339599609375, 0.473785400390625, 0.51361083984375, 0.553436279296875, 0.59326171875, 0.633087158203125, 0.67291259765625, 0.712738037109375, 0.7525634765625, 0.792388916015625, 0.83221435546875, 0.872039794921875, 0.911865234375, 0.951690673828125, 0.99151611328125, 1.031341552734375, 1.0711669921875, 1.110992431640625, 1.15081787109375, 1.190643310546875, 1.23046875]}, "gradients/encoder.encoder.layers.13.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 2.0, 4.0, 7.0, 5.0, 8.0, 6.0, 2.0, 14.0, 13.0, 26.0, 17.0, 18.0, 41.0, 34.0, 32.0, 38.0, 34.0, 46.0, 44.0, 48.0, 52.0, 53.0, 44.0, 53.0, 49.0, 50.0, 42.0, 44.0, 31.0, 25.0, 22.0, 17.0, 21.0, 15.0, 11.0, 14.0, 8.0, 8.0, 6.0, 3.0, 3.0, 5.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.5419921875, -1.4770355224609375, -1.412078857421875, -1.3471221923828125, -1.28216552734375, -1.2172088623046875, -1.152252197265625, -1.0872955322265625, -1.0223388671875, -0.9573822021484375, -0.892425537109375, -0.8274688720703125, -0.76251220703125, -0.6975555419921875, -0.632598876953125, -0.5676422119140625, -0.502685546875, -0.4377288818359375, -0.372772216796875, -0.3078155517578125, -0.24285888671875, -0.1779022216796875, -0.112945556640625, -0.0479888916015625, 0.0169677734375, 0.0819244384765625, 0.146881103515625, 0.2118377685546875, 0.27679443359375, 0.3417510986328125, 0.406707763671875, 0.4716644287109375, 0.53662109375, 0.6015777587890625, 0.666534423828125, 0.7314910888671875, 0.79644775390625, 0.8614044189453125, 0.926361083984375, 0.9913177490234375, 1.0562744140625, 1.1212310791015625, 1.186187744140625, 1.2511444091796875, 1.31610107421875, 1.3810577392578125, 1.446014404296875, 1.5109710693359375, 1.575927734375, 1.6408843994140625, 1.705841064453125, 1.7707977294921875, 1.83575439453125, 1.9007110595703125, 1.965667724609375, 2.0306243896484375, 2.0955810546875, 2.1605377197265625, 2.225494384765625, 2.2904510498046875, 2.35540771484375, 2.4203643798828125, 2.485321044921875, 2.5502777099609375, 2.615234375]}, "gradients/encoder.encoder.layers.13.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 1.0, 1.0, 8.0, 7.0, 14.0, 15.0, 25.0, 43.0, 67.0, 137.0, 330.0, 877.0, 3604.0, 32618.0, 766746.0, 229779.0, 11379.0, 1930.0, 550.0, 190.0, 107.0, 66.0, 19.0, 16.0, 12.0, 7.0, 6.0, 1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.126953125, -1.0891265869140625, -1.051300048828125, -1.0134735107421875, -0.97564697265625, -0.9378204345703125, -0.899993896484375, -0.8621673583984375, -0.8243408203125, -0.7865142822265625, -0.748687744140625, -0.7108612060546875, -0.67303466796875, -0.6352081298828125, -0.597381591796875, -0.5595550537109375, -0.521728515625, -0.4839019775390625, -0.446075439453125, -0.4082489013671875, -0.37042236328125, -0.3325958251953125, -0.294769287109375, -0.2569427490234375, -0.2191162109375, -0.1812896728515625, -0.143463134765625, -0.1056365966796875, -0.06781005859375, -0.0299835205078125, 0.007843017578125, 0.0456695556640625, 0.08349609375, 0.1213226318359375, 0.159149169921875, 0.1969757080078125, 0.23480224609375, 0.2726287841796875, 0.310455322265625, 0.3482818603515625, 0.3861083984375, 0.4239349365234375, 0.461761474609375, 0.4995880126953125, 0.53741455078125, 0.5752410888671875, 0.613067626953125, 0.6508941650390625, 0.688720703125, 0.7265472412109375, 0.764373779296875, 0.8022003173828125, 0.84002685546875, 0.8778533935546875, 0.915679931640625, 0.9535064697265625, 0.9913330078125, 1.0291595458984375, 1.066986083984375, 1.1048126220703125, 1.14263916015625, 1.1804656982421875, 1.218292236328125, 1.2561187744140625, 1.2939453125]}, "gradients/encoder.encoder.layers.13.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 3.0, 2.0, 5.0, 3.0, 6.0, 18.0, 28.0, 30.0, 47.0, 61.0, 108.0, 146.0, 134.0, 128.0, 86.0, 66.0, 47.0, 37.0, 15.0, 12.0, 9.0, 4.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0001380443572998047, -0.00013433396816253662, -0.00013062357902526855, -0.0001269131898880005, -0.00012320280075073242, -0.00011949241161346436, -0.00011578202247619629, -0.00011207163333892822, -0.00010836124420166016, -0.00010465085506439209, -0.00010094046592712402, -9.723007678985596e-05, -9.351968765258789e-05, -8.980929851531982e-05, -8.609890937805176e-05, -8.238852024078369e-05, -7.867813110351562e-05, -7.496774196624756e-05, -7.125735282897949e-05, -6.754696369171143e-05, -6.383657455444336e-05, -6.012618541717529e-05, -5.6415796279907227e-05, -5.270540714263916e-05, -4.8995018005371094e-05, -4.528462886810303e-05, -4.157423973083496e-05, -3.7863850593566895e-05, -3.415346145629883e-05, -3.0443072319030762e-05, -2.6732683181762695e-05, -2.302229404449463e-05, -1.9311904907226562e-05, -1.5601515769958496e-05, -1.189112663269043e-05, -8.180737495422363e-06, -4.470348358154297e-06, -7.599592208862305e-07, 2.950429916381836e-06, 6.660819053649902e-06, 1.0371208190917969e-05, 1.4081597328186035e-05, 1.77919864654541e-05, 2.1502375602722168e-05, 2.5212764739990234e-05, 2.89231538772583e-05, 3.263354301452637e-05, 3.6343932151794434e-05, 4.00543212890625e-05, 4.3764710426330566e-05, 4.747509956359863e-05, 5.11854887008667e-05, 5.4895877838134766e-05, 5.860626697540283e-05, 6.23166561126709e-05, 6.602704524993896e-05, 6.973743438720703e-05, 7.34478235244751e-05, 7.715821266174316e-05, 8.086860179901123e-05, 8.45789909362793e-05, 8.828938007354736e-05, 9.199976921081543e-05, 9.57101583480835e-05, 9.942054748535156e-05]}, "gradients/encoder.encoder.layers.13.attention.q_proj.weight": {"_type": "histogram", "values": [2.0, 2.0, 0.0, 2.0, 1.0, 1.0, 2.0, 3.0, 0.0, 2.0, 3.0, 6.0, 7.0, 11.0, 21.0, 20.0, 26.0, 49.0, 76.0, 132.0, 233.0, 413.0, 846.0, 1938.0, 5194.0, 16408.0, 67650.0, 347219.0, 472540.0, 101604.0, 22795.0, 6660.0, 2510.0, 1052.0, 488.0, 267.0, 147.0, 87.0, 46.0, 34.0, 14.0, 12.0, 9.0, 10.0, 6.0, 3.0, 6.0, 5.0, 4.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.495361328125, -0.4777488708496094, -0.46013641357421875, -0.4425239562988281, -0.4249114990234375, -0.4072990417480469, -0.38968658447265625, -0.3720741271972656, -0.354461669921875, -0.3368492126464844, -0.31923675537109375, -0.3016242980957031, -0.2840118408203125, -0.2663993835449219, -0.24878692626953125, -0.23117446899414062, -0.21356201171875, -0.19594955444335938, -0.17833709716796875, -0.16072463989257812, -0.1431121826171875, -0.12549972534179688, -0.10788726806640625, -0.09027481079101562, -0.072662353515625, -0.055049896240234375, -0.03743743896484375, -0.019824981689453125, -0.0022125244140625, 0.015399932861328125, 0.03301239013671875, 0.050624847412109375, 0.0682373046875, 0.08584976196289062, 0.10346221923828125, 0.12107467651367188, 0.1386871337890625, 0.15629959106445312, 0.17391204833984375, 0.19152450561523438, 0.209136962890625, 0.22674942016601562, 0.24436187744140625, 0.2619743347167969, 0.2795867919921875, 0.2971992492675781, 0.31481170654296875, 0.3324241638183594, 0.35003662109375, 0.3676490783691406, 0.38526153564453125, 0.4028739929199219, 0.4204864501953125, 0.4380989074707031, 0.45571136474609375, 0.4733238220214844, 0.490936279296875, 0.5085487365722656, 0.5261611938476562, 0.5437736511230469, 0.5613861083984375, 0.5789985656738281, 0.5966110229492188, 0.6142234802246094, 0.6318359375]}, "gradients/encoder.encoder.layers.13.attention.q_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 2.0, 3.0, 2.0, 3.0, 5.0, 5.0, 4.0, 4.0, 14.0, 13.0, 16.0, 17.0, 24.0, 35.0, 40.0, 55.0, 64.0, 62.0, 64.0, 83.0, 76.0, 78.0, 49.0, 65.0, 46.0, 39.0, 29.0, 25.0, 28.0, 5.0, 14.0, 13.0, 9.0, 7.0, 0.0, 1.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0], "bins": [-0.58837890625, -0.5673065185546875, -0.546234130859375, -0.5251617431640625, -0.50408935546875, -0.4830169677734375, -0.461944580078125, -0.4408721923828125, -0.4197998046875, -0.3987274169921875, -0.377655029296875, -0.3565826416015625, -0.33551025390625, -0.3144378662109375, -0.293365478515625, -0.2722930908203125, -0.251220703125, -0.2301483154296875, -0.209075927734375, -0.1880035400390625, -0.16693115234375, -0.1458587646484375, -0.124786376953125, -0.1037139892578125, -0.0826416015625, -0.0615692138671875, -0.040496826171875, -0.0194244384765625, 0.00164794921875, 0.0227203369140625, 0.043792724609375, 0.0648651123046875, 0.0859375, 0.1070098876953125, 0.128082275390625, 0.1491546630859375, 0.17022705078125, 0.1912994384765625, 0.212371826171875, 0.2334442138671875, 0.2545166015625, 0.2755889892578125, 0.296661376953125, 0.3177337646484375, 0.33880615234375, 0.3598785400390625, 0.380950927734375, 0.4020233154296875, 0.423095703125, 0.4441680908203125, 0.465240478515625, 0.4863128662109375, 0.50738525390625, 0.5284576416015625, 0.549530029296875, 0.5706024169921875, 0.5916748046875, 0.6127471923828125, 0.633819580078125, 0.6548919677734375, 0.67596435546875, 0.6970367431640625, 0.718109130859375, 0.7391815185546875, 0.76025390625]}, "gradients/encoder.encoder.layers.13.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 5.0, 5.0, 6.0, 9.0, 18.0, 26.0, 68.0, 97.0, 161.0, 195.0, 176.0, 116.0, 55.0, 36.0, 18.0, 12.0, 2.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-11.996576309204102, -11.492213249206543, -10.987850189208984, -10.483488082885742, -9.979125022888184, -9.474761962890625, -8.970399856567383, -8.466036796569824, -7.961673736572266, -7.457310676574707, -6.952948093414307, -6.448585510253906, -5.944222450256348, -5.439859390258789, -4.935496807098389, -4.431134223937988, -3.9267711639404297, -3.42240834236145, -2.9180455207824707, -2.413682699203491, -1.9093198776245117, -1.4049570560455322, -0.9005942344665527, -0.39623141288757324, 0.10813140869140625, 0.6124942302703857, 1.1168570518493652, 1.6212198734283447, 2.125582695007324, 2.6299455165863037, 3.134308338165283, 3.6386711597442627, 4.143033981323242, 4.647397041320801, 5.151759624481201, 5.656122207641602, 6.16048526763916, 6.664848327636719, 7.169210910797119, 7.6735734939575195, 8.177936553955078, 8.682299613952637, 9.186662673950195, 9.691024780273438, 10.195387840270996, 10.699750900268555, 11.204113006591797, 11.708476066589355, 12.212839126586914, 12.717202186584473, 13.221565246582031, 13.725927352905273, 14.230290412902832, 14.73465347290039, 15.239015579223633, 15.743378639221191, 16.24774169921875, 16.752103805541992, 17.256467819213867, 17.76082992553711, 18.265193939208984, 18.769556045532227, 19.27391815185547, 19.778282165527344, 20.282644271850586]}, "gradients/encoder.encoder.layers.13.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 4.0, 4.0, 4.0, 3.0, 5.0, 7.0, 13.0, 10.0, 7.0, 21.0, 25.0, 38.0, 22.0, 23.0, 35.0, 43.0, 41.0, 32.0, 49.0, 57.0, 41.0, 51.0, 44.0, 45.0, 50.0, 42.0, 48.0, 37.0, 28.0, 38.0, 31.0, 18.0, 18.0, 17.0, 10.0, 16.0, 8.0, 8.0, 8.0, 2.0, 4.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 4.0], "bins": [-13.998659133911133, -13.62474536895752, -13.250832557678223, -12.87691879272461, -12.503005981445312, -12.1290922164917, -11.755178451538086, -11.381265640258789, -11.007352828979492, -10.633439064025879, -10.259526252746582, -9.885612487792969, -9.511699676513672, -9.137785911560059, -8.763872146606445, -8.389959335327148, -8.016045570373535, -7.64213228225708, -7.268218994140625, -6.894305229187012, -6.520392417907715, -6.146478652954102, -5.7725653648376465, -5.398652076721191, -5.024738788604736, -4.650825500488281, -4.276912212371826, -3.902998685836792, -3.529085397720337, -3.155172109603882, -2.7812585830688477, -2.4073452949523926, -2.033432960510254, -1.6595196723937988, -1.2856062650680542, -0.9116928577423096, -0.5377795696258545, -0.16386628150939941, 0.21004724502563477, 0.5839605331420898, 0.9578738212585449, 1.331787109375, 1.7057005167007446, 2.0796139240264893, 2.4535272121429443, 2.8274405002593994, 3.2013540267944336, 3.5752673149108887, 3.9491806030273438, 4.323093891143799, 4.697007179260254, 5.070920944213867, 5.444833755493164, 5.818747520446777, 6.192660808563232, 6.5665740966796875, 6.940487384796143, 7.314400672912598, 7.688313961029053, 8.062227249145508, 8.436141014099121, 8.810053825378418, 9.183967590332031, 9.557880401611328, 9.931794166564941]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 3.0, 13.0, 15.0, 15.0, 32.0, 43.0, 97.0, 129.0, 236.0, 442.0, 840.0, 1693.0, 3580.0, 9193.0, 31111.0, 286038.0, 3767592.0, 67408.0, 15029.0, 5535.0, 2428.0, 1226.0, 626.0, 360.0, 206.0, 123.0, 78.0, 53.0, 41.0, 24.0, 18.0, 20.0, 10.0, 3.0, 4.0, 8.0, 6.0, 6.0, 2.0, 1.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.392578125, -2.304718017578125, -2.21685791015625, -2.128997802734375, -2.0411376953125, -1.953277587890625, -1.86541748046875, -1.777557373046875, -1.689697265625, -1.601837158203125, -1.51397705078125, -1.426116943359375, -1.3382568359375, -1.250396728515625, -1.16253662109375, -1.074676513671875, -0.98681640625, -0.898956298828125, -0.81109619140625, -0.723236083984375, -0.6353759765625, -0.547515869140625, -0.45965576171875, -0.371795654296875, -0.283935546875, -0.196075439453125, -0.10821533203125, -0.020355224609375, 0.0675048828125, 0.155364990234375, 0.24322509765625, 0.331085205078125, 0.4189453125, 0.506805419921875, 0.59466552734375, 0.682525634765625, 0.7703857421875, 0.858245849609375, 0.94610595703125, 1.033966064453125, 1.121826171875, 1.209686279296875, 1.29754638671875, 1.385406494140625, 1.4732666015625, 1.561126708984375, 1.64898681640625, 1.736846923828125, 1.82470703125, 1.912567138671875, 2.00042724609375, 2.088287353515625, 2.1761474609375, 2.264007568359375, 2.35186767578125, 2.439727783203125, 2.527587890625, 2.615447998046875, 2.70330810546875, 2.791168212890625, 2.8790283203125, 2.966888427734375, 3.05474853515625, 3.142608642578125, 3.23046875]}, "gradients/encoder.encoder.layers.12.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 3.0, 4.0, 2.0, 9.0, 9.0, 21.0, 20.0, 20.0, 26.0, 32.0, 35.0, 54.0, 58.0, 74.0, 73.0, 64.0, 82.0, 57.0, 72.0, 50.0, 56.0, 41.0, 38.0, 24.0, 23.0, 14.0, 12.0, 7.0, 6.0, 9.0, 4.0, 5.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.70849609375, -0.6848831176757812, -0.6612701416015625, -0.6376571655273438, -0.614044189453125, -0.5904312133789062, -0.5668182373046875, -0.5432052612304688, -0.51959228515625, -0.49597930908203125, -0.4723663330078125, -0.44875335693359375, -0.425140380859375, -0.40152740478515625, -0.3779144287109375, -0.35430145263671875, -0.3306884765625, -0.30707550048828125, -0.2834625244140625, -0.25984954833984375, -0.236236572265625, -0.21262359619140625, -0.1890106201171875, -0.16539764404296875, -0.14178466796875, -0.11817169189453125, -0.0945587158203125, -0.07094573974609375, -0.047332763671875, -0.02371978759765625, -0.0001068115234375, 0.02350616455078125, 0.047119140625, 0.07073211669921875, 0.0943450927734375, 0.11795806884765625, 0.141571044921875, 0.16518402099609375, 0.1887969970703125, 0.21240997314453125, 0.23602294921875, 0.25963592529296875, 0.2832489013671875, 0.30686187744140625, 0.330474853515625, 0.35408782958984375, 0.3777008056640625, 0.40131378173828125, 0.4249267578125, 0.44853973388671875, 0.4721527099609375, 0.49576568603515625, 0.519378662109375, 0.5429916381835938, 0.5666046142578125, 0.5902175903320312, 0.61383056640625, 0.6374435424804688, 0.6610565185546875, 0.6846694946289062, 0.708282470703125, 0.7318954467773438, 0.7555084228515625, 0.7791213989257812, 0.802734375]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 4.0, 11.0, 10.0, 17.0, 43.0, 79.0, 94.0, 152.0, 246.0, 501.0, 746.0, 1364.0, 2497.0, 4807.0, 10709.0, 29920.0, 137290.0, 3510351.0, 410790.0, 54040.0, 16346.0, 6709.0, 3308.0, 1777.0, 979.0, 626.0, 369.0, 206.0, 120.0, 69.0, 47.0, 19.0, 19.0, 8.0, 2.0, 6.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.912109375, -1.85540771484375, -1.7987060546875, -1.74200439453125, -1.685302734375, -1.62860107421875, -1.5718994140625, -1.51519775390625, -1.45849609375, -1.40179443359375, -1.3450927734375, -1.28839111328125, -1.231689453125, -1.17498779296875, -1.1182861328125, -1.06158447265625, -1.0048828125, -0.94818115234375, -0.8914794921875, -0.83477783203125, -0.778076171875, -0.72137451171875, -0.6646728515625, -0.60797119140625, -0.55126953125, -0.49456787109375, -0.4378662109375, -0.38116455078125, -0.324462890625, -0.26776123046875, -0.2110595703125, -0.15435791015625, -0.09765625, -0.04095458984375, 0.0157470703125, 0.07244873046875, 0.129150390625, 0.18585205078125, 0.2425537109375, 0.29925537109375, 0.35595703125, 0.41265869140625, 0.4693603515625, 0.52606201171875, 0.582763671875, 0.63946533203125, 0.6961669921875, 0.75286865234375, 0.8095703125, 0.86627197265625, 0.9229736328125, 0.97967529296875, 1.036376953125, 1.09307861328125, 1.1497802734375, 1.20648193359375, 1.26318359375, 1.31988525390625, 1.3765869140625, 1.43328857421875, 1.489990234375, 1.54669189453125, 1.6033935546875, 1.66009521484375, 1.716796875]}, "gradients/encoder.encoder.layers.12.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 0.0, 1.0, 1.0, 0.0, 7.0, 2.0, 4.0, 4.0, 6.0, 8.0, 4.0, 10.0, 13.0, 18.0, 45.0, 52.0, 127.0, 290.0, 2265.0, 785.0, 182.0, 99.0, 53.0, 40.0, 22.0, 12.0, 8.0, 1.0, 4.0, 3.0, 0.0, 2.0, 2.0, 4.0, 5.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.3115234375, -1.2702789306640625, -1.229034423828125, -1.1877899169921875, -1.14654541015625, -1.1053009033203125, -1.064056396484375, -1.0228118896484375, -0.9815673828125, -0.9403228759765625, -0.899078369140625, -0.8578338623046875, -0.81658935546875, -0.7753448486328125, -0.734100341796875, -0.6928558349609375, -0.651611328125, -0.6103668212890625, -0.569122314453125, -0.5278778076171875, -0.48663330078125, -0.4453887939453125, -0.404144287109375, -0.3628997802734375, -0.3216552734375, -0.2804107666015625, -0.239166259765625, -0.1979217529296875, -0.15667724609375, -0.1154327392578125, -0.074188232421875, -0.0329437255859375, 0.00830078125, 0.0495452880859375, 0.090789794921875, 0.1320343017578125, 0.17327880859375, 0.2145233154296875, 0.255767822265625, 0.2970123291015625, 0.3382568359375, 0.3795013427734375, 0.420745849609375, 0.4619903564453125, 0.50323486328125, 0.5444793701171875, 0.585723876953125, 0.6269683837890625, 0.668212890625, 0.7094573974609375, 0.750701904296875, 0.7919464111328125, 0.83319091796875, 0.8744354248046875, 0.915679931640625, 0.9569244384765625, 0.9981689453125, 1.0394134521484375, 1.080657958984375, 1.1219024658203125, 1.16314697265625, 1.2043914794921875, 1.245635986328125, 1.2868804931640625, 1.328125]}, "gradients/encoder.encoder.layers.12.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 13.0, 41.0, 183.0, 435.0, 259.0, 58.0, 13.0, 4.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-24.100658416748047, -23.58439826965332, -23.068138122558594, -22.551877975463867, -22.03561782836914, -21.519357681274414, -21.003097534179688, -20.48683738708496, -19.970577239990234, -19.454317092895508, -18.93805694580078, -18.421796798706055, -17.905536651611328, -17.3892765045166, -16.873016357421875, -16.35675621032715, -15.840496063232422, -15.324235916137695, -14.807975769042969, -14.291715621948242, -13.775455474853516, -13.259195327758789, -12.742935180664062, -12.226675033569336, -11.71041488647461, -11.194154739379883, -10.677894592285156, -10.16163444519043, -9.645374298095703, -9.129114151000977, -8.61285400390625, -8.096593856811523, -7.58033561706543, -7.064075469970703, -6.547815322875977, -6.03155517578125, -5.515295028686523, -4.999034881591797, -4.48277473449707, -3.9665145874023438, -3.450254440307617, -2.9339942932128906, -2.417734146118164, -1.9014739990234375, -1.385213851928711, -0.8689537048339844, -0.3526935577392578, 0.16356658935546875, 0.6798267364501953, 1.1960868835449219, 1.7123470306396484, 2.228607177734375, 2.7448673248291016, 3.261127471923828, 3.7773876190185547, 4.293647766113281, 4.809907913208008, 5.326168060302734, 5.842428207397461, 6.3586883544921875, 6.874948501586914, 7.391208648681641, 7.907468795776367, 8.423728942871094, 8.93998908996582]}, "gradients/encoder.encoder.layers.12.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 3.0, 6.0, 2.0, 15.0, 9.0, 5.0, 4.0, 11.0, 16.0, 35.0, 23.0, 41.0, 39.0, 43.0, 47.0, 40.0, 55.0, 61.0, 57.0, 81.0, 54.0, 51.0, 48.0, 55.0, 42.0, 33.0, 28.0, 20.0, 21.0, 17.0, 15.0, 8.0, 10.0, 2.0, 3.0, 4.0, 4.0, 2.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0510759353637695, -2.936291217803955, -2.8215062618255615, -2.706721544265747, -2.5919368267059326, -2.477151870727539, -2.3623671531677246, -2.24758243560791, -2.1327977180480957, -2.0180130004882812, -1.9032281637191772, -1.7884433269500732, -1.6736586093902588, -1.5588737726211548, -1.4440889358520508, -1.3293042182922363, -1.2145192623138428, -1.0997344255447388, -0.9849497079849243, -0.8701648712158203, -0.7553800940513611, -0.6405953168869019, -0.5258104801177979, -0.4110257029533386, -0.2962409257888794, -0.18145613372325897, -0.06667134165763855, 0.048113465309143066, 0.1628982424736023, 0.2776830196380615, 0.3924678564071655, 0.5072526335716248, 0.622037410736084, 0.7368221879005432, 0.8516069650650024, 0.9663918018341064, 1.081176519393921, 1.195961356163025, 1.310746192932129, 1.4255309104919434, 1.5403157472610474, 1.6551005840301514, 1.7698853015899658, 1.8846701383590698, 1.9994549751281738, 2.1142396926879883, 2.2290244102478027, 2.3438093662261963, 2.4585940837860107, 2.573378801345825, 2.6881637573242188, 2.802948474884033, 2.9177331924438477, 3.032517910003662, 3.1473028659820557, 3.26208758354187, 3.3768725395202637, 3.491657257080078, 3.6064422130584717, 3.721226930618286, 3.8360116481781006, 3.950796604156494, 4.065581321716309, 4.180366039276123, 4.2951507568359375]}, "gradients/encoder.encoder.layers.12.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 0.0, 5.0, 10.0, 10.0, 13.0, 12.0, 17.0, 36.0, 24.0, 47.0, 79.0, 143.0, 198.0, 406.0, 727.0, 1483.0, 3256.0, 8411.0, 25439.0, 99700.0, 449320.0, 352416.0, 74239.0, 20160.0, 6903.0, 2717.0, 1273.0, 652.0, 316.0, 190.0, 110.0, 68.0, 46.0, 42.0, 24.0, 24.0, 14.0, 4.0, 6.0, 5.0, 3.0, 2.0, 3.0, 2.0, 0.0, 1.0, 3.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.814453125, -2.726226806640625, -2.63800048828125, -2.549774169921875, -2.4615478515625, -2.373321533203125, -2.28509521484375, -2.196868896484375, -2.108642578125, -2.020416259765625, -1.93218994140625, -1.843963623046875, -1.7557373046875, -1.667510986328125, -1.57928466796875, -1.491058349609375, -1.40283203125, -1.314605712890625, -1.22637939453125, -1.138153076171875, -1.0499267578125, -0.961700439453125, -0.87347412109375, -0.785247802734375, -0.697021484375, -0.608795166015625, -0.52056884765625, -0.432342529296875, -0.3441162109375, -0.255889892578125, -0.16766357421875, -0.079437255859375, 0.0087890625, 0.097015380859375, 0.18524169921875, 0.273468017578125, 0.3616943359375, 0.449920654296875, 0.53814697265625, 0.626373291015625, 0.714599609375, 0.802825927734375, 0.89105224609375, 0.979278564453125, 1.0675048828125, 1.155731201171875, 1.24395751953125, 1.332183837890625, 1.42041015625, 1.508636474609375, 1.59686279296875, 1.685089111328125, 1.7733154296875, 1.861541748046875, 1.94976806640625, 2.037994384765625, 2.126220703125, 2.214447021484375, 2.30267333984375, 2.390899658203125, 2.4791259765625, 2.567352294921875, 2.65557861328125, 2.743804931640625, 2.83203125]}, "gradients/encoder.encoder.layers.12.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 4.0, 5.0, 6.0, 8.0, 7.0, 20.0, 23.0, 29.0, 22.0, 46.0, 56.0, 63.0, 67.0, 78.0, 74.0, 67.0, 77.0, 67.0, 51.0, 51.0, 49.0, 45.0, 18.0, 19.0, 17.0, 9.0, 11.0, 6.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.7685546875, -0.7430038452148438, -0.7174530029296875, -0.6919021606445312, -0.666351318359375, -0.6408004760742188, -0.6152496337890625, -0.5896987915039062, -0.56414794921875, -0.5385971069335938, -0.5130462646484375, -0.48749542236328125, -0.461944580078125, -0.43639373779296875, -0.4108428955078125, -0.38529205322265625, -0.3597412109375, -0.33419036865234375, -0.3086395263671875, -0.28308868408203125, -0.257537841796875, -0.23198699951171875, -0.2064361572265625, -0.18088531494140625, -0.15533447265625, -0.12978363037109375, -0.1042327880859375, -0.07868194580078125, -0.053131103515625, -0.02758026123046875, -0.0020294189453125, 0.02352142333984375, 0.049072265625, 0.07462310791015625, 0.1001739501953125, 0.12572479248046875, 0.151275634765625, 0.17682647705078125, 0.2023773193359375, 0.22792816162109375, 0.25347900390625, 0.27902984619140625, 0.3045806884765625, 0.33013153076171875, 0.355682373046875, 0.38123321533203125, 0.4067840576171875, 0.43233489990234375, 0.4578857421875, 0.48343658447265625, 0.5089874267578125, 0.5345382690429688, 0.560089111328125, 0.5856399536132812, 0.6111907958984375, 0.6367416381835938, 0.66229248046875, 0.6878433227539062, 0.7133941650390625, 0.7389450073242188, 0.764495849609375, 0.7900466918945312, 0.8155975341796875, 0.8411483764648438, 0.86669921875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 2.0, 6.0, 9.0, 9.0, 8.0, 8.0, 21.0, 36.0, 57.0, 91.0, 127.0, 198.0, 273.0, 465.0, 787.0, 1432.0, 2606.0, 4954.0, 10610.0, 24842.0, 66212.0, 213713.0, 437678.0, 184068.0, 58340.0, 22134.0, 9660.0, 4627.0, 2374.0, 1300.0, 685.0, 427.0, 276.0, 155.0, 112.0, 64.0, 54.0, 39.0, 30.0, 14.0, 18.0, 9.0, 6.0, 9.0, 5.0, 5.0, 4.0, 1.0, 2.0, 2.0, 1.0], "bins": [-2.078125, -2.0194854736328125, -1.960845947265625, -1.9022064208984375, -1.84356689453125, -1.7849273681640625, -1.726287841796875, -1.6676483154296875, -1.6090087890625, -1.5503692626953125, -1.491729736328125, -1.4330902099609375, -1.37445068359375, -1.3158111572265625, -1.257171630859375, -1.1985321044921875, -1.139892578125, -1.0812530517578125, -1.022613525390625, -0.9639739990234375, -0.90533447265625, -0.8466949462890625, -0.788055419921875, -0.7294158935546875, -0.6707763671875, -0.6121368408203125, -0.553497314453125, -0.4948577880859375, -0.43621826171875, -0.3775787353515625, -0.318939208984375, -0.2602996826171875, -0.20166015625, -0.1430206298828125, -0.084381103515625, -0.0257415771484375, 0.03289794921875, 0.0915374755859375, 0.150177001953125, 0.2088165283203125, 0.2674560546875, 0.3260955810546875, 0.384735107421875, 0.4433746337890625, 0.50201416015625, 0.5606536865234375, 0.619293212890625, 0.6779327392578125, 0.736572265625, 0.7952117919921875, 0.853851318359375, 0.9124908447265625, 0.97113037109375, 1.0297698974609375, 1.088409423828125, 1.1470489501953125, 1.2056884765625, 1.2643280029296875, 1.322967529296875, 1.3816070556640625, 1.44024658203125, 1.4988861083984375, 1.557525634765625, 1.6161651611328125, 1.6748046875]}, "gradients/encoder.encoder.layers.12.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 4.0, 3.0, 5.0, 7.0, 9.0, 9.0, 9.0, 11.0, 25.0, 25.0, 24.0, 21.0, 32.0, 47.0, 49.0, 56.0, 66.0, 68.0, 53.0, 50.0, 61.0, 61.0, 43.0, 39.0, 34.0, 37.0, 31.0, 19.0, 21.0, 21.0, 19.0, 12.0, 6.0, 11.0, 6.0, 3.0, 3.0, 3.0, 2.0, 3.0, 1.0, 4.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.62109375, -3.511383056640625, -3.40167236328125, -3.291961669921875, -3.1822509765625, -3.072540283203125, -2.96282958984375, -2.853118896484375, -2.743408203125, -2.633697509765625, -2.52398681640625, -2.414276123046875, -2.3045654296875, -2.194854736328125, -2.08514404296875, -1.975433349609375, -1.86572265625, -1.756011962890625, -1.64630126953125, -1.536590576171875, -1.4268798828125, -1.317169189453125, -1.20745849609375, -1.097747802734375, -0.988037109375, -0.878326416015625, -0.76861572265625, -0.658905029296875, -0.5491943359375, -0.439483642578125, -0.32977294921875, -0.220062255859375, -0.1103515625, -0.000640869140625, 0.10906982421875, 0.218780517578125, 0.3284912109375, 0.438201904296875, 0.54791259765625, 0.657623291015625, 0.767333984375, 0.877044677734375, 0.98675537109375, 1.096466064453125, 1.2061767578125, 1.315887451171875, 1.42559814453125, 1.535308837890625, 1.64501953125, 1.754730224609375, 1.86444091796875, 1.974151611328125, 2.0838623046875, 2.193572998046875, 2.30328369140625, 2.412994384765625, 2.522705078125, 2.632415771484375, 2.74212646484375, 2.851837158203125, 2.9615478515625, 3.071258544921875, 3.18096923828125, 3.290679931640625, 3.400390625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 6.0, 5.0, 4.0, 6.0, 7.0, 16.0, 35.0, 41.0, 83.0, 113.0, 269.0, 484.0, 1211.0, 3622.0, 15446.0, 106375.0, 673903.0, 212981.0, 25690.0, 5311.0, 1630.0, 611.0, 312.0, 183.0, 82.0, 43.0, 30.0, 15.0, 13.0, 10.0, 8.0, 5.0, 2.0, 1.0, 4.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0390625, -1.0027923583984375, -0.966522216796875, -0.9302520751953125, -0.89398193359375, -0.8577117919921875, -0.821441650390625, -0.7851715087890625, -0.7489013671875, -0.7126312255859375, -0.676361083984375, -0.6400909423828125, -0.60382080078125, -0.5675506591796875, -0.531280517578125, -0.4950103759765625, -0.458740234375, -0.4224700927734375, -0.386199951171875, -0.3499298095703125, -0.31365966796875, -0.2773895263671875, -0.241119384765625, -0.2048492431640625, -0.1685791015625, -0.1323089599609375, -0.096038818359375, -0.0597686767578125, -0.02349853515625, 0.0127716064453125, 0.049041748046875, 0.0853118896484375, 0.12158203125, 0.1578521728515625, 0.194122314453125, 0.2303924560546875, 0.26666259765625, 0.3029327392578125, 0.339202880859375, 0.3754730224609375, 0.4117431640625, 0.4480133056640625, 0.484283447265625, 0.5205535888671875, 0.55682373046875, 0.5930938720703125, 0.629364013671875, 0.6656341552734375, 0.701904296875, 0.7381744384765625, 0.774444580078125, 0.8107147216796875, 0.84698486328125, 0.8832550048828125, 0.919525146484375, 0.9557952880859375, 0.9920654296875, 1.0283355712890625, 1.064605712890625, 1.1008758544921875, 1.13714599609375, 1.1734161376953125, 1.209686279296875, 1.2459564208984375, 1.2822265625]}, "gradients/encoder.encoder.layers.12.attention.k_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 3.0, 6.0, 8.0, 4.0, 15.0, 15.0, 23.0, 25.0, 47.0, 71.0, 82.0, 95.0, 89.0, 111.0, 86.0, 91.0, 59.0, 50.0, 37.0, 27.0, 17.0, 6.0, 12.0, 4.0, 5.0, 7.0, 3.0, 2.0, 2.0, 3.0, 0.0, 3.0, 2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.250640869140625e-05, -8.836574852466583e-05, -8.422508835792542e-05, -8.0084428191185e-05, -7.594376802444458e-05, -7.180310785770416e-05, -6.766244769096375e-05, -6.352178752422333e-05, -5.938112735748291e-05, -5.524046719074249e-05, -5.1099807024002075e-05, -4.695914685726166e-05, -4.281848669052124e-05, -3.867782652378082e-05, -3.4537166357040405e-05, -3.0396506190299988e-05, -2.625584602355957e-05, -2.2115185856819153e-05, -1.7974525690078735e-05, -1.3833865523338318e-05, -9.6932053565979e-06, -5.552545189857483e-06, -1.4118850231170654e-06, 2.728775143623352e-06, 6.8694353103637695e-06, 1.1010095477104187e-05, 1.5150755643844604e-05, 1.9291415810585022e-05, 2.343207597732544e-05, 2.7572736144065857e-05, 3.1713396310806274e-05, 3.585405647754669e-05, 3.999471664428711e-05, 4.413537681102753e-05, 4.8276036977767944e-05, 5.241669714450836e-05, 5.655735731124878e-05, 6.06980174779892e-05, 6.483867764472961e-05, 6.897933781147003e-05, 7.311999797821045e-05, 7.726065814495087e-05, 8.140131831169128e-05, 8.55419784784317e-05, 8.968263864517212e-05, 9.382329881191254e-05, 9.796395897865295e-05, 0.00010210461914539337, 0.00010624527931213379, 0.0001103859394788742, 0.00011452659964561462, 0.00011866725981235504, 0.00012280791997909546, 0.00012694858014583588, 0.0001310892403125763, 0.0001352299004793167, 0.00013937056064605713, 0.00014351122081279755, 0.00014765188097953796, 0.00015179254114627838, 0.0001559332013130188, 0.00016007386147975922, 0.00016421452164649963, 0.00016835518181324005, 0.00017249584197998047]}, "gradients/encoder.encoder.layers.12.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 5.0, 5.0, 8.0, 9.0, 14.0, 50.0, 71.0, 164.0, 324.0, 838.0, 2954.0, 14626.0, 119410.0, 690601.0, 192739.0, 20939.0, 3930.0, 1086.0, 414.0, 162.0, 89.0, 53.0, 37.0, 17.0, 9.0, 3.0, 7.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0830078125, -1.046417236328125, -1.00982666015625, -0.973236083984375, -0.9366455078125, -0.900054931640625, -0.86346435546875, -0.826873779296875, -0.790283203125, -0.753692626953125, -0.71710205078125, -0.680511474609375, -0.6439208984375, -0.607330322265625, -0.57073974609375, -0.534149169921875, -0.49755859375, -0.460968017578125, -0.42437744140625, -0.387786865234375, -0.3511962890625, -0.314605712890625, -0.27801513671875, -0.241424560546875, -0.204833984375, -0.168243408203125, -0.13165283203125, -0.095062255859375, -0.0584716796875, -0.021881103515625, 0.01470947265625, 0.051300048828125, 0.087890625, 0.124481201171875, 0.16107177734375, 0.197662353515625, 0.2342529296875, 0.270843505859375, 0.30743408203125, 0.344024658203125, 0.380615234375, 0.417205810546875, 0.45379638671875, 0.490386962890625, 0.5269775390625, 0.563568115234375, 0.60015869140625, 0.636749267578125, 0.67333984375, 0.709930419921875, 0.74652099609375, 0.783111572265625, 0.8197021484375, 0.856292724609375, 0.89288330078125, 0.929473876953125, 0.966064453125, 1.002655029296875, 1.03924560546875, 1.075836181640625, 1.1124267578125, 1.149017333984375, 1.18560791015625, 1.222198486328125, 1.2587890625]}, "gradients/encoder.encoder.layers.12.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 5.0, 7.0, 11.0, 19.0, 22.0, 33.0, 55.0, 74.0, 104.0, 122.0, 134.0, 120.0, 94.0, 61.0, 48.0, 38.0, 16.0, 11.0, 10.0, 7.0, 10.0, 2.0, 3.0, 3.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.326171875, -1.2758331298828125, -1.225494384765625, -1.1751556396484375, -1.12481689453125, -1.0744781494140625, -1.024139404296875, -0.9738006591796875, -0.9234619140625, -0.8731231689453125, -0.822784423828125, -0.7724456787109375, -0.72210693359375, -0.6717681884765625, -0.621429443359375, -0.5710906982421875, -0.520751953125, -0.4704132080078125, -0.420074462890625, -0.3697357177734375, -0.31939697265625, -0.2690582275390625, -0.218719482421875, -0.1683807373046875, -0.1180419921875, -0.0677032470703125, -0.017364501953125, 0.0329742431640625, 0.08331298828125, 0.1336517333984375, 0.183990478515625, 0.2343292236328125, 0.28466796875, 0.3350067138671875, 0.385345458984375, 0.4356842041015625, 0.48602294921875, 0.5363616943359375, 0.586700439453125, 0.6370391845703125, 0.6873779296875, 0.7377166748046875, 0.788055419921875, 0.8383941650390625, 0.88873291015625, 0.9390716552734375, 0.989410400390625, 1.0397491455078125, 1.090087890625, 1.1404266357421875, 1.190765380859375, 1.2411041259765625, 1.29144287109375, 1.3417816162109375, 1.392120361328125, 1.4424591064453125, 1.4927978515625, 1.5431365966796875, 1.593475341796875, 1.6438140869140625, 1.69415283203125, 1.7444915771484375, 1.794830322265625, 1.8451690673828125, 1.8955078125]}, "gradients/encoder.encoder.layers.12.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 4.0, 1.0, 1.0, 1.0, 1.0, 5.0, 2.0, 12.0, 16.0, 18.0, 33.0, 57.0, 82.0, 134.0, 161.0, 163.0, 111.0, 80.0, 44.0, 26.0, 22.0, 12.0, 14.0, 5.0, 6.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.96710205078125, -12.323904037475586, -11.680706024169922, -11.037508010864258, -10.394309997558594, -9.75111198425293, -9.107913970947266, -8.464715957641602, -7.821517467498779, -7.178319454193115, -6.535121440887451, -5.891922950744629, -5.248724937438965, -4.605526924133301, -3.9623289108276367, -3.3191308975219727, -2.6759328842163086, -2.0327348709106445, -1.389536738395691, -0.7463386058807373, -0.10314059257507324, 0.5400574207305908, 1.183255672454834, 1.826453685760498, 2.469651699066162, 3.112849712371826, 3.7560477256774902, 4.3992462158203125, 5.042444229125977, 5.685642242431641, 6.328840255737305, 6.972038269042969, 7.615236282348633, 8.258434295654297, 8.901632308959961, 9.544830322265625, 10.188028335571289, 10.831226348876953, 11.474424362182617, 12.117622375488281, 12.760820388793945, 13.40401840209961, 14.047216415405273, 14.690414428710938, 15.333612442016602, 15.976810455322266, 16.62000846862793, 17.263206481933594, 17.90640640258789, 18.549604415893555, 19.19280242919922, 19.836000442504883, 20.479198455810547, 21.12239646911621, 21.765594482421875, 22.40879249572754, 23.051990509033203, 23.695188522338867, 24.33838653564453, 24.981584548950195, 25.62478256225586, 26.267980575561523, 26.911178588867188, 27.55437660217285, 28.197574615478516]}, "gradients/encoder.encoder.layers.12.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 6.0, 2.0, 0.0, 3.0, 3.0, 2.0, 9.0, 6.0, 7.0, 4.0, 14.0, 15.0, 11.0, 15.0, 23.0, 17.0, 29.0, 28.0, 32.0, 28.0, 33.0, 33.0, 41.0, 33.0, 47.0, 48.0, 41.0, 43.0, 43.0, 30.0, 42.0, 46.0, 34.0, 32.0, 27.0, 24.0, 25.0, 16.0, 17.0, 18.0, 15.0, 12.0, 9.0, 8.0, 10.0, 8.0, 6.0, 4.0, 4.0, 0.0, 2.0, 2.0, 3.0, 1.0, 1.0, 2.0, 1.0, 2.0], "bins": [-15.823076248168945, -15.334844589233398, -14.846612930297852, -14.358381271362305, -13.870148658752441, -13.381916999816895, -12.893685340881348, -12.4054536819458, -11.917221069335938, -11.42898941040039, -10.940757751464844, -10.452526092529297, -9.964293479919434, -9.476061820983887, -8.98783016204834, -8.499598503112793, -8.011366844177246, -7.523135185241699, -7.034903049468994, -6.546671390533447, -6.058439254760742, -5.570207595825195, -5.081975936889648, -4.593744277954102, -4.1055121421813965, -3.6172802448272705, -3.1290483474731445, -2.6408166885375977, -2.1525847911834717, -1.6643528938293457, -1.1761212348937988, -0.6878893375396729, -0.19965744018554688, 0.2885743975639343, 0.7768062353134155, 1.265038013458252, 1.753269910812378, 2.241501808166504, 2.729733467102051, 3.2179653644561768, 3.7061972618103027, 4.19442892074585, 4.682661056518555, 5.170892715454102, 5.659124374389648, 6.1473565101623535, 6.6355881690979, 7.1238203048706055, 7.612051963806152, 8.1002836227417, 8.588515281677246, 9.07674789428711, 9.564979553222656, 10.053211212158203, 10.54144287109375, 11.029674530029297, 11.517906188964844, 12.00613784790039, 12.494369506835938, 12.982601165771484, 13.470833778381348, 13.959065437316895, 14.447297096252441, 14.935528755187988, 15.423761367797852]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 3.0, 3.0, 10.0, 7.0, 10.0, 22.0, 37.0, 59.0, 91.0, 178.0, 299.0, 472.0, 922.0, 1766.0, 3903.0, 11945.0, 270217.0, 3883496.0, 12736.0, 4202.0, 1860.0, 887.0, 455.0, 277.0, 177.0, 86.0, 53.0, 32.0, 27.0, 22.0, 16.0, 6.0, 5.0, 4.0, 2.0, 3.0, 1.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-4.68359375, -4.54986572265625, -4.4161376953125, -4.28240966796875, -4.148681640625, -4.01495361328125, -3.8812255859375, -3.74749755859375, -3.61376953125, -3.48004150390625, -3.3463134765625, -3.21258544921875, -3.078857421875, -2.94512939453125, -2.8114013671875, -2.67767333984375, -2.5439453125, -2.41021728515625, -2.2764892578125, -2.14276123046875, -2.009033203125, -1.87530517578125, -1.7415771484375, -1.60784912109375, -1.47412109375, -1.34039306640625, -1.2066650390625, -1.07293701171875, -0.939208984375, -0.80548095703125, -0.6717529296875, -0.53802490234375, -0.404296875, -0.27056884765625, -0.1368408203125, -0.00311279296875, 0.130615234375, 0.26434326171875, 0.3980712890625, 0.53179931640625, 0.66552734375, 0.79925537109375, 0.9329833984375, 1.06671142578125, 1.200439453125, 1.33416748046875, 1.4678955078125, 1.60162353515625, 1.7353515625, 1.86907958984375, 2.0028076171875, 2.13653564453125, 2.270263671875, 2.40399169921875, 2.5377197265625, 2.67144775390625, 2.80517578125, 2.93890380859375, 3.0726318359375, 3.20635986328125, 3.340087890625, 3.47381591796875, 3.6075439453125, 3.74127197265625, 3.875]}, "gradients/encoder.encoder.layers.11.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 3.0, 4.0, 4.0, 5.0, 8.0, 14.0, 13.0, 16.0, 20.0, 18.0, 22.0, 36.0, 39.0, 47.0, 45.0, 60.0, 51.0, 69.0, 60.0, 67.0, 52.0, 64.0, 41.0, 44.0, 44.0, 26.0, 32.0, 26.0, 23.0, 14.0, 7.0, 6.0, 6.0, 7.0, 3.0, 1.0, 9.0, 1.0, 4.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.87255859375, -0.8419418334960938, -0.8113250732421875, -0.7807083129882812, -0.750091552734375, -0.7194747924804688, -0.6888580322265625, -0.6582412719726562, -0.62762451171875, -0.5970077514648438, -0.5663909912109375, -0.5357742309570312, -0.505157470703125, -0.47454071044921875, -0.4439239501953125, -0.41330718994140625, -0.3826904296875, -0.35207366943359375, -0.3214569091796875, -0.29084014892578125, -0.260223388671875, -0.22960662841796875, -0.1989898681640625, -0.16837310791015625, -0.13775634765625, -0.10713958740234375, -0.0765228271484375, -0.04590606689453125, -0.015289306640625, 0.01532745361328125, 0.0459442138671875, 0.07656097412109375, 0.107177734375, 0.13779449462890625, 0.1684112548828125, 0.19902801513671875, 0.229644775390625, 0.26026153564453125, 0.2908782958984375, 0.32149505615234375, 0.35211181640625, 0.38272857666015625, 0.4133453369140625, 0.44396209716796875, 0.474578857421875, 0.5051956176757812, 0.5358123779296875, 0.5664291381835938, 0.5970458984375, 0.6276626586914062, 0.6582794189453125, 0.6888961791992188, 0.719512939453125, 0.7501296997070312, 0.7807464599609375, 0.8113632202148438, 0.84197998046875, 0.8725967407226562, 0.9032135009765625, 0.9338302612304688, 0.964447021484375, 0.9950637817382812, 1.0256805419921875, 1.0562973022460938, 1.0869140625]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 5.0, 4.0, 6.0, 8.0, 14.0, 13.0, 27.0, 26.0, 44.0, 65.0, 82.0, 111.0, 158.0, 251.0, 363.0, 569.0, 894.0, 1675.0, 3423.0, 8670.0, 32594.0, 4038652.0, 82379.0, 13899.0, 4933.0, 2183.0, 1124.0, 702.0, 436.0, 266.0, 208.0, 142.0, 106.0, 82.0, 41.0, 33.0, 35.0, 19.0, 18.0, 11.0, 8.0, 6.0, 3.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.771484375, -2.667694091796875, -2.56390380859375, -2.460113525390625, -2.3563232421875, -2.252532958984375, -2.14874267578125, -2.044952392578125, -1.941162109375, -1.837371826171875, -1.73358154296875, -1.629791259765625, -1.5260009765625, -1.422210693359375, -1.31842041015625, -1.214630126953125, -1.11083984375, -1.007049560546875, -0.90325927734375, -0.799468994140625, -0.6956787109375, -0.591888427734375, -0.48809814453125, -0.384307861328125, -0.280517578125, -0.176727294921875, -0.07293701171875, 0.030853271484375, 0.1346435546875, 0.238433837890625, 0.34222412109375, 0.446014404296875, 0.5498046875, 0.653594970703125, 0.75738525390625, 0.861175537109375, 0.9649658203125, 1.068756103515625, 1.17254638671875, 1.276336669921875, 1.380126953125, 1.483917236328125, 1.58770751953125, 1.691497802734375, 1.7952880859375, 1.899078369140625, 2.00286865234375, 2.106658935546875, 2.21044921875, 2.314239501953125, 2.41802978515625, 2.521820068359375, 2.6256103515625, 2.729400634765625, 2.83319091796875, 2.936981201171875, 3.040771484375, 3.144561767578125, 3.24835205078125, 3.352142333984375, 3.4559326171875, 3.559722900390625, 3.66351318359375, 3.767303466796875, 3.87109375]}, "gradients/encoder.encoder.layers.11.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 10.0, 9.0, 10.0, 19.0, 29.0, 77.0, 3662.0, 173.0, 30.0, 21.0, 10.0, 6.0, 9.0, 2.0, 1.0, 5.0, 3.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.77783203125, -0.7487411499023438, -0.7196502685546875, -0.6905593872070312, -0.661468505859375, -0.6323776245117188, -0.6032867431640625, -0.5741958618164062, -0.54510498046875, -0.5160140991210938, -0.4869232177734375, -0.45783233642578125, -0.428741455078125, -0.39965057373046875, -0.3705596923828125, -0.34146881103515625, -0.3123779296875, -0.28328704833984375, -0.2541961669921875, -0.22510528564453125, -0.196014404296875, -0.16692352294921875, -0.1378326416015625, -0.10874176025390625, -0.07965087890625, -0.05055999755859375, -0.0214691162109375, 0.00762176513671875, 0.036712646484375, 0.06580352783203125, 0.0948944091796875, 0.12398529052734375, 0.153076171875, 0.18216705322265625, 0.2112579345703125, 0.24034881591796875, 0.269439697265625, 0.29853057861328125, 0.3276214599609375, 0.35671234130859375, 0.38580322265625, 0.41489410400390625, 0.4439849853515625, 0.47307586669921875, 0.502166748046875, 0.5312576293945312, 0.5603485107421875, 0.5894393920898438, 0.6185302734375, 0.6476211547851562, 0.6767120361328125, 0.7058029174804688, 0.734893798828125, 0.7639846801757812, 0.7930755615234375, 0.8221664428710938, 0.85125732421875, 0.8803482055664062, 0.9094390869140625, 0.9385299682617188, 0.967620849609375, 0.9967117309570312, 1.0258026123046875, 1.0548934936523438, 1.083984375]}, "gradients/encoder.encoder.layers.11.final_layer_norm.weight": {"_type": "histogram", "values": [3.0, 13.0, 26.0, 92.0, 213.0, 349.0, 204.0, 74.0, 26.0, 8.0, 5.0, 2.0, 2.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9026222229003906, -0.738679051399231, -0.5747358798980713, -0.41079264879226685, -0.24684947729110718, -0.08290630578994751, 0.08103692531585693, 0.2449800968170166, 0.40892326831817627, 0.5728664398193359, 0.7368096113204956, 0.9007528424263, 1.0646960735321045, 1.2286391258239746, 1.3925824165344238, 1.5565255880355835, 1.7204687595367432, 1.8844119310379028, 2.0483551025390625, 2.2122983932495117, 2.376241445541382, 2.540184736251831, 2.704127788543701, 2.8680710792541504, 3.0320143699645996, 3.195957660675049, 3.359900712966919, 3.523844003677368, 3.6877870559692383, 3.8517303466796875, 4.015673637390137, 4.179616928100586, 4.343559741973877, 4.507503032684326, 4.671446323394775, 4.835389137268066, 4.999332427978516, 5.163275718688965, 5.327219009399414, 5.491162300109863, 5.655105113983154, 5.8190484046936035, 5.982991695404053, 6.146934509277344, 6.310877799987793, 6.474821090698242, 6.638764381408691, 6.802707672119141, 6.96665096282959, 7.130594253540039, 7.294537544250488, 7.458480358123779, 7.6224236488342285, 7.786366939544678, 7.950310230255127, 8.114253044128418, 8.278196334838867, 8.442139625549316, 8.606082916259766, 8.770026206970215, 8.933969497680664, 9.097911834716797, 9.261855125427246, 9.425798416137695, 9.589741706848145]}, "gradients/encoder.encoder.layers.11.final_layer_norm.bias": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 3.0, 8.0, 10.0, 6.0, 7.0, 12.0, 7.0, 12.0, 17.0, 22.0, 22.0, 26.0, 30.0, 40.0, 27.0, 52.0, 37.0, 49.0, 59.0, 53.0, 41.0, 49.0, 53.0, 59.0, 40.0, 44.0, 40.0, 26.0, 27.0, 30.0, 23.0, 19.0, 8.0, 11.0, 11.0, 7.0, 4.0, 4.0, 5.0, 2.0, 2.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.9365293383598328, -0.8964431881904602, -0.8563570380210876, -0.8162708878517151, -0.7761847376823425, -0.73609858751297, -0.6960123777389526, -0.6559262275695801, -0.6158400774002075, -0.575753927230835, -0.5356677770614624, -0.49558162689208984, -0.4554954767227173, -0.4154093265533447, -0.3753231465816498, -0.3352369964122772, -0.29515087604522705, -0.2550647258758545, -0.21497857570648193, -0.17489241063594818, -0.13480626046657562, -0.09472011029720306, -0.05463394522666931, -0.014547795057296753, 0.025538355112075806, 0.06562450528144836, 0.10571066290140152, 0.14579682052135468, 0.18588297069072723, 0.2259691208600998, 0.26605528593063354, 0.3061414361000061, 0.3462275266647339, 0.38631367683410645, 0.426399827003479, 0.46648597717285156, 0.5065721273422241, 0.5466582775115967, 0.5867444276809692, 0.6268305778503418, 0.6669167280197144, 0.7070028781890869, 0.7470890283584595, 0.787175178527832, 0.8272613286972046, 0.8673474788665771, 0.9074336290359497, 0.9475197792053223, 0.9876059889793396, 1.027692198753357, 1.0677783489227295, 1.107864499092102, 1.1479506492614746, 1.1880367994308472, 1.2281229496002197, 1.2682090997695923, 1.3082952499389648, 1.3483814001083374, 1.38846755027771, 1.4285537004470825, 1.468639850616455, 1.5087260007858276, 1.5488121509552002, 1.5888983011245728, 1.6289844512939453]}, "gradients/encoder.encoder.layers.11.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 1.0, 2.0, 8.0, 7.0, 6.0, 7.0, 12.0, 12.0, 28.0, 42.0, 64.0, 81.0, 128.0, 190.0, 274.0, 435.0, 610.0, 1060.0, 1781.0, 3047.0, 5486.0, 10042.0, 20046.0, 44667.0, 107843.0, 253185.0, 315632.0, 160368.0, 65272.0, 28045.0, 13285.0, 7141.0, 3885.0, 2238.0, 1275.0, 781.0, 548.0, 362.0, 209.0, 146.0, 104.0, 65.0, 41.0, 28.0, 19.0, 14.0, 12.0, 9.0, 7.0, 2.0, 3.0, 3.0, 1.0, 4.0, 2.0, 2.0], "bins": [-2.109375, -2.0477294921875, -1.986083984375, -1.9244384765625, -1.86279296875, -1.8011474609375, -1.739501953125, -1.6778564453125, -1.6162109375, -1.5545654296875, -1.492919921875, -1.4312744140625, -1.36962890625, -1.3079833984375, -1.246337890625, -1.1846923828125, -1.123046875, -1.0614013671875, -0.999755859375, -0.9381103515625, -0.87646484375, -0.8148193359375, -0.753173828125, -0.6915283203125, -0.6298828125, -0.5682373046875, -0.506591796875, -0.4449462890625, -0.38330078125, -0.3216552734375, -0.260009765625, -0.1983642578125, -0.13671875, -0.0750732421875, -0.013427734375, 0.0482177734375, 0.10986328125, 0.1715087890625, 0.233154296875, 0.2947998046875, 0.3564453125, 0.4180908203125, 0.479736328125, 0.5413818359375, 0.60302734375, 0.6646728515625, 0.726318359375, 0.7879638671875, 0.849609375, 0.9112548828125, 0.972900390625, 1.0345458984375, 1.09619140625, 1.1578369140625, 1.219482421875, 1.2811279296875, 1.3427734375, 1.4044189453125, 1.466064453125, 1.5277099609375, 1.58935546875, 1.6510009765625, 1.712646484375, 1.7742919921875, 1.8359375]}, "gradients/encoder.encoder.layers.11.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 4.0, 7.0, 4.0, 11.0, 14.0, 10.0, 12.0, 15.0, 18.0, 21.0, 22.0, 32.0, 44.0, 46.0, 34.0, 46.0, 62.0, 51.0, 56.0, 59.0, 44.0, 46.0, 54.0, 58.0, 46.0, 30.0, 30.0, 24.0, 21.0, 20.0, 19.0, 11.0, 4.0, 6.0, 6.0, 3.0, 0.0, 5.0, 7.0, 2.0, 2.0, 4.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.91845703125, -0.8895950317382812, -0.8607330322265625, -0.8318710327148438, -0.803009033203125, -0.7741470336914062, -0.7452850341796875, -0.7164230346679688, -0.68756103515625, -0.6586990356445312, -0.6298370361328125, -0.6009750366210938, -0.572113037109375, -0.5432510375976562, -0.5143890380859375, -0.48552703857421875, -0.4566650390625, -0.42780303955078125, -0.3989410400390625, -0.37007904052734375, -0.341217041015625, -0.31235504150390625, -0.2834930419921875, -0.25463104248046875, -0.22576904296875, -0.19690704345703125, -0.1680450439453125, -0.13918304443359375, -0.110321044921875, -0.08145904541015625, -0.0525970458984375, -0.02373504638671875, 0.005126953125, 0.03398895263671875, 0.0628509521484375, 0.09171295166015625, 0.120574951171875, 0.14943695068359375, 0.1782989501953125, 0.20716094970703125, 0.23602294921875, 0.26488494873046875, 0.2937469482421875, 0.32260894775390625, 0.351470947265625, 0.38033294677734375, 0.4091949462890625, 0.43805694580078125, 0.4669189453125, 0.49578094482421875, 0.5246429443359375, 0.5535049438476562, 0.582366943359375, 0.6112289428710938, 0.6400909423828125, 0.6689529418945312, 0.69781494140625, 0.7266769409179688, 0.7555389404296875, 0.7844009399414062, 0.813262939453125, 0.8421249389648438, 0.8709869384765625, 0.8998489379882812, 0.9287109375]}, "gradients/encoder.encoder.layers.11.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 4.0, 4.0, 6.0, 10.0, 9.0, 7.0, 14.0, 32.0, 26.0, 35.0, 63.0, 83.0, 137.0, 256.0, 514.0, 919.0, 2190.0, 5142.0, 14393.0, 50659.0, 265627.0, 550698.0, 115714.0, 26923.0, 8608.0, 3364.0, 1490.0, 695.0, 379.0, 190.0, 107.0, 80.0, 61.0, 24.0, 32.0, 14.0, 9.0, 13.0, 10.0, 5.0, 5.0, 1.0, 8.0, 2.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0], "bins": [-3.416015625, -3.313323974609375, -3.21063232421875, -3.107940673828125, -3.0052490234375, -2.902557373046875, -2.79986572265625, -2.697174072265625, -2.594482421875, -2.491790771484375, -2.38909912109375, -2.286407470703125, -2.1837158203125, -2.081024169921875, -1.97833251953125, -1.875640869140625, -1.77294921875, -1.670257568359375, -1.56756591796875, -1.464874267578125, -1.3621826171875, -1.259490966796875, -1.15679931640625, -1.054107666015625, -0.951416015625, -0.848724365234375, -0.74603271484375, -0.643341064453125, -0.5406494140625, -0.437957763671875, -0.33526611328125, -0.232574462890625, -0.1298828125, -0.027191162109375, 0.07550048828125, 0.178192138671875, 0.2808837890625, 0.383575439453125, 0.48626708984375, 0.588958740234375, 0.691650390625, 0.794342041015625, 0.89703369140625, 0.999725341796875, 1.1024169921875, 1.205108642578125, 1.30780029296875, 1.410491943359375, 1.51318359375, 1.615875244140625, 1.71856689453125, 1.821258544921875, 1.9239501953125, 2.026641845703125, 2.12933349609375, 2.232025146484375, 2.334716796875, 2.437408447265625, 2.54010009765625, 2.642791748046875, 2.7454833984375, 2.848175048828125, 2.95086669921875, 3.053558349609375, 3.15625]}, "gradients/encoder.encoder.layers.11.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 3.0, 4.0, 3.0, 6.0, 5.0, 5.0, 6.0, 4.0, 13.0, 19.0, 16.0, 18.0, 22.0, 50.0, 38.0, 46.0, 52.0, 73.0, 69.0, 65.0, 64.0, 74.0, 64.0, 56.0, 41.0, 27.0, 34.0, 33.0, 31.0, 16.0, 14.0, 9.0, 6.0, 4.0, 5.0, 5.0, 6.0, 6.0, 3.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.4140625, -4.211669921875, -4.00927734375, -3.806884765625, -3.6044921875, -3.402099609375, -3.19970703125, -2.997314453125, -2.794921875, -2.592529296875, -2.39013671875, -2.187744140625, -1.9853515625, -1.782958984375, -1.58056640625, -1.378173828125, -1.17578125, -0.973388671875, -0.77099609375, -0.568603515625, -0.3662109375, -0.163818359375, 0.03857421875, 0.240966796875, 0.443359375, 0.645751953125, 0.84814453125, 1.050537109375, 1.2529296875, 1.455322265625, 1.65771484375, 1.860107421875, 2.0625, 2.264892578125, 2.46728515625, 2.669677734375, 2.8720703125, 3.074462890625, 3.27685546875, 3.479248046875, 3.681640625, 3.884033203125, 4.08642578125, 4.288818359375, 4.4912109375, 4.693603515625, 4.89599609375, 5.098388671875, 5.30078125, 5.503173828125, 5.70556640625, 5.907958984375, 6.1103515625, 6.312744140625, 6.51513671875, 6.717529296875, 6.919921875, 7.122314453125, 7.32470703125, 7.527099609375, 7.7294921875, 7.931884765625, 8.13427734375, 8.336669921875, 8.5390625]}, "gradients/encoder.encoder.layers.11.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 4.0, 7.0, 8.0, 11.0, 19.0, 45.0, 85.0, 211.0, 515.0, 2033.0, 25169.0, 1006940.0, 11402.0, 1366.0, 409.0, 162.0, 87.0, 32.0, 30.0, 10.0, 10.0, 8.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.2890625, -6.0201416015625, -5.751220703125, -5.4822998046875, -5.21337890625, -4.9444580078125, -4.675537109375, -4.4066162109375, -4.1376953125, -3.8687744140625, -3.599853515625, -3.3309326171875, -3.06201171875, -2.7930908203125, -2.524169921875, -2.2552490234375, -1.986328125, -1.7174072265625, -1.448486328125, -1.1795654296875, -0.91064453125, -0.6417236328125, -0.372802734375, -0.1038818359375, 0.1650390625, 0.4339599609375, 0.702880859375, 0.9718017578125, 1.24072265625, 1.5096435546875, 1.778564453125, 2.0474853515625, 2.31640625, 2.5853271484375, 2.854248046875, 3.1231689453125, 3.39208984375, 3.6610107421875, 3.929931640625, 4.1988525390625, 4.4677734375, 4.7366943359375, 5.005615234375, 5.2745361328125, 5.54345703125, 5.8123779296875, 6.081298828125, 6.3502197265625, 6.619140625, 6.8880615234375, 7.156982421875, 7.4259033203125, 7.69482421875, 7.9637451171875, 8.232666015625, 8.5015869140625, 8.7705078125, 9.0394287109375, 9.308349609375, 9.5772705078125, 9.84619140625, 10.1151123046875, 10.384033203125, 10.6529541015625, 10.921875]}, "gradients/encoder.encoder.layers.11.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 2.0, 2.0, 2.0, 1.0, 2.0, 3.0, 9.0, 11.0, 6.0, 15.0, 31.0, 32.0, 88.0, 110.0, 173.0, 154.0, 144.0, 83.0, 44.0, 37.0, 12.0, 17.0, 11.0, 9.0, 5.0, 2.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.0002753734588623047, -0.00026654452085494995, -0.0002577155828475952, -0.0002488866448402405, -0.00024005770683288574, -0.000231228768825531, -0.00022239983081817627, -0.00021357089281082153, -0.0002047419548034668, -0.00019591301679611206, -0.00018708407878875732, -0.0001782551407814026, -0.00016942620277404785, -0.00016059726476669312, -0.00015176832675933838, -0.00014293938875198364, -0.0001341104507446289, -0.00012528151273727417, -0.00011645257472991943, -0.0001076236367225647, -9.879469871520996e-05, -8.996576070785522e-05, -8.113682270050049e-05, -7.230788469314575e-05, -6.347894668579102e-05, -5.465000867843628e-05, -4.582107067108154e-05, -3.699213266372681e-05, -2.816319465637207e-05, -1.9334256649017334e-05, -1.0505318641662598e-05, -1.6763806343078613e-06, 7.152557373046875e-06, 1.598149538040161e-05, 2.4810433387756348e-05, 3.3639371395111084e-05, 4.246830940246582e-05, 5.129724740982056e-05, 6.012618541717529e-05, 6.895512342453003e-05, 7.778406143188477e-05, 8.66129994392395e-05, 9.544193744659424e-05, 0.00010427087545394897, 0.00011309981346130371, 0.00012192875146865845, 0.00013075768947601318, 0.00013958662748336792, 0.00014841556549072266, 0.0001572445034980774, 0.00016607344150543213, 0.00017490237951278687, 0.0001837313175201416, 0.00019256025552749634, 0.00020138919353485107, 0.0002102181315422058, 0.00021904706954956055, 0.00022787600755691528, 0.00023670494556427002, 0.00024553388357162476, 0.0002543628215789795, 0.00026319175958633423, 0.00027202069759368896, 0.0002808496356010437, 0.00028967857360839844]}, "gradients/encoder.encoder.layers.11.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 2.0, 5.0, 3.0, 4.0, 3.0, 8.0, 11.0, 18.0, 26.0, 44.0, 83.0, 141.0, 250.0, 548.0, 1339.0, 4008.0, 16189.0, 274219.0, 715354.0, 27591.0, 5565.0, 1733.0, 718.0, 307.0, 180.0, 69.0, 50.0, 31.0, 20.0, 20.0, 8.0, 5.0, 3.0, 3.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-3.080078125, -2.98712158203125, -2.8941650390625, -2.80120849609375, -2.708251953125, -2.61529541015625, -2.5223388671875, -2.42938232421875, -2.33642578125, -2.24346923828125, -2.1505126953125, -2.05755615234375, -1.964599609375, -1.87164306640625, -1.7786865234375, -1.68572998046875, -1.5927734375, -1.49981689453125, -1.4068603515625, -1.31390380859375, -1.220947265625, -1.12799072265625, -1.0350341796875, -0.94207763671875, -0.84912109375, -0.75616455078125, -0.6632080078125, -0.57025146484375, -0.477294921875, -0.38433837890625, -0.2913818359375, -0.19842529296875, -0.10546875, -0.01251220703125, 0.0804443359375, 0.17340087890625, 0.266357421875, 0.35931396484375, 0.4522705078125, 0.54522705078125, 0.63818359375, 0.73114013671875, 0.8240966796875, 0.91705322265625, 1.010009765625, 1.10296630859375, 1.1959228515625, 1.28887939453125, 1.3818359375, 1.47479248046875, 1.5677490234375, 1.66070556640625, 1.753662109375, 1.84661865234375, 1.9395751953125, 2.03253173828125, 2.12548828125, 2.21844482421875, 2.3114013671875, 2.40435791015625, 2.497314453125, 2.59027099609375, 2.6832275390625, 2.77618408203125, 2.869140625]}, "gradients/encoder.encoder.layers.11.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 5.0, 3.0, 4.0, 5.0, 1.0, 1.0, 6.0, 11.0, 23.0, 27.0, 57.0, 105.0, 203.0, 256.0, 154.0, 70.0, 29.0, 20.0, 7.0, 8.0, 7.0, 1.0, 0.0, 1.0, 2.0, 2.0, 3.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.849609375, -3.675384521484375, -3.50115966796875, -3.326934814453125, -3.1527099609375, -2.978485107421875, -2.80426025390625, -2.630035400390625, -2.455810546875, -2.281585693359375, -2.10736083984375, -1.933135986328125, -1.7589111328125, -1.584686279296875, -1.41046142578125, -1.236236572265625, -1.06201171875, -0.887786865234375, -0.71356201171875, -0.539337158203125, -0.3651123046875, -0.190887451171875, -0.01666259765625, 0.157562255859375, 0.331787109375, 0.506011962890625, 0.68023681640625, 0.854461669921875, 1.0286865234375, 1.202911376953125, 1.37713623046875, 1.551361083984375, 1.7255859375, 1.899810791015625, 2.07403564453125, 2.248260498046875, 2.4224853515625, 2.596710205078125, 2.77093505859375, 2.945159912109375, 3.119384765625, 3.293609619140625, 3.46783447265625, 3.642059326171875, 3.8162841796875, 3.990509033203125, 4.16473388671875, 4.338958740234375, 4.51318359375, 4.687408447265625, 4.86163330078125, 5.035858154296875, 5.2100830078125, 5.384307861328125, 5.55853271484375, 5.732757568359375, 5.906982421875, 6.081207275390625, 6.25543212890625, 6.429656982421875, 6.6038818359375, 6.778106689453125, 6.95233154296875, 7.126556396484375, 7.30078125]}, "gradients/encoder.encoder.layers.11.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 4.0, 9.0, 22.0, 59.0, 160.0, 337.0, 274.0, 97.0, 35.0, 12.0, 6.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-72.20555877685547, -69.6031494140625, -67.000732421875, -64.39832305908203, -61.7959098815918, -59.19349670410156, -56.59108352661133, -53.988670349121094, -51.386260986328125, -48.78384780883789, -46.181434631347656, -43.57902526855469, -40.97661209106445, -38.37419891357422, -35.771785736083984, -33.16937255859375, -30.566959381103516, -27.96454620361328, -25.36213493347168, -22.759721755981445, -20.157310485839844, -17.55489730834961, -14.952484130859375, -12.350072860717773, -9.747659683227539, -7.145247459411621, -4.542834758758545, -1.9404220581054688, 0.6619901657104492, 3.264402389526367, 5.866815567016602, 8.469226837158203, 11.071640014648438, 13.674052238464355, 16.276464462280273, 18.878877639770508, 21.48128890991211, 24.083702087402344, 26.686115264892578, 29.28852653503418, 31.890939712524414, 34.493350982666016, 37.09576416015625, 39.698177337646484, 42.30059051513672, 44.90299987792969, 47.50541687011719, 50.107826232910156, 52.71023941040039, 55.312652587890625, 57.91506576538086, 60.517478942871094, 63.11988830566406, 65.72230529785156, 68.32471466064453, 70.9271240234375, 73.529541015625, 76.13195037841797, 78.73436737060547, 81.33677673339844, 83.93919372558594, 86.5416030883789, 89.14401245117188, 91.74642944335938, 94.34883880615234]}, "gradients/encoder.encoder.layers.11.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 3.0, 0.0, 2.0, 1.0, 0.0, 1.0, 0.0, 5.0, 5.0, 6.0, 12.0, 19.0, 16.0, 28.0, 21.0, 30.0, 33.0, 27.0, 53.0, 55.0, 62.0, 65.0, 59.0, 61.0, 66.0, 58.0, 57.0, 32.0, 41.0, 48.0, 21.0, 24.0, 20.0, 13.0, 11.0, 9.0, 7.0, 13.0, 6.0, 9.0, 7.0, 2.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-34.153141021728516, -33.114498138427734, -32.07585525512695, -31.037214279174805, -29.998571395874023, -28.959928512573242, -27.921287536621094, -26.882644653320312, -25.84400177001953, -24.80535888671875, -23.76671600341797, -22.72807502746582, -21.68943214416504, -20.650789260864258, -19.61214828491211, -18.573505401611328, -17.534862518310547, -16.496219635009766, -15.4575777053833, -14.418935775756836, -13.380292892456055, -12.341650009155273, -11.303008079528809, -10.264366149902344, -9.225723266601562, -8.187080383300781, -7.148438453674316, -6.109796047210693, -5.07115364074707, -4.032511234283447, -2.993868827819824, -1.9552264213562012, -0.9165802001953125, 0.12206220626831055, 1.1607046127319336, 2.1993470191955566, 3.2379894256591797, 4.276631832122803, 5.315274238586426, 6.353916645050049, 7.392559051513672, 8.431201934814453, 9.469843864440918, 10.508485794067383, 11.547128677368164, 12.585771560668945, 13.62441349029541, 14.663055419921875, 15.701698303222656, 16.740341186523438, 17.77898406982422, 18.817625045776367, 19.85626792907715, 20.89491081237793, 21.933551788330078, 22.97219467163086, 24.01083755493164, 25.049480438232422, 26.088123321533203, 27.12676429748535, 28.165407180786133, 29.204050064086914, 30.242691040039062, 31.281333923339844, 32.319976806640625]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 3.0, 7.0, 3.0, 7.0, 14.0, 12.0, 12.0, 21.0, 23.0, 27.0, 38.0, 50.0, 88.0, 129.0, 188.0, 343.0, 596.0, 1151.0, 2644.0, 7322.0, 41235.0, 4080213.0, 46483.0, 8149.0, 2776.0, 1281.0, 611.0, 349.0, 176.0, 109.0, 81.0, 49.0, 34.0, 14.0, 14.0, 13.0, 5.0, 11.0, 1.0, 2.0, 1.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.23828125, -5.06085205078125, -4.8834228515625, -4.70599365234375, -4.528564453125, -4.35113525390625, -4.1737060546875, -3.99627685546875, -3.81884765625, -3.64141845703125, -3.4639892578125, -3.28656005859375, -3.109130859375, -2.93170166015625, -2.7542724609375, -2.57684326171875, -2.3994140625, -2.22198486328125, -2.0445556640625, -1.86712646484375, -1.689697265625, -1.51226806640625, -1.3348388671875, -1.15740966796875, -0.97998046875, -0.80255126953125, -0.6251220703125, -0.44769287109375, -0.270263671875, -0.09283447265625, 0.0845947265625, 0.26202392578125, 0.439453125, 0.61688232421875, 0.7943115234375, 0.97174072265625, 1.149169921875, 1.32659912109375, 1.5040283203125, 1.68145751953125, 1.85888671875, 2.03631591796875, 2.2137451171875, 2.39117431640625, 2.568603515625, 2.74603271484375, 2.9234619140625, 3.10089111328125, 3.2783203125, 3.45574951171875, 3.6331787109375, 3.81060791015625, 3.988037109375, 4.16546630859375, 4.3428955078125, 4.52032470703125, 4.69775390625, 4.87518310546875, 5.0526123046875, 5.23004150390625, 5.407470703125, 5.58489990234375, 5.7623291015625, 5.93975830078125, 6.1171875]}, "gradients/encoder.encoder.layers.10.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 1.0, 2.0, 4.0, 6.0, 2.0, 12.0, 7.0, 15.0, 22.0, 36.0, 36.0, 74.0, 78.0, 100.0, 110.0, 106.0, 99.0, 83.0, 52.0, 42.0, 27.0, 26.0, 19.0, 20.0, 7.0, 6.0, 6.0, 2.0, 1.0, 5.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.107421875, -2.0435333251953125, -1.979644775390625, -1.9157562255859375, -1.85186767578125, -1.7879791259765625, -1.724090576171875, -1.6602020263671875, -1.5963134765625, -1.5324249267578125, -1.468536376953125, -1.4046478271484375, -1.34075927734375, -1.2768707275390625, -1.212982177734375, -1.1490936279296875, -1.085205078125, -1.0213165283203125, -0.957427978515625, -0.8935394287109375, -0.82965087890625, -0.7657623291015625, -0.701873779296875, -0.6379852294921875, -0.5740966796875, -0.5102081298828125, -0.446319580078125, -0.3824310302734375, -0.31854248046875, -0.2546539306640625, -0.190765380859375, -0.1268768310546875, -0.06298828125, 0.0009002685546875, 0.064788818359375, 0.1286773681640625, 0.19256591796875, 0.2564544677734375, 0.320343017578125, 0.3842315673828125, 0.4481201171875, 0.5120086669921875, 0.575897216796875, 0.6397857666015625, 0.70367431640625, 0.7675628662109375, 0.831451416015625, 0.8953399658203125, 0.959228515625, 1.0231170654296875, 1.087005615234375, 1.1508941650390625, 1.21478271484375, 1.2786712646484375, 1.342559814453125, 1.4064483642578125, 1.4703369140625, 1.5342254638671875, 1.598114013671875, 1.6620025634765625, 1.72589111328125, 1.7897796630859375, 1.853668212890625, 1.9175567626953125, 1.9814453125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 1.0, 1.0, 4.0, 3.0, 5.0, 10.0, 9.0, 10.0, 18.0, 16.0, 28.0, 33.0, 61.0, 69.0, 85.0, 145.0, 183.0, 248.0, 312.0, 464.0, 703.0, 930.0, 1487.0, 2338.0, 3673.0, 6816.0, 12865.0, 29776.0, 109406.0, 3813287.0, 143944.0, 34189.0, 14337.0, 7309.0, 3966.0, 2483.0, 1608.0, 965.0, 724.0, 520.0, 346.0, 258.0, 157.0, 143.0, 93.0, 66.0, 58.0, 38.0, 28.0, 24.0, 16.0, 12.0, 9.0, 2.0, 4.0, 2.0, 5.0, 2.0, 1.0, 3.0, 3.0], "bins": [-3.24609375, -3.14642333984375, -3.0467529296875, -2.94708251953125, -2.847412109375, -2.74774169921875, -2.6480712890625, -2.54840087890625, -2.44873046875, -2.34906005859375, -2.2493896484375, -2.14971923828125, -2.050048828125, -1.95037841796875, -1.8507080078125, -1.75103759765625, -1.6513671875, -1.55169677734375, -1.4520263671875, -1.35235595703125, -1.252685546875, -1.15301513671875, -1.0533447265625, -0.95367431640625, -0.85400390625, -0.75433349609375, -0.6546630859375, -0.55499267578125, -0.455322265625, -0.35565185546875, -0.2559814453125, -0.15631103515625, -0.056640625, 0.04302978515625, 0.1427001953125, 0.24237060546875, 0.342041015625, 0.44171142578125, 0.5413818359375, 0.64105224609375, 0.74072265625, 0.84039306640625, 0.9400634765625, 1.03973388671875, 1.139404296875, 1.23907470703125, 1.3387451171875, 1.43841552734375, 1.5380859375, 1.63775634765625, 1.7374267578125, 1.83709716796875, 1.936767578125, 2.03643798828125, 2.1361083984375, 2.23577880859375, 2.33544921875, 2.43511962890625, 2.5347900390625, 2.63446044921875, 2.734130859375, 2.83380126953125, 2.9334716796875, 3.03314208984375, 3.1328125]}, "gradients/encoder.encoder.layers.10.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 0.0, 0.0, 2.0, 5.0, 2.0, 2.0, 6.0, 4.0, 11.0, 8.0, 13.0, 16.0, 19.0, 30.0, 54.0, 96.0, 454.0, 3011.0, 151.0, 59.0, 36.0, 19.0, 20.0, 11.0, 10.0, 8.0, 12.0, 4.0, 3.0, 3.0, 1.0, 3.0, 5.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0], "bins": [-1.228515625, -1.191436767578125, -1.15435791015625, -1.117279052734375, -1.0802001953125, -1.043121337890625, -1.00604248046875, -0.968963623046875, -0.931884765625, -0.894805908203125, -0.85772705078125, -0.820648193359375, -0.7835693359375, -0.746490478515625, -0.70941162109375, -0.672332763671875, -0.63525390625, -0.598175048828125, -0.56109619140625, -0.524017333984375, -0.4869384765625, -0.449859619140625, -0.41278076171875, -0.375701904296875, -0.338623046875, -0.301544189453125, -0.26446533203125, -0.227386474609375, -0.1903076171875, -0.153228759765625, -0.11614990234375, -0.079071044921875, -0.0419921875, -0.004913330078125, 0.03216552734375, 0.069244384765625, 0.1063232421875, 0.143402099609375, 0.18048095703125, 0.217559814453125, 0.254638671875, 0.291717529296875, 0.32879638671875, 0.365875244140625, 0.4029541015625, 0.440032958984375, 0.47711181640625, 0.514190673828125, 0.55126953125, 0.588348388671875, 0.62542724609375, 0.662506103515625, 0.6995849609375, 0.736663818359375, 0.77374267578125, 0.810821533203125, 0.847900390625, 0.884979248046875, 0.92205810546875, 0.959136962890625, 0.9962158203125, 1.033294677734375, 1.07037353515625, 1.107452392578125, 1.14453125]}, "gradients/encoder.encoder.layers.10.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 4.0, 4.0, 9.0, 24.0, 55.0, 90.0, 145.0, 199.0, 178.0, 131.0, 68.0, 37.0, 26.0, 15.0, 6.0, 9.0, 3.0, 5.0, 2.0, 2.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.453207492828369, -4.201204299926758, -3.9492008686065674, -3.697197437286377, -3.4451942443847656, -3.193190813064575, -2.9411873817443848, -2.6891841888427734, -2.437180757522583, -2.1851773262023926, -1.9331741333007812, -1.6811707019805908, -1.42916738986969, -1.177164077758789, -0.9251606464385986, -0.6731573343276978, -0.4211540222167969, -0.1691506803035736, 0.08285266160964966, 0.3348560333251953, 0.5868593454360962, 0.8388626575469971, 1.0908660888671875, 1.3428694009780884, 1.5948727130889893, 1.8468760251998901, 2.098879337310791, 2.3508827686309814, 2.602886199951172, 2.854889392852783, 3.1068928241729736, 3.358896255493164, 3.6108999252319336, 3.862903356552124, 4.1149067878723145, 4.366909980773926, 4.618913173675537, 4.870916366577148, 5.122920036315918, 5.374923229217529, 5.626926422119141, 5.878929615020752, 6.1309332847595215, 6.382936477661133, 6.634939670562744, 6.8869428634643555, 7.138946533203125, 7.390949726104736, 7.642953395843506, 7.894956588745117, 8.146960258483887, 8.398963928222656, 8.65096664428711, 8.902970314025879, 9.154973983764648, 9.406976699829102, 9.658980369567871, 9.91098403930664, 10.162986755371094, 10.414990425109863, 10.666994094848633, 10.918996810913086, 11.171000480651855, 11.423004150390625, 11.675006866455078]}, "gradients/encoder.encoder.layers.10.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 2.0, 0.0, 0.0, 4.0, 0.0, 4.0, 1.0, 4.0, 9.0, 10.0, 4.0, 12.0, 14.0, 11.0, 19.0, 19.0, 20.0, 23.0, 24.0, 30.0, 28.0, 43.0, 32.0, 39.0, 50.0, 34.0, 56.0, 51.0, 42.0, 31.0, 28.0, 45.0, 36.0, 46.0, 28.0, 24.0, 37.0, 31.0, 29.0, 16.0, 18.0, 17.0, 12.0, 5.0, 7.0, 3.0, 5.0, 5.0, 2.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.00634765625, -2.904017925262451, -2.8016879558563232, -2.6993582248687744, -2.5970282554626465, -2.4946985244750977, -2.392368793487549, -2.2900390625, -2.187709093093872, -2.0853793621063232, -1.9830493927001953, -1.8807196617126465, -1.778389811515808, -1.6760599613189697, -1.573730230331421, -1.4714003801345825, -1.3690705299377441, -1.2667406797409058, -1.1644108295440674, -1.0620810985565186, -0.9597512483596802, -0.8574213981628418, -0.7550916075706482, -0.6527618169784546, -0.5504319667816162, -0.4481021463871002, -0.34577232599258423, -0.24344250559806824, -0.14111268520355225, -0.03878283500671387, 0.06354695558547974, 0.16587674617767334, 0.2682068347930908, 0.3705366551876068, 0.4728664755821228, 0.5751962661743164, 0.6775261163711548, 0.7798559665679932, 0.8821857571601868, 0.9845155477523804, 1.0868453979492188, 1.1891752481460571, 1.2915050983428955, 1.3938348293304443, 1.4961646795272827, 1.598494529724121, 1.70082426071167, 1.8031541109085083, 1.9054839611053467, 2.0078136920928955, 2.1101436614990234, 2.2124733924865723, 2.314803123474121, 2.417133092880249, 2.519462823867798, 2.621792793273926, 2.7241225242614746, 2.8264522552490234, 2.9287822246551514, 3.0311119556427, 3.133441925048828, 3.235771656036377, 3.338101387023926, 3.4404311180114746, 3.5427610874176025]}, "gradients/encoder.encoder.layers.10.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 3.0, 5.0, 10.0, 8.0, 15.0, 15.0, 17.0, 43.0, 57.0, 76.0, 98.0, 170.0, 235.0, 400.0, 605.0, 1060.0, 1973.0, 4018.0, 9196.0, 23491.0, 69331.0, 213637.0, 410239.0, 206894.0, 66358.0, 23177.0, 8952.0, 3920.0, 1886.0, 991.0, 581.0, 349.0, 236.0, 153.0, 112.0, 71.0, 46.0, 45.0, 17.0, 17.0, 16.0, 8.0, 9.0, 7.0, 2.0, 5.0, 6.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-2.365234375, -2.282196044921875, -2.19915771484375, -2.116119384765625, -2.0330810546875, -1.950042724609375, -1.86700439453125, -1.783966064453125, -1.700927734375, -1.617889404296875, -1.53485107421875, -1.451812744140625, -1.3687744140625, -1.285736083984375, -1.20269775390625, -1.119659423828125, -1.03662109375, -0.953582763671875, -0.87054443359375, -0.787506103515625, -0.7044677734375, -0.621429443359375, -0.53839111328125, -0.455352783203125, -0.372314453125, -0.289276123046875, -0.20623779296875, -0.123199462890625, -0.0401611328125, 0.042877197265625, 0.12591552734375, 0.208953857421875, 0.2919921875, 0.375030517578125, 0.45806884765625, 0.541107177734375, 0.6241455078125, 0.707183837890625, 0.79022216796875, 0.873260498046875, 0.956298828125, 1.039337158203125, 1.12237548828125, 1.205413818359375, 1.2884521484375, 1.371490478515625, 1.45452880859375, 1.537567138671875, 1.62060546875, 1.703643798828125, 1.78668212890625, 1.869720458984375, 1.9527587890625, 2.035797119140625, 2.11883544921875, 2.201873779296875, 2.284912109375, 2.367950439453125, 2.45098876953125, 2.534027099609375, 2.6170654296875, 2.700103759765625, 2.78314208984375, 2.866180419921875, 2.94921875]}, "gradients/encoder.encoder.layers.10.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 3.0, 1.0, 3.0, 5.0, 4.0, 8.0, 18.0, 20.0, 34.0, 45.0, 44.0, 54.0, 69.0, 69.0, 93.0, 98.0, 84.0, 62.0, 50.0, 56.0, 52.0, 36.0, 33.0, 9.0, 23.0, 10.0, 6.0, 8.0, 4.0, 1.0, 3.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.19140625, -2.1310882568359375, -2.070770263671875, -2.0104522705078125, -1.95013427734375, -1.8898162841796875, -1.829498291015625, -1.7691802978515625, -1.7088623046875, -1.6485443115234375, -1.588226318359375, -1.5279083251953125, -1.46759033203125, -1.4072723388671875, -1.346954345703125, -1.2866363525390625, -1.226318359375, -1.1660003662109375, -1.105682373046875, -1.0453643798828125, -0.98504638671875, -0.9247283935546875, -0.864410400390625, -0.8040924072265625, -0.7437744140625, -0.6834564208984375, -0.623138427734375, -0.5628204345703125, -0.50250244140625, -0.4421844482421875, -0.381866455078125, -0.3215484619140625, -0.26123046875, -0.2009124755859375, -0.140594482421875, -0.0802764892578125, -0.01995849609375, 0.0403594970703125, 0.100677490234375, 0.1609954833984375, 0.2213134765625, 0.2816314697265625, 0.341949462890625, 0.4022674560546875, 0.46258544921875, 0.5229034423828125, 0.583221435546875, 0.6435394287109375, 0.703857421875, 0.7641754150390625, 0.824493408203125, 0.8848114013671875, 0.94512939453125, 1.0054473876953125, 1.065765380859375, 1.1260833740234375, 1.1864013671875, 1.2467193603515625, 1.307037353515625, 1.3673553466796875, 1.42767333984375, 1.4879913330078125, 1.548309326171875, 1.6086273193359375, 1.6689453125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 4.0, 3.0, 2.0, 4.0, 2.0, 8.0, 5.0, 12.0, 37.0, 44.0, 81.0, 147.0, 294.0, 625.0, 1668.0, 5985.0, 30959.0, 336257.0, 602547.0, 56834.0, 9063.0, 2382.0, 849.0, 364.0, 157.0, 99.0, 53.0, 25.0, 14.0, 14.0, 9.0, 4.0, 7.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0], "bins": [-7.09765625, -6.8897705078125, -6.681884765625, -6.4739990234375, -6.26611328125, -6.0582275390625, -5.850341796875, -5.6424560546875, -5.4345703125, -5.2266845703125, -5.018798828125, -4.8109130859375, -4.60302734375, -4.3951416015625, -4.187255859375, -3.9793701171875, -3.771484375, -3.5635986328125, -3.355712890625, -3.1478271484375, -2.93994140625, -2.7320556640625, -2.524169921875, -2.3162841796875, -2.1083984375, -1.9005126953125, -1.692626953125, -1.4847412109375, -1.27685546875, -1.0689697265625, -0.861083984375, -0.6531982421875, -0.4453125, -0.2374267578125, -0.029541015625, 0.1783447265625, 0.38623046875, 0.5941162109375, 0.802001953125, 1.0098876953125, 1.2177734375, 1.4256591796875, 1.633544921875, 1.8414306640625, 2.04931640625, 2.2572021484375, 2.465087890625, 2.6729736328125, 2.880859375, 3.0887451171875, 3.296630859375, 3.5045166015625, 3.71240234375, 3.9202880859375, 4.128173828125, 4.3360595703125, 4.5439453125, 4.7518310546875, 4.959716796875, 5.1676025390625, 5.37548828125, 5.5833740234375, 5.791259765625, 5.9991455078125, 6.20703125]}, "gradients/encoder.encoder.layers.10.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 3.0, 4.0, 5.0, 7.0, 5.0, 7.0, 6.0, 10.0, 14.0, 13.0, 15.0, 17.0, 21.0, 31.0, 26.0, 29.0, 33.0, 44.0, 49.0, 49.0, 49.0, 54.0, 57.0, 58.0, 60.0, 42.0, 46.0, 42.0, 35.0, 39.0, 27.0, 20.0, 23.0, 16.0, 15.0, 9.0, 8.0, 6.0, 1.0, 1.0, 4.0, 2.0, 1.0, 2.0, 3.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-6.72265625, -6.5030517578125, -6.283447265625, -6.0638427734375, -5.84423828125, -5.6246337890625, -5.405029296875, -5.1854248046875, -4.9658203125, -4.7462158203125, -4.526611328125, -4.3070068359375, -4.08740234375, -3.8677978515625, -3.648193359375, -3.4285888671875, -3.208984375, -2.9893798828125, -2.769775390625, -2.5501708984375, -2.33056640625, -2.1109619140625, -1.891357421875, -1.6717529296875, -1.4521484375, -1.2325439453125, -1.012939453125, -0.7933349609375, -0.57373046875, -0.3541259765625, -0.134521484375, 0.0850830078125, 0.3046875, 0.5242919921875, 0.743896484375, 0.9635009765625, 1.18310546875, 1.4027099609375, 1.622314453125, 1.8419189453125, 2.0615234375, 2.2811279296875, 2.500732421875, 2.7203369140625, 2.93994140625, 3.1595458984375, 3.379150390625, 3.5987548828125, 3.818359375, 4.0379638671875, 4.257568359375, 4.4771728515625, 4.69677734375, 4.9163818359375, 5.135986328125, 5.3555908203125, 5.5751953125, 5.7947998046875, 6.014404296875, 6.2340087890625, 6.45361328125, 6.6732177734375, 6.892822265625, 7.1124267578125, 7.33203125]}, "gradients/encoder.encoder.layers.10.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 6.0, 11.0, 11.0, 14.0, 37.0, 70.0, 131.0, 292.0, 877.0, 3872.0, 92575.0, 930700.0, 17065.0, 1901.0, 561.0, 203.0, 103.0, 55.0, 26.0, 19.0, 16.0, 7.0, 2.0, 3.0, 3.0, 2.0, 1.0, 2.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.80859375, -6.62603759765625, -6.4434814453125, -6.26092529296875, -6.078369140625, -5.89581298828125, -5.7132568359375, -5.53070068359375, -5.34814453125, -5.16558837890625, -4.9830322265625, -4.80047607421875, -4.617919921875, -4.43536376953125, -4.2528076171875, -4.07025146484375, -3.8876953125, -3.70513916015625, -3.5225830078125, -3.34002685546875, -3.157470703125, -2.97491455078125, -2.7923583984375, -2.60980224609375, -2.42724609375, -2.24468994140625, -2.0621337890625, -1.87957763671875, -1.697021484375, -1.51446533203125, -1.3319091796875, -1.14935302734375, -0.966796875, -0.78424072265625, -0.6016845703125, -0.41912841796875, -0.236572265625, -0.05401611328125, 0.1285400390625, 0.31109619140625, 0.49365234375, 0.67620849609375, 0.8587646484375, 1.04132080078125, 1.223876953125, 1.40643310546875, 1.5889892578125, 1.77154541015625, 1.9541015625, 2.13665771484375, 2.3192138671875, 2.50177001953125, 2.684326171875, 2.86688232421875, 3.0494384765625, 3.23199462890625, 3.41455078125, 3.59710693359375, 3.7796630859375, 3.96221923828125, 4.144775390625, 4.32733154296875, 4.5098876953125, 4.69244384765625, 4.875]}, "gradients/encoder.encoder.layers.10.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 4.0, 7.0, 9.0, 15.0, 31.0, 64.0, 110.0, 202.0, 224.0, 162.0, 76.0, 59.0, 24.0, 16.0, 9.0, 7.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0006542205810546875, -0.0006339848041534424, -0.0006137490272521973, -0.0005935132503509521, -0.000573277473449707, -0.0005530416965484619, -0.0005328059196472168, -0.0005125701427459717, -0.0004923343658447266, -0.00047209858894348145, -0.00045186281204223633, -0.0004316270351409912, -0.0004113912582397461, -0.000391155481338501, -0.00037091970443725586, -0.00035068392753601074, -0.0003304481506347656, -0.0003102123737335205, -0.0002899765968322754, -0.0002697408199310303, -0.00024950504302978516, -0.00022926926612854004, -0.00020903348922729492, -0.0001887977123260498, -0.0001685619354248047, -0.00014832615852355957, -0.00012809038162231445, -0.00010785460472106934, -8.761882781982422e-05, -6.73830509185791e-05, -4.7147274017333984e-05, -2.6911497116088867e-05, -6.67572021484375e-06, 1.3560056686401367e-05, 3.3795833587646484e-05, 5.40316104888916e-05, 7.426738739013672e-05, 9.450316429138184e-05, 0.00011473894119262695, 0.00013497471809387207, 0.0001552104949951172, 0.0001754462718963623, 0.00019568204879760742, 0.00021591782569885254, 0.00023615360260009766, 0.0002563893795013428, 0.0002766251564025879, 0.000296860933303833, 0.0003170967102050781, 0.00033733248710632324, 0.00035756826400756836, 0.0003778040409088135, 0.0003980398178100586, 0.0004182755947113037, 0.00043851137161254883, 0.00045874714851379395, 0.00047898292541503906, 0.0004992187023162842, 0.0005194544792175293, 0.0005396902561187744, 0.0005599260330200195, 0.0005801618099212646, 0.0006003975868225098, 0.0006206333637237549, 0.000640869140625]}, "gradients/encoder.encoder.layers.10.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 2.0, 4.0, 4.0, 5.0, 16.0, 20.0, 38.0, 87.0, 280.0, 948.0, 6211.0, 473213.0, 559489.0, 6770.0, 1024.0, 266.0, 87.0, 47.0, 22.0, 12.0, 3.0, 7.0, 4.0, 2.0, 2.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.625, -6.4552001953125, -6.285400390625, -6.1156005859375, -5.94580078125, -5.7760009765625, -5.606201171875, -5.4364013671875, -5.2666015625, -5.0968017578125, -4.927001953125, -4.7572021484375, -4.58740234375, -4.4176025390625, -4.247802734375, -4.0780029296875, -3.908203125, -3.7384033203125, -3.568603515625, -3.3988037109375, -3.22900390625, -3.0592041015625, -2.889404296875, -2.7196044921875, -2.5498046875, -2.3800048828125, -2.210205078125, -2.0404052734375, -1.87060546875, -1.7008056640625, -1.531005859375, -1.3612060546875, -1.19140625, -1.0216064453125, -0.851806640625, -0.6820068359375, -0.51220703125, -0.3424072265625, -0.172607421875, -0.0028076171875, 0.1669921875, 0.3367919921875, 0.506591796875, 0.6763916015625, 0.84619140625, 1.0159912109375, 1.185791015625, 1.3555908203125, 1.525390625, 1.6951904296875, 1.864990234375, 2.0347900390625, 2.20458984375, 2.3743896484375, 2.544189453125, 2.7139892578125, 2.8837890625, 3.0535888671875, 3.223388671875, 3.3931884765625, 3.56298828125, 3.7327880859375, 3.902587890625, 4.0723876953125, 4.2421875]}, "gradients/encoder.encoder.layers.10.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 3.0, 6.0, 2.0, 7.0, 11.0, 16.0, 21.0, 43.0, 57.0, 74.0, 116.0, 122.0, 130.0, 97.0, 90.0, 77.0, 41.0, 26.0, 22.0, 19.0, 9.0, 12.0, 2.0, 4.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-4.19140625, -4.0869140625, -3.982421875, -3.8779296875, -3.7734375, -3.6689453125, -3.564453125, -3.4599609375, -3.35546875, -3.2509765625, -3.146484375, -3.0419921875, -2.9375, -2.8330078125, -2.728515625, -2.6240234375, -2.51953125, -2.4150390625, -2.310546875, -2.2060546875, -2.1015625, -1.9970703125, -1.892578125, -1.7880859375, -1.68359375, -1.5791015625, -1.474609375, -1.3701171875, -1.265625, -1.1611328125, -1.056640625, -0.9521484375, -0.84765625, -0.7431640625, -0.638671875, -0.5341796875, -0.4296875, -0.3251953125, -0.220703125, -0.1162109375, -0.01171875, 0.0927734375, 0.197265625, 0.3017578125, 0.40625, 0.5107421875, 0.615234375, 0.7197265625, 0.82421875, 0.9287109375, 1.033203125, 1.1376953125, 1.2421875, 1.3466796875, 1.451171875, 1.5556640625, 1.66015625, 1.7646484375, 1.869140625, 1.9736328125, 2.078125, 2.1826171875, 2.287109375, 2.3916015625, 2.49609375]}, "gradients/encoder.encoder.layers.10.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 2.0, 12.0, 23.0, 58.0, 120.0, 205.0, 219.0, 183.0, 104.0, 37.0, 21.0, 14.0, 4.0, 2.0, 2.0, 1.0, 0.0, 3.0, 2.0], "bins": [-101.10289001464844, -99.13160705566406, -97.16031646728516, -95.18903350830078, -93.2177505493164, -91.2464599609375, -89.27517700195312, -87.30389404296875, -85.33261108398438, -83.361328125, -81.3900375366211, -79.41875457763672, -77.44747161865234, -75.47618103027344, -73.50489807128906, -71.53361511230469, -69.56232452392578, -67.5910415649414, -65.6197509765625, -63.648468017578125, -61.67718505859375, -59.70589828491211, -57.73461151123047, -55.763328552246094, -53.79204177856445, -51.82075500488281, -49.84947204589844, -47.8781852722168, -45.906898498535156, -43.93561553955078, -41.96432876586914, -39.9930419921875, -38.02176284790039, -36.05047607421875, -34.079193115234375, -32.107906341552734, -30.136621475219727, -28.16533660888672, -26.194049835205078, -24.22276496887207, -22.251480102539062, -20.280195236206055, -18.308910369873047, -16.337623596191406, -14.366338729858398, -12.39505386352539, -10.423768043518066, -8.452482223510742, -6.481197357177734, -4.509912014007568, -2.5386266708374023, -0.5673413276672363, 1.4039440155029297, 3.3752288818359375, 5.346514701843262, 7.317800521850586, 9.289085388183594, 11.260370254516602, 13.231656074523926, 15.20294189453125, 17.174226760864258, 19.145511627197266, 21.116798400878906, 23.088083267211914, 25.059368133544922]}, "gradients/encoder.encoder.layers.10.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 5.0, 2.0, 4.0, 5.0, 3.0, 11.0, 11.0, 11.0, 13.0, 12.0, 21.0, 18.0, 18.0, 18.0, 26.0, 35.0, 31.0, 38.0, 41.0, 68.0, 50.0, 50.0, 56.0, 45.0, 51.0, 52.0, 47.0, 36.0, 27.0, 32.0, 32.0, 30.0, 16.0, 13.0, 13.0, 13.0, 13.0, 8.0, 7.0, 3.0, 8.0, 4.0, 4.0, 2.0, 2.0, 3.0, 1.0, 2.0, 1.0, 3.0], "bins": [-32.41179656982422, -31.51688003540039, -30.621965408325195, -29.72705078125, -28.832134246826172, -27.937217712402344, -27.04230308532715, -26.147388458251953, -25.252471923828125, -24.357555389404297, -23.4626407623291, -22.567726135253906, -21.672809600830078, -20.77789306640625, -19.882978439331055, -18.98806381225586, -18.09314727783203, -17.198230743408203, -16.303316116333008, -15.408400535583496, -14.513484954833984, -13.618569374084473, -12.723653793334961, -11.82873821258545, -10.933822631835938, -10.038907051086426, -9.143991470336914, -8.249075889587402, -7.354160308837891, -6.459244728088379, -5.564329147338867, -4.6694135665893555, -3.774496078491211, -2.879580497741699, -1.9846649169921875, -1.0897493362426758, -0.19483375549316406, 0.7000818252563477, 1.5949974060058594, 2.489912986755371, 3.384828567504883, 4.2797441482543945, 5.174659729003906, 6.069575309753418, 6.96449089050293, 7.859406471252441, 8.754322052001953, 9.649237632751465, 10.544153213500977, 11.439068794250488, 12.333984375, 13.228899955749512, 14.123815536499023, 15.018731117248535, 15.913646697998047, 16.808563232421875, 17.70347785949707, 18.598392486572266, 19.493309020996094, 20.388225555419922, 21.283140182495117, 22.178054809570312, 23.07297134399414, 23.96788787841797, 24.862802505493164]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 0.0, 2.0, 4.0, 5.0, 1.0, 3.0, 2.0, 7.0, 6.0, 15.0, 17.0, 21.0, 35.0, 55.0, 91.0, 191.0, 394.0, 1223.0, 8189.0, 4173585.0, 8234.0, 1380.0, 424.0, 204.0, 92.0, 41.0, 25.0, 20.0, 14.0, 8.0, 1.0, 2.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.375, -17.885009765625, -17.39501953125, -16.905029296875, -16.4150390625, -15.925048828125, -15.43505859375, -14.945068359375, -14.455078125, -13.965087890625, -13.47509765625, -12.985107421875, -12.4951171875, -12.005126953125, -11.51513671875, -11.025146484375, -10.53515625, -10.045166015625, -9.55517578125, -9.065185546875, -8.5751953125, -8.085205078125, -7.59521484375, -7.105224609375, -6.615234375, -6.125244140625, -5.63525390625, -5.145263671875, -4.6552734375, -4.165283203125, -3.67529296875, -3.185302734375, -2.6953125, -2.205322265625, -1.71533203125, -1.225341796875, -0.7353515625, -0.245361328125, 0.24462890625, 0.734619140625, 1.224609375, 1.714599609375, 2.20458984375, 2.694580078125, 3.1845703125, 3.674560546875, 4.16455078125, 4.654541015625, 5.14453125, 5.634521484375, 6.12451171875, 6.614501953125, 7.1044921875, 7.594482421875, 8.08447265625, 8.574462890625, 9.064453125, 9.554443359375, 10.04443359375, 10.534423828125, 11.0244140625, 11.514404296875, 12.00439453125, 12.494384765625, 12.984375]}, "gradients/encoder.encoder.layers.9.feed_forward.output_dense.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 5.0, 4.0, 1.0, 4.0, 4.0, 8.0, 8.0, 7.0, 13.0, 28.0, 37.0, 48.0, 65.0, 86.0, 80.0, 107.0, 102.0, 87.0, 80.0, 54.0, 57.0, 39.0, 19.0, 20.0, 11.0, 14.0, 7.0, 3.0, 3.0, 5.0, 1.0, 2.0, 3.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.302734375, -2.225677490234375, -2.14862060546875, -2.071563720703125, -1.9945068359375, -1.917449951171875, -1.84039306640625, -1.763336181640625, -1.686279296875, -1.609222412109375, -1.53216552734375, -1.455108642578125, -1.3780517578125, -1.300994873046875, -1.22393798828125, -1.146881103515625, -1.06982421875, -0.992767333984375, -0.91571044921875, -0.838653564453125, -0.7615966796875, -0.684539794921875, -0.60748291015625, -0.530426025390625, -0.453369140625, -0.376312255859375, -0.29925537109375, -0.222198486328125, -0.1451416015625, -0.068084716796875, 0.00897216796875, 0.086029052734375, 0.1630859375, 0.240142822265625, 0.31719970703125, 0.394256591796875, 0.4713134765625, 0.548370361328125, 0.62542724609375, 0.702484130859375, 0.779541015625, 0.856597900390625, 0.93365478515625, 1.010711669921875, 1.0877685546875, 1.164825439453125, 1.24188232421875, 1.318939208984375, 1.39599609375, 1.473052978515625, 1.55010986328125, 1.627166748046875, 1.7042236328125, 1.781280517578125, 1.85833740234375, 1.935394287109375, 2.012451171875, 2.089508056640625, 2.16656494140625, 2.243621826171875, 2.3206787109375, 2.397735595703125, 2.47479248046875, 2.551849365234375, 2.62890625]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 3.0, 3.0, 1.0, 2.0, 7.0, 7.0, 12.0, 16.0, 18.0, 29.0, 28.0, 39.0, 51.0, 64.0, 91.0, 116.0, 182.0, 216.0, 358.0, 542.0, 844.0, 1504.0, 2537.0, 5293.0, 13827.0, 135871.0, 4002343.0, 16931.0, 6025.0, 2913.0, 1576.0, 931.0, 583.0, 387.0, 264.0, 184.0, 132.0, 96.0, 63.0, 49.0, 44.0, 21.0, 18.0, 16.0, 13.0, 9.0, 10.0, 4.0, 7.0, 6.0, 5.0, 4.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-7.14453125, -6.921875, -6.69921875, -6.4765625, -6.25390625, -6.03125, -5.80859375, -5.5859375, -5.36328125, -5.140625, -4.91796875, -4.6953125, -4.47265625, -4.25, -4.02734375, -3.8046875, -3.58203125, -3.359375, -3.13671875, -2.9140625, -2.69140625, -2.46875, -2.24609375, -2.0234375, -1.80078125, -1.578125, -1.35546875, -1.1328125, -0.91015625, -0.6875, -0.46484375, -0.2421875, -0.01953125, 0.203125, 0.42578125, 0.6484375, 0.87109375, 1.09375, 1.31640625, 1.5390625, 1.76171875, 1.984375, 2.20703125, 2.4296875, 2.65234375, 2.875, 3.09765625, 3.3203125, 3.54296875, 3.765625, 3.98828125, 4.2109375, 4.43359375, 4.65625, 4.87890625, 5.1015625, 5.32421875, 5.546875, 5.76953125, 5.9921875, 6.21484375, 6.4375, 6.66015625, 6.8828125, 7.10546875]}, "gradients/encoder.encoder.layers.9.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 3.0, 2.0, 4.0, 1.0, 2.0, 4.0, 7.0, 8.0, 11.0, 18.0, 66.0, 3811.0, 81.0, 27.0, 12.0, 9.0, 6.0, 5.0, 2.0, 3.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.515625, -2.438262939453125, -2.36090087890625, -2.283538818359375, -2.2061767578125, -2.128814697265625, -2.05145263671875, -1.974090576171875, -1.896728515625, -1.819366455078125, -1.74200439453125, -1.664642333984375, -1.5872802734375, -1.509918212890625, -1.43255615234375, -1.355194091796875, -1.27783203125, -1.200469970703125, -1.12310791015625, -1.045745849609375, -0.9683837890625, -0.891021728515625, -0.81365966796875, -0.736297607421875, -0.658935546875, -0.581573486328125, -0.50421142578125, -0.426849365234375, -0.3494873046875, -0.272125244140625, -0.19476318359375, -0.117401123046875, -0.0400390625, 0.037322998046875, 0.11468505859375, 0.192047119140625, 0.2694091796875, 0.346771240234375, 0.42413330078125, 0.501495361328125, 0.578857421875, 0.656219482421875, 0.73358154296875, 0.810943603515625, 0.8883056640625, 0.965667724609375, 1.04302978515625, 1.120391845703125, 1.19775390625, 1.275115966796875, 1.35247802734375, 1.429840087890625, 1.5072021484375, 1.584564208984375, 1.66192626953125, 1.739288330078125, 1.816650390625, 1.894012451171875, 1.97137451171875, 2.048736572265625, 2.1260986328125, 2.203460693359375, 2.28082275390625, 2.358184814453125, 2.435546875]}, "gradients/encoder.encoder.layers.9.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 1.0, 7.0, 8.0, 18.0, 22.0, 45.0, 78.0, 108.0, 161.0, 179.0, 136.0, 91.0, 52.0, 47.0, 24.0, 13.0, 2.0, 6.0, 2.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.41562557220459, -4.199612617492676, -3.98360013961792, -3.767587423324585, -3.55157470703125, -3.335561752319336, -3.11954927444458, -2.903536319732666, -2.68752384185791, -2.471511125564575, -2.2554984092712402, -2.0394856929779053, -1.8234729766845703, -1.6074601411819458, -1.3914474248886108, -1.1754347085952759, -0.9594218730926514, -0.7434091567993164, -0.5273964405059814, -0.3113836646080017, -0.09537094831466675, 0.12064182758331299, 0.33665454387664795, 0.5526672601699829, 0.7686799764633179, 0.9846926927566528, 1.2007054090499878, 1.4167182445526123, 1.6327309608459473, 1.8487436771392822, 2.064756393432617, 2.280769109725952, 2.496781826019287, 2.712794542312622, 2.928807258605957, 3.144819974899292, 3.360832691192627, 3.576845645904541, 3.792858123779297, 4.008871078491211, 4.224883556365967, 4.440896511077881, 4.656908988952637, 4.872921943664551, 5.088934421539307, 5.304947376251221, 5.520959854125977, 5.736972808837891, 5.952985763549805, 6.168998718261719, 6.385011196136475, 6.601024150848389, 6.8170366287231445, 7.033049583435059, 7.2490620613098145, 7.4650750160217285, 7.681087493896484, 7.897100448608398, 8.113113403320312, 8.32912540435791, 8.545138359069824, 8.761151313781738, 8.977164268493652, 9.19317626953125, 9.409189224243164]}, "gradients/encoder.encoder.layers.9.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 4.0, 3.0, 3.0, 3.0, 7.0, 12.0, 10.0, 12.0, 13.0, 23.0, 19.0, 18.0, 23.0, 29.0, 28.0, 33.0, 22.0, 28.0, 36.0, 39.0, 41.0, 40.0, 41.0, 49.0, 40.0, 28.0, 44.0, 34.0, 37.0, 28.0, 29.0, 38.0, 27.0, 22.0, 24.0, 14.0, 16.0, 19.0, 12.0, 10.0, 9.0, 6.0, 5.0, 9.0, 7.0, 5.0, 2.0, 4.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 1.0, 1.0], "bins": [-2.6977663040161133, -2.6127142906188965, -2.5276622772216797, -2.442610263824463, -2.357558250427246, -2.27250599861145, -2.1874539852142334, -2.1024019718170166, -2.0173499584198, -1.932297945022583, -1.8472459316253662, -1.7621937990188599, -1.677141785621643, -1.5920897722244263, -1.50703763961792, -1.4219856262207031, -1.3369336128234863, -1.2518815994262695, -1.1668295860290527, -1.0817774534225464, -0.9967254400253296, -0.9116734266281128, -0.8266213536262512, -0.7415692806243896, -0.6565172672271729, -0.571465253829956, -0.4864131808280945, -0.4013611376285553, -0.3163090944290161, -0.23125705122947693, -0.14620500802993774, -0.06115293502807617, 0.023899078369140625, 0.10895112156867981, 0.194003164768219, 0.2790552079677582, 0.36410725116729736, 0.44915929436683655, 0.5342113375663757, 0.6192634105682373, 0.7043154239654541, 0.7893674373626709, 0.8744195103645325, 0.959471583366394, 1.0445235967636108, 1.1295756101608276, 1.214627742767334, 1.2996797561645508, 1.3847317695617676, 1.4697837829589844, 1.5548357963562012, 1.6398879289627075, 1.7249399423599243, 1.8099919557571411, 1.8950440883636475, 1.9800961017608643, 2.065148115158081, 2.150200128555298, 2.2352521419525146, 2.3203041553497314, 2.4053564071655273, 2.490408420562744, 2.575460433959961, 2.6605124473571777, 2.7455644607543945]}, "gradients/encoder.encoder.layers.9.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 2.0, 2.0, 0.0, 2.0, 3.0, 6.0, 4.0, 10.0, 6.0, 14.0, 14.0, 18.0, 29.0, 51.0, 57.0, 109.0, 187.0, 295.0, 545.0, 1267.0, 3575.0, 11530.0, 53305.0, 362240.0, 513143.0, 78689.0, 15763.0, 4509.0, 1642.0, 668.0, 353.0, 206.0, 123.0, 72.0, 30.0, 25.0, 16.0, 22.0, 6.0, 4.0, 8.0, 6.0, 3.0, 3.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.90234375, -5.7388916015625, -5.575439453125, -5.4119873046875, -5.24853515625, -5.0850830078125, -4.921630859375, -4.7581787109375, -4.5947265625, -4.4312744140625, -4.267822265625, -4.1043701171875, -3.94091796875, -3.7774658203125, -3.614013671875, -3.4505615234375, -3.287109375, -3.1236572265625, -2.960205078125, -2.7967529296875, -2.63330078125, -2.4698486328125, -2.306396484375, -2.1429443359375, -1.9794921875, -1.8160400390625, -1.652587890625, -1.4891357421875, -1.32568359375, -1.1622314453125, -0.998779296875, -0.8353271484375, -0.671875, -0.5084228515625, -0.344970703125, -0.1815185546875, -0.01806640625, 0.1453857421875, 0.308837890625, 0.4722900390625, 0.6357421875, 0.7991943359375, 0.962646484375, 1.1260986328125, 1.28955078125, 1.4530029296875, 1.616455078125, 1.7799072265625, 1.943359375, 2.1068115234375, 2.270263671875, 2.4337158203125, 2.59716796875, 2.7606201171875, 2.924072265625, 3.0875244140625, 3.2509765625, 3.4144287109375, 3.577880859375, 3.7413330078125, 3.90478515625, 4.0682373046875, 4.231689453125, 4.3951416015625, 4.55859375]}, "gradients/encoder.encoder.layers.9.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 2.0, 3.0, 4.0, 3.0, 5.0, 7.0, 14.0, 13.0, 8.0, 18.0, 40.0, 29.0, 47.0, 39.0, 77.0, 78.0, 65.0, 85.0, 82.0, 70.0, 57.0, 52.0, 41.0, 34.0, 28.0, 24.0, 20.0, 13.0, 15.0, 8.0, 6.0, 2.0, 10.0, 4.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.185546875, -2.1203460693359375, -2.055145263671875, -1.9899444580078125, -1.92474365234375, -1.8595428466796875, -1.794342041015625, -1.7291412353515625, -1.6639404296875, -1.5987396240234375, -1.533538818359375, -1.4683380126953125, -1.40313720703125, -1.3379364013671875, -1.272735595703125, -1.2075347900390625, -1.142333984375, -1.0771331787109375, -1.011932373046875, -0.9467315673828125, -0.88153076171875, -0.8163299560546875, -0.751129150390625, -0.6859283447265625, -0.6207275390625, -0.5555267333984375, -0.490325927734375, -0.4251251220703125, -0.35992431640625, -0.2947235107421875, -0.229522705078125, -0.1643218994140625, -0.09912109375, -0.0339202880859375, 0.031280517578125, 0.0964813232421875, 0.16168212890625, 0.2268829345703125, 0.292083740234375, 0.3572845458984375, 0.4224853515625, 0.4876861572265625, 0.552886962890625, 0.6180877685546875, 0.68328857421875, 0.7484893798828125, 0.813690185546875, 0.8788909912109375, 0.944091796875, 1.0092926025390625, 1.074493408203125, 1.1396942138671875, 1.20489501953125, 1.2700958251953125, 1.335296630859375, 1.4004974365234375, 1.4656982421875, 1.5308990478515625, 1.596099853515625, 1.6613006591796875, 1.72650146484375, 1.7917022705078125, 1.856903076171875, 1.9221038818359375, 1.9873046875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 4.0, 7.0, 9.0, 9.0, 17.0, 19.0, 27.0, 59.0, 75.0, 135.0, 314.0, 663.0, 1882.0, 7877.0, 50052.0, 543069.0, 398045.0, 37294.0, 6158.0, 1594.0, 633.0, 277.0, 142.0, 56.0, 34.0, 35.0, 22.0, 22.0, 8.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 1.0, 2.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.44140625, -6.233154296875, -6.02490234375, -5.816650390625, -5.6083984375, -5.400146484375, -5.19189453125, -4.983642578125, -4.775390625, -4.567138671875, -4.35888671875, -4.150634765625, -3.9423828125, -3.734130859375, -3.52587890625, -3.317626953125, -3.109375, -2.901123046875, -2.69287109375, -2.484619140625, -2.2763671875, -2.068115234375, -1.85986328125, -1.651611328125, -1.443359375, -1.235107421875, -1.02685546875, -0.818603515625, -0.6103515625, -0.402099609375, -0.19384765625, 0.014404296875, 0.22265625, 0.430908203125, 0.63916015625, 0.847412109375, 1.0556640625, 1.263916015625, 1.47216796875, 1.680419921875, 1.888671875, 2.096923828125, 2.30517578125, 2.513427734375, 2.7216796875, 2.929931640625, 3.13818359375, 3.346435546875, 3.5546875, 3.762939453125, 3.97119140625, 4.179443359375, 4.3876953125, 4.595947265625, 4.80419921875, 5.012451171875, 5.220703125, 5.428955078125, 5.63720703125, 5.845458984375, 6.0537109375, 6.261962890625, 6.47021484375, 6.678466796875, 6.88671875]}, "gradients/encoder.encoder.layers.9.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 2.0, 3.0, 1.0, 2.0, 4.0, 7.0, 7.0, 9.0, 16.0, 14.0, 23.0, 22.0, 44.0, 44.0, 35.0, 51.0, 53.0, 64.0, 82.0, 71.0, 51.0, 63.0, 54.0, 50.0, 48.0, 42.0, 37.0, 24.0, 24.0, 28.0, 8.0, 13.0, 9.0, 5.0, 2.0, 2.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-7.0546875, -6.7564697265625, -6.458251953125, -6.1600341796875, -5.86181640625, -5.5635986328125, -5.265380859375, -4.9671630859375, -4.6689453125, -4.3707275390625, -4.072509765625, -3.7742919921875, -3.47607421875, -3.1778564453125, -2.879638671875, -2.5814208984375, -2.283203125, -1.9849853515625, -1.686767578125, -1.3885498046875, -1.09033203125, -0.7921142578125, -0.493896484375, -0.1956787109375, 0.1025390625, 0.4007568359375, 0.698974609375, 0.9971923828125, 1.29541015625, 1.5936279296875, 1.891845703125, 2.1900634765625, 2.48828125, 2.7864990234375, 3.084716796875, 3.3829345703125, 3.68115234375, 3.9793701171875, 4.277587890625, 4.5758056640625, 4.8740234375, 5.1722412109375, 5.470458984375, 5.7686767578125, 6.06689453125, 6.3651123046875, 6.663330078125, 6.9615478515625, 7.259765625, 7.5579833984375, 7.856201171875, 8.1544189453125, 8.45263671875, 8.7508544921875, 9.049072265625, 9.3472900390625, 9.6455078125, 9.9437255859375, 10.241943359375, 10.5401611328125, 10.83837890625, 11.1365966796875, 11.434814453125, 11.7330322265625, 12.03125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 4.0, 3.0, 7.0, 6.0, 15.0, 15.0, 18.0, 34.0, 33.0, 91.0, 113.0, 219.0, 549.0, 1618.0, 12106.0, 583326.0, 437547.0, 10163.0, 1638.0, 501.0, 227.0, 119.0, 77.0, 54.0, 26.0, 13.0, 16.0, 9.0, 6.0, 5.0, 1.0, 3.0, 1.0, 0.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.88671875, -4.74285888671875, -4.5989990234375, -4.45513916015625, -4.311279296875, -4.16741943359375, -4.0235595703125, -3.87969970703125, -3.73583984375, -3.59197998046875, -3.4481201171875, -3.30426025390625, -3.160400390625, -3.01654052734375, -2.8726806640625, -2.72882080078125, -2.5849609375, -2.44110107421875, -2.2972412109375, -2.15338134765625, -2.009521484375, -1.86566162109375, -1.7218017578125, -1.57794189453125, -1.43408203125, -1.29022216796875, -1.1463623046875, -1.00250244140625, -0.858642578125, -0.71478271484375, -0.5709228515625, -0.42706298828125, -0.283203125, -0.13934326171875, 0.0045166015625, 0.14837646484375, 0.292236328125, 0.43609619140625, 0.5799560546875, 0.72381591796875, 0.86767578125, 1.01153564453125, 1.1553955078125, 1.29925537109375, 1.443115234375, 1.58697509765625, 1.7308349609375, 1.87469482421875, 2.0185546875, 2.16241455078125, 2.3062744140625, 2.45013427734375, 2.593994140625, 2.73785400390625, 2.8817138671875, 3.02557373046875, 3.16943359375, 3.31329345703125, 3.4571533203125, 3.60101318359375, 3.744873046875, 3.88873291015625, 4.0325927734375, 4.17645263671875, 4.3203125]}, "gradients/encoder.encoder.layers.9.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 7.0, 3.0, 4.0, 4.0, 10.0, 12.0, 16.0, 16.0, 18.0, 29.0, 43.0, 65.0, 66.0, 89.0, 92.0, 95.0, 74.0, 83.0, 68.0, 57.0, 40.0, 28.0, 26.0, 13.0, 16.0, 10.0, 11.0, 4.0, 1.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.0003323554992675781, -0.00032315775752067566, -0.0003139600157737732, -0.00030476227402687073, -0.00029556453227996826, -0.0002863667905330658, -0.00027716904878616333, -0.00026797130703926086, -0.0002587735652923584, -0.00024957582354545593, -0.00024037808179855347, -0.000231180340051651, -0.00022198259830474854, -0.00021278485655784607, -0.0002035871148109436, -0.00019438937306404114, -0.00018519163131713867, -0.0001759938895702362, -0.00016679614782333374, -0.00015759840607643127, -0.0001484006643295288, -0.00013920292258262634, -0.00013000518083572388, -0.00012080743908882141, -0.00011160969734191895, -0.00010241195559501648, -9.321421384811401e-05, -8.401647210121155e-05, -7.481873035430908e-05, -6.562098860740662e-05, -5.642324686050415e-05, -4.7225505113601685e-05, -3.802776336669922e-05, -2.8830021619796753e-05, -1.9632279872894287e-05, -1.0434538125991821e-05, -1.2367963790893555e-06, 7.96094536781311e-06, 1.7158687114715576e-05, 2.6356428861618042e-05, 3.555417060852051e-05, 4.4751912355422974e-05, 5.394965410232544e-05, 6.31473958492279e-05, 7.234513759613037e-05, 8.154287934303284e-05, 9.07406210899353e-05, 9.993836283683777e-05, 0.00010913610458374023, 0.0001183338463306427, 0.00012753158807754517, 0.00013672932982444763, 0.0001459270715713501, 0.00015512481331825256, 0.00016432255506515503, 0.0001735202968120575, 0.00018271803855895996, 0.00019191578030586243, 0.0002011135220527649, 0.00021031126379966736, 0.00021950900554656982, 0.0002287067472934723, 0.00023790448904037476, 0.0002471022307872772, 0.0002562999725341797]}, "gradients/encoder.encoder.layers.9.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 3.0, 0.0, 5.0, 7.0, 7.0, 12.0, 18.0, 14.0, 42.0, 50.0, 94.0, 157.0, 302.0, 686.0, 2013.0, 9640.0, 130107.0, 836979.0, 59710.0, 6067.0, 1498.0, 532.0, 217.0, 153.0, 88.0, 57.0, 31.0, 19.0, 12.0, 16.0, 5.0, 3.0, 4.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 1.0, 1.0, 1.0, 2.0], "bins": [-3.919921875, -3.817779541015625, -3.71563720703125, -3.613494873046875, -3.5113525390625, -3.409210205078125, -3.30706787109375, -3.204925537109375, -3.102783203125, -3.000640869140625, -2.89849853515625, -2.796356201171875, -2.6942138671875, -2.592071533203125, -2.48992919921875, -2.387786865234375, -2.28564453125, -2.183502197265625, -2.08135986328125, -1.979217529296875, -1.8770751953125, -1.774932861328125, -1.67279052734375, -1.570648193359375, -1.468505859375, -1.366363525390625, -1.26422119140625, -1.162078857421875, -1.0599365234375, -0.957794189453125, -0.85565185546875, -0.753509521484375, -0.6513671875, -0.549224853515625, -0.44708251953125, -0.344940185546875, -0.2427978515625, -0.140655517578125, -0.03851318359375, 0.063629150390625, 0.165771484375, 0.267913818359375, 0.37005615234375, 0.472198486328125, 0.5743408203125, 0.676483154296875, 0.77862548828125, 0.880767822265625, 0.98291015625, 1.085052490234375, 1.18719482421875, 1.289337158203125, 1.3914794921875, 1.493621826171875, 1.59576416015625, 1.697906494140625, 1.800048828125, 1.902191162109375, 2.00433349609375, 2.106475830078125, 2.2086181640625, 2.310760498046875, 2.41290283203125, 2.515045166015625, 2.6171875]}, "gradients/encoder.encoder.layers.9.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 5.0, 6.0, 11.0, 20.0, 24.0, 33.0, 55.0, 87.0, 129.0, 161.0, 154.0, 112.0, 78.0, 43.0, 34.0, 27.0, 15.0, 5.0, 3.0, 3.0, 2.0, 0.0, 2.0, 3.0, 1.0, 0.0, 0.0, 1.0], "bins": [-5.64453125, -5.521270751953125, -5.39801025390625, -5.274749755859375, -5.1514892578125, -5.028228759765625, -4.90496826171875, -4.781707763671875, -4.658447265625, -4.535186767578125, -4.41192626953125, -4.288665771484375, -4.1654052734375, -4.042144775390625, -3.91888427734375, -3.795623779296875, -3.67236328125, -3.549102783203125, -3.42584228515625, -3.302581787109375, -3.1793212890625, -3.056060791015625, -2.93280029296875, -2.809539794921875, -2.686279296875, -2.563018798828125, -2.43975830078125, -2.316497802734375, -2.1932373046875, -2.069976806640625, -1.94671630859375, -1.823455810546875, -1.7001953125, -1.576934814453125, -1.45367431640625, -1.330413818359375, -1.2071533203125, -1.083892822265625, -0.96063232421875, -0.837371826171875, -0.714111328125, -0.590850830078125, -0.46759033203125, -0.344329833984375, -0.2210693359375, -0.097808837890625, 0.02545166015625, 0.148712158203125, 0.27197265625, 0.395233154296875, 0.51849365234375, 0.641754150390625, 0.7650146484375, 0.888275146484375, 1.01153564453125, 1.134796142578125, 1.258056640625, 1.381317138671875, 1.50457763671875, 1.627838134765625, 1.7510986328125, 1.874359130859375, 1.99761962890625, 2.120880126953125, 2.244140625]}, "gradients/encoder.encoder.layers.9.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 4.0, 4.0, 15.0, 14.0, 35.0, 51.0, 88.0, 136.0, 146.0, 143.0, 144.0, 99.0, 53.0, 29.0, 23.0, 14.0, 4.0, 4.0, 3.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-61.3626708984375, -60.002540588378906, -58.64241027832031, -57.28227996826172, -55.922149658203125, -54.5620231628418, -53.2018928527832, -51.84176254272461, -50.481632232666016, -49.12150192260742, -47.76137161254883, -46.401241302490234, -45.041114807128906, -43.68098449707031, -42.32085418701172, -40.960723876953125, -39.60059356689453, -38.24046325683594, -36.880332946777344, -35.52020263671875, -34.160072326660156, -32.79994583129883, -31.439815521240234, -30.07968521118164, -28.719554901123047, -27.359424591064453, -25.99929428100586, -24.6391658782959, -23.279035568237305, -21.91890525817871, -20.55877685546875, -19.198646545410156, -17.838516235351562, -16.47838592529297, -15.118256568908691, -13.758127212524414, -12.39799690246582, -11.037866592407227, -9.67773723602295, -8.317607879638672, -6.957477569580078, -5.597347736358643, -4.237217903137207, -2.8770880699157715, -1.516958236694336, -0.1568284034729004, 1.2033014297485352, 2.5634307861328125, 3.9235610961914062, 5.283690929412842, 6.643820762634277, 8.003950119018555, 9.364080429077148, 10.724210739135742, 12.08434009552002, 13.444469451904297, 14.80459976196289, 16.164730072021484, 17.524860382080078, 18.88498878479004, 20.245119094848633, 21.605249404907227, 22.965377807617188, 24.32550811767578, 25.685638427734375]}, "gradients/encoder.encoder.layers.9.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 3.0, 1.0, 4.0, 3.0, 4.0, 1.0, 6.0, 3.0, 6.0, 7.0, 4.0, 9.0, 15.0, 9.0, 15.0, 22.0, 17.0, 21.0, 18.0, 27.0, 24.0, 33.0, 39.0, 42.0, 44.0, 50.0, 50.0, 49.0, 55.0, 37.0, 44.0, 35.0, 36.0, 38.0, 30.0, 27.0, 30.0, 24.0, 22.0, 17.0, 15.0, 15.0, 13.0, 8.0, 7.0, 4.0, 6.0, 7.0, 6.0, 2.0, 5.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-25.166027069091797, -24.3118953704834, -23.457763671875, -22.6036319732666, -21.749500274658203, -20.895366668701172, -20.041234970092773, -19.187103271484375, -18.332971572875977, -17.478839874267578, -16.62470817565918, -15.770575523376465, -14.916443824768066, -14.062312126159668, -13.208179473876953, -12.354047775268555, -11.499916076660156, -10.645784378051758, -9.79165267944336, -8.937520027160645, -8.083388328552246, -7.229256629943848, -6.375124454498291, -5.520992279052734, -4.666860580444336, -3.8127286434173584, -2.958596706390381, -2.1044647693634033, -1.2503328323364258, -0.39620113372802734, 0.4579310417175293, 1.312063217163086, 2.1661930084228516, 3.020324945449829, 3.8744568824768066, 4.728589057922363, 5.582720756530762, 6.43685245513916, 7.290984630584717, 8.145116806030273, 8.999248504638672, 9.85338020324707, 10.707511901855469, 11.561644554138184, 12.415776252746582, 13.26990795135498, 14.124040603637695, 14.978172302246094, 15.832304000854492, 16.68643569946289, 17.54056739807129, 18.394699096679688, 19.24883270263672, 20.102962493896484, 20.957096099853516, 21.811227798461914, 22.665359497070312, 23.51949119567871, 24.37362289428711, 25.227754592895508, 26.081886291503906, 26.936019897460938, 27.790151596069336, 28.644283294677734, 29.498414993286133]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 1.0, 3.0, 2.0, 5.0, 7.0, 7.0, 5.0, 8.0, 9.0, 15.0, 19.0, 26.0, 35.0, 51.0, 76.0, 118.0, 195.0, 328.0, 622.0, 1301.0, 3325.0, 11223.0, 3986869.0, 174877.0, 9544.0, 3031.0, 1296.0, 596.0, 279.0, 174.0, 82.0, 61.0, 39.0, 19.0, 12.0, 14.0, 7.0, 5.0, 6.0, 0.0, 0.0, 1.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.98828125, -6.7823486328125, -6.576416015625, -6.3704833984375, -6.16455078125, -5.9586181640625, -5.752685546875, -5.5467529296875, -5.3408203125, -5.1348876953125, -4.928955078125, -4.7230224609375, -4.51708984375, -4.3111572265625, -4.105224609375, -3.8992919921875, -3.693359375, -3.4874267578125, -3.281494140625, -3.0755615234375, -2.86962890625, -2.6636962890625, -2.457763671875, -2.2518310546875, -2.0458984375, -1.8399658203125, -1.634033203125, -1.4281005859375, -1.22216796875, -1.0162353515625, -0.810302734375, -0.6043701171875, -0.3984375, -0.1925048828125, 0.013427734375, 0.2193603515625, 0.42529296875, 0.6312255859375, 0.837158203125, 1.0430908203125, 1.2490234375, 1.4549560546875, 1.660888671875, 1.8668212890625, 2.07275390625, 2.2786865234375, 2.484619140625, 2.6905517578125, 2.896484375, 3.1024169921875, 3.308349609375, 3.5142822265625, 3.72021484375, 3.9261474609375, 4.132080078125, 4.3380126953125, 4.5439453125, 4.7498779296875, 4.955810546875, 5.1617431640625, 5.36767578125, 5.5736083984375, 5.779541015625, 5.9854736328125, 6.19140625]}, "gradients/encoder.encoder.layers.8.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 6.0, 11.0, 9.0, 13.0, 28.0, 30.0, 40.0, 54.0, 76.0, 91.0, 89.0, 90.0, 101.0, 83.0, 74.0, 54.0, 41.0, 30.0, 24.0, 11.0, 13.0, 8.0, 10.0, 6.0, 3.0, 4.0, 3.0, 3.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.876953125, -2.798309326171875, -2.71966552734375, -2.641021728515625, -2.5623779296875, -2.483734130859375, -2.40509033203125, -2.326446533203125, -2.247802734375, -2.169158935546875, -2.09051513671875, -2.011871337890625, -1.9332275390625, -1.854583740234375, -1.77593994140625, -1.697296142578125, -1.61865234375, -1.540008544921875, -1.46136474609375, -1.382720947265625, -1.3040771484375, -1.225433349609375, -1.14678955078125, -1.068145751953125, -0.989501953125, -0.910858154296875, -0.83221435546875, -0.753570556640625, -0.6749267578125, -0.596282958984375, -0.51763916015625, -0.438995361328125, -0.3603515625, -0.281707763671875, -0.20306396484375, -0.124420166015625, -0.0457763671875, 0.032867431640625, 0.11151123046875, 0.190155029296875, 0.268798828125, 0.347442626953125, 0.42608642578125, 0.504730224609375, 0.5833740234375, 0.662017822265625, 0.74066162109375, 0.819305419921875, 0.89794921875, 0.976593017578125, 1.05523681640625, 1.133880615234375, 1.2125244140625, 1.291168212890625, 1.36981201171875, 1.448455810546875, 1.527099609375, 1.605743408203125, 1.68438720703125, 1.763031005859375, 1.8416748046875, 1.920318603515625, 1.99896240234375, 2.077606201171875, 2.15625]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 1.0, 4.0, 5.0, 9.0, 10.0, 17.0, 18.0, 46.0, 57.0, 80.0, 97.0, 136.0, 206.0, 285.0, 419.0, 658.0, 1031.0, 1733.0, 3210.0, 6236.0, 14456.0, 67636.0, 4013651.0, 57105.0, 13449.0, 6031.0, 2964.0, 1705.0, 1012.0, 629.0, 443.0, 283.0, 204.0, 132.0, 90.0, 71.0, 36.0, 33.0, 37.0, 18.0, 12.0, 5.0, 5.0, 3.0, 9.0, 3.0, 1.0, 3.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-4.0390625, -3.9019775390625, -3.764892578125, -3.6278076171875, -3.49072265625, -3.3536376953125, -3.216552734375, -3.0794677734375, -2.9423828125, -2.8052978515625, -2.668212890625, -2.5311279296875, -2.39404296875, -2.2569580078125, -2.119873046875, -1.9827880859375, -1.845703125, -1.7086181640625, -1.571533203125, -1.4344482421875, -1.29736328125, -1.1602783203125, -1.023193359375, -0.8861083984375, -0.7490234375, -0.6119384765625, -0.474853515625, -0.3377685546875, -0.20068359375, -0.0635986328125, 0.073486328125, 0.2105712890625, 0.34765625, 0.4847412109375, 0.621826171875, 0.7589111328125, 0.89599609375, 1.0330810546875, 1.170166015625, 1.3072509765625, 1.4443359375, 1.5814208984375, 1.718505859375, 1.8555908203125, 1.99267578125, 2.1297607421875, 2.266845703125, 2.4039306640625, 2.541015625, 2.6781005859375, 2.815185546875, 2.9522705078125, 3.08935546875, 3.2264404296875, 3.363525390625, 3.5006103515625, 3.6376953125, 3.7747802734375, 3.911865234375, 4.0489501953125, 4.18603515625, 4.3231201171875, 4.460205078125, 4.5972900390625, 4.734375]}, "gradients/encoder.encoder.layers.8.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 3.0, 6.0, 3.0, 9.0, 8.0, 20.0, 38.0, 98.0, 3479.0, 258.0, 51.0, 32.0, 16.0, 15.0, 9.0, 10.0, 4.0, 1.0, 4.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.1328125, -2.049957275390625, -1.96710205078125, -1.884246826171875, -1.8013916015625, -1.718536376953125, -1.63568115234375, -1.552825927734375, -1.469970703125, -1.387115478515625, -1.30426025390625, -1.221405029296875, -1.1385498046875, -1.055694580078125, -0.97283935546875, -0.889984130859375, -0.80712890625, -0.724273681640625, -0.64141845703125, -0.558563232421875, -0.4757080078125, -0.392852783203125, -0.30999755859375, -0.227142333984375, -0.144287109375, -0.061431884765625, 0.02142333984375, 0.104278564453125, 0.1871337890625, 0.269989013671875, 0.35284423828125, 0.435699462890625, 0.5185546875, 0.601409912109375, 0.68426513671875, 0.767120361328125, 0.8499755859375, 0.932830810546875, 1.01568603515625, 1.098541259765625, 1.181396484375, 1.264251708984375, 1.34710693359375, 1.429962158203125, 1.5128173828125, 1.595672607421875, 1.67852783203125, 1.761383056640625, 1.84423828125, 1.927093505859375, 2.00994873046875, 2.092803955078125, 2.1756591796875, 2.258514404296875, 2.34136962890625, 2.424224853515625, 2.507080078125, 2.589935302734375, 2.67279052734375, 2.755645751953125, 2.8385009765625, 2.921356201171875, 3.00421142578125, 3.087066650390625, 3.169921875]}, "gradients/encoder.encoder.layers.8.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 1.0, 7.0, 12.0, 26.0, 28.0, 63.0, 106.0, 146.0, 161.0, 149.0, 128.0, 70.0, 32.0, 28.0, 15.0, 8.0, 5.0, 4.0, 5.0, 3.0, 2.0, 2.0, 2.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.927201271057129, -6.6313910484313965, -6.335580348968506, -6.039770126342773, -5.743959426879883, -5.44814920425415, -5.152338981628418, -4.856528282165527, -4.560718059539795, -4.2649078369140625, -3.969097137451172, -3.6732869148254395, -3.377476453781128, -3.0816659927368164, -2.785855770111084, -2.4900453090667725, -2.194234848022461, -1.8984243869781494, -1.6026140451431274, -1.3068037033081055, -1.010993242263794, -0.7151827812194824, -0.41937243938446045, -0.12356209754943848, 0.17224836349487305, 0.4680587649345398, 0.7638691663742065, 1.0596795082092285, 1.35548996925354, 1.6513004302978516, 1.9471107721328735, 2.2429211139678955, 2.5387325286865234, 2.834542989730835, 3.1303534507751465, 3.426163673400879, 3.7219741344451904, 4.017784595489502, 4.313594818115234, 4.609405517578125, 4.905215740203857, 5.20102596282959, 5.4968366622924805, 5.792646884918213, 6.088457107543945, 6.384267807006836, 6.680078029632568, 6.975888252258301, 7.271698951721191, 7.567509174346924, 7.8633198738098145, 8.159130096435547, 8.454940795898438, 8.750751495361328, 9.046561241149902, 9.342371940612793, 9.638181686401367, 9.933992385864258, 10.229802131652832, 10.525612831115723, 10.821423530578613, 11.117233276367188, 11.413043975830078, 11.708854675292969, 12.00466537475586]}, "gradients/encoder.encoder.layers.8.final_layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 3.0, 0.0, 1.0, 0.0, 3.0, 1.0, 9.0, 7.0, 7.0, 8.0, 14.0, 12.0, 16.0, 17.0, 17.0, 27.0, 33.0, 37.0, 45.0, 53.0, 40.0, 45.0, 62.0, 64.0, 60.0, 50.0, 47.0, 57.0, 48.0, 38.0, 29.0, 29.0, 20.0, 30.0, 20.0, 12.0, 16.0, 4.0, 8.0, 4.0, 7.0, 3.0, 5.0, 5.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.17314338684082, -4.01095724105835, -3.8487708568573, -3.686584711074829, -3.5243985652923584, -3.3622121810913086, -3.200026035308838, -3.037839889526367, -2.8756537437438965, -2.713467597961426, -2.551281213760376, -2.3890950679779053, -2.2269089221954346, -2.0647225379943848, -1.902536392211914, -1.7403502464294434, -1.5781638622283936, -1.4159775972366333, -1.2537914514541626, -1.0916051864624023, -0.9294189810752869, -0.7672327756881714, -0.6050465106964111, -0.44286036491394043, -0.2806740999221802, -0.1184878796339035, 0.04369834065437317, 0.20588457584381104, 0.3680707812309265, 0.530256986618042, 0.6924432516098022, 0.854629397392273, 1.0168156623840332, 1.1790019273757935, 1.3411880731582642, 1.5033743381500244, 1.6655604839324951, 1.8277467489242554, 1.9899330139160156, 2.1521191596984863, 2.314305305480957, 2.4764914512634277, 2.6386778354644775, 2.8008639812469482, 2.963050127029419, 3.1252365112304688, 3.2874226570129395, 3.44960880279541, 3.61179518699646, 3.7739813327789307, 3.9361677169799805, 4.098353862762451, 4.260540008544922, 4.422726154327393, 4.584912300109863, 4.747098922729492, 4.909285068511963, 5.071471214294434, 5.233657360076904, 5.395843505859375, 5.558030128479004, 5.720216274261475, 5.882402420043945, 6.044588565826416, 6.206774711608887]}, "gradients/encoder.encoder.layers.8.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 4.0, 4.0, 10.0, 13.0, 16.0, 19.0, 68.0, 79.0, 155.0, 292.0, 572.0, 1298.0, 3350.0, 11206.0, 50079.0, 302517.0, 544102.0, 105466.0, 20244.0, 5467.0, 1903.0, 811.0, 382.0, 236.0, 100.0, 62.0, 36.0, 25.0, 15.0, 9.0, 4.0, 5.0, 4.0, 0.0, 3.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.19921875, -5.03265380859375, -4.8660888671875, -4.69952392578125, -4.532958984375, -4.36639404296875, -4.1998291015625, -4.03326416015625, -3.86669921875, -3.70013427734375, -3.5335693359375, -3.36700439453125, -3.200439453125, -3.03387451171875, -2.8673095703125, -2.70074462890625, -2.5341796875, -2.36761474609375, -2.2010498046875, -2.03448486328125, -1.867919921875, -1.70135498046875, -1.5347900390625, -1.36822509765625, -1.20166015625, -1.03509521484375, -0.8685302734375, -0.70196533203125, -0.535400390625, -0.36883544921875, -0.2022705078125, -0.03570556640625, 0.130859375, 0.29742431640625, 0.4639892578125, 0.63055419921875, 0.797119140625, 0.96368408203125, 1.1302490234375, 1.29681396484375, 1.46337890625, 1.62994384765625, 1.7965087890625, 1.96307373046875, 2.129638671875, 2.29620361328125, 2.4627685546875, 2.62933349609375, 2.7958984375, 2.96246337890625, 3.1290283203125, 3.29559326171875, 3.462158203125, 3.62872314453125, 3.7952880859375, 3.96185302734375, 4.12841796875, 4.29498291015625, 4.4615478515625, 4.62811279296875, 4.794677734375, 4.96124267578125, 5.1278076171875, 5.29437255859375, 5.4609375]}, "gradients/encoder.encoder.layers.8.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 2.0, 8.0, 15.0, 10.0, 11.0, 24.0, 25.0, 42.0, 40.0, 69.0, 89.0, 85.0, 104.0, 87.0, 85.0, 75.0, 54.0, 50.0, 35.0, 27.0, 14.0, 16.0, 9.0, 11.0, 8.0, 5.0, 5.0, 2.0, 3.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-3.248046875, -3.166839599609375, -3.08563232421875, -3.004425048828125, -2.9232177734375, -2.842010498046875, -2.76080322265625, -2.679595947265625, -2.598388671875, -2.517181396484375, -2.43597412109375, -2.354766845703125, -2.2735595703125, -2.192352294921875, -2.11114501953125, -2.029937744140625, -1.94873046875, -1.867523193359375, -1.78631591796875, -1.705108642578125, -1.6239013671875, -1.542694091796875, -1.46148681640625, -1.380279541015625, -1.299072265625, -1.217864990234375, -1.13665771484375, -1.055450439453125, -0.9742431640625, -0.893035888671875, -0.81182861328125, -0.730621337890625, -0.6494140625, -0.568206787109375, -0.48699951171875, -0.405792236328125, -0.3245849609375, -0.243377685546875, -0.16217041015625, -0.080963134765625, 0.000244140625, 0.081451416015625, 0.16265869140625, 0.243865966796875, 0.3250732421875, 0.406280517578125, 0.48748779296875, 0.568695068359375, 0.64990234375, 0.731109619140625, 0.81231689453125, 0.893524169921875, 0.9747314453125, 1.055938720703125, 1.13714599609375, 1.218353271484375, 1.299560546875, 1.380767822265625, 1.46197509765625, 1.543182373046875, 1.6243896484375, 1.705596923828125, 1.78680419921875, 1.868011474609375, 1.94921875]}, "gradients/encoder.encoder.layers.8.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 5.0, 8.0, 5.0, 9.0, 20.0, 35.0, 35.0, 64.0, 82.0, 182.0, 320.0, 801.0, 1764.0, 6091.0, 31543.0, 320423.0, 611255.0, 61617.0, 9773.0, 2627.0, 912.0, 446.0, 232.0, 98.0, 76.0, 31.0, 33.0, 25.0, 13.0, 14.0, 10.0, 6.0, 4.0, 3.0, 1.0, 3.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-6.2578125, -6.043212890625, -5.82861328125, -5.614013671875, -5.3994140625, -5.184814453125, -4.97021484375, -4.755615234375, -4.541015625, -4.326416015625, -4.11181640625, -3.897216796875, -3.6826171875, -3.468017578125, -3.25341796875, -3.038818359375, -2.82421875, -2.609619140625, -2.39501953125, -2.180419921875, -1.9658203125, -1.751220703125, -1.53662109375, -1.322021484375, -1.107421875, -0.892822265625, -0.67822265625, -0.463623046875, -0.2490234375, -0.034423828125, 0.18017578125, 0.394775390625, 0.609375, 0.823974609375, 1.03857421875, 1.253173828125, 1.4677734375, 1.682373046875, 1.89697265625, 2.111572265625, 2.326171875, 2.540771484375, 2.75537109375, 2.969970703125, 3.1845703125, 3.399169921875, 3.61376953125, 3.828369140625, 4.04296875, 4.257568359375, 4.47216796875, 4.686767578125, 4.9013671875, 5.115966796875, 5.33056640625, 5.545166015625, 5.759765625, 5.974365234375, 6.18896484375, 6.403564453125, 6.6181640625, 6.832763671875, 7.04736328125, 7.261962890625, 7.4765625]}, "gradients/encoder.encoder.layers.8.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 0.0, 0.0, 1.0, 0.0, 5.0, 7.0, 3.0, 7.0, 15.0, 15.0, 20.0, 20.0, 35.0, 34.0, 37.0, 59.0, 63.0, 61.0, 57.0, 80.0, 84.0, 68.0, 68.0, 65.0, 42.0, 42.0, 35.0, 26.0, 14.0, 11.0, 15.0, 5.0, 4.0, 6.0, 4.0, 1.0, 2.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.4609375, -9.1510009765625, -8.841064453125, -8.5311279296875, -8.22119140625, -7.9112548828125, -7.601318359375, -7.2913818359375, -6.9814453125, -6.6715087890625, -6.361572265625, -6.0516357421875, -5.74169921875, -5.4317626953125, -5.121826171875, -4.8118896484375, -4.501953125, -4.1920166015625, -3.882080078125, -3.5721435546875, -3.26220703125, -2.9522705078125, -2.642333984375, -2.3323974609375, -2.0224609375, -1.7125244140625, -1.402587890625, -1.0926513671875, -0.78271484375, -0.4727783203125, -0.162841796875, 0.1470947265625, 0.45703125, 0.7669677734375, 1.076904296875, 1.3868408203125, 1.69677734375, 2.0067138671875, 2.316650390625, 2.6265869140625, 2.9365234375, 3.2464599609375, 3.556396484375, 3.8663330078125, 4.17626953125, 4.4862060546875, 4.796142578125, 5.1060791015625, 5.416015625, 5.7259521484375, 6.035888671875, 6.3458251953125, 6.65576171875, 6.9656982421875, 7.275634765625, 7.5855712890625, 7.8955078125, 8.2054443359375, 8.515380859375, 8.8253173828125, 9.13525390625, 9.4451904296875, 9.755126953125, 10.0650634765625, 10.375]}, "gradients/encoder.encoder.layers.8.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 3.0, 6.0, 10.0, 6.0, 8.0, 11.0, 14.0, 23.0, 22.0, 44.0, 69.0, 100.0, 202.0, 361.0, 859.0, 2760.0, 13867.0, 211604.0, 767637.0, 42835.0, 5330.0, 1500.0, 588.0, 281.0, 151.0, 92.0, 68.0, 34.0, 20.0, 18.0, 10.0, 6.0, 5.0, 4.0, 4.0, 1.0, 1.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.34765625, -2.261474609375, -2.17529296875, -2.089111328125, -2.0029296875, -1.916748046875, -1.83056640625, -1.744384765625, -1.658203125, -1.572021484375, -1.48583984375, -1.399658203125, -1.3134765625, -1.227294921875, -1.14111328125, -1.054931640625, -0.96875, -0.882568359375, -0.79638671875, -0.710205078125, -0.6240234375, -0.537841796875, -0.45166015625, -0.365478515625, -0.279296875, -0.193115234375, -0.10693359375, -0.020751953125, 0.0654296875, 0.151611328125, 0.23779296875, 0.323974609375, 0.41015625, 0.496337890625, 0.58251953125, 0.668701171875, 0.7548828125, 0.841064453125, 0.92724609375, 1.013427734375, 1.099609375, 1.185791015625, 1.27197265625, 1.358154296875, 1.4443359375, 1.530517578125, 1.61669921875, 1.702880859375, 1.7890625, 1.875244140625, 1.96142578125, 2.047607421875, 2.1337890625, 2.219970703125, 2.30615234375, 2.392333984375, 2.478515625, 2.564697265625, 2.65087890625, 2.737060546875, 2.8232421875, 2.909423828125, 2.99560546875, 3.081787109375, 3.16796875]}, "gradients/encoder.encoder.layers.8.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 3.0, 3.0, 4.0, 9.0, 2.0, 6.0, 13.0, 9.0, 23.0, 30.0, 46.0, 69.0, 75.0, 111.0, 100.0, 138.0, 98.0, 72.0, 50.0, 44.0, 26.0, 22.0, 20.0, 12.0, 8.0, 6.0, 4.0, 4.0, 0.0, 5.0, 0.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.000278472900390625, -0.00026776641607284546, -0.0002570599317550659, -0.0002463534474372864, -0.00023564696311950684, -0.0002249404788017273, -0.00021423399448394775, -0.0002035275101661682, -0.00019282102584838867, -0.00018211454153060913, -0.0001714080572128296, -0.00016070157289505005, -0.0001499950885772705, -0.00013928860425949097, -0.00012858211994171143, -0.00011787563562393188, -0.00010716915130615234, -9.64626669883728e-05, -8.575618267059326e-05, -7.504969835281372e-05, -6.434321403503418e-05, -5.363672971725464e-05, -4.29302453994751e-05, -3.222376108169556e-05, -2.1517276763916016e-05, -1.0810792446136475e-05, -1.043081283569336e-07, 1.0602176189422607e-05, 2.130866050720215e-05, 3.201514482498169e-05, 4.272162914276123e-05, 5.342811346054077e-05, 6.413459777832031e-05, 7.484108209609985e-05, 8.55475664138794e-05, 9.625405073165894e-05, 0.00010696053504943848, 0.00011766701936721802, 0.00012837350368499756, 0.0001390799880027771, 0.00014978647232055664, 0.00016049295663833618, 0.00017119944095611572, 0.00018190592527389526, 0.0001926124095916748, 0.00020331889390945435, 0.0002140253782272339, 0.00022473186254501343, 0.00023543834686279297, 0.0002461448311805725, 0.00025685131549835205, 0.0002675577998161316, 0.00027826428413391113, 0.0002889707684516907, 0.0002996772527694702, 0.00031038373708724976, 0.0003210902214050293, 0.00033179670572280884, 0.0003425031900405884, 0.0003532096743583679, 0.00036391615867614746, 0.000374622642993927, 0.00038532912731170654, 0.0003960356116294861, 0.0004067420959472656]}, "gradients/encoder.encoder.layers.8.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 3.0, 1.0, 5.0, 1.0, 3.0, 3.0, 6.0, 8.0, 15.0, 22.0, 27.0, 59.0, 84.0, 186.0, 337.0, 680.0, 1822.0, 6754.0, 50257.0, 745389.0, 221314.0, 16083.0, 3376.0, 1078.0, 482.0, 255.0, 133.0, 56.0, 50.0, 26.0, 19.0, 4.0, 6.0, 6.0, 3.0, 6.0, 0.0, 2.0, 1.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 1.0], "bins": [-2.14453125, -2.064361572265625, -1.98419189453125, -1.904022216796875, -1.8238525390625, -1.743682861328125, -1.66351318359375, -1.583343505859375, -1.503173828125, -1.423004150390625, -1.34283447265625, -1.262664794921875, -1.1824951171875, -1.102325439453125, -1.02215576171875, -0.941986083984375, -0.86181640625, -0.781646728515625, -0.70147705078125, -0.621307373046875, -0.5411376953125, -0.460968017578125, -0.38079833984375, -0.300628662109375, -0.220458984375, -0.140289306640625, -0.06011962890625, 0.020050048828125, 0.1002197265625, 0.180389404296875, 0.26055908203125, 0.340728759765625, 0.4208984375, 0.501068115234375, 0.58123779296875, 0.661407470703125, 0.7415771484375, 0.821746826171875, 0.90191650390625, 0.982086181640625, 1.062255859375, 1.142425537109375, 1.22259521484375, 1.302764892578125, 1.3829345703125, 1.463104248046875, 1.54327392578125, 1.623443603515625, 1.70361328125, 1.783782958984375, 1.86395263671875, 1.944122314453125, 2.0242919921875, 2.104461669921875, 2.18463134765625, 2.264801025390625, 2.344970703125, 2.425140380859375, 2.50531005859375, 2.585479736328125, 2.6656494140625, 2.745819091796875, 2.82598876953125, 2.906158447265625, 2.986328125]}, "gradients/encoder.encoder.layers.8.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 0.0, 10.0, 6.0, 14.0, 27.0, 51.0, 92.0, 109.0, 166.0, 150.0, 163.0, 84.0, 56.0, 34.0, 23.0, 5.0, 9.0, 4.0, 3.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.37109375, -3.255859375, -3.140625, -3.025390625, -2.91015625, -2.794921875, -2.6796875, -2.564453125, -2.44921875, -2.333984375, -2.21875, -2.103515625, -1.98828125, -1.873046875, -1.7578125, -1.642578125, -1.52734375, -1.412109375, -1.296875, -1.181640625, -1.06640625, -0.951171875, -0.8359375, -0.720703125, -0.60546875, -0.490234375, -0.375, -0.259765625, -0.14453125, -0.029296875, 0.0859375, 0.201171875, 0.31640625, 0.431640625, 0.546875, 0.662109375, 0.77734375, 0.892578125, 1.0078125, 1.123046875, 1.23828125, 1.353515625, 1.46875, 1.583984375, 1.69921875, 1.814453125, 1.9296875, 2.044921875, 2.16015625, 2.275390625, 2.390625, 2.505859375, 2.62109375, 2.736328125, 2.8515625, 2.966796875, 3.08203125, 3.197265625, 3.3125, 3.427734375, 3.54296875, 3.658203125, 3.7734375, 3.888671875, 4.00390625]}, "gradients/encoder.encoder.layers.8.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 4.0, 3.0, 7.0, 16.0, 35.0, 58.0, 134.0, 189.0, 222.0, 160.0, 97.0, 37.0, 20.0, 18.0, 5.0, 2.0, 1.0, 0.0, 3.0, 0.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-48.40748596191406, -46.488380432128906, -44.56927490234375, -42.65017318725586, -40.7310676574707, -38.81196212768555, -36.892860412597656, -34.9737548828125, -33.054649353027344, -31.135543823242188, -29.216440200805664, -27.29733657836914, -25.378231048583984, -23.459125518798828, -21.540021896362305, -19.62091827392578, -17.701812744140625, -15.782708168029785, -13.863603591918945, -11.944499015808105, -10.025394439697266, -8.106289863586426, -6.187185287475586, -4.268080711364746, -2.3489761352539062, -0.4298715591430664, 1.4892330169677734, 3.4083375930786133, 5.327442169189453, 7.246546745300293, 9.165651321411133, 11.084755897521973, 13.003860473632812, 14.922965049743652, 16.842069625854492, 18.761173248291016, 20.680278778076172, 22.599384307861328, 24.51848793029785, 26.437591552734375, 28.35669708251953, 30.275802612304688, 32.194908142089844, 34.114009857177734, 36.03311538696289, 37.95222091674805, 39.87132263183594, 41.790428161621094, 43.70953369140625, 45.628639221191406, 47.54774475097656, 49.46684646606445, 51.38595199584961, 53.305057525634766, 55.224159240722656, 57.14326477050781, 59.06237030029297, 60.981475830078125, 62.90058135986328, 64.81968688964844, 66.73878479003906, 68.65789031982422, 70.57699584960938, 72.49610137939453, 74.41520690917969]}, "gradients/encoder.encoder.layers.8.layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 3.0, 2.0, 3.0, 4.0, 3.0, 5.0, 11.0, 11.0, 16.0, 20.0, 28.0, 34.0, 45.0, 53.0, 58.0, 75.0, 66.0, 86.0, 91.0, 77.0, 77.0, 49.0, 42.0, 42.0, 31.0, 21.0, 21.0, 14.0, 8.0, 8.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.65980529785156, -37.1434440612793, -35.6270866394043, -34.11072540283203, -32.594364166259766, -31.078004837036133, -29.5616455078125, -28.045284271240234, -26.5289249420166, -25.01256561279297, -23.496204376220703, -21.97984504699707, -20.463485717773438, -18.947124481201172, -17.43076515197754, -15.91440486907959, -14.39804458618164, -12.881684303283691, -11.365324020385742, -9.84896469116211, -8.33260440826416, -6.816244125366211, -5.299884796142578, -3.783524513244629, -2.2671642303466797, -0.7508041858673096, 0.7655558586120605, 2.2819156646728516, 3.798275947570801, 5.31463623046875, 6.830995559692383, 8.347355842590332, 9.863712310791016, 11.380072593688965, 12.896432876586914, 14.412792205810547, 15.929152488708496, 17.445512771606445, 18.961872100830078, 20.478233337402344, 21.994592666625977, 23.51095199584961, 25.027313232421875, 26.543672561645508, 28.06003189086914, 29.576393127441406, 31.09275245666504, 32.60911178588867, 34.12547302246094, 35.6418342590332, 37.1581916809082, 38.67455291748047, 40.190914154052734, 41.707275390625, 43.2236328125, 44.739994049072266, 46.25635528564453, 47.7727165222168, 49.2890739440918, 50.80543518066406, 52.32179641723633, 53.838157653808594, 55.354515075683594, 56.87087631225586, 58.38723373413086]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 2.0, 0.0, 2.0, 0.0, 7.0, 10.0, 9.0, 32.0, 68.0, 115.0, 276.0, 675.0, 1941.0, 6278.0, 28473.0, 534300.0, 3558239.0, 50355.0, 9134.0, 2586.0, 899.0, 379.0, 188.0, 94.0, 60.0, 36.0, 29.0, 19.0, 11.0, 12.0, 9.0, 4.0, 9.0, 5.0, 5.0, 5.0, 3.0, 1.0, 6.0, 4.0, 1.0, 0.0, 1.0, 4.0, 0.0, 4.0, 1.0, 3.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0], "bins": [-3.71875, -3.5343017578125, -3.349853515625, -3.1654052734375, -2.98095703125, -2.7965087890625, -2.612060546875, -2.4276123046875, -2.2431640625, -2.0587158203125, -1.874267578125, -1.6898193359375, -1.50537109375, -1.3209228515625, -1.136474609375, -0.9520263671875, -0.767578125, -0.5831298828125, -0.398681640625, -0.2142333984375, -0.02978515625, 0.1546630859375, 0.339111328125, 0.5235595703125, 0.7080078125, 0.8924560546875, 1.076904296875, 1.2613525390625, 1.44580078125, 1.6302490234375, 1.814697265625, 1.9991455078125, 2.18359375, 2.3680419921875, 2.552490234375, 2.7369384765625, 2.92138671875, 3.1058349609375, 3.290283203125, 3.4747314453125, 3.6591796875, 3.8436279296875, 4.028076171875, 4.2125244140625, 4.39697265625, 4.5814208984375, 4.765869140625, 4.9503173828125, 5.134765625, 5.3192138671875, 5.503662109375, 5.6881103515625, 5.87255859375, 6.0570068359375, 6.241455078125, 6.4259033203125, 6.6103515625, 6.7947998046875, 6.979248046875, 7.1636962890625, 7.34814453125, 7.5325927734375, 7.717041015625, 7.9014892578125, 8.0859375]}, "gradients/encoder.encoder.layers.7.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 4.0, 6.0, 16.0, 30.0, 68.0, 116.0, 159.0, 176.0, 161.0, 114.0, 69.0, 51.0, 24.0, 11.0, 10.0, 5.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.552734375, -1.409210205078125, -1.26568603515625, -1.122161865234375, -0.9786376953125, -0.835113525390625, -0.69158935546875, -0.548065185546875, -0.404541015625, -0.261016845703125, -0.11749267578125, 0.026031494140625, 0.1695556640625, 0.313079833984375, 0.45660400390625, 0.600128173828125, 0.74365234375, 0.887176513671875, 1.03070068359375, 1.174224853515625, 1.3177490234375, 1.461273193359375, 1.60479736328125, 1.748321533203125, 1.891845703125, 2.035369873046875, 2.17889404296875, 2.322418212890625, 2.4659423828125, 2.609466552734375, 2.75299072265625, 2.896514892578125, 3.0400390625, 3.183563232421875, 3.32708740234375, 3.470611572265625, 3.6141357421875, 3.757659912109375, 3.90118408203125, 4.044708251953125, 4.188232421875, 4.331756591796875, 4.47528076171875, 4.618804931640625, 4.7623291015625, 4.905853271484375, 5.04937744140625, 5.192901611328125, 5.33642578125, 5.479949951171875, 5.62347412109375, 5.766998291015625, 5.9105224609375, 6.054046630859375, 6.19757080078125, 6.341094970703125, 6.484619140625, 6.628143310546875, 6.77166748046875, 6.915191650390625, 7.0587158203125, 7.202239990234375, 7.34576416015625, 7.489288330078125, 7.6328125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 5.0, 4.0, 3.0, 4.0, 9.0, 12.0, 11.0, 15.0, 21.0, 37.0, 69.0, 102.0, 199.0, 296.0, 606.0, 1497.0, 3456.0, 9991.0, 38537.0, 294650.0, 3647932.0, 157911.0, 26650.0, 7270.0, 2636.0, 1134.0, 526.0, 306.0, 142.0, 83.0, 54.0, 39.0, 20.0, 22.0, 11.0, 9.0, 3.0, 4.0, 4.0, 3.0, 3.0, 3.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-4.58984375, -4.443603515625, -4.29736328125, -4.151123046875, -4.0048828125, -3.858642578125, -3.71240234375, -3.566162109375, -3.419921875, -3.273681640625, -3.12744140625, -2.981201171875, -2.8349609375, -2.688720703125, -2.54248046875, -2.396240234375, -2.25, -2.103759765625, -1.95751953125, -1.811279296875, -1.6650390625, -1.518798828125, -1.37255859375, -1.226318359375, -1.080078125, -0.933837890625, -0.78759765625, -0.641357421875, -0.4951171875, -0.348876953125, -0.20263671875, -0.056396484375, 0.08984375, 0.236083984375, 0.38232421875, 0.528564453125, 0.6748046875, 0.821044921875, 0.96728515625, 1.113525390625, 1.259765625, 1.406005859375, 1.55224609375, 1.698486328125, 1.8447265625, 1.990966796875, 2.13720703125, 2.283447265625, 2.4296875, 2.575927734375, 2.72216796875, 2.868408203125, 3.0146484375, 3.160888671875, 3.30712890625, 3.453369140625, 3.599609375, 3.745849609375, 3.89208984375, 4.038330078125, 4.1845703125, 4.330810546875, 4.47705078125, 4.623291015625, 4.76953125]}, "gradients/encoder.encoder.layers.7.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 3.0, 1.0, 0.0, 2.0, 3.0, 2.0, 1.0, 2.0, 5.0, 3.0, 10.0, 7.0, 15.0, 20.0, 17.0, 24.0, 38.0, 58.0, 100.0, 162.0, 395.0, 1170.0, 1192.0, 434.0, 160.0, 93.0, 55.0, 38.0, 20.0, 19.0, 9.0, 7.0, 9.0, 4.0, 3.0, 1.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.3046875, -4.1453857421875, -3.986083984375, -3.8267822265625, -3.66748046875, -3.5081787109375, -3.348876953125, -3.1895751953125, -3.0302734375, -2.8709716796875, -2.711669921875, -2.5523681640625, -2.39306640625, -2.2337646484375, -2.074462890625, -1.9151611328125, -1.755859375, -1.5965576171875, -1.437255859375, -1.2779541015625, -1.11865234375, -0.9593505859375, -0.800048828125, -0.6407470703125, -0.4814453125, -0.3221435546875, -0.162841796875, -0.0035400390625, 0.15576171875, 0.3150634765625, 0.474365234375, 0.6336669921875, 0.79296875, 0.9522705078125, 1.111572265625, 1.2708740234375, 1.43017578125, 1.5894775390625, 1.748779296875, 1.9080810546875, 2.0673828125, 2.2266845703125, 2.385986328125, 2.5452880859375, 2.70458984375, 2.8638916015625, 3.023193359375, 3.1824951171875, 3.341796875, 3.5010986328125, 3.660400390625, 3.8197021484375, 3.97900390625, 4.1383056640625, 4.297607421875, 4.4569091796875, 4.6162109375, 4.7755126953125, 4.934814453125, 5.0941162109375, 5.25341796875, 5.4127197265625, 5.572021484375, 5.7313232421875, 5.890625]}, "gradients/encoder.encoder.layers.7.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 3.0, 4.0, 3.0, 2.0, 16.0, 31.0, 80.0, 200.0, 313.0, 218.0, 90.0, 28.0, 10.0, 3.0, 6.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-99.85432434082031, -97.70513916015625, -95.55594635009766, -93.4067611694336, -91.25757598876953, -89.10838317871094, -86.95919799804688, -84.81001281738281, -82.66082000732422, -80.51163482666016, -78.36244201660156, -76.2132568359375, -74.06407165527344, -71.91487884521484, -69.76569366455078, -67.61650848388672, -65.46731567382812, -63.3181266784668, -61.168941497802734, -59.019752502441406, -56.87056350708008, -54.72137451171875, -52.57218933105469, -50.42300033569336, -48.27381896972656, -46.124629974365234, -43.97544479370117, -41.826255798339844, -39.677066802978516, -37.52787780761719, -35.378692626953125, -33.2295036315918, -31.08031463623047, -28.931127548217773, -26.781938552856445, -24.63275146484375, -22.483562469482422, -20.334375381469727, -18.18518829345703, -16.035999298095703, -13.886812210083008, -11.737624168395996, -9.588436126708984, -7.439249038696289, -5.290060997009277, -3.1408729553222656, -0.9916858673095703, 1.1575021743774414, 3.306690216064453, 5.455878257751465, 7.605065822601318, 9.754253387451172, 11.903441429138184, 14.052629470825195, 16.20181655883789, 18.35100555419922, 20.500192642211914, 22.64937973022461, 24.798568725585938, 26.947755813598633, 29.096942901611328, 31.246131896972656, 33.39531707763672, 35.54450607299805, 37.693695068359375]}, "gradients/encoder.encoder.layers.7.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 3.0, 7.0, 6.0, 8.0, 15.0, 26.0, 25.0, 22.0, 37.0, 54.0, 74.0, 73.0, 68.0, 77.0, 81.0, 67.0, 65.0, 71.0, 43.0, 51.0, 41.0, 22.0, 27.0, 17.0, 9.0, 11.0, 7.0, 2.0, 1.0, 1.0, 5.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-38.652130126953125, -37.7086181640625, -36.765106201171875, -35.82159423828125, -34.87808609008789, -33.934574127197266, -32.99106216430664, -32.047550201416016, -31.10403823852539, -30.160526275634766, -29.217016220092773, -28.27350425720215, -27.329992294311523, -26.38648223876953, -25.442970275878906, -24.49945831298828, -23.55594825744629, -22.612436294555664, -21.668926239013672, -20.725414276123047, -19.781902313232422, -18.838390350341797, -17.894880294799805, -16.95136833190918, -16.007858276367188, -15.064347267150879, -14.120835304260254, -13.177324295043945, -12.23381233215332, -11.290301322937012, -10.346790313720703, -9.403278350830078, -8.45976448059082, -7.5162529945373535, -6.572741508483887, -5.629230499267578, -4.685719013214111, -3.7422075271606445, -2.798696517944336, -1.8551850318908691, -0.9116735458374023, 0.0318378210067749, 0.9753491878509521, 1.9188604354858398, 2.8623719215393066, 3.8058834075927734, 4.749394416809082, 5.692905902862549, 6.636417388916016, 7.579928874969482, 8.52344036102295, 9.466951370239258, 10.410463333129883, 11.353974342346191, 12.2974853515625, 13.240997314453125, 14.184508323669434, 15.128019332885742, 16.071531295776367, 17.01504135131836, 17.958553314208984, 18.90206527709961, 19.845577239990234, 20.789087295532227, 21.73259925842285]}, "gradients/encoder.encoder.layers.7.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 3.0, 7.0, 6.0, 1.0, 8.0, 8.0, 20.0, 15.0, 29.0, 45.0, 65.0, 144.0, 304.0, 615.0, 1471.0, 3717.0, 11556.0, 42219.0, 176336.0, 496541.0, 236642.0, 56280.0, 14728.0, 4639.0, 1689.0, 759.0, 336.0, 150.0, 83.0, 44.0, 33.0, 26.0, 19.0, 9.0, 6.0, 5.0, 3.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-3.783203125, -3.659576416015625, -3.53594970703125, -3.412322998046875, -3.2886962890625, -3.165069580078125, -3.04144287109375, -2.917816162109375, -2.794189453125, -2.670562744140625, -2.54693603515625, -2.423309326171875, -2.2996826171875, -2.176055908203125, -2.05242919921875, -1.928802490234375, -1.80517578125, -1.681549072265625, -1.55792236328125, -1.434295654296875, -1.3106689453125, -1.187042236328125, -1.06341552734375, -0.939788818359375, -0.816162109375, -0.692535400390625, -0.56890869140625, -0.445281982421875, -0.3216552734375, -0.198028564453125, -0.07440185546875, 0.049224853515625, 0.1728515625, 0.296478271484375, 0.42010498046875, 0.543731689453125, 0.6673583984375, 0.790985107421875, 0.91461181640625, 1.038238525390625, 1.161865234375, 1.285491943359375, 1.40911865234375, 1.532745361328125, 1.6563720703125, 1.779998779296875, 1.90362548828125, 2.027252197265625, 2.15087890625, 2.274505615234375, 2.39813232421875, 2.521759033203125, 2.6453857421875, 2.769012451171875, 2.89263916015625, 3.016265869140625, 3.139892578125, 3.263519287109375, 3.38714599609375, 3.510772705078125, 3.6343994140625, 3.758026123046875, 3.88165283203125, 4.005279541015625, 4.12890625]}, "gradients/encoder.encoder.layers.7.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 9.0, 16.0, 17.0, 21.0, 44.0, 69.0, 73.0, 88.0, 133.0, 122.0, 98.0, 89.0, 68.0, 55.0, 34.0, 36.0, 19.0, 12.0, 7.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.84765625, -1.75726318359375, -1.6668701171875, -1.57647705078125, -1.486083984375, -1.39569091796875, -1.3052978515625, -1.21490478515625, -1.12451171875, -1.03411865234375, -0.9437255859375, -0.85333251953125, -0.762939453125, -0.67254638671875, -0.5821533203125, -0.49176025390625, -0.4013671875, -0.31097412109375, -0.2205810546875, -0.13018798828125, -0.039794921875, 0.05059814453125, 0.1409912109375, 0.23138427734375, 0.32177734375, 0.41217041015625, 0.5025634765625, 0.59295654296875, 0.683349609375, 0.77374267578125, 0.8641357421875, 0.95452880859375, 1.044921875, 1.13531494140625, 1.2257080078125, 1.31610107421875, 1.406494140625, 1.49688720703125, 1.5872802734375, 1.67767333984375, 1.76806640625, 1.85845947265625, 1.9488525390625, 2.03924560546875, 2.129638671875, 2.22003173828125, 2.3104248046875, 2.40081787109375, 2.4912109375, 2.58160400390625, 2.6719970703125, 2.76239013671875, 2.852783203125, 2.94317626953125, 3.0335693359375, 3.12396240234375, 3.21435546875, 3.30474853515625, 3.3951416015625, 3.48553466796875, 3.575927734375, 3.66632080078125, 3.7567138671875, 3.84710693359375, 3.9375]}, "gradients/encoder.encoder.layers.7.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 3.0, 3.0, 3.0, 6.0, 3.0, 7.0, 13.0, 13.0, 15.0, 22.0, 27.0, 78.0, 70.0, 129.0, 234.0, 384.0, 714.0, 1426.0, 2909.0, 8031.0, 28464.0, 152739.0, 625475.0, 179920.0, 32951.0, 8730.0, 3085.0, 1365.0, 694.0, 438.0, 224.0, 145.0, 86.0, 57.0, 39.0, 16.0, 15.0, 8.0, 7.0, 1.0, 2.0, 3.0, 3.0, 4.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-4.84765625, -4.718536376953125, -4.58941650390625, -4.460296630859375, -4.3311767578125, -4.202056884765625, -4.07293701171875, -3.943817138671875, -3.814697265625, -3.685577392578125, -3.55645751953125, -3.427337646484375, -3.2982177734375, -3.169097900390625, -3.03997802734375, -2.910858154296875, -2.78173828125, -2.652618408203125, -2.52349853515625, -2.394378662109375, -2.2652587890625, -2.136138916015625, -2.00701904296875, -1.877899169921875, -1.748779296875, -1.619659423828125, -1.49053955078125, -1.361419677734375, -1.2322998046875, -1.103179931640625, -0.97406005859375, -0.844940185546875, -0.7158203125, -0.586700439453125, -0.45758056640625, -0.328460693359375, -0.1993408203125, -0.070220947265625, 0.05889892578125, 0.188018798828125, 0.317138671875, 0.446258544921875, 0.57537841796875, 0.704498291015625, 0.8336181640625, 0.962738037109375, 1.09185791015625, 1.220977783203125, 1.35009765625, 1.479217529296875, 1.60833740234375, 1.737457275390625, 1.8665771484375, 1.995697021484375, 2.12481689453125, 2.253936767578125, 2.383056640625, 2.512176513671875, 2.64129638671875, 2.770416259765625, 2.8995361328125, 3.028656005859375, 3.15777587890625, 3.286895751953125, 3.416015625]}, "gradients/encoder.encoder.layers.7.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 1.0, 3.0, 3.0, 4.0, 6.0, 9.0, 14.0, 11.0, 17.0, 21.0, 28.0, 21.0, 23.0, 31.0, 36.0, 39.0, 37.0, 38.0, 59.0, 49.0, 69.0, 66.0, 51.0, 57.0, 47.0, 39.0, 41.0, 46.0, 27.0, 22.0, 23.0, 10.0, 13.0, 12.0, 6.0, 10.0, 7.0, 5.0, 3.0, 1.0, 2.0, 1.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-6.09375, -5.89471435546875, -5.6956787109375, -5.49664306640625, -5.297607421875, -5.09857177734375, -4.8995361328125, -4.70050048828125, -4.50146484375, -4.30242919921875, -4.1033935546875, -3.90435791015625, -3.705322265625, -3.50628662109375, -3.3072509765625, -3.10821533203125, -2.9091796875, -2.71014404296875, -2.5111083984375, -2.31207275390625, -2.113037109375, -1.91400146484375, -1.7149658203125, -1.51593017578125, -1.31689453125, -1.11785888671875, -0.9188232421875, -0.71978759765625, -0.520751953125, -0.32171630859375, -0.1226806640625, 0.07635498046875, 0.275390625, 0.47442626953125, 0.6734619140625, 0.87249755859375, 1.071533203125, 1.27056884765625, 1.4696044921875, 1.66864013671875, 1.86767578125, 2.06671142578125, 2.2657470703125, 2.46478271484375, 2.663818359375, 2.86285400390625, 3.0618896484375, 3.26092529296875, 3.4599609375, 3.65899658203125, 3.8580322265625, 4.05706787109375, 4.256103515625, 4.45513916015625, 4.6541748046875, 4.85321044921875, 5.05224609375, 5.25128173828125, 5.4503173828125, 5.64935302734375, 5.848388671875, 6.04742431640625, 6.2464599609375, 6.44549560546875, 6.64453125]}, "gradients/encoder.encoder.layers.7.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 3.0, 0.0, 1.0, 5.0, 4.0, 1.0, 9.0, 12.0, 16.0, 20.0, 20.0, 41.0, 71.0, 85.0, 155.0, 279.0, 599.0, 1333.0, 4007.0, 16788.0, 129918.0, 742276.0, 129471.0, 16821.0, 3944.0, 1352.0, 627.0, 263.0, 156.0, 94.0, 59.0, 41.0, 25.0, 17.0, 16.0, 9.0, 10.0, 5.0, 4.0, 5.0, 1.0, 3.0, 1.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.966796875, -1.906280517578125, -1.84576416015625, -1.785247802734375, -1.7247314453125, -1.664215087890625, -1.60369873046875, -1.543182373046875, -1.482666015625, -1.422149658203125, -1.36163330078125, -1.301116943359375, -1.2406005859375, -1.180084228515625, -1.11956787109375, -1.059051513671875, -0.99853515625, -0.938018798828125, -0.87750244140625, -0.816986083984375, -0.7564697265625, -0.695953369140625, -0.63543701171875, -0.574920654296875, -0.514404296875, -0.453887939453125, -0.39337158203125, -0.332855224609375, -0.2723388671875, -0.211822509765625, -0.15130615234375, -0.090789794921875, -0.0302734375, 0.030242919921875, 0.09075927734375, 0.151275634765625, 0.2117919921875, 0.272308349609375, 0.33282470703125, 0.393341064453125, 0.453857421875, 0.514373779296875, 0.57489013671875, 0.635406494140625, 0.6959228515625, 0.756439208984375, 0.81695556640625, 0.877471923828125, 0.93798828125, 0.998504638671875, 1.05902099609375, 1.119537353515625, 1.1800537109375, 1.240570068359375, 1.30108642578125, 1.361602783203125, 1.422119140625, 1.482635498046875, 1.54315185546875, 1.603668212890625, 1.6641845703125, 1.724700927734375, 1.78521728515625, 1.845733642578125, 1.90625]}, "gradients/encoder.encoder.layers.7.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 2.0, 2.0, 1.0, 0.0, 6.0, 3.0, 3.0, 2.0, 2.0, 8.0, 6.0, 14.0, 15.0, 21.0, 23.0, 39.0, 41.0, 55.0, 64.0, 73.0, 101.0, 109.0, 108.0, 68.0, 52.0, 54.0, 32.0, 23.0, 25.0, 15.0, 20.0, 7.0, 6.0, 4.0, 5.0, 5.0, 2.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00023484230041503906, -0.0002243146300315857, -0.00021378695964813232, -0.00020325928926467896, -0.00019273161888122559, -0.00018220394849777222, -0.00017167627811431885, -0.00016114860773086548, -0.0001506209373474121, -0.00014009326696395874, -0.00012956559658050537, -0.000119037926197052, -0.00010851025581359863, -9.798258543014526e-05, -8.74549150466919e-05, -7.692724466323853e-05, -6.639957427978516e-05, -5.587190389633179e-05, -4.534423351287842e-05, -3.481656312942505e-05, -2.428889274597168e-05, -1.376122236251831e-05, -3.2335519790649414e-06, 7.294118404388428e-06, 1.7821788787841797e-05, 2.8349459171295166e-05, 3.8877129554748535e-05, 4.9404799938201904e-05, 5.9932470321655273e-05, 7.046014070510864e-05, 8.098781108856201e-05, 9.151548147201538e-05, 0.00010204315185546875, 0.00011257082223892212, 0.0001230984926223755, 0.00013362616300582886, 0.00014415383338928223, 0.0001546815037727356, 0.00016520917415618896, 0.00017573684453964233, 0.0001862645149230957, 0.00019679218530654907, 0.00020731985569000244, 0.0002178475260734558, 0.00022837519645690918, 0.00023890286684036255, 0.0002494305372238159, 0.0002599582076072693, 0.00027048587799072266, 0.000281013548374176, 0.0002915412187576294, 0.00030206888914108276, 0.00031259655952453613, 0.0003231242299079895, 0.00033365190029144287, 0.00034417957067489624, 0.0003547072410583496, 0.000365234911441803, 0.00037576258182525635, 0.0003862902522087097, 0.0003968179225921631, 0.00040734559297561646, 0.0004178732633590698, 0.0004284009337425232, 0.00043892860412597656]}, "gradients/encoder.encoder.layers.7.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 2.0, 0.0, 1.0, 2.0, 2.0, 8.0, 8.0, 13.0, 16.0, 28.0, 43.0, 77.0, 138.0, 308.0, 753.0, 2270.0, 10690.0, 119772.0, 818136.0, 84285.0, 8650.0, 2078.0, 679.0, 279.0, 141.0, 75.0, 43.0, 24.0, 16.0, 10.0, 6.0, 4.0, 2.0, 2.0, 3.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.06640625, -1.988250732421875, -1.91009521484375, -1.831939697265625, -1.7537841796875, -1.675628662109375, -1.59747314453125, -1.519317626953125, -1.441162109375, -1.363006591796875, -1.28485107421875, -1.206695556640625, -1.1285400390625, -1.050384521484375, -0.97222900390625, -0.894073486328125, -0.81591796875, -0.737762451171875, -0.65960693359375, -0.581451416015625, -0.5032958984375, -0.425140380859375, -0.34698486328125, -0.268829345703125, -0.190673828125, -0.112518310546875, -0.03436279296875, 0.043792724609375, 0.1219482421875, 0.200103759765625, 0.27825927734375, 0.356414794921875, 0.4345703125, 0.512725830078125, 0.59088134765625, 0.669036865234375, 0.7471923828125, 0.825347900390625, 0.90350341796875, 0.981658935546875, 1.059814453125, 1.137969970703125, 1.21612548828125, 1.294281005859375, 1.3724365234375, 1.450592041015625, 1.52874755859375, 1.606903076171875, 1.68505859375, 1.763214111328125, 1.84136962890625, 1.919525146484375, 1.9976806640625, 2.075836181640625, 2.15399169921875, 2.232147216796875, 2.310302734375, 2.388458251953125, 2.46661376953125, 2.544769287109375, 2.6229248046875, 2.701080322265625, 2.77923583984375, 2.857391357421875, 2.935546875]}, "gradients/encoder.encoder.layers.7.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 1.0, 5.0, 8.0, 12.0, 14.0, 27.0, 45.0, 69.0, 96.0, 149.0, 180.0, 127.0, 102.0, 63.0, 36.0, 18.0, 21.0, 11.0, 11.0, 9.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.638671875, -2.53887939453125, -2.4390869140625, -2.33929443359375, -2.239501953125, -2.13970947265625, -2.0399169921875, -1.94012451171875, -1.84033203125, -1.74053955078125, -1.6407470703125, -1.54095458984375, -1.441162109375, -1.34136962890625, -1.2415771484375, -1.14178466796875, -1.0419921875, -0.94219970703125, -0.8424072265625, -0.74261474609375, -0.642822265625, -0.54302978515625, -0.4432373046875, -0.34344482421875, -0.24365234375, -0.14385986328125, -0.0440673828125, 0.05572509765625, 0.155517578125, 0.25531005859375, 0.3551025390625, 0.45489501953125, 0.5546875, 0.65447998046875, 0.7542724609375, 0.85406494140625, 0.953857421875, 1.05364990234375, 1.1534423828125, 1.25323486328125, 1.35302734375, 1.45281982421875, 1.5526123046875, 1.65240478515625, 1.752197265625, 1.85198974609375, 1.9517822265625, 2.05157470703125, 2.1513671875, 2.25115966796875, 2.3509521484375, 2.45074462890625, 2.550537109375, 2.65032958984375, 2.7501220703125, 2.84991455078125, 2.94970703125, 3.04949951171875, 3.1492919921875, 3.24908447265625, 3.348876953125, 3.44866943359375, 3.5484619140625, 3.64825439453125, 3.748046875]}, "gradients/encoder.encoder.layers.7.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 1.0, 3.0, 3.0, 8.0, 12.0, 16.0, 32.0, 43.0, 64.0, 110.0, 149.0, 161.0, 139.0, 112.0, 63.0, 44.0, 13.0, 14.0, 9.0, 3.0, 3.0, 4.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 1.0, 1.0], "bins": [-44.44267654418945, -43.4490966796875, -42.45552062988281, -41.46194076538086, -40.468360900878906, -39.47478103637695, -38.481204986572266, -37.48762512207031, -36.49404525756836, -35.500465393066406, -34.50688934326172, -33.513309478759766, -32.51972961425781, -31.526151657104492, -30.532573699951172, -29.53899383544922, -28.5454158782959, -27.551837921142578, -26.558258056640625, -25.564680099487305, -24.57110023498535, -23.57752227783203, -22.583942413330078, -21.590364456176758, -20.596786499023438, -19.603208541870117, -18.609628677368164, -17.616050720214844, -16.62247085571289, -15.62889289855957, -14.635313987731934, -13.641735076904297, -12.648155212402344, -11.654576301574707, -10.66099739074707, -9.66741943359375, -8.673839569091797, -7.680261135101318, -6.68668270111084, -5.693103790283203, -4.699524879455566, -3.7059459686279297, -2.712367296218872, -1.7187886238098145, -0.7252097129821777, 0.268369197845459, 1.2619476318359375, 2.255526542663574, 3.249105453491211, 4.242684364318848, 5.236263275146484, 6.229841709136963, 7.2234206199646, 8.216999053955078, 9.210577964782715, 10.204156875610352, 11.197735786437988, 12.191314697265625, 13.184893608093262, 14.178472518920898, 15.172050476074219, 16.165630340576172, 17.159208297729492, 18.152786254882812, 19.146366119384766]}, "gradients/encoder.encoder.layers.7.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 2.0, 1.0, 6.0, 8.0, 9.0, 6.0, 11.0, 14.0, 11.0, 19.0, 27.0, 31.0, 33.0, 51.0, 38.0, 42.0, 54.0, 80.0, 79.0, 73.0, 60.0, 58.0, 50.0, 44.0, 47.0, 32.0, 23.0, 19.0, 17.0, 16.0, 12.0, 12.0, 11.0, 3.0, 4.0, 3.0, 3.0, 0.0, 4.0, 1.0, 1.0, 0.0, 2.0], "bins": [-38.483909606933594, -37.52277755737305, -36.5616455078125, -35.60051727294922, -34.63938522338867, -33.678253173828125, -32.71712112426758, -31.755990982055664, -30.79486083984375, -29.833728790283203, -28.87259864807129, -27.911466598510742, -26.950336456298828, -25.98920440673828, -25.028072357177734, -24.06694221496582, -23.105810165405273, -22.144678115844727, -21.183547973632812, -20.222415924072266, -19.26128578186035, -18.300153732299805, -17.33902359008789, -16.377891540527344, -15.416760444641113, -14.455629348754883, -13.494498252868652, -12.533367156982422, -11.572235107421875, -10.611104965209961, -9.649972915649414, -8.688841819763184, -7.727710723876953, -6.766579627990723, -5.805448532104492, -4.8443169593811035, -3.883185863494873, -2.9220547676086426, -1.960923194885254, -0.9997920989990234, -0.03866100311279297, 0.922470211982727, 1.883601427078247, 2.8447327613830566, 3.805863857269287, 4.766994953155518, 5.728126525878906, 6.689257621765137, 7.650388717651367, 8.611519813537598, 9.572650909423828, 10.533782958984375, 11.494913101196289, 12.456045150756836, 13.417176246643066, 14.378307342529297, 15.339438438415527, 16.300569534301758, 17.261701583862305, 18.22283172607422, 19.183963775634766, 20.14509391784668, 21.106225967407227, 22.06735610961914, 23.028488159179688]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 3.0, 2.0, 4.0, 6.0, 6.0, 9.0, 21.0, 23.0, 43.0, 73.0, 125.0, 252.0, 476.0, 1148.0, 3210.0, 12013.0, 77374.0, 3362446.0, 691658.0, 34512.0, 7186.0, 2088.0, 818.0, 390.0, 161.0, 93.0, 56.0, 27.0, 27.0, 11.0, 11.0, 7.0, 4.0, 4.0, 1.0, 2.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.220703125, -3.104888916015625, -2.98907470703125, -2.873260498046875, -2.7574462890625, -2.641632080078125, -2.52581787109375, -2.410003662109375, -2.294189453125, -2.178375244140625, -2.06256103515625, -1.946746826171875, -1.8309326171875, -1.715118408203125, -1.59930419921875, -1.483489990234375, -1.36767578125, -1.251861572265625, -1.13604736328125, -1.020233154296875, -0.9044189453125, -0.788604736328125, -0.67279052734375, -0.556976318359375, -0.441162109375, -0.325347900390625, -0.20953369140625, -0.093719482421875, 0.0220947265625, 0.137908935546875, 0.25372314453125, 0.369537353515625, 0.4853515625, 0.601165771484375, 0.71697998046875, 0.832794189453125, 0.9486083984375, 1.064422607421875, 1.18023681640625, 1.296051025390625, 1.411865234375, 1.527679443359375, 1.64349365234375, 1.759307861328125, 1.8751220703125, 1.990936279296875, 2.10675048828125, 2.222564697265625, 2.33837890625, 2.454193115234375, 2.57000732421875, 2.685821533203125, 2.8016357421875, 2.917449951171875, 3.03326416015625, 3.149078369140625, 3.264892578125, 3.380706787109375, 3.49652099609375, 3.612335205078125, 3.7281494140625, 3.843963623046875, 3.95977783203125, 4.075592041015625, 4.19140625]}, "gradients/encoder.encoder.layers.6.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 1.0, 2.0, 3.0, 1.0, 5.0, 5.0, 3.0, 6.0, 11.0, 8.0, 13.0, 28.0, 29.0, 35.0, 45.0, 52.0, 62.0, 56.0, 62.0, 76.0, 69.0, 68.0, 49.0, 58.0, 40.0, 45.0, 29.0, 32.0, 20.0, 25.0, 19.0, 22.0, 9.0, 5.0, 5.0, 5.0, 6.0, 4.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.060546875, -1.01092529296875, -0.9613037109375, -0.91168212890625, -0.862060546875, -0.81243896484375, -0.7628173828125, -0.71319580078125, -0.66357421875, -0.61395263671875, -0.5643310546875, -0.51470947265625, -0.465087890625, -0.41546630859375, -0.3658447265625, -0.31622314453125, -0.2666015625, -0.21697998046875, -0.1673583984375, -0.11773681640625, -0.068115234375, -0.01849365234375, 0.0311279296875, 0.08074951171875, 0.13037109375, 0.17999267578125, 0.2296142578125, 0.27923583984375, 0.328857421875, 0.37847900390625, 0.4281005859375, 0.47772216796875, 0.52734375, 0.57696533203125, 0.6265869140625, 0.67620849609375, 0.725830078125, 0.77545166015625, 0.8250732421875, 0.87469482421875, 0.92431640625, 0.97393798828125, 1.0235595703125, 1.07318115234375, 1.122802734375, 1.17242431640625, 1.2220458984375, 1.27166748046875, 1.3212890625, 1.37091064453125, 1.4205322265625, 1.47015380859375, 1.519775390625, 1.56939697265625, 1.6190185546875, 1.66864013671875, 1.71826171875, 1.76788330078125, 1.8175048828125, 1.86712646484375, 1.916748046875, 1.96636962890625, 2.0159912109375, 2.06561279296875, 2.115234375]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 1.0, 4.0, 1.0, 5.0, 12.0, 29.0, 55.0, 144.0, 325.0, 1025.0, 4320.0, 24496.0, 299693.0, 3728574.0, 116839.0, 14912.0, 2779.0, 695.0, 205.0, 86.0, 47.0, 24.0, 14.0, 5.0, 2.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.46484375, -3.30255126953125, -3.1402587890625, -2.97796630859375, -2.815673828125, -2.65338134765625, -2.4910888671875, -2.32879638671875, -2.16650390625, -2.00421142578125, -1.8419189453125, -1.67962646484375, -1.517333984375, -1.35504150390625, -1.1927490234375, -1.03045654296875, -0.8681640625, -0.70587158203125, -0.5435791015625, -0.38128662109375, -0.218994140625, -0.05670166015625, 0.1055908203125, 0.26788330078125, 0.43017578125, 0.59246826171875, 0.7547607421875, 0.91705322265625, 1.079345703125, 1.24163818359375, 1.4039306640625, 1.56622314453125, 1.728515625, 1.89080810546875, 2.0531005859375, 2.21539306640625, 2.377685546875, 2.53997802734375, 2.7022705078125, 2.86456298828125, 3.02685546875, 3.18914794921875, 3.3514404296875, 3.51373291015625, 3.676025390625, 3.83831787109375, 4.0006103515625, 4.16290283203125, 4.3251953125, 4.48748779296875, 4.6497802734375, 4.81207275390625, 4.974365234375, 5.13665771484375, 5.2989501953125, 5.46124267578125, 5.62353515625, 5.78582763671875, 5.9481201171875, 6.11041259765625, 6.272705078125, 6.43499755859375, 6.5972900390625, 6.75958251953125, 6.921875]}, "gradients/encoder.encoder.layers.6.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 3.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 3.0, 3.0, 4.0, 5.0, 2.0, 15.0, 13.0, 18.0, 23.0, 30.0, 41.0, 73.0, 90.0, 197.0, 451.0, 865.0, 987.0, 547.0, 287.0, 129.0, 63.0, 47.0, 31.0, 35.0, 29.0, 22.0, 17.0, 16.0, 5.0, 11.0, 5.0, 5.0, 2.0, 1.0, 2.0, 1.0, 0.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.740234375, -2.635955810546875, -2.53167724609375, -2.427398681640625, -2.3231201171875, -2.218841552734375, -2.11456298828125, -2.010284423828125, -1.906005859375, -1.801727294921875, -1.69744873046875, -1.593170166015625, -1.4888916015625, -1.384613037109375, -1.28033447265625, -1.176055908203125, -1.07177734375, -0.967498779296875, -0.86322021484375, -0.758941650390625, -0.6546630859375, -0.550384521484375, -0.44610595703125, -0.341827392578125, -0.237548828125, -0.133270263671875, -0.02899169921875, 0.075286865234375, 0.1795654296875, 0.283843994140625, 0.38812255859375, 0.492401123046875, 0.5966796875, 0.700958251953125, 0.80523681640625, 0.909515380859375, 1.0137939453125, 1.118072509765625, 1.22235107421875, 1.326629638671875, 1.430908203125, 1.535186767578125, 1.63946533203125, 1.743743896484375, 1.8480224609375, 1.952301025390625, 2.05657958984375, 2.160858154296875, 2.26513671875, 2.369415283203125, 2.47369384765625, 2.577972412109375, 2.6822509765625, 2.786529541015625, 2.89080810546875, 2.995086669921875, 3.099365234375, 3.203643798828125, 3.30792236328125, 3.412200927734375, 3.5164794921875, 3.620758056640625, 3.72503662109375, 3.829315185546875, 3.93359375]}, "gradients/encoder.encoder.layers.6.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 3.0, 2.0, 5.0, 8.0, 11.0, 21.0, 26.0, 72.0, 99.0, 175.0, 242.0, 160.0, 108.0, 39.0, 17.0, 10.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-23.220149993896484, -22.087230682373047, -20.954313278198242, -19.821395874023438, -18.6884765625, -17.555557250976562, -16.422639846801758, -15.289721488952637, -14.156803131103516, -13.023884773254395, -11.890966415405273, -10.758048057556152, -9.625129699707031, -8.49221134185791, -7.359292984008789, -6.226374626159668, -5.093456268310547, -3.960537910461426, -2.8276195526123047, -1.6947011947631836, -0.5617828369140625, 0.5711355209350586, 1.7040538787841797, 2.836972236633301, 3.969890594482422, 5.102808952331543, 6.235727310180664, 7.368645668029785, 8.501564025878906, 9.634482383728027, 10.767400741577148, 11.90031909942627, 13.033241271972656, 14.166159629821777, 15.299077987670898, 16.431995391845703, 17.56491470336914, 18.697834014892578, 19.830751419067383, 20.963668823242188, 22.096588134765625, 23.229507446289062, 24.362424850463867, 25.495342254638672, 26.62826156616211, 27.761180877685547, 28.89409828186035, 30.027015686035156, 31.159934997558594, 32.29285430908203, 33.42577362060547, 34.55868911743164, 35.69160842895508, 36.824527740478516, 37.95744323730469, 39.090362548828125, 40.22328186035156, 41.356201171875, 42.48912048339844, 43.62203598022461, 44.75495529174805, 45.887874603271484, 47.020790100097656, 48.153709411621094, 49.28662872314453]}, "gradients/encoder.encoder.layers.6.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 3.0, 1.0, 4.0, 7.0, 6.0, 11.0, 23.0, 25.0, 31.0, 37.0, 32.0, 59.0, 73.0, 40.0, 53.0, 76.0, 62.0, 71.0, 64.0, 56.0, 59.0, 52.0, 40.0, 30.0, 31.0, 19.0, 18.0, 12.0, 4.0, 4.0, 4.0, 5.0, 1.0, 0.0, 0.0, 0.0, 3.0, 1.0], "bins": [-26.497116088867188, -25.8597469329834, -25.222379684448242, -24.585010528564453, -23.947641372680664, -23.310272216796875, -22.67290496826172, -22.03553581237793, -21.39816665649414, -20.76079750061035, -20.123430252075195, -19.486061096191406, -18.848691940307617, -18.211322784423828, -17.573955535888672, -16.936586380004883, -16.299217224121094, -15.661849021911621, -15.024479866027832, -14.38711166381836, -13.74974250793457, -13.112374305725098, -12.475006103515625, -11.837636947631836, -11.20026969909668, -10.562901496887207, -9.925532341003418, -9.288164138793945, -8.650794982910156, -8.013426780700684, -7.376058101654053, -6.738689422607422, -6.101320266723633, -5.463951587677002, -4.826582908630371, -4.189214706420898, -3.5518457889556885, -2.9144771099090576, -2.277108669281006, -1.639739990234375, -1.0023713111877441, -0.36500269174575806, 0.272365927696228, 0.9097344875335693, 1.5471031665802002, 2.184471845626831, 2.821840286254883, 3.4592089653015137, 4.0965776443481445, 4.733946323394775, 5.371315002441406, 6.008683204650879, 6.646052360534668, 7.283420562744141, 7.9207892417907715, 8.558157920837402, 9.195526123046875, 9.832894325256348, 10.470263481140137, 11.10763168334961, 11.745000839233398, 12.382369041442871, 13.019737243652344, 13.657106399536133, 14.294475555419922]}, "gradients/encoder.encoder.layers.6.attention.out_proj.weight": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 3.0, 5.0, 7.0, 3.0, 9.0, 18.0, 17.0, 33.0, 50.0, 64.0, 88.0, 167.0, 277.0, 427.0, 650.0, 1158.0, 1940.0, 3320.0, 6222.0, 12196.0, 24258.0, 52112.0, 115204.0, 243829.0, 292614.0, 156301.0, 70325.0, 32894.0, 15972.0, 8170.0, 4266.0, 2364.0, 1307.0, 848.0, 511.0, 306.0, 206.0, 138.0, 105.0, 54.0, 46.0, 22.0, 16.0, 14.0, 9.0, 5.0, 5.0, 2.0, 2.0, 0.0, 1.0, 2.0, 2.0, 0.0, 1.0, 1.0, 2.0], "bins": [-1.96875, -1.9056396484375, -1.842529296875, -1.7794189453125, -1.71630859375, -1.6531982421875, -1.590087890625, -1.5269775390625, -1.4638671875, -1.4007568359375, -1.337646484375, -1.2745361328125, -1.21142578125, -1.1483154296875, -1.085205078125, -1.0220947265625, -0.958984375, -0.8958740234375, -0.832763671875, -0.7696533203125, -0.70654296875, -0.6434326171875, -0.580322265625, -0.5172119140625, -0.4541015625, -0.3909912109375, -0.327880859375, -0.2647705078125, -0.20166015625, -0.1385498046875, -0.075439453125, -0.0123291015625, 0.05078125, 0.1138916015625, 0.177001953125, 0.2401123046875, 0.30322265625, 0.3663330078125, 0.429443359375, 0.4925537109375, 0.5556640625, 0.6187744140625, 0.681884765625, 0.7449951171875, 0.80810546875, 0.8712158203125, 0.934326171875, 0.9974365234375, 1.060546875, 1.1236572265625, 1.186767578125, 1.2498779296875, 1.31298828125, 1.3760986328125, 1.439208984375, 1.5023193359375, 1.5654296875, 1.6285400390625, 1.691650390625, 1.7547607421875, 1.81787109375, 1.8809814453125, 1.944091796875, 2.0072021484375, 2.0703125]}, "gradients/encoder.encoder.layers.6.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 2.0, 4.0, 2.0, 3.0, 1.0, 0.0, 3.0, 3.0, 6.0, 9.0, 12.0, 6.0, 14.0, 18.0, 18.0, 32.0, 22.0, 25.0, 35.0, 36.0, 31.0, 41.0, 32.0, 45.0, 42.0, 38.0, 46.0, 48.0, 46.0, 35.0, 34.0, 33.0, 39.0, 37.0, 26.0, 28.0, 18.0, 18.0, 24.0, 14.0, 13.0, 13.0, 13.0, 12.0, 8.0, 4.0, 5.0, 6.0, 2.0, 5.0, 1.0, 5.0, 1.0, 1.0, 2.0, 2.0], "bins": [-1.1982421875, -1.1637115478515625, -1.129180908203125, -1.0946502685546875, -1.06011962890625, -1.0255889892578125, -0.991058349609375, -0.9565277099609375, -0.9219970703125, -0.8874664306640625, -0.852935791015625, -0.8184051513671875, -0.78387451171875, -0.7493438720703125, -0.714813232421875, -0.6802825927734375, -0.645751953125, -0.6112213134765625, -0.576690673828125, -0.5421600341796875, -0.50762939453125, -0.4730987548828125, -0.438568115234375, -0.4040374755859375, -0.3695068359375, -0.3349761962890625, -0.300445556640625, -0.2659149169921875, -0.23138427734375, -0.1968536376953125, -0.162322998046875, -0.1277923583984375, -0.09326171875, -0.0587310791015625, -0.024200439453125, 0.0103302001953125, 0.04486083984375, 0.0793914794921875, 0.113922119140625, 0.1484527587890625, 0.1829833984375, 0.2175140380859375, 0.252044677734375, 0.2865753173828125, 0.32110595703125, 0.3556365966796875, 0.390167236328125, 0.4246978759765625, 0.459228515625, 0.4937591552734375, 0.528289794921875, 0.5628204345703125, 0.59735107421875, 0.6318817138671875, 0.666412353515625, 0.7009429931640625, 0.7354736328125, 0.7700042724609375, 0.804534912109375, 0.8390655517578125, 0.87359619140625, 0.9081268310546875, 0.942657470703125, 0.9771881103515625, 1.01171875]}, "gradients/encoder.encoder.layers.6.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 1.0, 0.0, 4.0, 1.0, 3.0, 3.0, 3.0, 3.0, 7.0, 10.0, 14.0, 20.0, 26.0, 38.0, 56.0, 113.0, 162.0, 279.0, 449.0, 862.0, 2059.0, 6372.0, 24384.0, 125797.0, 616035.0, 218109.0, 39168.0, 9240.0, 2837.0, 1158.0, 556.0, 271.0, 179.0, 121.0, 66.0, 44.0, 38.0, 16.0, 20.0, 13.0, 7.0, 9.0, 6.0, 3.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.62890625, -3.4976806640625, -3.366455078125, -3.2352294921875, -3.10400390625, -2.9727783203125, -2.841552734375, -2.7103271484375, -2.5791015625, -2.4478759765625, -2.316650390625, -2.1854248046875, -2.05419921875, -1.9229736328125, -1.791748046875, -1.6605224609375, -1.529296875, -1.3980712890625, -1.266845703125, -1.1356201171875, -1.00439453125, -0.8731689453125, -0.741943359375, -0.6107177734375, -0.4794921875, -0.3482666015625, -0.217041015625, -0.0858154296875, 0.04541015625, 0.1766357421875, 0.307861328125, 0.4390869140625, 0.5703125, 0.7015380859375, 0.832763671875, 0.9639892578125, 1.09521484375, 1.2264404296875, 1.357666015625, 1.4888916015625, 1.6201171875, 1.7513427734375, 1.882568359375, 2.0137939453125, 2.14501953125, 2.2762451171875, 2.407470703125, 2.5386962890625, 2.669921875, 2.8011474609375, 2.932373046875, 3.0635986328125, 3.19482421875, 3.3260498046875, 3.457275390625, 3.5885009765625, 3.7197265625, 3.8509521484375, 3.982177734375, 4.1134033203125, 4.24462890625, 4.3758544921875, 4.507080078125, 4.6383056640625, 4.76953125]}, "gradients/encoder.encoder.layers.6.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 1.0, 1.0, 2.0, 4.0, 5.0, 0.0, 6.0, 4.0, 9.0, 10.0, 12.0, 12.0, 14.0, 18.0, 22.0, 23.0, 34.0, 27.0, 32.0, 37.0, 40.0, 39.0, 46.0, 59.0, 34.0, 51.0, 46.0, 36.0, 45.0, 41.0, 37.0, 35.0, 29.0, 20.0, 21.0, 24.0, 26.0, 18.0, 22.0, 15.0, 22.0, 7.0, 4.0, 4.0, 4.0, 4.0, 3.0, 6.0, 2.0, 1.0, 0.0, 4.0], "bins": [-5.30078125, -5.158599853515625, -5.01641845703125, -4.874237060546875, -4.7320556640625, -4.589874267578125, -4.44769287109375, -4.305511474609375, -4.163330078125, -4.021148681640625, -3.87896728515625, -3.736785888671875, -3.5946044921875, -3.452423095703125, -3.31024169921875, -3.168060302734375, -3.02587890625, -2.883697509765625, -2.74151611328125, -2.599334716796875, -2.4571533203125, -2.314971923828125, -2.17279052734375, -2.030609130859375, -1.888427734375, -1.746246337890625, -1.60406494140625, -1.461883544921875, -1.3197021484375, -1.177520751953125, -1.03533935546875, -0.893157958984375, -0.7509765625, -0.608795166015625, -0.46661376953125, -0.324432373046875, -0.1822509765625, -0.040069580078125, 0.10211181640625, 0.244293212890625, 0.386474609375, 0.528656005859375, 0.67083740234375, 0.813018798828125, 0.9552001953125, 1.097381591796875, 1.23956298828125, 1.381744384765625, 1.52392578125, 1.666107177734375, 1.80828857421875, 1.950469970703125, 2.0926513671875, 2.234832763671875, 2.37701416015625, 2.519195556640625, 2.661376953125, 2.803558349609375, 2.94573974609375, 3.087921142578125, 3.2301025390625, 3.372283935546875, 3.51446533203125, 3.656646728515625, 3.798828125]}, "gradients/encoder.encoder.layers.6.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 1.0, 1.0, 4.0, 4.0, 8.0, 10.0, 6.0, 12.0, 20.0, 15.0, 25.0, 39.0, 70.0, 120.0, 206.0, 366.0, 927.0, 2237.0, 8783.0, 52906.0, 529328.0, 397451.0, 44564.0, 7574.0, 2140.0, 812.0, 404.0, 189.0, 114.0, 75.0, 36.0, 24.0, 29.0, 20.0, 11.0, 12.0, 7.0, 2.0, 2.0, 1.0, 0.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.912109375, -1.855804443359375, -1.79949951171875, -1.743194580078125, -1.6868896484375, -1.630584716796875, -1.57427978515625, -1.517974853515625, -1.461669921875, -1.405364990234375, -1.34906005859375, -1.292755126953125, -1.2364501953125, -1.180145263671875, -1.12384033203125, -1.067535400390625, -1.01123046875, -0.954925537109375, -0.89862060546875, -0.842315673828125, -0.7860107421875, -0.729705810546875, -0.67340087890625, -0.617095947265625, -0.560791015625, -0.504486083984375, -0.44818115234375, -0.391876220703125, -0.3355712890625, -0.279266357421875, -0.22296142578125, -0.166656494140625, -0.1103515625, -0.054046630859375, 0.00225830078125, 0.058563232421875, 0.1148681640625, 0.171173095703125, 0.22747802734375, 0.283782958984375, 0.340087890625, 0.396392822265625, 0.45269775390625, 0.509002685546875, 0.5653076171875, 0.621612548828125, 0.67791748046875, 0.734222412109375, 0.79052734375, 0.846832275390625, 0.90313720703125, 0.959442138671875, 1.0157470703125, 1.072052001953125, 1.12835693359375, 1.184661865234375, 1.240966796875, 1.297271728515625, 1.35357666015625, 1.409881591796875, 1.4661865234375, 1.522491455078125, 1.57879638671875, 1.635101318359375, 1.69140625]}, "gradients/encoder.encoder.layers.6.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 5.0, 13.0, 9.0, 23.0, 44.0, 69.0, 102.0, 174.0, 179.0, 155.0, 92.0, 51.0, 33.0, 23.0, 22.0, 7.0, 9.0, 0.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0007905960083007812, -0.0007714889943599701, -0.0007523819804191589, -0.0007332749664783478, -0.0007141679525375366, -0.0006950609385967255, -0.0006759539246559143, -0.0006568469107151031, -0.000637739896774292, -0.0006186328828334808, -0.0005995258688926697, -0.0005804188549518585, -0.0005613118410110474, -0.0005422048270702362, -0.000523097813129425, -0.0005039907991886139, -0.00048488378524780273, -0.0004657767713069916, -0.0004466697573661804, -0.00042756274342536926, -0.0004084557294845581, -0.00038934871554374695, -0.0003702417016029358, -0.00035113468766212463, -0.0003320276737213135, -0.0003129206597805023, -0.00029381364583969116, -0.00027470663189888, -0.00025559961795806885, -0.0002364926040172577, -0.00021738559007644653, -0.00019827857613563538, -0.00017917156219482422, -0.00016006454825401306, -0.0001409575343132019, -0.00012185052037239075, -0.00010274350643157959, -8.363649249076843e-05, -6.452947854995728e-05, -4.542246460914612e-05, -2.631545066833496e-05, -7.208436727523804e-06, 1.1898577213287354e-05, 3.100559115409851e-05, 5.011260509490967e-05, 6.921961903572083e-05, 8.832663297653198e-05, 0.00010743364691734314, 0.0001265406608581543, 0.00014564767479896545, 0.0001647546887397766, 0.00018386170268058777, 0.00020296871662139893, 0.00022207573056221008, 0.00024118274450302124, 0.0002602897584438324, 0.00027939677238464355, 0.0002985037863254547, 0.00031761080026626587, 0.000336717814207077, 0.0003558248281478882, 0.00037493184208869934, 0.0003940388560295105, 0.00041314586997032166, 0.0004322528839111328]}, "gradients/encoder.encoder.layers.6.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 2.0, 0.0, 2.0, 2.0, 1.0, 5.0, 4.0, 5.0, 7.0, 8.0, 18.0, 25.0, 36.0, 42.0, 85.0, 163.0, 309.0, 715.0, 1714.0, 5921.0, 37976.0, 432244.0, 518644.0, 41041.0, 6393.0, 1777.0, 687.0, 335.0, 169.0, 87.0, 61.0, 37.0, 12.0, 14.0, 7.0, 5.0, 6.0, 2.0, 4.0, 1.0, 2.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.21875, -2.1571502685546875, -2.095550537109375, -2.0339508056640625, -1.97235107421875, -1.9107513427734375, -1.849151611328125, -1.7875518798828125, -1.7259521484375, -1.6643524169921875, -1.602752685546875, -1.5411529541015625, -1.47955322265625, -1.4179534912109375, -1.356353759765625, -1.2947540283203125, -1.233154296875, -1.1715545654296875, -1.109954833984375, -1.0483551025390625, -0.98675537109375, -0.9251556396484375, -0.863555908203125, -0.8019561767578125, -0.7403564453125, -0.6787567138671875, -0.617156982421875, -0.5555572509765625, -0.49395751953125, -0.4323577880859375, -0.370758056640625, -0.3091583251953125, -0.24755859375, -0.1859588623046875, -0.124359130859375, -0.0627593994140625, -0.00115966796875, 0.0604400634765625, 0.122039794921875, 0.1836395263671875, 0.2452392578125, 0.3068389892578125, 0.368438720703125, 0.4300384521484375, 0.49163818359375, 0.5532379150390625, 0.614837646484375, 0.6764373779296875, 0.738037109375, 0.7996368408203125, 0.861236572265625, 0.9228363037109375, 0.98443603515625, 1.0460357666015625, 1.107635498046875, 1.1692352294921875, 1.2308349609375, 1.2924346923828125, 1.354034423828125, 1.4156341552734375, 1.47723388671875, 1.5388336181640625, 1.600433349609375, 1.6620330810546875, 1.7236328125]}, "gradients/encoder.encoder.layers.6.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 6.0, 3.0, 5.0, 2.0, 9.0, 7.0, 8.0, 17.0, 14.0, 27.0, 41.0, 56.0, 58.0, 80.0, 91.0, 111.0, 95.0, 97.0, 64.0, 59.0, 46.0, 34.0, 27.0, 13.0, 11.0, 12.0, 11.0, 2.0, 2.0, 2.0, 5.0, 3.0, 1.0, 1.0, 1.0], "bins": [-2.64453125, -2.585540771484375, -2.52655029296875, -2.467559814453125, -2.4085693359375, -2.349578857421875, -2.29058837890625, -2.231597900390625, -2.172607421875, -2.113616943359375, -2.05462646484375, -1.995635986328125, -1.9366455078125, -1.877655029296875, -1.81866455078125, -1.759674072265625, -1.70068359375, -1.641693115234375, -1.58270263671875, -1.523712158203125, -1.4647216796875, -1.405731201171875, -1.34674072265625, -1.287750244140625, -1.228759765625, -1.169769287109375, -1.11077880859375, -1.051788330078125, -0.9927978515625, -0.933807373046875, -0.87481689453125, -0.815826416015625, -0.7568359375, -0.697845458984375, -0.63885498046875, -0.579864501953125, -0.5208740234375, -0.461883544921875, -0.40289306640625, -0.343902587890625, -0.284912109375, -0.225921630859375, -0.16693115234375, -0.107940673828125, -0.0489501953125, 0.010040283203125, 0.06903076171875, 0.128021240234375, 0.18701171875, 0.246002197265625, 0.30499267578125, 0.363983154296875, 0.4229736328125, 0.481964111328125, 0.54095458984375, 0.599945068359375, 0.658935546875, 0.717926025390625, 0.77691650390625, 0.835906982421875, 0.8948974609375, 0.953887939453125, 1.01287841796875, 1.071868896484375, 1.130859375]}, "gradients/encoder.encoder.layers.6.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 3.0, 2.0, 3.0, 2.0, 1.0, 2.0, 6.0, 5.0, 13.0, 15.0, 41.0, 70.0, 125.0, 194.0, 214.0, 131.0, 96.0, 45.0, 20.0, 10.0, 6.0, 4.0, 2.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0], "bins": [-41.853790283203125, -40.68950653076172, -39.52522277832031, -38.360939025878906, -37.1966552734375, -36.03237533569336, -34.86809158325195, -33.70380783081055, -32.53952407836914, -31.375240325927734, -30.210956573486328, -29.046674728393555, -27.88239097595215, -26.718107223510742, -25.55382537841797, -24.389541625976562, -23.225257873535156, -22.06097412109375, -20.896690368652344, -19.73240852355957, -18.568124771118164, -17.403841018676758, -16.239559173583984, -15.075275421142578, -13.910991668701172, -12.746707916259766, -11.582425117492676, -10.418142318725586, -9.25385856628418, -8.089574813842773, -6.925292015075684, -5.761009216308594, -4.5967254638671875, -3.4324421882629395, -2.2681589126586914, -1.1038756370544434, 0.06040763854980469, 1.2246909141540527, 2.388974189758301, 3.5532569885253906, 4.717540740966797, 5.881824016571045, 7.046107292175293, 8.210390090942383, 9.374673843383789, 10.538957595825195, 11.703240394592285, 12.867523193359375, 14.031806945800781, 15.196090698242188, 16.360374450683594, 17.524656295776367, 18.688940048217773, 19.85322380065918, 21.017505645751953, 22.18178939819336, 23.346073150634766, 24.510356903076172, 25.674640655517578, 26.83892250061035, 28.003206253051758, 29.167490005493164, 30.331771850585938, 31.496055603027344, 32.66033935546875]}, "gradients/encoder.encoder.layers.6.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 5.0, 1.0, 1.0, 3.0, 4.0, 6.0, 7.0, 11.0, 16.0, 19.0, 12.0, 21.0, 24.0, 31.0, 35.0, 38.0, 26.0, 30.0, 38.0, 46.0, 47.0, 64.0, 67.0, 59.0, 56.0, 42.0, 45.0, 42.0, 36.0, 29.0, 20.0, 23.0, 25.0, 16.0, 18.0, 7.0, 8.0, 9.0, 6.0, 11.0, 2.0, 4.0, 1.0, 0.0, 4.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-19.22872543334961, -18.54726791381836, -17.86581039428711, -17.18435287475586, -16.50289535522461, -15.821436882019043, -15.139978408813477, -14.458520889282227, -13.777063369750977, -13.095605850219727, -12.414148330688477, -11.73268985748291, -11.05123233795166, -10.36977481842041, -9.688316345214844, -9.006858825683594, -8.325401306152344, -7.643943786621094, -6.9624857902526855, -6.281027793884277, -5.599570274353027, -4.918112754821777, -4.236654758453369, -3.555196762084961, -2.873739242553711, -2.192281484603882, -1.5108237266540527, -0.8293659687042236, -0.14790821075439453, 0.5335495471954346, 1.2150073051452637, 1.8964653015136719, 2.577922821044922, 3.259380578994751, 3.94083833694458, 4.622296333312988, 5.303753852844238, 5.985211372375488, 6.6666693687438965, 7.348127365112305, 8.029584884643555, 8.711042404174805, 9.392499923706055, 10.073958396911621, 10.755415916442871, 11.436873435974121, 12.118331909179688, 12.799789428710938, 13.481246948242188, 14.162704467773438, 14.844161987304688, 15.525620460510254, 16.207077026367188, 16.88853645324707, 17.56999397277832, 18.25145149230957, 18.93290901184082, 19.61436653137207, 20.29582405090332, 20.97728157043457, 21.658740997314453, 22.340198516845703, 23.021656036376953, 23.703113555908203, 24.384571075439453]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 2.0, 5.0, 6.0, 2.0, 10.0, 14.0, 25.0, 53.0, 86.0, 142.0, 266.0, 545.0, 1404.0, 4145.0, 16270.0, 90470.0, 1323966.0, 2554673.0, 169335.0, 24605.0, 5583.0, 1614.0, 588.0, 238.0, 124.0, 43.0, 34.0, 11.0, 8.0, 9.0, 7.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 1.0, 0.0, 1.0], "bins": [-3.48828125, -3.4034881591796875, -3.318695068359375, -3.2339019775390625, -3.14910888671875, -3.0643157958984375, -2.979522705078125, -2.8947296142578125, -2.8099365234375, -2.7251434326171875, -2.640350341796875, -2.5555572509765625, -2.47076416015625, -2.3859710693359375, -2.301177978515625, -2.2163848876953125, -2.131591796875, -2.0467987060546875, -1.962005615234375, -1.8772125244140625, -1.79241943359375, -1.7076263427734375, -1.622833251953125, -1.5380401611328125, -1.4532470703125, -1.3684539794921875, -1.283660888671875, -1.1988677978515625, -1.11407470703125, -1.0292816162109375, -0.944488525390625, -0.8596954345703125, -0.77490234375, -0.6901092529296875, -0.605316162109375, -0.5205230712890625, -0.43572998046875, -0.3509368896484375, -0.266143798828125, -0.1813507080078125, -0.0965576171875, -0.0117645263671875, 0.073028564453125, 0.1578216552734375, 0.24261474609375, 0.3274078369140625, 0.412200927734375, 0.4969940185546875, 0.581787109375, 0.6665802001953125, 0.751373291015625, 0.8361663818359375, 0.92095947265625, 1.0057525634765625, 1.090545654296875, 1.1753387451171875, 1.2601318359375, 1.3449249267578125, 1.429718017578125, 1.5145111083984375, 1.59930419921875, 1.6840972900390625, 1.768890380859375, 1.8536834716796875, 1.9384765625]}, "gradients/encoder.encoder.layers.5.feed_forward.output_dense.bias": {"_type": "histogram", "values": [4.0, 2.0, 1.0, 4.0, 9.0, 6.0, 10.0, 6.0, 14.0, 19.0, 22.0, 23.0, 39.0, 57.0, 43.0, 68.0, 69.0, 68.0, 73.0, 67.0, 66.0, 59.0, 47.0, 54.0, 36.0, 39.0, 23.0, 19.0, 18.0, 21.0, 10.0, 13.0, 3.0, 4.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.92724609375, -0.8779678344726562, -0.8286895751953125, -0.7794113159179688, -0.730133056640625, -0.6808547973632812, -0.6315765380859375, -0.5822982788085938, -0.53302001953125, -0.48374176025390625, -0.4344635009765625, -0.38518524169921875, -0.335906982421875, -0.28662872314453125, -0.2373504638671875, -0.18807220458984375, -0.1387939453125, -0.08951568603515625, -0.0402374267578125, 0.00904083251953125, 0.058319091796875, 0.10759735107421875, 0.1568756103515625, 0.20615386962890625, 0.25543212890625, 0.30471038818359375, 0.3539886474609375, 0.40326690673828125, 0.452545166015625, 0.5018234252929688, 0.5511016845703125, 0.6003799438476562, 0.649658203125, 0.6989364624023438, 0.7482147216796875, 0.7974929809570312, 0.846771240234375, 0.8960494995117188, 0.9453277587890625, 0.9946060180664062, 1.04388427734375, 1.0931625366210938, 1.1424407958984375, 1.1917190551757812, 1.240997314453125, 1.2902755737304688, 1.3395538330078125, 1.3888320922851562, 1.4381103515625, 1.4873886108398438, 1.5366668701171875, 1.5859451293945312, 1.635223388671875, 1.6845016479492188, 1.7337799072265625, 1.7830581665039062, 1.83233642578125, 1.8816146850585938, 1.9308929443359375, 1.9801712036132812, 2.029449462890625, 2.0787277221679688, 2.1280059814453125, 2.1772842407226562, 2.2265625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 5.0, 1.0, 2.0, 2.0, 6.0, 6.0, 14.0, 17.0, 26.0, 44.0, 62.0, 83.0, 150.0, 249.0, 499.0, 1297.0, 3920.0, 14644.0, 77187.0, 846200.0, 2991212.0, 218272.0, 30198.0, 6432.0, 2071.0, 808.0, 411.0, 172.0, 104.0, 66.0, 40.0, 25.0, 19.0, 14.0, 11.0, 7.0, 4.0, 6.0, 1.0, 2.0, 2.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.845703125, -2.744964599609375, -2.64422607421875, -2.543487548828125, -2.4427490234375, -2.342010498046875, -2.24127197265625, -2.140533447265625, -2.039794921875, -1.939056396484375, -1.83831787109375, -1.737579345703125, -1.6368408203125, -1.536102294921875, -1.43536376953125, -1.334625244140625, -1.23388671875, -1.133148193359375, -1.03240966796875, -0.931671142578125, -0.8309326171875, -0.730194091796875, -0.62945556640625, -0.528717041015625, -0.427978515625, -0.327239990234375, -0.22650146484375, -0.125762939453125, -0.0250244140625, 0.075714111328125, 0.17645263671875, 0.277191162109375, 0.3779296875, 0.478668212890625, 0.57940673828125, 0.680145263671875, 0.7808837890625, 0.881622314453125, 0.98236083984375, 1.083099365234375, 1.183837890625, 1.284576416015625, 1.38531494140625, 1.486053466796875, 1.5867919921875, 1.687530517578125, 1.78826904296875, 1.889007568359375, 1.98974609375, 2.090484619140625, 2.19122314453125, 2.291961669921875, 2.3927001953125, 2.493438720703125, 2.59417724609375, 2.694915771484375, 2.795654296875, 2.896392822265625, 2.99713134765625, 3.097869873046875, 3.1986083984375, 3.299346923828125, 3.40008544921875, 3.500823974609375, 3.6015625]}, "gradients/encoder.encoder.layers.5.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 8.0, 2.0, 4.0, 7.0, 5.0, 8.0, 17.0, 26.0, 12.0, 29.0, 36.0, 53.0, 74.0, 123.0, 164.0, 211.0, 351.0, 565.0, 647.0, 561.0, 364.0, 252.0, 168.0, 101.0, 83.0, 63.0, 44.0, 29.0, 19.0, 20.0, 8.0, 8.0, 6.0, 5.0, 1.0, 2.0, 3.0, 1.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.015625, -2.920166015625, -2.82470703125, -2.729248046875, -2.6337890625, -2.538330078125, -2.44287109375, -2.347412109375, -2.251953125, -2.156494140625, -2.06103515625, -1.965576171875, -1.8701171875, -1.774658203125, -1.67919921875, -1.583740234375, -1.48828125, -1.392822265625, -1.29736328125, -1.201904296875, -1.1064453125, -1.010986328125, -0.91552734375, -0.820068359375, -0.724609375, -0.629150390625, -0.53369140625, -0.438232421875, -0.3427734375, -0.247314453125, -0.15185546875, -0.056396484375, 0.0390625, 0.134521484375, 0.22998046875, 0.325439453125, 0.4208984375, 0.516357421875, 0.61181640625, 0.707275390625, 0.802734375, 0.898193359375, 0.99365234375, 1.089111328125, 1.1845703125, 1.280029296875, 1.37548828125, 1.470947265625, 1.56640625, 1.661865234375, 1.75732421875, 1.852783203125, 1.9482421875, 2.043701171875, 2.13916015625, 2.234619140625, 2.330078125, 2.425537109375, 2.52099609375, 2.616455078125, 2.7119140625, 2.807373046875, 2.90283203125, 2.998291015625, 3.09375]}, "gradients/encoder.encoder.layers.5.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 1.0, 1.0, 4.0, 21.0, 57.0, 178.0, 333.0, 264.0, 96.0, 31.0, 8.0, 3.0, 2.0, 2.0, 2.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-76.65087890625, -74.4437484741211, -72.23661804199219, -70.02947998046875, -67.82234954833984, -65.61521911621094, -63.408084869384766, -61.200950622558594, -58.99382019042969, -56.78668975830078, -54.57955551147461, -52.37242126464844, -50.16529083251953, -47.958160400390625, -45.75102615356445, -43.54389190673828, -41.336761474609375, -39.12963104248047, -36.9224967956543, -34.715362548828125, -32.50823211669922, -30.30109977722168, -28.09396743774414, -25.8868350982666, -23.679702758789062, -21.472570419311523, -19.265438079833984, -17.058305740356445, -14.851173400878906, -12.644041061401367, -10.436908721923828, -8.229776382446289, -6.02264404296875, -3.815511703491211, -1.6083793640136719, 0.5987529754638672, 2.8058853149414062, 5.013017654418945, 7.220149993896484, 9.427282333374023, 11.634414672851562, 13.841547012329102, 16.04867935180664, 18.25581169128418, 20.46294403076172, 22.670076370239258, 24.877208709716797, 27.084341049194336, 29.291473388671875, 31.498605728149414, 33.70573806762695, 35.912872314453125, 38.12000274658203, 40.32713317871094, 42.53426742553711, 44.74140167236328, 46.94853210449219, 49.155662536621094, 51.362796783447266, 53.56993103027344, 55.777061462402344, 57.98419189453125, 60.19132614135742, 62.398460388183594, 64.6055908203125]}, "gradients/encoder.encoder.layers.5.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 4.0, 2.0, 3.0, 1.0, 5.0, 7.0, 12.0, 7.0, 14.0, 16.0, 19.0, 30.0, 30.0, 27.0, 53.0, 42.0, 40.0, 50.0, 67.0, 53.0, 49.0, 54.0, 54.0, 56.0, 53.0, 41.0, 44.0, 28.0, 31.0, 25.0, 28.0, 16.0, 13.0, 10.0, 6.0, 6.0, 2.0, 3.0, 7.0, 2.0, 1.0, 2.0, 0.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-18.493680953979492, -17.888896942138672, -17.28411102294922, -16.6793270111084, -16.074541091918945, -15.469757080078125, -14.864972114562988, -14.260187149047852, -13.655402183532715, -13.050617218017578, -12.445832252502441, -11.841047286987305, -11.236263275146484, -10.631477355957031, -10.026693344116211, -9.421908378601074, -8.817123413085938, -8.2123384475708, -7.607553482055664, -7.0027689933776855, -6.397984027862549, -5.793199062347412, -5.188414573669434, -4.583629608154297, -3.97884464263916, -3.3740596771240234, -2.769274950027466, -2.164490222930908, -1.5597052574157715, -0.9549202919006348, -0.35013556480407715, 0.25464916229248047, 0.8594341278076172, 1.4642189741134644, 2.0690038204193115, 2.673788547515869, 3.278573513031006, 3.8833584785461426, 4.488142967224121, 5.092927932739258, 5.6977128982543945, 6.302497863769531, 6.907282829284668, 7.5120673179626465, 8.116851806640625, 8.721637725830078, 9.326421737670898, 9.931206703186035, 10.535991668701172, 11.140776634216309, 11.745561599731445, 12.350346565246582, 12.955131530761719, 13.559915542602539, 14.164700508117676, 14.769485473632812, 15.37427043914795, 15.979055404663086, 16.583839416503906, 17.18862533569336, 17.79340934753418, 18.398195266723633, 19.002979278564453, 19.607765197753906, 20.212549209594727]}, "gradients/encoder.encoder.layers.5.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 4.0, 4.0, 2.0, 4.0, 7.0, 13.0, 21.0, 21.0, 41.0, 55.0, 87.0, 126.0, 239.0, 340.0, 606.0, 1082.0, 1982.0, 3594.0, 6767.0, 12679.0, 24397.0, 45660.0, 84910.0, 151093.0, 223879.0, 207943.0, 129722.0, 71705.0, 38187.0, 20273.0, 10582.0, 5549.0, 3018.0, 1667.0, 929.0, 535.0, 322.0, 186.0, 125.0, 81.0, 42.0, 28.0, 18.0, 9.0, 7.0, 9.0, 9.0, 3.0, 1.0, 4.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.4130859375, -1.3672943115234375, -1.321502685546875, -1.2757110595703125, -1.22991943359375, -1.1841278076171875, -1.138336181640625, -1.0925445556640625, -1.0467529296875, -1.0009613037109375, -0.955169677734375, -0.9093780517578125, -0.86358642578125, -0.8177947998046875, -0.772003173828125, -0.7262115478515625, -0.680419921875, -0.6346282958984375, -0.588836669921875, -0.5430450439453125, -0.49725341796875, -0.4514617919921875, -0.405670166015625, -0.3598785400390625, -0.3140869140625, -0.2682952880859375, -0.222503662109375, -0.1767120361328125, -0.13092041015625, -0.0851287841796875, -0.039337158203125, 0.0064544677734375, 0.05224609375, 0.0980377197265625, 0.143829345703125, 0.1896209716796875, 0.23541259765625, 0.2812042236328125, 0.326995849609375, 0.3727874755859375, 0.4185791015625, 0.4643707275390625, 0.510162353515625, 0.5559539794921875, 0.60174560546875, 0.6475372314453125, 0.693328857421875, 0.7391204833984375, 0.784912109375, 0.8307037353515625, 0.876495361328125, 0.9222869873046875, 0.96807861328125, 1.0138702392578125, 1.059661865234375, 1.1054534912109375, 1.1512451171875, 1.1970367431640625, 1.242828369140625, 1.2886199951171875, 1.33441162109375, 1.3802032470703125, 1.425994873046875, 1.4717864990234375, 1.517578125]}, "gradients/encoder.encoder.layers.5.attention.out_proj.bias": {"_type": "histogram", "values": [3.0, 1.0, 2.0, 2.0, 2.0, 7.0, 4.0, 3.0, 4.0, 6.0, 6.0, 3.0, 7.0, 11.0, 14.0, 17.0, 19.0, 20.0, 18.0, 12.0, 21.0, 32.0, 22.0, 33.0, 42.0, 42.0, 42.0, 36.0, 27.0, 35.0, 48.0, 47.0, 50.0, 38.0, 40.0, 32.0, 31.0, 34.0, 15.0, 20.0, 20.0, 21.0, 17.0, 19.0, 18.0, 12.0, 10.0, 12.0, 14.0, 4.0, 5.0, 5.0, 4.0, 5.0, 1.0, 4.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-0.875, -0.8459091186523438, -0.8168182373046875, -0.7877273559570312, -0.758636474609375, -0.7295455932617188, -0.7004547119140625, -0.6713638305664062, -0.64227294921875, -0.6131820678710938, -0.5840911865234375, -0.5550003051757812, -0.525909423828125, -0.49681854248046875, -0.4677276611328125, -0.43863677978515625, -0.4095458984375, -0.38045501708984375, -0.3513641357421875, -0.32227325439453125, -0.293182373046875, -0.26409149169921875, -0.2350006103515625, -0.20590972900390625, -0.17681884765625, -0.14772796630859375, -0.1186370849609375, -0.08954620361328125, -0.060455322265625, -0.03136444091796875, -0.0022735595703125, 0.02681732177734375, 0.055908203125, 0.08499908447265625, 0.1140899658203125, 0.14318084716796875, 0.172271728515625, 0.20136260986328125, 0.2304534912109375, 0.25954437255859375, 0.28863525390625, 0.31772613525390625, 0.3468170166015625, 0.37590789794921875, 0.404998779296875, 0.43408966064453125, 0.4631805419921875, 0.49227142333984375, 0.5213623046875, 0.5504531860351562, 0.5795440673828125, 0.6086349487304688, 0.637725830078125, 0.6668167114257812, 0.6959075927734375, 0.7249984741210938, 0.75408935546875, 0.7831802368164062, 0.8122711181640625, 0.8413619995117188, 0.870452880859375, 0.8995437622070312, 0.9286346435546875, 0.9577255249023438, 0.98681640625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 4.0, 1.0, 5.0, 6.0, 11.0, 25.0, 16.0, 29.0, 38.0, 41.0, 52.0, 69.0, 110.0, 141.0, 168.0, 280.0, 395.0, 586.0, 912.0, 1721.0, 3575.0, 9593.0, 34332.0, 155049.0, 580522.0, 197142.0, 43147.0, 11397.0, 4111.0, 1935.0, 1004.0, 696.0, 423.0, 288.0, 207.0, 130.0, 118.0, 66.0, 55.0, 47.0, 31.0, 21.0, 14.0, 12.0, 18.0, 5.0, 4.0, 6.0, 2.0, 1.0, 5.0, 0.0, 3.0], "bins": [-3.552734375, -3.452880859375, -3.35302734375, -3.253173828125, -3.1533203125, -3.053466796875, -2.95361328125, -2.853759765625, -2.75390625, -2.654052734375, -2.55419921875, -2.454345703125, -2.3544921875, -2.254638671875, -2.15478515625, -2.054931640625, -1.955078125, -1.855224609375, -1.75537109375, -1.655517578125, -1.5556640625, -1.455810546875, -1.35595703125, -1.256103515625, -1.15625, -1.056396484375, -0.95654296875, -0.856689453125, -0.7568359375, -0.656982421875, -0.55712890625, -0.457275390625, -0.357421875, -0.257568359375, -0.15771484375, -0.057861328125, 0.0419921875, 0.141845703125, 0.24169921875, 0.341552734375, 0.44140625, 0.541259765625, 0.64111328125, 0.740966796875, 0.8408203125, 0.940673828125, 1.04052734375, 1.140380859375, 1.240234375, 1.340087890625, 1.43994140625, 1.539794921875, 1.6396484375, 1.739501953125, 1.83935546875, 1.939208984375, 2.0390625, 2.138916015625, 2.23876953125, 2.338623046875, 2.4384765625, 2.538330078125, 2.63818359375, 2.738037109375, 2.837890625]}, "gradients/encoder.encoder.layers.5.attention.v_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 3.0, 3.0, 6.0, 8.0, 6.0, 5.0, 10.0, 13.0, 9.0, 18.0, 17.0, 22.0, 28.0, 31.0, 33.0, 40.0, 25.0, 37.0, 31.0, 42.0, 38.0, 52.0, 42.0, 48.0, 54.0, 36.0, 39.0, 39.0, 25.0, 34.0, 24.0, 26.0, 31.0, 22.0, 16.0, 15.0, 9.0, 11.0, 11.0, 6.0, 8.0, 8.0, 4.0, 0.0, 9.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0, 2.0, 1.0, 0.0, 2.0], "bins": [-4.25, -4.11419677734375, -3.9783935546875, -3.84259033203125, -3.706787109375, -3.57098388671875, -3.4351806640625, -3.29937744140625, -3.16357421875, -3.02777099609375, -2.8919677734375, -2.75616455078125, -2.620361328125, -2.48455810546875, -2.3487548828125, -2.21295166015625, -2.0771484375, -1.94134521484375, -1.8055419921875, -1.66973876953125, -1.533935546875, -1.39813232421875, -1.2623291015625, -1.12652587890625, -0.99072265625, -0.85491943359375, -0.7191162109375, -0.58331298828125, -0.447509765625, -0.31170654296875, -0.1759033203125, -0.04010009765625, 0.095703125, 0.23150634765625, 0.3673095703125, 0.50311279296875, 0.638916015625, 0.77471923828125, 0.9105224609375, 1.04632568359375, 1.18212890625, 1.31793212890625, 1.4537353515625, 1.58953857421875, 1.725341796875, 1.86114501953125, 1.9969482421875, 2.13275146484375, 2.2685546875, 2.40435791015625, 2.5401611328125, 2.67596435546875, 2.811767578125, 2.94757080078125, 3.0833740234375, 3.21917724609375, 3.35498046875, 3.49078369140625, 3.6265869140625, 3.76239013671875, 3.898193359375, 4.03399658203125, 4.1697998046875, 4.30560302734375, 4.44140625]}, "gradients/encoder.encoder.layers.5.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 1.0, 3.0, 3.0, 6.0, 4.0, 9.0, 11.0, 17.0, 30.0, 38.0, 73.0, 93.0, 180.0, 369.0, 795.0, 2339.0, 8724.0, 51206.0, 562141.0, 368880.0, 42391.0, 7613.0, 2088.0, 740.0, 352.0, 184.0, 82.0, 81.0, 31.0, 23.0, 19.0, 8.0, 11.0, 3.0, 7.0, 3.0, 4.0, 3.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.625, -1.582183837890625, -1.53936767578125, -1.496551513671875, -1.4537353515625, -1.410919189453125, -1.36810302734375, -1.325286865234375, -1.282470703125, -1.239654541015625, -1.19683837890625, -1.154022216796875, -1.1112060546875, -1.068389892578125, -1.02557373046875, -0.982757568359375, -0.93994140625, -0.897125244140625, -0.85430908203125, -0.811492919921875, -0.7686767578125, -0.725860595703125, -0.68304443359375, -0.640228271484375, -0.597412109375, -0.554595947265625, -0.51177978515625, -0.468963623046875, -0.4261474609375, -0.383331298828125, -0.34051513671875, -0.297698974609375, -0.2548828125, -0.212066650390625, -0.16925048828125, -0.126434326171875, -0.0836181640625, -0.040802001953125, 0.00201416015625, 0.044830322265625, 0.087646484375, 0.130462646484375, 0.17327880859375, 0.216094970703125, 0.2589111328125, 0.301727294921875, 0.34454345703125, 0.387359619140625, 0.43017578125, 0.472991943359375, 0.51580810546875, 0.558624267578125, 0.6014404296875, 0.644256591796875, 0.68707275390625, 0.729888916015625, 0.772705078125, 0.815521240234375, 0.85833740234375, 0.901153564453125, 0.9439697265625, 0.986785888671875, 1.02960205078125, 1.072418212890625, 1.115234375]}, "gradients/encoder.encoder.layers.5.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 2.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 5.0, 6.0, 6.0, 8.0, 14.0, 9.0, 16.0, 13.0, 36.0, 33.0, 50.0, 52.0, 52.0, 68.0, 65.0, 77.0, 59.0, 72.0, 58.0, 54.0, 46.0, 32.0, 39.0, 24.0, 19.0, 20.0, 15.0, 10.0, 10.0, 5.0, 4.0, 5.0, 8.0, 5.0, 3.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0], "bins": [-0.0002455711364746094, -0.00023787468671798706, -0.00023017823696136475, -0.00022248178720474243, -0.00021478533744812012, -0.0002070888876914978, -0.0001993924379348755, -0.00019169598817825317, -0.00018399953842163086, -0.00017630308866500854, -0.00016860663890838623, -0.00016091018915176392, -0.0001532137393951416, -0.0001455172896385193, -0.00013782083988189697, -0.00013012439012527466, -0.00012242794036865234, -0.00011473149061203003, -0.00010703504085540771, -9.93385910987854e-05, -9.164214134216309e-05, -8.394569158554077e-05, -7.624924182891846e-05, -6.855279207229614e-05, -6.085634231567383e-05, -5.3159892559051514e-05, -4.54634428024292e-05, -3.7766993045806885e-05, -3.007054328918457e-05, -2.2374093532562256e-05, -1.4677643775939941e-05, -6.981194019317627e-06, 7.152557373046875e-07, 8.411705493927002e-06, 1.6108155250549316e-05, 2.380460500717163e-05, 3.1501054763793945e-05, 3.919750452041626e-05, 4.6893954277038574e-05, 5.459040403366089e-05, 6.22868537902832e-05, 6.998330354690552e-05, 7.767975330352783e-05, 8.537620306015015e-05, 9.307265281677246e-05, 0.00010076910257339478, 0.00010846555233001709, 0.0001161620020866394, 0.00012385845184326172, 0.00013155490159988403, 0.00013925135135650635, 0.00014694780111312866, 0.00015464425086975098, 0.0001623407006263733, 0.0001700371503829956, 0.00017773360013961792, 0.00018543004989624023, 0.00019312649965286255, 0.00020082294940948486, 0.00020851939916610718, 0.0002162158489227295, 0.0002239122986793518, 0.00023160874843597412, 0.00023930519819259644, 0.00024700164794921875]}, "gradients/encoder.encoder.layers.5.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 4.0, 5.0, 3.0, 6.0, 12.0, 10.0, 26.0, 23.0, 41.0, 91.0, 156.0, 293.0, 766.0, 2067.0, 9088.0, 89196.0, 800293.0, 130725.0, 11603.0, 2563.0, 821.0, 367.0, 196.0, 99.0, 41.0, 28.0, 19.0, 9.0, 4.0, 5.0, 6.0, 2.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9419479370117188, -0.8912200927734375, -0.8404922485351562, -0.789764404296875, -0.7390365600585938, -0.6883087158203125, -0.6375808715820312, -0.58685302734375, -0.5361251831054688, -0.4853973388671875, -0.43466949462890625, -0.383941650390625, -0.33321380615234375, -0.2824859619140625, -0.23175811767578125, -0.1810302734375, -0.13030242919921875, -0.0795745849609375, -0.02884674072265625, 0.021881103515625, 0.07260894775390625, 0.1233367919921875, 0.17406463623046875, 0.22479248046875, 0.27552032470703125, 0.3262481689453125, 0.37697601318359375, 0.427703857421875, 0.47843170166015625, 0.5291595458984375, 0.5798873901367188, 0.630615234375, 0.6813430786132812, 0.7320709228515625, 0.7827987670898438, 0.833526611328125, 0.8842544555664062, 0.9349822998046875, 0.9857101440429688, 1.03643798828125, 1.0871658325195312, 1.1378936767578125, 1.1886215209960938, 1.239349365234375, 1.2900772094726562, 1.3408050537109375, 1.3915328979492188, 1.4422607421875, 1.4929885864257812, 1.5437164306640625, 1.5944442749023438, 1.645172119140625, 1.6958999633789062, 1.7466278076171875, 1.7973556518554688, 1.84808349609375, 1.8988113403320312, 1.9495391845703125, 2.0002670288085938, 2.050994873046875, 2.1017227172851562, 2.1524505615234375, 2.2031784057617188, 2.25390625]}, "gradients/encoder.encoder.layers.5.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 5.0, 3.0, 6.0, 9.0, 11.0, 12.0, 13.0, 10.0, 18.0, 27.0, 25.0, 35.0, 35.0, 55.0, 42.0, 52.0, 54.0, 57.0, 48.0, 55.0, 49.0, 64.0, 46.0, 45.0, 33.0, 32.0, 24.0, 28.0, 26.0, 23.0, 12.0, 9.0, 7.0, 8.0, 6.0, 4.0, 5.0, 5.0, 0.0, 2.0, 1.0, 3.0, 3.0, 0.0, 0.0, 2.0], "bins": [-1.0498046875, -1.0211944580078125, -0.992584228515625, -0.9639739990234375, -0.93536376953125, -0.9067535400390625, -0.878143310546875, -0.8495330810546875, -0.8209228515625, -0.7923126220703125, -0.763702392578125, -0.7350921630859375, -0.70648193359375, -0.6778717041015625, -0.649261474609375, -0.6206512451171875, -0.592041015625, -0.5634307861328125, -0.534820556640625, -0.5062103271484375, -0.47760009765625, -0.4489898681640625, -0.420379638671875, -0.3917694091796875, -0.3631591796875, -0.3345489501953125, -0.305938720703125, -0.2773284912109375, -0.24871826171875, -0.2201080322265625, -0.191497802734375, -0.1628875732421875, -0.13427734375, -0.1056671142578125, -0.077056884765625, -0.0484466552734375, -0.01983642578125, 0.0087738037109375, 0.037384033203125, 0.0659942626953125, 0.0946044921875, 0.1232147216796875, 0.151824951171875, 0.1804351806640625, 0.20904541015625, 0.2376556396484375, 0.266265869140625, 0.2948760986328125, 0.323486328125, 0.3520965576171875, 0.380706787109375, 0.4093170166015625, 0.43792724609375, 0.4665374755859375, 0.495147705078125, 0.5237579345703125, 0.5523681640625, 0.5809783935546875, 0.609588623046875, 0.6381988525390625, 0.66680908203125, 0.6954193115234375, 0.724029541015625, 0.7526397705078125, 0.78125]}, "gradients/encoder.encoder.layers.5.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 3.0, 3.0, 15.0, 57.0, 165.0, 323.0, 256.0, 125.0, 41.0, 9.0, 4.0, 3.0, 2.0, 1.0, 3.0, 0.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-62.32345199584961, -60.5822639465332, -58.84107208251953, -57.099884033203125, -55.35869598388672, -53.61750411987305, -51.87631607055664, -50.13512420654297, -48.39393615722656, -46.652748107910156, -44.911556243896484, -43.17036819458008, -41.429176330566406, -39.68798828125, -37.946800231933594, -36.20561218261719, -34.464420318603516, -32.72323226928711, -30.982040405273438, -29.24085235595703, -27.499662399291992, -25.758472442626953, -24.017284393310547, -22.276094436645508, -20.53490447998047, -18.79371452331543, -17.05252456665039, -15.311336517333984, -13.570146560668945, -11.828956604003906, -10.087767601013184, -8.346578598022461, -6.6053924560546875, -4.864202976226807, -3.123013496398926, -1.381824016571045, 0.35936546325683594, 2.100555419921875, 3.8417444229125977, 5.58293342590332, 7.324123382568359, 9.065313339233398, 10.806502342224121, 12.547691345214844, 14.288881301879883, 16.030071258544922, 17.771259307861328, 19.512449264526367, 21.253639221191406, 22.994829177856445, 24.736019134521484, 26.47720718383789, 28.21839714050293, 29.95958709716797, 31.700775146484375, 33.44196319580078, 35.18315505981445, 36.92434310913086, 38.66553497314453, 40.40672302246094, 42.147911071777344, 43.889102935791016, 45.63029098510742, 47.371482849121094, 49.1126708984375]}, "gradients/encoder.encoder.layers.5.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 3.0, 1.0, 3.0, 1.0, 5.0, 3.0, 3.0, 4.0, 6.0, 8.0, 11.0, 9.0, 15.0, 7.0, 13.0, 19.0, 15.0, 21.0, 30.0, 39.0, 15.0, 24.0, 32.0, 33.0, 38.0, 62.0, 57.0, 66.0, 54.0, 39.0, 41.0, 40.0, 32.0, 24.0, 37.0, 32.0, 26.0, 20.0, 19.0, 9.0, 17.0, 10.0, 13.0, 16.0, 12.0, 7.0, 5.0, 3.0, 3.0, 2.0, 3.0, 4.0, 2.0, 2.0, 1.0, 0.0, 4.0], "bins": [-18.59769630432129, -18.057756423950195, -17.5178165435791, -16.977876663208008, -16.437936782836914, -15.89799690246582, -15.35805606842041, -14.818116188049316, -14.278176307678223, -13.738236427307129, -13.198296546936035, -12.658356666564941, -12.118415832519531, -11.578475952148438, -11.038536071777344, -10.49859619140625, -9.958656311035156, -9.418716430664062, -8.878776550292969, -8.338836669921875, -7.798896312713623, -7.258956432342529, -6.719016075134277, -6.179076194763184, -5.63913631439209, -5.099196434020996, -4.559256553649902, -4.01931619644165, -3.4793763160705566, -2.939436435699463, -2.39949631690979, -1.8595561981201172, -1.3196144104003906, -0.7796744108200073, -0.23973441123962402, 0.3002055883407593, 0.8401455879211426, 1.3800854682922363, 1.9200255870819092, 2.459965705871582, 2.999905586242676, 3.5398454666137695, 4.079785346984863, 4.619725704193115, 5.159665584564209, 5.699605464935303, 6.239545822143555, 6.779485702514648, 7.319425582885742, 7.859365463256836, 8.39930534362793, 8.939245223999023, 9.479185104370117, 10.019124984741211, 10.559065818786621, 11.099005699157715, 11.638945579528809, 12.178885459899902, 12.718825340270996, 13.25876522064209, 13.7987060546875, 14.338645935058594, 14.878585815429688, 15.418525695800781, 15.958465576171875]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 2.0, 7.0, 3.0, 7.0, 13.0, 10.0, 20.0, 34.0, 45.0, 78.0, 119.0, 160.0, 325.0, 689.0, 1680.0, 5184.0, 19449.0, 101503.0, 998580.0, 2687704.0, 318540.0, 45020.0, 10317.0, 2944.0, 994.0, 391.0, 176.0, 111.0, 77.0, 32.0, 15.0, 18.0, 13.0, 4.0, 12.0, 7.0, 2.0, 3.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0], "bins": [-2.78515625, -2.7142333984375, -2.643310546875, -2.5723876953125, -2.50146484375, -2.4305419921875, -2.359619140625, -2.2886962890625, -2.2177734375, -2.1468505859375, -2.075927734375, -2.0050048828125, -1.93408203125, -1.8631591796875, -1.792236328125, -1.7213134765625, -1.650390625, -1.5794677734375, -1.508544921875, -1.4376220703125, -1.36669921875, -1.2957763671875, -1.224853515625, -1.1539306640625, -1.0830078125, -1.0120849609375, -0.941162109375, -0.8702392578125, -0.79931640625, -0.7283935546875, -0.657470703125, -0.5865478515625, -0.515625, -0.4447021484375, -0.373779296875, -0.3028564453125, -0.23193359375, -0.1610107421875, -0.090087890625, -0.0191650390625, 0.0517578125, 0.1226806640625, 0.193603515625, 0.2645263671875, 0.33544921875, 0.4063720703125, 0.477294921875, 0.5482177734375, 0.619140625, 0.6900634765625, 0.760986328125, 0.8319091796875, 0.90283203125, 0.9737548828125, 1.044677734375, 1.1156005859375, 1.1865234375, 1.2574462890625, 1.328369140625, 1.3992919921875, 1.47021484375, 1.5411376953125, 1.612060546875, 1.6829833984375, 1.75390625]}, "gradients/encoder.encoder.layers.4.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 6.0, 3.0, 5.0, 13.0, 11.0, 15.0, 23.0, 20.0, 27.0, 33.0, 41.0, 42.0, 52.0, 62.0, 60.0, 73.0, 68.0, 66.0, 65.0, 58.0, 60.0, 46.0, 32.0, 24.0, 22.0, 20.0, 15.0, 19.0, 8.0, 8.0, 7.0, 3.0, 3.0, 2.0, 1.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.7451171875, -1.6994781494140625, -1.653839111328125, -1.6082000732421875, -1.56256103515625, -1.5169219970703125, -1.471282958984375, -1.4256439208984375, -1.3800048828125, -1.3343658447265625, -1.288726806640625, -1.2430877685546875, -1.19744873046875, -1.1518096923828125, -1.106170654296875, -1.0605316162109375, -1.014892578125, -0.9692535400390625, -0.923614501953125, -0.8779754638671875, -0.83233642578125, -0.7866973876953125, -0.741058349609375, -0.6954193115234375, -0.6497802734375, -0.6041412353515625, -0.558502197265625, -0.5128631591796875, -0.46722412109375, -0.4215850830078125, -0.375946044921875, -0.3303070068359375, -0.28466796875, -0.2390289306640625, -0.193389892578125, -0.1477508544921875, -0.10211181640625, -0.0564727783203125, -0.010833740234375, 0.0348052978515625, 0.0804443359375, 0.1260833740234375, 0.171722412109375, 0.2173614501953125, 0.26300048828125, 0.3086395263671875, 0.354278564453125, 0.3999176025390625, 0.445556640625, 0.4911956787109375, 0.536834716796875, 0.5824737548828125, 0.62811279296875, 0.6737518310546875, 0.719390869140625, 0.7650299072265625, 0.8106689453125, 0.8563079833984375, 0.901947021484375, 0.9475860595703125, 0.99322509765625, 1.0388641357421875, 1.084503173828125, 1.1301422119140625, 1.17578125]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 2.0, 3.0, 9.0, 19.0, 22.0, 38.0, 63.0, 147.0, 232.0, 503.0, 1143.0, 3769.0, 15920.0, 115474.0, 2521481.0, 1448061.0, 72658.0, 10567.0, 2580.0, 852.0, 336.0, 161.0, 106.0, 57.0, 39.0, 13.0, 10.0, 7.0, 5.0, 3.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.79296875, -2.6851806640625, -2.577392578125, -2.4696044921875, -2.36181640625, -2.2540283203125, -2.146240234375, -2.0384521484375, -1.9306640625, -1.8228759765625, -1.715087890625, -1.6072998046875, -1.49951171875, -1.3917236328125, -1.283935546875, -1.1761474609375, -1.068359375, -0.9605712890625, -0.852783203125, -0.7449951171875, -0.63720703125, -0.5294189453125, -0.421630859375, -0.3138427734375, -0.2060546875, -0.0982666015625, 0.009521484375, 0.1173095703125, 0.22509765625, 0.3328857421875, 0.440673828125, 0.5484619140625, 0.65625, 0.7640380859375, 0.871826171875, 0.9796142578125, 1.08740234375, 1.1951904296875, 1.302978515625, 1.4107666015625, 1.5185546875, 1.6263427734375, 1.734130859375, 1.8419189453125, 1.94970703125, 2.0574951171875, 2.165283203125, 2.2730712890625, 2.380859375, 2.4886474609375, 2.596435546875, 2.7042236328125, 2.81201171875, 2.9197998046875, 3.027587890625, 3.1353759765625, 3.2431640625, 3.3509521484375, 3.458740234375, 3.5665283203125, 3.67431640625, 3.7821044921875, 3.889892578125, 3.9976806640625, 4.10546875]}, "gradients/encoder.encoder.layers.4.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 4.0, 1.0, 1.0, 7.0, 9.0, 3.0, 12.0, 16.0, 18.0, 33.0, 39.0, 66.0, 122.0, 188.0, 350.0, 553.0, 894.0, 684.0, 475.0, 229.0, 135.0, 103.0, 56.0, 29.0, 14.0, 20.0, 7.0, 7.0, 4.0, 2.0, 3.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.375, -4.25604248046875, -4.1370849609375, -4.01812744140625, -3.899169921875, -3.78021240234375, -3.6612548828125, -3.54229736328125, -3.42333984375, -3.30438232421875, -3.1854248046875, -3.06646728515625, -2.947509765625, -2.82855224609375, -2.7095947265625, -2.59063720703125, -2.4716796875, -2.35272216796875, -2.2337646484375, -2.11480712890625, -1.995849609375, -1.87689208984375, -1.7579345703125, -1.63897705078125, -1.52001953125, -1.40106201171875, -1.2821044921875, -1.16314697265625, -1.044189453125, -0.92523193359375, -0.8062744140625, -0.68731689453125, -0.568359375, -0.44940185546875, -0.3304443359375, -0.21148681640625, -0.092529296875, 0.02642822265625, 0.1453857421875, 0.26434326171875, 0.38330078125, 0.50225830078125, 0.6212158203125, 0.74017333984375, 0.859130859375, 0.97808837890625, 1.0970458984375, 1.21600341796875, 1.3349609375, 1.45391845703125, 1.5728759765625, 1.69183349609375, 1.810791015625, 1.92974853515625, 2.0487060546875, 2.16766357421875, 2.28662109375, 2.40557861328125, 2.5245361328125, 2.64349365234375, 2.762451171875, 2.88140869140625, 3.0003662109375, 3.11932373046875, 3.23828125]}, "gradients/encoder.encoder.layers.4.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 0.0, 1.0, 3.0, 5.0, 15.0, 24.0, 86.0, 163.0, 247.0, 223.0, 134.0, 52.0, 26.0, 14.0, 4.0, 3.0, 2.0, 1.0, 3.0, 1.0, 0.0, 1.0, 1.0, 3.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-65.60090637207031, -64.03793334960938, -62.474952697753906, -60.9119758605957, -59.3489990234375, -57.7860221862793, -56.223045349121094, -54.66006851196289, -53.09709167480469, -51.534114837646484, -49.97113800048828, -48.40816116333008, -46.845184326171875, -45.28220748901367, -43.71923065185547, -42.156253814697266, -40.59327697753906, -39.03030014038086, -37.467323303222656, -35.90434646606445, -34.34136962890625, -32.77839279174805, -31.215415954589844, -29.65243911743164, -28.089462280273438, -26.526485443115234, -24.96350860595703, -23.400531768798828, -21.837554931640625, -20.274578094482422, -18.71160125732422, -17.148624420166016, -15.585643768310547, -14.022666931152344, -12.45969009399414, -10.896713256835938, -9.333736419677734, -7.770759582519531, -6.207782745361328, -4.644805908203125, -3.081829071044922, -1.5188522338867188, 0.044124603271484375, 1.6071014404296875, 3.1700782775878906, 4.733055114746094, 6.296031951904297, 7.8590087890625, 9.421985626220703, 10.984962463378906, 12.54793930053711, 14.110916137695312, 15.673892974853516, 17.23686981201172, 18.799846649169922, 20.362823486328125, 21.925800323486328, 23.48877716064453, 25.051753997802734, 26.614730834960938, 28.17770767211914, 29.740684509277344, 31.303661346435547, 32.86663818359375, 34.42961502075195]}, "gradients/encoder.encoder.layers.4.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 3.0, 4.0, 5.0, 8.0, 4.0, 6.0, 6.0, 8.0, 13.0, 25.0, 26.0, 31.0, 39.0, 50.0, 51.0, 56.0, 47.0, 59.0, 65.0, 57.0, 66.0, 59.0, 50.0, 49.0, 38.0, 48.0, 38.0, 29.0, 22.0, 15.0, 10.0, 7.0, 6.0, 5.0, 5.0, 5.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-17.67677116394043, -17.081113815307617, -16.485456466674805, -15.889799118041992, -15.29414176940918, -14.698484420776367, -14.102828025817871, -13.507170677185059, -12.911513328552246, -12.315855979919434, -11.720198631286621, -11.124541282653809, -10.528884887695312, -9.9332275390625, -9.337570190429688, -8.741912841796875, -8.146255493164062, -7.55059814453125, -6.9549407958984375, -6.359283924102783, -5.763626575469971, -5.167969226837158, -4.572312355041504, -3.9766550064086914, -3.380997657775879, -2.7853403091430664, -2.189683198928833, -1.59402596950531, -0.9983687400817871, -0.4027113914489746, 0.1929457187652588, 0.7886028289794922, 1.3842601776123047, 1.9799174070358276, 2.5755746364593506, 3.171231746673584, 3.7668890953063965, 4.362546443939209, 4.958203315734863, 5.553860664367676, 6.149518013000488, 6.745175361633301, 7.340832710266113, 7.936489582061768, 8.532146453857422, 9.127803802490234, 9.723461151123047, 10.31911849975586, 10.914775848388672, 11.510433197021484, 12.106090545654297, 12.70174789428711, 13.297405242919922, 13.893062591552734, 14.48871898651123, 15.084376335144043, 15.680033683776855, 16.27569007873535, 16.871347427368164, 17.467004776000977, 18.06266212463379, 18.6583194732666, 19.253976821899414, 19.849634170532227, 20.44529151916504]}, "gradients/encoder.encoder.layers.4.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 1.0, 0.0, 2.0, 0.0, 5.0, 3.0, 1.0, 4.0, 6.0, 12.0, 19.0, 35.0, 52.0, 62.0, 114.0, 171.0, 255.0, 426.0, 722.0, 1173.0, 1794.0, 3151.0, 5189.0, 8803.0, 15116.0, 26367.0, 45991.0, 80023.0, 135297.0, 202056.0, 199861.0, 134885.0, 79411.0, 45103.0, 25753.0, 15000.0, 8631.0, 4970.0, 3095.0, 1841.0, 1159.0, 741.0, 455.0, 294.0, 199.0, 118.0, 66.0, 49.0, 31.0, 27.0, 9.0, 7.0, 4.0, 5.0, 2.0, 2.0, 4.0, 0.0, 1.0, 0.0, 1.0], "bins": [-1.4169921875, -1.3740386962890625, -1.331085205078125, -1.2881317138671875, -1.24517822265625, -1.2022247314453125, -1.159271240234375, -1.1163177490234375, -1.0733642578125, -1.0304107666015625, -0.987457275390625, -0.9445037841796875, -0.90155029296875, -0.8585968017578125, -0.815643310546875, -0.7726898193359375, -0.729736328125, -0.6867828369140625, -0.643829345703125, -0.6008758544921875, -0.55792236328125, -0.5149688720703125, -0.472015380859375, -0.4290618896484375, -0.3861083984375, -0.3431549072265625, -0.300201416015625, -0.2572479248046875, -0.21429443359375, -0.1713409423828125, -0.128387451171875, -0.0854339599609375, -0.04248046875, 0.0004730224609375, 0.043426513671875, 0.0863800048828125, 0.12933349609375, 0.1722869873046875, 0.215240478515625, 0.2581939697265625, 0.3011474609375, 0.3441009521484375, 0.387054443359375, 0.4300079345703125, 0.47296142578125, 0.5159149169921875, 0.558868408203125, 0.6018218994140625, 0.644775390625, 0.6877288818359375, 0.730682373046875, 0.7736358642578125, 0.81658935546875, 0.8595428466796875, 0.902496337890625, 0.9454498291015625, 0.9884033203125, 1.0313568115234375, 1.074310302734375, 1.1172637939453125, 1.16021728515625, 1.2031707763671875, 1.246124267578125, 1.2890777587890625, 1.33203125]}, "gradients/encoder.encoder.layers.4.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 1.0, 0.0, 1.0, 3.0, 3.0, 1.0, 0.0, 1.0, 0.0, 2.0, 7.0, 8.0, 5.0, 9.0, 9.0, 8.0, 11.0, 6.0, 15.0, 26.0, 15.0, 28.0, 32.0, 32.0, 49.0, 44.0, 41.0, 36.0, 41.0, 51.0, 40.0, 50.0, 40.0, 47.0, 45.0, 50.0, 31.0, 37.0, 31.0, 18.0, 19.0, 22.0, 17.0, 18.0, 14.0, 15.0, 13.0, 6.0, 6.0, 1.0, 5.0, 1.0, 3.0, 4.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.09765625, -1.063873291015625, -1.03009033203125, -0.996307373046875, -0.9625244140625, -0.928741455078125, -0.89495849609375, -0.861175537109375, -0.827392578125, -0.793609619140625, -0.75982666015625, -0.726043701171875, -0.6922607421875, -0.658477783203125, -0.62469482421875, -0.590911865234375, -0.55712890625, -0.523345947265625, -0.48956298828125, -0.455780029296875, -0.4219970703125, -0.388214111328125, -0.35443115234375, -0.320648193359375, -0.286865234375, -0.253082275390625, -0.21929931640625, -0.185516357421875, -0.1517333984375, -0.117950439453125, -0.08416748046875, -0.050384521484375, -0.0166015625, 0.017181396484375, 0.05096435546875, 0.084747314453125, 0.1185302734375, 0.152313232421875, 0.18609619140625, 0.219879150390625, 0.253662109375, 0.287445068359375, 0.32122802734375, 0.355010986328125, 0.3887939453125, 0.422576904296875, 0.45635986328125, 0.490142822265625, 0.52392578125, 0.557708740234375, 0.59149169921875, 0.625274658203125, 0.6590576171875, 0.692840576171875, 0.72662353515625, 0.760406494140625, 0.794189453125, 0.827972412109375, 0.86175537109375, 0.895538330078125, 0.9293212890625, 0.963104248046875, 0.99688720703125, 1.030670166015625, 1.064453125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 3.0, 2.0, 1.0, 5.0, 8.0, 13.0, 8.0, 17.0, 29.0, 34.0, 43.0, 80.0, 89.0, 122.0, 193.0, 300.0, 422.0, 713.0, 1419.0, 3150.0, 9755.0, 43646.0, 246290.0, 613550.0, 99187.0, 19386.0, 5255.0, 2068.0, 1039.0, 592.0, 370.0, 254.0, 156.0, 111.0, 89.0, 56.0, 38.0, 20.0, 13.0, 14.0, 8.0, 8.0, 5.0, 3.0, 0.0, 3.0, 2.0, 2.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-4.2578125, -4.129730224609375, -4.00164794921875, -3.873565673828125, -3.7454833984375, -3.617401123046875, -3.48931884765625, -3.361236572265625, -3.233154296875, -3.105072021484375, -2.97698974609375, -2.848907470703125, -2.7208251953125, -2.592742919921875, -2.46466064453125, -2.336578369140625, -2.20849609375, -2.080413818359375, -1.95233154296875, -1.824249267578125, -1.6961669921875, -1.568084716796875, -1.44000244140625, -1.311920166015625, -1.183837890625, -1.055755615234375, -0.92767333984375, -0.799591064453125, -0.6715087890625, -0.543426513671875, -0.41534423828125, -0.287261962890625, -0.1591796875, -0.031097412109375, 0.09698486328125, 0.225067138671875, 0.3531494140625, 0.481231689453125, 0.60931396484375, 0.737396240234375, 0.865478515625, 0.993560791015625, 1.12164306640625, 1.249725341796875, 1.3778076171875, 1.505889892578125, 1.63397216796875, 1.762054443359375, 1.89013671875, 2.018218994140625, 2.14630126953125, 2.274383544921875, 2.4024658203125, 2.530548095703125, 2.65863037109375, 2.786712646484375, 2.914794921875, 3.042877197265625, 3.17095947265625, 3.299041748046875, 3.4271240234375, 3.555206298828125, 3.68328857421875, 3.811370849609375, 3.939453125]}, "gradients/encoder.encoder.layers.4.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 2.0, 4.0, 5.0, 5.0, 4.0, 7.0, 8.0, 10.0, 12.0, 18.0, 26.0, 31.0, 25.0, 33.0, 48.0, 48.0, 56.0, 39.0, 75.0, 65.0, 62.0, 67.0, 40.0, 39.0, 57.0, 34.0, 34.0, 31.0, 29.0, 16.0, 26.0, 18.0, 12.0, 7.0, 7.0, 4.0, 3.0, 4.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-4.65234375, -4.47662353515625, -4.3009033203125, -4.12518310546875, -3.949462890625, -3.77374267578125, -3.5980224609375, -3.42230224609375, -3.24658203125, -3.07086181640625, -2.8951416015625, -2.71942138671875, -2.543701171875, -2.36798095703125, -2.1922607421875, -2.01654052734375, -1.8408203125, -1.66510009765625, -1.4893798828125, -1.31365966796875, -1.137939453125, -0.96221923828125, -0.7864990234375, -0.61077880859375, -0.43505859375, -0.25933837890625, -0.0836181640625, 0.09210205078125, 0.267822265625, 0.44354248046875, 0.6192626953125, 0.79498291015625, 0.970703125, 1.14642333984375, 1.3221435546875, 1.49786376953125, 1.673583984375, 1.84930419921875, 2.0250244140625, 2.20074462890625, 2.37646484375, 2.55218505859375, 2.7279052734375, 2.90362548828125, 3.079345703125, 3.25506591796875, 3.4307861328125, 3.60650634765625, 3.7822265625, 3.95794677734375, 4.1336669921875, 4.30938720703125, 4.485107421875, 4.66082763671875, 4.8365478515625, 5.01226806640625, 5.18798828125, 5.36370849609375, 5.5394287109375, 5.71514892578125, 5.890869140625, 6.06658935546875, 6.2423095703125, 6.41802978515625, 6.59375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 1.0, 4.0, 4.0, 3.0, 2.0, 5.0, 9.0, 13.0, 13.0, 19.0, 35.0, 44.0, 84.0, 104.0, 165.0, 262.0, 507.0, 950.0, 2103.0, 5694.0, 17773.0, 63377.0, 229201.0, 539332.0, 134299.0, 36833.0, 10838.0, 3725.0, 1476.0, 658.0, 378.0, 229.0, 130.0, 82.0, 58.0, 47.0, 28.0, 20.0, 12.0, 11.0, 8.0, 9.0, 9.0, 3.0, 1.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.849609375, -0.8224563598632812, -0.7953033447265625, -0.7681503295898438, -0.740997314453125, -0.7138442993164062, -0.6866912841796875, -0.6595382690429688, -0.63238525390625, -0.6052322387695312, -0.5780792236328125, -0.5509262084960938, -0.523773193359375, -0.49662017822265625, -0.4694671630859375, -0.44231414794921875, -0.4151611328125, -0.38800811767578125, -0.3608551025390625, -0.33370208740234375, -0.306549072265625, -0.27939605712890625, -0.2522430419921875, -0.22509002685546875, -0.19793701171875, -0.17078399658203125, -0.1436309814453125, -0.11647796630859375, -0.089324951171875, -0.06217193603515625, -0.0350189208984375, -0.00786590576171875, 0.019287109375, 0.04644012451171875, 0.0735931396484375, 0.10074615478515625, 0.127899169921875, 0.15505218505859375, 0.1822052001953125, 0.20935821533203125, 0.23651123046875, 0.26366424560546875, 0.2908172607421875, 0.31797027587890625, 0.345123291015625, 0.37227630615234375, 0.3994293212890625, 0.42658233642578125, 0.4537353515625, 0.48088836669921875, 0.5080413818359375, 0.5351943969726562, 0.562347412109375, 0.5895004272460938, 0.6166534423828125, 0.6438064575195312, 0.67095947265625, 0.6981124877929688, 0.7252655029296875, 0.7524185180664062, 0.779571533203125, 0.8067245483398438, 0.8338775634765625, 0.8610305786132812, 0.88818359375]}, "gradients/encoder.encoder.layers.4.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 2.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 3.0, 2.0, 4.0, 11.0, 6.0, 13.0, 13.0, 20.0, 23.0, 28.0, 48.0, 65.0, 71.0, 86.0, 98.0, 108.0, 83.0, 70.0, 57.0, 46.0, 32.0, 37.0, 19.0, 12.0, 15.0, 16.0, 5.0, 2.0, 3.0, 4.0, 0.0, 4.0, 0.0, 2.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.00029659271240234375, -0.0002851225435733795, -0.0002736523747444153, -0.00026218220591545105, -0.0002507120370864868, -0.00023924186825752258, -0.00022777169942855835, -0.00021630153059959412, -0.00020483136177062988, -0.00019336119294166565, -0.00018189102411270142, -0.00017042085528373718, -0.00015895068645477295, -0.00014748051762580872, -0.00013601034879684448, -0.00012454017996788025, -0.00011307001113891602, -0.00010159984230995178, -9.012967348098755e-05, -7.865950465202332e-05, -6.718933582305908e-05, -5.571916699409485e-05, -4.4248998165130615e-05, -3.277882933616638e-05, -2.130866050720215e-05, -9.838491678237915e-06, 1.6316771507263184e-06, 1.3101845979690552e-05, 2.4572014808654785e-05, 3.604218363761902e-05, 4.751235246658325e-05, 5.8982521295547485e-05, 7.045269012451172e-05, 8.192285895347595e-05, 9.339302778244019e-05, 0.00010486319661140442, 0.00011633336544036865, 0.00012780353426933289, 0.00013927370309829712, 0.00015074387192726135, 0.00016221404075622559, 0.00017368420958518982, 0.00018515437841415405, 0.00019662454724311829, 0.00020809471607208252, 0.00021956488490104675, 0.00023103505373001099, 0.00024250522255897522, 0.00025397539138793945, 0.0002654455602169037, 0.0002769157290458679, 0.00028838589787483215, 0.0002998560667037964, 0.0003113262355327606, 0.00032279640436172485, 0.0003342665731906891, 0.0003457367420196533, 0.00035720691084861755, 0.0003686770796775818, 0.000380147248506546, 0.00039161741733551025, 0.0004030875861644745, 0.0004145577549934387, 0.00042602792382240295, 0.0004374980926513672]}, "gradients/encoder.encoder.layers.4.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 8.0, 3.0, 4.0, 7.0, 7.0, 13.0, 17.0, 25.0, 28.0, 38.0, 51.0, 81.0, 116.0, 166.0, 271.0, 370.0, 616.0, 1143.0, 2220.0, 4888.0, 13255.0, 41215.0, 140173.0, 505251.0, 231988.0, 71015.0, 21343.0, 7360.0, 3107.0, 1492.0, 768.0, 476.0, 322.0, 203.0, 150.0, 94.0, 58.0, 60.0, 40.0, 33.0, 30.0, 16.0, 14.0, 8.0, 5.0, 6.0, 4.0, 4.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0], "bins": [-0.7841796875, -0.76092529296875, -0.7376708984375, -0.71441650390625, -0.691162109375, -0.66790771484375, -0.6446533203125, -0.62139892578125, -0.59814453125, -0.57489013671875, -0.5516357421875, -0.52838134765625, -0.505126953125, -0.48187255859375, -0.4586181640625, -0.43536376953125, -0.412109375, -0.38885498046875, -0.3656005859375, -0.34234619140625, -0.319091796875, -0.29583740234375, -0.2725830078125, -0.24932861328125, -0.22607421875, -0.20281982421875, -0.1795654296875, -0.15631103515625, -0.133056640625, -0.10980224609375, -0.0865478515625, -0.06329345703125, -0.0400390625, -0.01678466796875, 0.0064697265625, 0.02972412109375, 0.052978515625, 0.07623291015625, 0.0994873046875, 0.12274169921875, 0.14599609375, 0.16925048828125, 0.1925048828125, 0.21575927734375, 0.239013671875, 0.26226806640625, 0.2855224609375, 0.30877685546875, 0.33203125, 0.35528564453125, 0.3785400390625, 0.40179443359375, 0.425048828125, 0.44830322265625, 0.4715576171875, 0.49481201171875, 0.51806640625, 0.54132080078125, 0.5645751953125, 0.58782958984375, 0.611083984375, 0.63433837890625, 0.6575927734375, 0.68084716796875, 0.7041015625]}, "gradients/encoder.encoder.layers.4.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 3.0, 2.0, 3.0, 2.0, 4.0, 4.0, 8.0, 7.0, 9.0, 8.0, 9.0, 14.0, 12.0, 13.0, 30.0, 26.0, 37.0, 42.0, 48.0, 60.0, 47.0, 54.0, 54.0, 47.0, 51.0, 42.0, 44.0, 45.0, 50.0, 27.0, 31.0, 32.0, 19.0, 27.0, 16.0, 12.0, 12.0, 13.0, 13.0, 11.0, 4.0, 5.0, 3.0, 2.0, 4.0, 1.0, 1.0, 3.0, 1.0, 1.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-0.74951171875, -0.7248992919921875, -0.700286865234375, -0.6756744384765625, -0.65106201171875, -0.6264495849609375, -0.601837158203125, -0.5772247314453125, -0.5526123046875, -0.5279998779296875, -0.503387451171875, -0.4787750244140625, -0.45416259765625, -0.4295501708984375, -0.404937744140625, -0.3803253173828125, -0.355712890625, -0.3311004638671875, -0.306488037109375, -0.2818756103515625, -0.25726318359375, -0.2326507568359375, -0.208038330078125, -0.1834259033203125, -0.1588134765625, -0.1342010498046875, -0.109588623046875, -0.0849761962890625, -0.06036376953125, -0.0357513427734375, -0.011138916015625, 0.0134735107421875, 0.0380859375, 0.0626983642578125, 0.087310791015625, 0.1119232177734375, 0.13653564453125, 0.1611480712890625, 0.185760498046875, 0.2103729248046875, 0.2349853515625, 0.2595977783203125, 0.284210205078125, 0.3088226318359375, 0.33343505859375, 0.3580474853515625, 0.382659912109375, 0.4072723388671875, 0.431884765625, 0.4564971923828125, 0.481109619140625, 0.5057220458984375, 0.53033447265625, 0.5549468994140625, 0.579559326171875, 0.6041717529296875, 0.6287841796875, 0.6533966064453125, 0.678009033203125, 0.7026214599609375, 0.72723388671875, 0.7518463134765625, 0.776458740234375, 0.8010711669921875, 0.82568359375]}, "gradients/encoder.encoder.layers.4.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 3.0, 5.0, 5.0, 8.0, 15.0, 30.0, 59.0, 96.0, 144.0, 249.0, 145.0, 116.0, 61.0, 27.0, 23.0, 9.0, 2.0, 7.0, 1.0, 2.0, 1.0, 2.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 1.0], "bins": [-42.741580963134766, -41.780296325683594, -40.81901550292969, -39.857730865478516, -38.89645004272461, -37.93516540527344, -36.97388458251953, -36.01259994506836, -35.05131912231445, -34.09003448486328, -33.128753662109375, -32.1674690246582, -31.206188201904297, -30.244905471801758, -29.28362274169922, -28.32234001159668, -27.36105728149414, -26.3997745513916, -25.438491821289062, -24.477209091186523, -23.515926361083984, -22.554643630981445, -21.593360900878906, -20.632078170776367, -19.670793533325195, -18.709510803222656, -17.748228073120117, -16.786945343017578, -15.825662612915039, -14.8643798828125, -13.903097152709961, -12.941814422607422, -11.980531692504883, -11.019248962402344, -10.057966232299805, -9.096683502197266, -8.135400772094727, -7.174117565155029, -6.21283483505249, -5.251552104949951, -4.290269374847412, -3.328986644744873, -2.367703914642334, -1.4064209461212158, -0.44513821601867676, 0.5161447525024414, 1.4774274826049805, 2.4387102127075195, 3.3999929428100586, 4.361275672912598, 5.322558403015137, 6.283841133117676, 7.245123863220215, 8.20640754699707, 9.16769027709961, 10.128973007202148, 11.090255737304688, 12.051538467407227, 13.012821197509766, 13.974103927612305, 14.935386657714844, 15.896669387817383, 16.857952117919922, 17.81923484802246, 18.780517578125]}, "gradients/encoder.encoder.layers.4.layer_norm.bias": {"_type": "histogram", "values": [2.0, 1.0, 1.0, 1.0, 2.0, 0.0, 3.0, 2.0, 5.0, 1.0, 7.0, 7.0, 5.0, 4.0, 10.0, 11.0, 11.0, 18.0, 12.0, 20.0, 16.0, 20.0, 27.0, 29.0, 26.0, 44.0, 37.0, 45.0, 47.0, 62.0, 68.0, 67.0, 61.0, 50.0, 33.0, 35.0, 33.0, 21.0, 24.0, 18.0, 16.0, 14.0, 20.0, 12.0, 15.0, 18.0, 6.0, 5.0, 2.0, 7.0, 4.0, 1.0, 7.0, 3.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-16.809316635131836, -16.25734519958496, -15.705373764038086, -15.153402328491211, -14.601430892944336, -14.049459457397461, -13.497488021850586, -12.945516586303711, -12.393545150756836, -11.841573715209961, -11.289602279663086, -10.737630844116211, -10.185659408569336, -9.633687973022461, -9.081716537475586, -8.529745101928711, -7.977773666381836, -7.425802230834961, -6.873830795288086, -6.321859359741211, -5.769887924194336, -5.217916488647461, -4.665945053100586, -4.113973617553711, -3.562002182006836, -3.010030746459961, -2.458059310913086, -1.906087875366211, -1.354116439819336, -0.8021450042724609, -0.25017356872558594, 0.30179786682128906, 0.8537673950195312, 1.4057388305664062, 1.9577102661132812, 2.5096817016601562, 3.0616531372070312, 3.6136245727539062, 4.165596008300781, 4.717567443847656, 5.269538879394531, 5.821510314941406, 6.373481750488281, 6.925453186035156, 7.477424621582031, 8.029396057128906, 8.581367492675781, 9.133338928222656, 9.685310363769531, 10.237281799316406, 10.789253234863281, 11.341224670410156, 11.893196105957031, 12.445167541503906, 12.997138977050781, 13.549110412597656, 14.101081848144531, 14.653053283691406, 15.205024719238281, 15.756996154785156, 16.30896759033203, 16.860939025878906, 17.41291046142578, 17.964881896972656, 18.51685333251953]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 4.0, 2.0, 4.0, 3.0, 6.0, 14.0, 7.0, 19.0, 36.0, 41.0, 71.0, 154.0, 314.0, 483.0, 891.0, 1687.0, 3526.0, 8393.0, 24919.0, 114128.0, 942106.0, 2557304.0, 447799.0, 63971.0, 16765.0, 6042.0, 2644.0, 1331.0, 715.0, 394.0, 219.0, 108.0, 81.0, 47.0, 30.0, 14.0, 11.0, 4.0, 6.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-2.05078125, -1.9986419677734375, -1.946502685546875, -1.8943634033203125, -1.84222412109375, -1.7900848388671875, -1.737945556640625, -1.6858062744140625, -1.6336669921875, -1.5815277099609375, -1.529388427734375, -1.4772491455078125, -1.42510986328125, -1.3729705810546875, -1.320831298828125, -1.2686920166015625, -1.216552734375, -1.1644134521484375, -1.112274169921875, -1.0601348876953125, -1.00799560546875, -0.9558563232421875, -0.903717041015625, -0.8515777587890625, -0.7994384765625, -0.7472991943359375, -0.695159912109375, -0.6430206298828125, -0.59088134765625, -0.5387420654296875, -0.486602783203125, -0.4344635009765625, -0.38232421875, -0.3301849365234375, -0.278045654296875, -0.2259063720703125, -0.17376708984375, -0.1216278076171875, -0.069488525390625, -0.0173492431640625, 0.0347900390625, 0.0869293212890625, 0.139068603515625, 0.1912078857421875, 0.24334716796875, 0.2954864501953125, 0.347625732421875, 0.3997650146484375, 0.451904296875, 0.5040435791015625, 0.556182861328125, 0.6083221435546875, 0.66046142578125, 0.7126007080078125, 0.764739990234375, 0.8168792724609375, 0.8690185546875, 0.9211578369140625, 0.973297119140625, 1.0254364013671875, 1.07757568359375, 1.1297149658203125, 1.181854248046875, 1.2339935302734375, 1.2861328125]}, "gradients/encoder.encoder.layers.3.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 2.0, 2.0, 0.0, 6.0, 3.0, 6.0, 6.0, 10.0, 11.0, 12.0, 13.0, 20.0, 19.0, 19.0, 27.0, 18.0, 35.0, 37.0, 41.0, 42.0, 39.0, 38.0, 48.0, 53.0, 47.0, 40.0, 45.0, 35.0, 37.0, 38.0, 39.0, 29.0, 34.0, 20.0, 23.0, 16.0, 12.0, 23.0, 10.0, 17.0, 7.0, 7.0, 10.0, 5.0, 2.0, 0.0, 2.0, 2.0, 3.0, 2.0, 2.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-0.99267578125, -0.9618072509765625, -0.930938720703125, -0.9000701904296875, -0.86920166015625, -0.8383331298828125, -0.807464599609375, -0.7765960693359375, -0.7457275390625, -0.7148590087890625, -0.683990478515625, -0.6531219482421875, -0.62225341796875, -0.5913848876953125, -0.560516357421875, -0.5296478271484375, -0.498779296875, -0.4679107666015625, -0.437042236328125, -0.4061737060546875, -0.37530517578125, -0.3444366455078125, -0.313568115234375, -0.2826995849609375, -0.2518310546875, -0.2209625244140625, -0.190093994140625, -0.1592254638671875, -0.12835693359375, -0.0974884033203125, -0.066619873046875, -0.0357513427734375, -0.0048828125, 0.0259857177734375, 0.056854248046875, 0.0877227783203125, 0.11859130859375, 0.1494598388671875, 0.180328369140625, 0.2111968994140625, 0.2420654296875, 0.2729339599609375, 0.303802490234375, 0.3346710205078125, 0.36553955078125, 0.3964080810546875, 0.427276611328125, 0.4581451416015625, 0.489013671875, 0.5198822021484375, 0.550750732421875, 0.5816192626953125, 0.61248779296875, 0.6433563232421875, 0.674224853515625, 0.7050933837890625, 0.7359619140625, 0.7668304443359375, 0.797698974609375, 0.8285675048828125, 0.85943603515625, 0.8903045654296875, 0.921173095703125, 0.9520416259765625, 0.98291015625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 5.0, 3.0, 5.0, 5.0, 13.0, 15.0, 28.0, 27.0, 69.0, 119.0, 195.0, 389.0, 739.0, 1596.0, 4275.0, 16738.0, 125856.0, 3305435.0, 680652.0, 44663.0, 8624.0, 2675.0, 1040.0, 533.0, 270.0, 140.0, 87.0, 31.0, 24.0, 19.0, 5.0, 3.0, 4.0, 2.0, 4.0, 1.0, 0.0, 3.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0], "bins": [-3.650390625, -3.54534912109375, -3.4403076171875, -3.33526611328125, -3.230224609375, -3.12518310546875, -3.0201416015625, -2.91510009765625, -2.81005859375, -2.70501708984375, -2.5999755859375, -2.49493408203125, -2.389892578125, -2.28485107421875, -2.1798095703125, -2.07476806640625, -1.9697265625, -1.86468505859375, -1.7596435546875, -1.65460205078125, -1.549560546875, -1.44451904296875, -1.3394775390625, -1.23443603515625, -1.12939453125, -1.02435302734375, -0.9193115234375, -0.81427001953125, -0.709228515625, -0.60418701171875, -0.4991455078125, -0.39410400390625, -0.2890625, -0.18402099609375, -0.0789794921875, 0.02606201171875, 0.131103515625, 0.23614501953125, 0.3411865234375, 0.44622802734375, 0.55126953125, 0.65631103515625, 0.7613525390625, 0.86639404296875, 0.971435546875, 1.07647705078125, 1.1815185546875, 1.28656005859375, 1.3916015625, 1.49664306640625, 1.6016845703125, 1.70672607421875, 1.811767578125, 1.91680908203125, 2.0218505859375, 2.12689208984375, 2.23193359375, 2.33697509765625, 2.4420166015625, 2.54705810546875, 2.652099609375, 2.75714111328125, 2.8621826171875, 2.96722412109375, 3.072265625]}, "gradients/encoder.encoder.layers.3.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 4.0, 2.0, 3.0, 3.0, 7.0, 5.0, 8.0, 15.0, 12.0, 24.0, 23.0, 51.0, 62.0, 99.0, 164.0, 249.0, 467.0, 725.0, 703.0, 548.0, 307.0, 191.0, 120.0, 66.0, 61.0, 39.0, 44.0, 19.0, 16.0, 13.0, 11.0, 6.0, 6.0, 7.0, 2.0, 0.0, 1.0, 0.0, 3.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.423828125, -2.3372802734375, -2.250732421875, -2.1641845703125, -2.07763671875, -1.9910888671875, -1.904541015625, -1.8179931640625, -1.7314453125, -1.6448974609375, -1.558349609375, -1.4718017578125, -1.38525390625, -1.2987060546875, -1.212158203125, -1.1256103515625, -1.0390625, -0.9525146484375, -0.865966796875, -0.7794189453125, -0.69287109375, -0.6063232421875, -0.519775390625, -0.4332275390625, -0.3466796875, -0.2601318359375, -0.173583984375, -0.0870361328125, -0.00048828125, 0.0860595703125, 0.172607421875, 0.2591552734375, 0.345703125, 0.4322509765625, 0.518798828125, 0.6053466796875, 0.69189453125, 0.7784423828125, 0.864990234375, 0.9515380859375, 1.0380859375, 1.1246337890625, 1.211181640625, 1.2977294921875, 1.38427734375, 1.4708251953125, 1.557373046875, 1.6439208984375, 1.73046875, 1.8170166015625, 1.903564453125, 1.9901123046875, 2.07666015625, 2.1632080078125, 2.249755859375, 2.3363037109375, 2.4228515625, 2.5093994140625, 2.595947265625, 2.6824951171875, 2.76904296875, 2.8555908203125, 2.942138671875, 3.0286865234375, 3.115234375]}, "gradients/encoder.encoder.layers.3.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 4.0, 1.0, 2.0, 10.0, 12.0, 25.0, 88.0, 254.0, 307.0, 164.0, 75.0, 31.0, 24.0, 5.0, 2.0, 2.0, 3.0, 3.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-59.70853042602539, -57.643943786621094, -55.57935333251953, -53.514766693115234, -51.45018005371094, -49.385589599609375, -47.32100296020508, -45.25641632080078, -43.19182586669922, -41.12723922729492, -39.06264877319336, -36.99806213378906, -34.9334716796875, -32.8688850402832, -30.804298400878906, -28.739709854125977, -26.675121307373047, -24.610532760620117, -22.545944213867188, -20.48135757446289, -18.41676902770996, -16.35218048095703, -14.287592887878418, -12.223005294799805, -10.158416748046875, -8.093828201293945, -6.029240608215332, -3.9646525382995605, -1.900064468383789, 0.16452407836914062, 2.229111671447754, 4.293699264526367, 6.3582916259765625, 8.422880172729492, 10.487467765808105, 12.552055358886719, 14.616643905639648, 16.681232452392578, 18.745819091796875, 20.810407638549805, 22.874996185302734, 24.939584732055664, 27.004173278808594, 29.06875991821289, 31.13334846496582, 33.19793701171875, 35.26252365112305, 37.327110290527344, 39.391700744628906, 41.4562873840332, 43.520877838134766, 45.58546447753906, 47.650054931640625, 49.71464157104492, 51.77922821044922, 53.84381866455078, 55.90840530395508, 57.972991943359375, 60.03758239746094, 62.102169036865234, 64.16675567626953, 66.2313461303711, 68.29593658447266, 70.36051940917969, 72.42510986328125]}, "gradients/encoder.encoder.layers.3.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 3.0, 4.0, 1.0, 3.0, 4.0, 1.0, 6.0, 10.0, 17.0, 10.0, 14.0, 21.0, 24.0, 25.0, 33.0, 30.0, 42.0, 41.0, 43.0, 36.0, 46.0, 45.0, 36.0, 35.0, 42.0, 41.0, 41.0, 32.0, 41.0, 31.0, 38.0, 25.0, 23.0, 21.0, 18.0, 19.0, 19.0, 23.0, 18.0, 15.0, 7.0, 4.0, 4.0, 6.0, 4.0, 3.0, 1.0, 6.0, 2.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.588845252990723, -14.091793060302734, -13.59473991394043, -13.097687721252441, -12.600634574890137, -12.103582382202148, -11.606529235839844, -11.109477043151855, -10.612424850463867, -10.115372657775879, -9.618319511413574, -9.121267318725586, -8.624214172363281, -8.127161979675293, -7.6301093101501465, -7.133056640625, -6.636003494262695, -6.138950824737549, -5.641898155212402, -5.144845962524414, -4.647792816162109, -4.150740623474121, -3.6536879539489746, -3.156635284423828, -2.6595826148986816, -2.162529945373535, -1.6654773950576782, -1.1684248447418213, -0.6713721752166748, -0.17431950569152832, 0.32273292541503906, 0.8197855949401855, 1.3168373107910156, 1.813889980316162, 2.3109426498413086, 2.807995080947876, 3.3050477504730225, 3.802100419998169, 4.299152851104736, 4.796205520629883, 5.293258190155029, 5.790310859680176, 6.287363529205322, 6.784416198730469, 7.281468391418457, 7.778521537780762, 8.27557373046875, 8.772626876831055, 9.269679069519043, 9.766731262207031, 10.263784408569336, 10.760836601257324, 11.257889747619629, 11.754941940307617, 12.251995086669922, 12.74904727935791, 13.246099472045898, 13.743151664733887, 14.240204811096191, 14.73725700378418, 15.234310150146484, 15.731362342834473, 16.22841453552246, 16.725467681884766, 17.22252082824707]}, "gradients/encoder.encoder.layers.3.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 10.0, 17.0, 13.0, 27.0, 48.0, 37.0, 86.0, 90.0, 151.0, 220.0, 326.0, 458.0, 719.0, 1216.0, 1819.0, 2776.0, 4618.0, 7898.0, 13113.0, 22967.0, 40832.0, 71903.0, 123974.0, 188590.0, 206310.0, 149755.0, 90316.0, 50725.0, 28416.0, 16368.0, 9526.0, 5674.0, 3426.0, 2151.0, 1392.0, 825.0, 573.0, 376.0, 245.0, 186.0, 115.0, 68.0, 55.0, 39.0, 39.0, 19.0, 9.0, 10.0, 11.0, 6.0, 6.0, 3.0, 4.0, 5.0, 0.0, 2.0], "bins": [-1.3671875, -1.3247222900390625, -1.282257080078125, -1.2397918701171875, -1.19732666015625, -1.1548614501953125, -1.112396240234375, -1.0699310302734375, -1.0274658203125, -0.9850006103515625, -0.942535400390625, -0.9000701904296875, -0.85760498046875, -0.8151397705078125, -0.772674560546875, -0.7302093505859375, -0.687744140625, -0.6452789306640625, -0.602813720703125, -0.5603485107421875, -0.51788330078125, -0.4754180908203125, -0.432952880859375, -0.3904876708984375, -0.3480224609375, -0.3055572509765625, -0.263092041015625, -0.2206268310546875, -0.17816162109375, -0.1356964111328125, -0.093231201171875, -0.0507659912109375, -0.00830078125, 0.0341644287109375, 0.076629638671875, 0.1190948486328125, 0.16156005859375, 0.2040252685546875, 0.246490478515625, 0.2889556884765625, 0.3314208984375, 0.3738861083984375, 0.416351318359375, 0.4588165283203125, 0.50128173828125, 0.5437469482421875, 0.586212158203125, 0.6286773681640625, 0.671142578125, 0.7136077880859375, 0.756072998046875, 0.7985382080078125, 0.84100341796875, 0.8834686279296875, 0.925933837890625, 0.9683990478515625, 1.0108642578125, 1.0533294677734375, 1.095794677734375, 1.1382598876953125, 1.18072509765625, 1.2231903076171875, 1.265655517578125, 1.3081207275390625, 1.3505859375]}, "gradients/encoder.encoder.layers.3.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 1.0, 2.0, 2.0, 2.0, 1.0, 3.0, 2.0, 5.0, 3.0, 2.0, 3.0, 10.0, 8.0, 11.0, 11.0, 15.0, 15.0, 21.0, 11.0, 19.0, 26.0, 34.0, 27.0, 28.0, 31.0, 34.0, 33.0, 39.0, 34.0, 39.0, 60.0, 45.0, 38.0, 30.0, 29.0, 38.0, 40.0, 27.0, 33.0, 20.0, 25.0, 21.0, 20.0, 13.0, 19.0, 18.0, 17.0, 5.0, 8.0, 6.0, 12.0, 3.0, 5.0, 1.0, 3.0, 5.0, 1.0, 3.0, 1.0, 1.0, 1.0, 1.0, 1.0], "bins": [-0.97509765625, -0.9443206787109375, -0.913543701171875, -0.8827667236328125, -0.85198974609375, -0.8212127685546875, -0.790435791015625, -0.7596588134765625, -0.7288818359375, -0.6981048583984375, -0.667327880859375, -0.6365509033203125, -0.60577392578125, -0.5749969482421875, -0.544219970703125, -0.5134429931640625, -0.482666015625, -0.4518890380859375, -0.421112060546875, -0.3903350830078125, -0.35955810546875, -0.3287811279296875, -0.298004150390625, -0.2672271728515625, -0.2364501953125, -0.2056732177734375, -0.174896240234375, -0.1441192626953125, -0.11334228515625, -0.0825653076171875, -0.051788330078125, -0.0210113525390625, 0.009765625, 0.0405426025390625, 0.071319580078125, 0.1020965576171875, 0.13287353515625, 0.1636505126953125, 0.194427490234375, 0.2252044677734375, 0.2559814453125, 0.2867584228515625, 0.317535400390625, 0.3483123779296875, 0.37908935546875, 0.4098663330078125, 0.440643310546875, 0.4714202880859375, 0.502197265625, 0.5329742431640625, 0.563751220703125, 0.5945281982421875, 0.62530517578125, 0.6560821533203125, 0.686859130859375, 0.7176361083984375, 0.7484130859375, 0.7791900634765625, 0.809967041015625, 0.8407440185546875, 0.87152099609375, 0.9022979736328125, 0.933074951171875, 0.9638519287109375, 0.99462890625]}, "gradients/encoder.encoder.layers.3.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 4.0, 1.0, 7.0, 1.0, 5.0, 8.0, 13.0, 10.0, 21.0, 26.0, 45.0, 62.0, 98.0, 139.0, 231.0, 442.0, 843.0, 1899.0, 4865.0, 14304.0, 50475.0, 197062.0, 572147.0, 149125.0, 38108.0, 11318.0, 3939.0, 1606.0, 708.0, 412.0, 222.0, 130.0, 84.0, 53.0, 35.0, 31.0, 19.0, 19.0, 8.0, 9.0, 7.0, 12.0, 3.0, 2.0, 4.0, 3.0, 1.0, 1.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.0546875, -2.954193115234375, -2.85369873046875, -2.753204345703125, -2.6527099609375, -2.552215576171875, -2.45172119140625, -2.351226806640625, -2.250732421875, -2.150238037109375, -2.04974365234375, -1.949249267578125, -1.8487548828125, -1.748260498046875, -1.64776611328125, -1.547271728515625, -1.44677734375, -1.346282958984375, -1.24578857421875, -1.145294189453125, -1.0447998046875, -0.944305419921875, -0.84381103515625, -0.743316650390625, -0.642822265625, -0.542327880859375, -0.44183349609375, -0.341339111328125, -0.2408447265625, -0.140350341796875, -0.03985595703125, 0.060638427734375, 0.1611328125, 0.261627197265625, 0.36212158203125, 0.462615966796875, 0.5631103515625, 0.663604736328125, 0.76409912109375, 0.864593505859375, 0.965087890625, 1.065582275390625, 1.16607666015625, 1.266571044921875, 1.3670654296875, 1.467559814453125, 1.56805419921875, 1.668548583984375, 1.76904296875, 1.869537353515625, 1.97003173828125, 2.070526123046875, 2.1710205078125, 2.271514892578125, 2.37200927734375, 2.472503662109375, 2.572998046875, 2.673492431640625, 2.77398681640625, 2.874481201171875, 2.9749755859375, 3.075469970703125, 3.17596435546875, 3.276458740234375, 3.376953125]}, "gradients/encoder.encoder.layers.3.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 2.0, 3.0, 7.0, 7.0, 6.0, 9.0, 8.0, 7.0, 13.0, 17.0, 26.0, 15.0, 26.0, 24.0, 36.0, 36.0, 44.0, 36.0, 44.0, 44.0, 43.0, 39.0, 44.0, 66.0, 42.0, 54.0, 43.0, 25.0, 33.0, 42.0, 29.0, 23.0, 19.0, 15.0, 16.0, 17.0, 14.0, 5.0, 9.0, 7.0, 1.0, 4.0, 2.0, 2.0, 1.0, 4.0, 0.0, 1.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 2.0, 1.0], "bins": [-3.9921875, -3.858154296875, -3.72412109375, -3.590087890625, -3.4560546875, -3.322021484375, -3.18798828125, -3.053955078125, -2.919921875, -2.785888671875, -2.65185546875, -2.517822265625, -2.3837890625, -2.249755859375, -2.11572265625, -1.981689453125, -1.84765625, -1.713623046875, -1.57958984375, -1.445556640625, -1.3115234375, -1.177490234375, -1.04345703125, -0.909423828125, -0.775390625, -0.641357421875, -0.50732421875, -0.373291015625, -0.2392578125, -0.105224609375, 0.02880859375, 0.162841796875, 0.296875, 0.430908203125, 0.56494140625, 0.698974609375, 0.8330078125, 0.967041015625, 1.10107421875, 1.235107421875, 1.369140625, 1.503173828125, 1.63720703125, 1.771240234375, 1.9052734375, 2.039306640625, 2.17333984375, 2.307373046875, 2.44140625, 2.575439453125, 2.70947265625, 2.843505859375, 2.9775390625, 3.111572265625, 3.24560546875, 3.379638671875, 3.513671875, 3.647705078125, 3.78173828125, 3.915771484375, 4.0498046875, 4.183837890625, 4.31787109375, 4.451904296875, 4.5859375]}, "gradients/encoder.encoder.layers.3.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 3.0, 3.0, 5.0, 8.0, 8.0, 19.0, 19.0, 23.0, 33.0, 43.0, 65.0, 86.0, 151.0, 224.0, 365.0, 591.0, 920.0, 1612.0, 2728.0, 5474.0, 12038.0, 29137.0, 81205.0, 256207.0, 486426.0, 106149.0, 36302.0, 14403.0, 6528.0, 3237.0, 1701.0, 992.0, 633.0, 399.0, 274.0, 169.0, 103.0, 83.0, 47.0, 39.0, 34.0, 24.0, 9.0, 17.0, 14.0, 8.0, 3.0, 2.0, 1.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.8984375, -0.8686065673828125, -0.838775634765625, -0.8089447021484375, -0.77911376953125, -0.7492828369140625, -0.719451904296875, -0.6896209716796875, -0.6597900390625, -0.6299591064453125, -0.600128173828125, -0.5702972412109375, -0.54046630859375, -0.5106353759765625, -0.480804443359375, -0.4509735107421875, -0.421142578125, -0.3913116455078125, -0.361480712890625, -0.3316497802734375, -0.30181884765625, -0.2719879150390625, -0.242156982421875, -0.2123260498046875, -0.1824951171875, -0.1526641845703125, -0.122833251953125, -0.0930023193359375, -0.06317138671875, -0.0333404541015625, -0.003509521484375, 0.0263214111328125, 0.05615234375, 0.0859832763671875, 0.115814208984375, 0.1456451416015625, 0.17547607421875, 0.2053070068359375, 0.235137939453125, 0.2649688720703125, 0.2947998046875, 0.3246307373046875, 0.354461669921875, 0.3842926025390625, 0.41412353515625, 0.4439544677734375, 0.473785400390625, 0.5036163330078125, 0.533447265625, 0.5632781982421875, 0.593109130859375, 0.6229400634765625, 0.65277099609375, 0.6826019287109375, 0.712432861328125, 0.7422637939453125, 0.7720947265625, 0.8019256591796875, 0.831756591796875, 0.8615875244140625, 0.89141845703125, 0.9212493896484375, 0.951080322265625, 0.9809112548828125, 1.0107421875]}, "gradients/encoder.encoder.layers.3.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 3.0, 6.0, 4.0, 1.0, 5.0, 2.0, 6.0, 7.0, 15.0, 6.0, 21.0, 27.0, 28.0, 38.0, 54.0, 61.0, 81.0, 97.0, 118.0, 85.0, 101.0, 59.0, 46.0, 36.0, 22.0, 20.0, 15.0, 13.0, 8.0, 10.0, 9.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0003418922424316406, -0.00032940879464149475, -0.0003169253468513489, -0.000304441899061203, -0.00029195845127105713, -0.00027947500348091125, -0.0002669915556907654, -0.0002545081079006195, -0.00024202466011047363, -0.00022954121232032776, -0.00021705776453018188, -0.000204574316740036, -0.00019209086894989014, -0.00017960742115974426, -0.0001671239733695984, -0.00015464052557945251, -0.00014215707778930664, -0.00012967362999916077, -0.00011719018220901489, -0.00010470673441886902, -9.222328662872314e-05, -7.973983883857727e-05, -6.72563910484314e-05, -5.477294325828552e-05, -4.228949546813965e-05, -2.9806047677993774e-05, -1.73225998878479e-05, -4.839152097702026e-06, 7.644295692443848e-06, 2.012774348258972e-05, 3.2611191272735596e-05, 4.509463906288147e-05, 5.7578086853027344e-05, 7.006153464317322e-05, 8.254498243331909e-05, 9.502843022346497e-05, 0.00010751187801361084, 0.00011999532580375671, 0.0001324787735939026, 0.00014496222138404846, 0.00015744566917419434, 0.0001699291169643402, 0.00018241256475448608, 0.00019489601254463196, 0.00020737946033477783, 0.0002198629081249237, 0.00023234635591506958, 0.00024482980370521545, 0.00025731325149536133, 0.0002697966992855072, 0.0002822801470756531, 0.00029476359486579895, 0.0003072470426559448, 0.0003197304904460907, 0.00033221393823623657, 0.00034469738602638245, 0.0003571808338165283, 0.0003696642816066742, 0.00038214772939682007, 0.00039463117718696594, 0.0004071146249771118, 0.0004195980727672577, 0.00043208152055740356, 0.00044456496834754944, 0.0004570484161376953]}, "gradients/encoder.encoder.layers.3.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 4.0, 0.0, 1.0, 2.0, 3.0, 3.0, 6.0, 21.0, 13.0, 35.0, 37.0, 63.0, 116.0, 236.0, 328.0, 565.0, 1072.0, 1939.0, 4331.0, 10453.0, 29362.0, 99508.0, 506710.0, 278184.0, 76035.0, 23328.0, 8617.0, 3633.0, 1750.0, 897.0, 506.0, 293.0, 188.0, 124.0, 73.0, 51.0, 28.0, 9.0, 16.0, 9.0, 4.0, 9.0, 1.0, 0.0, 3.0, 4.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.142578125, -1.1088714599609375, -1.075164794921875, -1.0414581298828125, -1.00775146484375, -0.9740447998046875, -0.940338134765625, -0.9066314697265625, -0.8729248046875, -0.8392181396484375, -0.805511474609375, -0.7718048095703125, -0.73809814453125, -0.7043914794921875, -0.670684814453125, -0.6369781494140625, -0.603271484375, -0.5695648193359375, -0.535858154296875, -0.5021514892578125, -0.46844482421875, -0.4347381591796875, -0.401031494140625, -0.3673248291015625, -0.3336181640625, -0.2999114990234375, -0.266204833984375, -0.2324981689453125, -0.19879150390625, -0.1650848388671875, -0.131378173828125, -0.0976715087890625, -0.06396484375, -0.0302581787109375, 0.003448486328125, 0.0371551513671875, 0.07086181640625, 0.1045684814453125, 0.138275146484375, 0.1719818115234375, 0.2056884765625, 0.2393951416015625, 0.273101806640625, 0.3068084716796875, 0.34051513671875, 0.3742218017578125, 0.407928466796875, 0.4416351318359375, 0.475341796875, 0.5090484619140625, 0.542755126953125, 0.5764617919921875, 0.61016845703125, 0.6438751220703125, 0.677581787109375, 0.7112884521484375, 0.7449951171875, 0.7787017822265625, 0.812408447265625, 0.8461151123046875, 0.87982177734375, 0.9135284423828125, 0.947235107421875, 0.9809417724609375, 1.0146484375]}, "gradients/encoder.encoder.layers.3.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 4.0, 1.0, 5.0, 6.0, 5.0, 8.0, 14.0, 10.0, 11.0, 18.0, 32.0, 32.0, 45.0, 62.0, 70.0, 66.0, 78.0, 76.0, 73.0, 69.0, 64.0, 61.0, 44.0, 35.0, 33.0, 27.0, 9.0, 14.0, 8.0, 5.0, 6.0, 2.0, 8.0, 4.0, 5.0, 2.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.00390625, -0.96453857421875, -0.9251708984375, -0.88580322265625, -0.846435546875, -0.80706787109375, -0.7677001953125, -0.72833251953125, -0.68896484375, -0.64959716796875, -0.6102294921875, -0.57086181640625, -0.531494140625, -0.49212646484375, -0.4527587890625, -0.41339111328125, -0.3740234375, -0.33465576171875, -0.2952880859375, -0.25592041015625, -0.216552734375, -0.17718505859375, -0.1378173828125, -0.09844970703125, -0.05908203125, -0.01971435546875, 0.0196533203125, 0.05902099609375, 0.098388671875, 0.13775634765625, 0.1771240234375, 0.21649169921875, 0.255859375, 0.29522705078125, 0.3345947265625, 0.37396240234375, 0.413330078125, 0.45269775390625, 0.4920654296875, 0.53143310546875, 0.57080078125, 0.61016845703125, 0.6495361328125, 0.68890380859375, 0.728271484375, 0.76763916015625, 0.8070068359375, 0.84637451171875, 0.8857421875, 0.92510986328125, 0.9644775390625, 1.00384521484375, 1.043212890625, 1.08258056640625, 1.1219482421875, 1.16131591796875, 1.20068359375, 1.24005126953125, 1.2794189453125, 1.31878662109375, 1.358154296875, 1.39752197265625, 1.4368896484375, 1.47625732421875, 1.515625]}, "gradients/encoder.encoder.layers.3.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 6.0, 1.0, 13.0, 18.0, 25.0, 65.0, 120.0, 225.0, 293.0, 134.0, 64.0, 23.0, 14.0, 3.0, 2.0, 2.0, 2.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-49.14048767089844, -47.78323745727539, -46.425987243652344, -45.0687370300293, -43.71148681640625, -42.35423278808594, -40.996986389160156, -39.639732360839844, -38.2824821472168, -36.92523193359375, -35.5679817199707, -34.210731506347656, -32.85348129272461, -31.49622917175293, -30.138978958129883, -28.781726837158203, -27.42447853088379, -26.067228317260742, -24.709978103637695, -23.352725982666016, -21.99547576904297, -20.638225555419922, -19.280975341796875, -17.923725128173828, -16.56647491455078, -15.209224700927734, -13.851973533630371, -12.494723320007324, -11.137472152709961, -9.780221939086914, -8.422971725463867, -7.065720558166504, -5.708469390869141, -4.3512187004089355, -2.9939682483673096, -1.6367177963256836, -0.2794671058654785, 1.0777835845947266, 2.4350337982177734, 3.7922849655151367, 5.149535179138184, 6.506785869598389, 7.864036560058594, 9.22128677368164, 10.578536987304688, 11.93578815460205, 13.293038368225098, 14.650289535522461, 16.007539749145508, 17.364789962768555, 18.7220401763916, 20.07929229736328, 21.436542510986328, 22.793792724609375, 24.151042938232422, 25.50829315185547, 26.865543365478516, 28.222793579101562, 29.58004379272461, 30.937294006347656, 32.2945442199707, 33.65179443359375, 35.00904846191406, 36.36629867553711, 37.723548889160156]}, "gradients/encoder.encoder.layers.3.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 0.0, 2.0, 2.0, 2.0, 2.0, 1.0, 9.0, 6.0, 9.0, 6.0, 9.0, 20.0, 18.0, 24.0, 29.0, 32.0, 35.0, 58.0, 55.0, 58.0, 96.0, 96.0, 63.0, 61.0, 48.0, 53.0, 37.0, 40.0, 31.0, 24.0, 24.0, 15.0, 18.0, 10.0, 6.0, 4.0, 6.0, 5.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-25.599811553955078, -24.875669479370117, -24.151527404785156, -23.427385330200195, -22.703243255615234, -21.979103088378906, -21.254959106445312, -20.530818939208984, -19.806676864624023, -19.082534790039062, -18.3583927154541, -17.63425064086914, -16.91010856628418, -16.18596649169922, -15.461825370788574, -14.73768424987793, -14.013541221618652, -13.289399147033691, -12.56525707244873, -11.841115951538086, -11.116973876953125, -10.392831802368164, -9.668689727783203, -8.944547653198242, -8.220405578613281, -7.49626350402832, -6.772121906280518, -6.047979831695557, -5.323838233947754, -4.599696159362793, -3.875554084777832, -3.1514124870300293, -2.4272708892822266, -1.7031290531158447, -0.9789870977401733, -0.25484514236450195, 0.4692966938018799, 1.1934385299682617, 1.9175806045532227, 2.6417222023010254, 3.3658642768859863, 4.090006351470947, 4.81414794921875, 5.538290023803711, 6.262432098388672, 6.986573696136475, 7.7107157707214355, 8.434857368469238, 9.1589994430542, 9.88314151763916, 10.607283592224121, 11.331424713134766, 12.055566787719727, 12.779708862304688, 13.503850936889648, 14.22799301147461, 14.95213508605957, 15.676277160644531, 16.400419235229492, 17.124561309814453, 17.848703384399414, 18.572845458984375, 19.296985626220703, 20.021127700805664, 20.745269775390625]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 2.0, 3.0, 2.0, 6.0, 4.0, 7.0, 8.0, 16.0, 23.0, 28.0, 33.0, 55.0, 90.0, 110.0, 197.0, 331.0, 544.0, 1004.0, 1895.0, 3956.0, 9741.0, 30758.0, 248044.0, 2895418.0, 908286.0, 66881.0, 15716.0, 5637.0, 2556.0, 1292.0, 646.0, 404.0, 196.0, 133.0, 85.0, 56.0, 43.0, 31.0, 18.0, 9.0, 5.0, 7.0, 9.0, 4.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.64453125, -2.568359375, -2.4921875, -2.416015625, -2.33984375, -2.263671875, -2.1875, -2.111328125, -2.03515625, -1.958984375, -1.8828125, -1.806640625, -1.73046875, -1.654296875, -1.578125, -1.501953125, -1.42578125, -1.349609375, -1.2734375, -1.197265625, -1.12109375, -1.044921875, -0.96875, -0.892578125, -0.81640625, -0.740234375, -0.6640625, -0.587890625, -0.51171875, -0.435546875, -0.359375, -0.283203125, -0.20703125, -0.130859375, -0.0546875, 0.021484375, 0.09765625, 0.173828125, 0.25, 0.326171875, 0.40234375, 0.478515625, 0.5546875, 0.630859375, 0.70703125, 0.783203125, 0.859375, 0.935546875, 1.01171875, 1.087890625, 1.1640625, 1.240234375, 1.31640625, 1.392578125, 1.46875, 1.544921875, 1.62109375, 1.697265625, 1.7734375, 1.849609375, 1.92578125, 2.001953125, 2.078125, 2.154296875, 2.23046875]}, "gradients/encoder.encoder.layers.2.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 0.0, 2.0, 5.0, 5.0, 4.0, 4.0, 9.0, 9.0, 17.0, 12.0, 21.0, 16.0, 18.0, 20.0, 22.0, 26.0, 35.0, 43.0, 30.0, 56.0, 45.0, 47.0, 49.0, 50.0, 41.0, 51.0, 43.0, 42.0, 44.0, 27.0, 33.0, 27.0, 29.0, 26.0, 17.0, 18.0, 14.0, 15.0, 7.0, 10.0, 6.0, 7.0, 3.0, 0.0, 3.0, 3.0, 1.0, 2.0, 1.0], "bins": [-1.271484375, -1.2380828857421875, -1.204681396484375, -1.1712799072265625, -1.13787841796875, -1.1044769287109375, -1.071075439453125, -1.0376739501953125, -1.0042724609375, -0.9708709716796875, -0.937469482421875, -0.9040679931640625, -0.87066650390625, -0.8372650146484375, -0.803863525390625, -0.7704620361328125, -0.737060546875, -0.7036590576171875, -0.670257568359375, -0.6368560791015625, -0.60345458984375, -0.5700531005859375, -0.536651611328125, -0.5032501220703125, -0.4698486328125, -0.4364471435546875, -0.403045654296875, -0.3696441650390625, -0.33624267578125, -0.3028411865234375, -0.269439697265625, -0.2360382080078125, -0.20263671875, -0.1692352294921875, -0.135833740234375, -0.1024322509765625, -0.06903076171875, -0.0356292724609375, -0.002227783203125, 0.0311737060546875, 0.0645751953125, 0.0979766845703125, 0.131378173828125, 0.1647796630859375, 0.19818115234375, 0.2315826416015625, 0.264984130859375, 0.2983856201171875, 0.331787109375, 0.3651885986328125, 0.398590087890625, 0.4319915771484375, 0.46539306640625, 0.4987945556640625, 0.532196044921875, 0.5655975341796875, 0.5989990234375, 0.6324005126953125, 0.665802001953125, 0.6992034912109375, 0.73260498046875, 0.7660064697265625, 0.799407958984375, 0.8328094482421875, 0.8662109375]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 5.0, 4.0, 11.0, 21.0, 47.0, 95.0, 148.0, 361.0, 853.0, 3416.0, 165036.0, 4009397.0, 12291.0, 1438.0, 605.0, 279.0, 135.0, 67.0, 37.0, 19.0, 12.0, 8.0, 0.0, 3.0, 1.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.1953125, -11.8492431640625, -11.503173828125, -11.1571044921875, -10.81103515625, -10.4649658203125, -10.118896484375, -9.7728271484375, -9.4267578125, -9.0806884765625, -8.734619140625, -8.3885498046875, -8.04248046875, -7.6964111328125, -7.350341796875, -7.0042724609375, -6.658203125, -6.3121337890625, -5.966064453125, -5.6199951171875, -5.27392578125, -4.9278564453125, -4.581787109375, -4.2357177734375, -3.8896484375, -3.5435791015625, -3.197509765625, -2.8514404296875, -2.50537109375, -2.1593017578125, -1.813232421875, -1.4671630859375, -1.12109375, -0.7750244140625, -0.428955078125, -0.0828857421875, 0.26318359375, 0.6092529296875, 0.955322265625, 1.3013916015625, 1.6474609375, 1.9935302734375, 2.339599609375, 2.6856689453125, 3.03173828125, 3.3778076171875, 3.723876953125, 4.0699462890625, 4.416015625, 4.7620849609375, 5.108154296875, 5.4542236328125, 5.80029296875, 6.1463623046875, 6.492431640625, 6.8385009765625, 7.1845703125, 7.5306396484375, 7.876708984375, 8.2227783203125, 8.56884765625, 8.9149169921875, 9.260986328125, 9.6070556640625, 9.953125]}, "gradients/encoder.encoder.layers.2.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 3.0, 0.0, 3.0, 2.0, 3.0, 6.0, 4.0, 14.0, 17.0, 29.0, 49.0, 81.0, 148.0, 234.0, 579.0, 1143.0, 978.0, 441.0, 166.0, 81.0, 53.0, 18.0, 14.0, 9.0, 4.0, 4.0, 1.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.62890625, -2.4722900390625, -2.315673828125, -2.1590576171875, -2.00244140625, -1.8458251953125, -1.689208984375, -1.5325927734375, -1.3759765625, -1.2193603515625, -1.062744140625, -0.9061279296875, -0.74951171875, -0.5928955078125, -0.436279296875, -0.2796630859375, -0.123046875, 0.0335693359375, 0.190185546875, 0.3468017578125, 0.50341796875, 0.6600341796875, 0.816650390625, 0.9732666015625, 1.1298828125, 1.2864990234375, 1.443115234375, 1.5997314453125, 1.75634765625, 1.9129638671875, 2.069580078125, 2.2261962890625, 2.3828125, 2.5394287109375, 2.696044921875, 2.8526611328125, 3.00927734375, 3.1658935546875, 3.322509765625, 3.4791259765625, 3.6357421875, 3.7923583984375, 3.948974609375, 4.1055908203125, 4.26220703125, 4.4188232421875, 4.575439453125, 4.7320556640625, 4.888671875, 5.0452880859375, 5.201904296875, 5.3585205078125, 5.51513671875, 5.6717529296875, 5.828369140625, 5.9849853515625, 6.1416015625, 6.2982177734375, 6.454833984375, 6.6114501953125, 6.76806640625, 6.9246826171875, 7.081298828125, 7.2379150390625, 7.39453125]}, "gradients/encoder.encoder.layers.2.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 3.0, 4.0, 0.0, 6.0, 9.0, 25.0, 66.0, 168.0, 320.0, 233.0, 118.0, 38.0, 10.0, 5.0, 4.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-90.71321868896484, -88.59353637695312, -86.47384643554688, -84.35416412353516, -82.23448181152344, -80.11479187011719, -77.99510955810547, -75.87541961669922, -73.7557373046875, -71.63605499267578, -69.51636505126953, -67.39668273925781, -65.27699279785156, -63.157310485839844, -61.037628173828125, -58.91794204711914, -56.798255920410156, -54.67856979370117, -52.55888366699219, -50.43920135498047, -48.319515228271484, -46.1998291015625, -44.08014678955078, -41.9604606628418, -39.84077453613281, -37.72108840942383, -35.601402282714844, -33.481719970703125, -31.36203384399414, -29.242347717285156, -27.122663497924805, -25.002979278564453, -22.88330078125, -20.763614654541016, -18.643930435180664, -16.524246215820312, -14.404560089111328, -12.28487491607666, -10.165189743041992, -8.045504570007324, -5.925819396972656, -3.8061342239379883, -1.6864490509033203, 0.43323612213134766, 2.5529212951660156, 4.672606468200684, 6.792291641235352, 8.91197681427002, 11.031661987304688, 13.151347160339355, 15.271032333374023, 17.390716552734375, 19.51040267944336, 21.630088806152344, 23.749773025512695, 25.869457244873047, 27.98914337158203, 30.108829498291016, 32.228515625, 34.34819793701172, 36.4678840637207, 38.58757019042969, 40.707252502441406, 42.82693862915039, 44.946624755859375]}, "gradients/encoder.encoder.layers.2.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 2.0, 1.0, 2.0, 4.0, 2.0, 3.0, 6.0, 11.0, 16.0, 15.0, 11.0, 28.0, 20.0, 31.0, 37.0, 41.0, 43.0, 37.0, 63.0, 54.0, 54.0, 81.0, 53.0, 58.0, 54.0, 43.0, 44.0, 37.0, 33.0, 26.0, 23.0, 24.0, 16.0, 13.0, 8.0, 8.0, 3.0, 5.0, 3.0, 0.0, 2.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-21.478548049926758, -20.798233032226562, -20.117916107177734, -19.43760108947754, -18.757286071777344, -18.07697105407715, -17.396656036376953, -16.716339111328125, -16.03602409362793, -15.355709075927734, -14.675393104553223, -13.995077133178711, -13.314762115478516, -12.63444709777832, -11.954131126403809, -11.273815155029297, -10.593500137329102, -9.913185119628906, -9.232869148254395, -8.552553176879883, -7.8722381591796875, -7.191922664642334, -6.5116071701049805, -5.831291675567627, -5.150976181030273, -4.47066068649292, -3.7903451919555664, -3.110029697418213, -2.4297142028808594, -1.7493987083435059, -1.0690832138061523, -0.38876771926879883, 0.2915458679199219, 0.9718613624572754, 1.652176856994629, 2.3324923515319824, 3.012807846069336, 3.6931233406066895, 4.373438835144043, 5.0537543296813965, 5.73406982421875, 6.4143853187561035, 7.094700813293457, 7.7750163078308105, 8.455331802368164, 9.13564682006836, 9.815962791442871, 10.496278762817383, 11.176593780517578, 11.856908798217773, 12.537224769592285, 13.217540740966797, 13.897855758666992, 14.578170776367188, 15.2584867477417, 15.938802719116211, 16.619117736816406, 17.2994327545166, 17.979747772216797, 18.660064697265625, 19.34037971496582, 20.020694732666016, 20.701011657714844, 21.38132667541504, 22.061641693115234]}, "gradients/encoder.encoder.layers.2.attention.out_proj.weight": {"_type": "histogram", "values": [2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 2.0, 5.0, 8.0, 7.0, 11.0, 11.0, 20.0, 31.0, 37.0, 50.0, 87.0, 131.0, 161.0, 242.0, 356.0, 535.0, 814.0, 1404.0, 2254.0, 3595.0, 6074.0, 10528.0, 18748.0, 34318.0, 64987.0, 124318.0, 216415.0, 240062.0, 149693.0, 78780.0, 41600.0, 22315.0, 12649.0, 7034.0, 4253.0, 2546.0, 1637.0, 974.0, 602.0, 403.0, 272.0, 159.0, 134.0, 79.0, 54.0, 44.0, 33.0, 27.0, 19.0, 14.0, 10.0, 9.0, 6.0, 2.0, 6.0, 1.0, 0.0, 1.0], "bins": [-1.6181640625, -1.5693511962890625, -1.520538330078125, -1.4717254638671875, -1.42291259765625, -1.3740997314453125, -1.325286865234375, -1.2764739990234375, -1.2276611328125, -1.1788482666015625, -1.130035400390625, -1.0812225341796875, -1.03240966796875, -0.9835968017578125, -0.934783935546875, -0.8859710693359375, -0.837158203125, -0.7883453369140625, -0.739532470703125, -0.6907196044921875, -0.64190673828125, -0.5930938720703125, -0.544281005859375, -0.4954681396484375, -0.4466552734375, -0.3978424072265625, -0.349029541015625, -0.3002166748046875, -0.25140380859375, -0.2025909423828125, -0.153778076171875, -0.1049652099609375, -0.05615234375, -0.0073394775390625, 0.041473388671875, 0.0902862548828125, 0.13909912109375, 0.1879119873046875, 0.236724853515625, 0.2855377197265625, 0.3343505859375, 0.3831634521484375, 0.431976318359375, 0.4807891845703125, 0.52960205078125, 0.5784149169921875, 0.627227783203125, 0.6760406494140625, 0.724853515625, 0.7736663818359375, 0.822479248046875, 0.8712921142578125, 0.92010498046875, 0.9689178466796875, 1.017730712890625, 1.0665435791015625, 1.1153564453125, 1.1641693115234375, 1.212982177734375, 1.2617950439453125, 1.31060791015625, 1.3594207763671875, 1.408233642578125, 1.4570465087890625, 1.505859375]}, "gradients/encoder.encoder.layers.2.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 3.0, 2.0, 0.0, 4.0, 3.0, 8.0, 9.0, 9.0, 11.0, 15.0, 13.0, 13.0, 21.0, 17.0, 28.0, 32.0, 33.0, 33.0, 40.0, 51.0, 50.0, 63.0, 50.0, 57.0, 56.0, 50.0, 53.0, 34.0, 33.0, 31.0, 32.0, 24.0, 20.0, 18.0, 23.0, 13.0, 17.0, 7.0, 19.0, 6.0, 3.0, 4.0, 6.0, 3.0, 2.0, 0.0, 0.0, 1.0], "bins": [-1.748046875, -1.7032318115234375, -1.658416748046875, -1.6136016845703125, -1.56878662109375, -1.5239715576171875, -1.479156494140625, -1.4343414306640625, -1.3895263671875, -1.3447113037109375, -1.299896240234375, -1.2550811767578125, -1.21026611328125, -1.1654510498046875, -1.120635986328125, -1.0758209228515625, -1.031005859375, -0.9861907958984375, -0.941375732421875, -0.8965606689453125, -0.85174560546875, -0.8069305419921875, -0.762115478515625, -0.7173004150390625, -0.6724853515625, -0.6276702880859375, -0.582855224609375, -0.5380401611328125, -0.49322509765625, -0.4484100341796875, -0.403594970703125, -0.3587799072265625, -0.31396484375, -0.2691497802734375, -0.224334716796875, -0.1795196533203125, -0.13470458984375, -0.0898895263671875, -0.045074462890625, -0.0002593994140625, 0.0445556640625, 0.0893707275390625, 0.134185791015625, 0.1790008544921875, 0.22381591796875, 0.2686309814453125, 0.313446044921875, 0.3582611083984375, 0.403076171875, 0.4478912353515625, 0.492706298828125, 0.5375213623046875, 0.58233642578125, 0.6271514892578125, 0.671966552734375, 0.7167816162109375, 0.7615966796875, 0.8064117431640625, 0.851226806640625, 0.8960418701171875, 0.94085693359375, 0.9856719970703125, 1.030487060546875, 1.0753021240234375, 1.1201171875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 2.0, 3.0, 7.0, 0.0, 0.0, 4.0, 3.0, 7.0, 9.0, 14.0, 21.0, 27.0, 46.0, 65.0, 118.0, 179.0, 299.0, 616.0, 1410.0, 4448.0, 24106.0, 237083.0, 715325.0, 52941.0, 8036.0, 2066.0, 763.0, 376.0, 225.0, 131.0, 73.0, 54.0, 32.0, 14.0, 16.0, 16.0, 12.0, 5.0, 6.0, 4.0, 2.0, 1.0, 2.0, 0.0, 1.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.92578125, -5.74169921875, -5.5576171875, -5.37353515625, -5.189453125, -5.00537109375, -4.8212890625, -4.63720703125, -4.453125, -4.26904296875, -4.0849609375, -3.90087890625, -3.716796875, -3.53271484375, -3.3486328125, -3.16455078125, -2.98046875, -2.79638671875, -2.6123046875, -2.42822265625, -2.244140625, -2.06005859375, -1.8759765625, -1.69189453125, -1.5078125, -1.32373046875, -1.1396484375, -0.95556640625, -0.771484375, -0.58740234375, -0.4033203125, -0.21923828125, -0.03515625, 0.14892578125, 0.3330078125, 0.51708984375, 0.701171875, 0.88525390625, 1.0693359375, 1.25341796875, 1.4375, 1.62158203125, 1.8056640625, 1.98974609375, 2.173828125, 2.35791015625, 2.5419921875, 2.72607421875, 2.91015625, 3.09423828125, 3.2783203125, 3.46240234375, 3.646484375, 3.83056640625, 4.0146484375, 4.19873046875, 4.3828125, 4.56689453125, 4.7509765625, 4.93505859375, 5.119140625, 5.30322265625, 5.4873046875, 5.67138671875, 5.85546875]}, "gradients/encoder.encoder.layers.2.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 2.0, 2.0, 4.0, 1.0, 3.0, 4.0, 2.0, 4.0, 9.0, 5.0, 13.0, 14.0, 17.0, 11.0, 8.0, 22.0, 21.0, 21.0, 26.0, 31.0, 43.0, 52.0, 55.0, 40.0, 42.0, 48.0, 60.0, 50.0, 45.0, 45.0, 41.0, 40.0, 35.0, 21.0, 29.0, 22.0, 24.0, 22.0, 18.0, 13.0, 7.0, 5.0, 6.0, 6.0, 7.0, 2.0, 4.0, 7.0, 3.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0], "bins": [-5.69140625, -5.52947998046875, -5.3675537109375, -5.20562744140625, -5.043701171875, -4.88177490234375, -4.7198486328125, -4.55792236328125, -4.39599609375, -4.23406982421875, -4.0721435546875, -3.91021728515625, -3.748291015625, -3.58636474609375, -3.4244384765625, -3.26251220703125, -3.1005859375, -2.93865966796875, -2.7767333984375, -2.61480712890625, -2.452880859375, -2.29095458984375, -2.1290283203125, -1.96710205078125, -1.80517578125, -1.64324951171875, -1.4813232421875, -1.31939697265625, -1.157470703125, -0.99554443359375, -0.8336181640625, -0.67169189453125, -0.509765625, -0.34783935546875, -0.1859130859375, -0.02398681640625, 0.137939453125, 0.29986572265625, 0.4617919921875, 0.62371826171875, 0.78564453125, 0.94757080078125, 1.1094970703125, 1.27142333984375, 1.433349609375, 1.59527587890625, 1.7572021484375, 1.91912841796875, 2.0810546875, 2.24298095703125, 2.4049072265625, 2.56683349609375, 2.728759765625, 2.89068603515625, 3.0526123046875, 3.21453857421875, 3.37646484375, 3.53839111328125, 3.7003173828125, 3.86224365234375, 4.024169921875, 4.18609619140625, 4.3480224609375, 4.50994873046875, 4.671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 3.0, 1.0, 1.0, 1.0, 1.0, 3.0, 1.0, 3.0, 5.0, 7.0, 6.0, 11.0, 11.0, 20.0, 24.0, 33.0, 58.0, 116.0, 207.0, 432.0, 965.0, 2733.0, 11017.0, 87092.0, 844383.0, 85878.0, 10927.0, 2780.0, 922.0, 398.0, 201.0, 115.0, 56.0, 51.0, 28.0, 13.0, 18.0, 10.0, 10.0, 6.0, 3.0, 7.0, 4.0, 3.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.8330078125, -1.7729034423828125, -1.712799072265625, -1.6526947021484375, -1.59259033203125, -1.5324859619140625, -1.472381591796875, -1.4122772216796875, -1.3521728515625, -1.2920684814453125, -1.231964111328125, -1.1718597412109375, -1.11175537109375, -1.0516510009765625, -0.991546630859375, -0.9314422607421875, -0.871337890625, -0.8112335205078125, -0.751129150390625, -0.6910247802734375, -0.63092041015625, -0.5708160400390625, -0.510711669921875, -0.4506072998046875, -0.3905029296875, -0.3303985595703125, -0.270294189453125, -0.2101898193359375, -0.15008544921875, -0.0899810791015625, -0.029876708984375, 0.0302276611328125, 0.09033203125, 0.1504364013671875, 0.210540771484375, 0.2706451416015625, 0.33074951171875, 0.3908538818359375, 0.450958251953125, 0.5110626220703125, 0.5711669921875, 0.6312713623046875, 0.691375732421875, 0.7514801025390625, 0.81158447265625, 0.8716888427734375, 0.931793212890625, 0.9918975830078125, 1.052001953125, 1.1121063232421875, 1.172210693359375, 1.2323150634765625, 1.29241943359375, 1.3525238037109375, 1.412628173828125, 1.4727325439453125, 1.5328369140625, 1.5929412841796875, 1.653045654296875, 1.7131500244140625, 1.77325439453125, 1.8333587646484375, 1.893463134765625, 1.9535675048828125, 2.013671875]}, "gradients/encoder.encoder.layers.2.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 1.0, 1.0, 4.0, 1.0, 2.0, 2.0, 5.0, 10.0, 4.0, 6.0, 2.0, 4.0, 6.0, 6.0, 19.0, 9.0, 11.0, 18.0, 28.0, 22.0, 41.0, 56.0, 67.0, 85.0, 85.0, 119.0, 70.0, 82.0, 53.0, 38.0, 30.0, 19.0, 24.0, 16.0, 12.0, 10.0, 11.0, 4.0, 6.0, 4.0, 3.0, 4.0, 1.0, 4.0, 2.0, 1.0, 3.0, 0.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-0.0002727508544921875, -0.00026455894112586975, -0.000256367027759552, -0.00024817511439323425, -0.0002399832010269165, -0.00023179128766059875, -0.000223599374294281, -0.00021540746092796326, -0.0002072155475616455, -0.00019902363419532776, -0.00019083172082901, -0.00018263980746269226, -0.0001744478940963745, -0.00016625598073005676, -0.00015806406736373901, -0.00014987215399742126, -0.00014168024063110352, -0.00013348832726478577, -0.00012529641389846802, -0.00011710450053215027, -0.00010891258716583252, -0.00010072067379951477, -9.252876043319702e-05, -8.433684706687927e-05, -7.614493370056152e-05, -6.795302033424377e-05, -5.9761106967926025e-05, -5.1569193601608276e-05, -4.337728023529053e-05, -3.518536686897278e-05, -2.699345350265503e-05, -1.880154013633728e-05, -1.0609626770019531e-05, -2.4177134037017822e-06, 5.774199962615967e-06, 1.3966113328933716e-05, 2.2158026695251465e-05, 3.0349940061569214e-05, 3.854185342788696e-05, 4.673376679420471e-05, 5.492568016052246e-05, 6.311759352684021e-05, 7.130950689315796e-05, 7.950142025947571e-05, 8.769333362579346e-05, 9.58852469921112e-05, 0.00010407716035842896, 0.0001122690737247467, 0.00012046098709106445, 0.0001286529004573822, 0.00013684481382369995, 0.0001450367271900177, 0.00015322864055633545, 0.0001614205539226532, 0.00016961246728897095, 0.0001778043806552887, 0.00018599629402160645, 0.0001941882073879242, 0.00020238012075424194, 0.0002105720341205597, 0.00021876394748687744, 0.0002269558608531952, 0.00023514777421951294, 0.0002433396875858307, 0.00025153160095214844]}, "gradients/encoder.encoder.layers.2.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 2.0, 4.0, 2.0, 7.0, 4.0, 4.0, 14.0, 20.0, 29.0, 52.0, 126.0, 271.0, 703.0, 2211.0, 11846.0, 154673.0, 832252.0, 39168.0, 5159.0, 1211.0, 440.0, 164.0, 81.0, 49.0, 21.0, 19.0, 14.0, 7.0, 7.0, 2.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.7744140625, -1.7068634033203125, -1.639312744140625, -1.5717620849609375, -1.50421142578125, -1.4366607666015625, -1.369110107421875, -1.3015594482421875, -1.2340087890625, -1.1664581298828125, -1.098907470703125, -1.0313568115234375, -0.96380615234375, -0.8962554931640625, -0.828704833984375, -0.7611541748046875, -0.693603515625, -0.6260528564453125, -0.558502197265625, -0.4909515380859375, -0.42340087890625, -0.3558502197265625, -0.288299560546875, -0.2207489013671875, -0.1531982421875, -0.0856475830078125, -0.018096923828125, 0.0494537353515625, 0.11700439453125, 0.1845550537109375, 0.252105712890625, 0.3196563720703125, 0.38720703125, 0.4547576904296875, 0.522308349609375, 0.5898590087890625, 0.65740966796875, 0.7249603271484375, 0.792510986328125, 0.8600616455078125, 0.9276123046875, 0.9951629638671875, 1.062713623046875, 1.1302642822265625, 1.19781494140625, 1.2653656005859375, 1.332916259765625, 1.4004669189453125, 1.468017578125, 1.5355682373046875, 1.603118896484375, 1.6706695556640625, 1.73822021484375, 1.8057708740234375, 1.873321533203125, 1.9408721923828125, 2.0084228515625, 2.0759735107421875, 2.143524169921875, 2.2110748291015625, 2.27862548828125, 2.3461761474609375, 2.413726806640625, 2.4812774658203125, 2.548828125]}, "gradients/encoder.encoder.layers.2.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 4.0, 1.0, 0.0, 0.0, 1.0, 0.0, 2.0, 3.0, 0.0, 4.0, 2.0, 1.0, 1.0, 3.0, 9.0, 10.0, 9.0, 12.0, 13.0, 14.0, 19.0, 24.0, 34.0, 32.0, 64.0, 56.0, 57.0, 69.0, 73.0, 61.0, 72.0, 65.0, 52.0, 51.0, 34.0, 39.0, 26.0, 18.0, 18.0, 13.0, 12.0, 7.0, 7.0, 8.0, 3.0, 4.0, 2.0, 1.0, 6.0, 1.0, 0.0, 1.0, 3.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-0.87744140625, -0.8484268188476562, -0.8194122314453125, -0.7903976440429688, -0.761383056640625, -0.7323684692382812, -0.7033538818359375, -0.6743392944335938, -0.64532470703125, -0.6163101196289062, -0.5872955322265625, -0.5582809448242188, -0.529266357421875, -0.5002517700195312, -0.4712371826171875, -0.44222259521484375, -0.4132080078125, -0.38419342041015625, -0.3551788330078125, -0.32616424560546875, -0.297149658203125, -0.26813507080078125, -0.2391204833984375, -0.21010589599609375, -0.18109130859375, -0.15207672119140625, -0.1230621337890625, -0.09404754638671875, -0.065032958984375, -0.03601837158203125, -0.0070037841796875, 0.02201080322265625, 0.051025390625, 0.08003997802734375, 0.1090545654296875, 0.13806915283203125, 0.167083740234375, 0.19609832763671875, 0.2251129150390625, 0.25412750244140625, 0.28314208984375, 0.31215667724609375, 0.3411712646484375, 0.37018585205078125, 0.399200439453125, 0.42821502685546875, 0.4572296142578125, 0.48624420166015625, 0.5152587890625, 0.5442733764648438, 0.5732879638671875, 0.6023025512695312, 0.631317138671875, 0.6603317260742188, 0.6893463134765625, 0.7183609008789062, 0.74737548828125, 0.7763900756835938, 0.8054046630859375, 0.8344192504882812, 0.863433837890625, 0.8924484252929688, 0.9214630126953125, 0.9504776000976562, 0.9794921875]}, "gradients/encoder.encoder.layers.2.layer_norm.weight": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 3.0, 2.0, 3.0, 7.0, 12.0, 15.0, 24.0, 34.0, 48.0, 88.0, 139.0, 268.0, 124.0, 77.0, 75.0, 28.0, 21.0, 19.0, 4.0, 6.0, 4.0, 3.0, 5.0, 1.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-17.634052276611328, -16.80976104736328, -15.98547077178955, -15.161179542541504, -14.336889266967773, -13.512598037719727, -12.68830680847168, -11.864015579223633, -11.039725303649902, -10.215434074401855, -9.391143798828125, -8.566852569580078, -7.7425618171691895, -6.918271064758301, -6.093979835510254, -5.269689083099365, -4.445398330688477, -3.621107578277588, -2.79681658744812, -1.9725255966186523, -1.1482348442077637, -0.323944091796875, 0.5003471374511719, 1.3246378898620605, 2.148928642272949, 2.973219394683838, 3.7975103855133057, 4.621801376342773, 5.446092128753662, 6.270382881164551, 7.094674110412598, 7.918964862823486, 8.743255615234375, 9.567546844482422, 10.391837120056152, 11.2161283493042, 12.04041862487793, 12.864709854125977, 13.689001083374023, 14.51329231262207, 15.3375825881958, 16.16187286376953, 16.986164093017578, 17.810455322265625, 18.634746551513672, 19.45903778076172, 20.283329010009766, 21.10761833190918, 21.931909561157227, 22.756200790405273, 23.58049201965332, 24.404781341552734, 25.22907257080078, 26.053363800048828, 26.877655029296875, 27.701946258544922, 28.52623748779297, 29.350528717041016, 30.174819946289062, 30.99911117553711, 31.823400497436523, 32.64768981933594, 33.47198486328125, 34.29627227783203, 35.12056350708008]}, "gradients/encoder.encoder.layers.2.layer_norm.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 2.0, 5.0, 2.0, 7.0, 3.0, 5.0, 6.0, 17.0, 15.0, 17.0, 14.0, 16.0, 24.0, 31.0, 30.0, 43.0, 35.0, 46.0, 73.0, 113.0, 102.0, 79.0, 42.0, 37.0, 33.0, 29.0, 32.0, 27.0, 20.0, 21.0, 25.0, 11.0, 14.0, 10.0, 8.0, 1.0, 8.0, 2.0, 3.0, 2.0, 2.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0], "bins": [-23.476234436035156, -22.722492218017578, -21.96875, -21.215007781982422, -20.461265563964844, -19.707523345947266, -18.953781127929688, -18.20003890991211, -17.44629669189453, -16.692554473876953, -15.938812255859375, -15.185070037841797, -14.431327819824219, -13.67758560180664, -12.923843383789062, -12.170101165771484, -11.416359901428223, -10.662617683410645, -9.908875465393066, -9.155133247375488, -8.40139102935791, -7.647648811340332, -6.893907070159912, -6.140164852142334, -5.386422634124756, -4.632680416107178, -3.8789381980895996, -3.1251962184906006, -2.3714540004730225, -1.6177117824554443, -0.8639698028564453, -0.11022758483886719, 0.6435146331787109, 1.397256851196289, 2.150999069213867, 2.904741048812866, 3.6584832668304443, 4.412225723266602, 5.1659674644470215, 5.9197096824646, 6.673451900482178, 7.427194118499756, 8.180935859680176, 8.934678077697754, 9.688420295715332, 10.44216251373291, 11.195904731750488, 11.949646949768066, 12.703389167785645, 13.457131385803223, 14.2108736038208, 14.964615821838379, 15.718358039855957, 16.47209930419922, 17.225841522216797, 17.979583740234375, 18.733325958251953, 19.48706817626953, 20.24081039428711, 20.994552612304688, 21.748294830322266, 22.502037048339844, 23.255779266357422, 24.009521484375, 24.763263702392578]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 5.0, 1.0, 4.0, 8.0, 8.0, 22.0, 13.0, 26.0, 36.0, 38.0, 60.0, 121.0, 146.0, 244.0, 373.0, 635.0, 1150.0, 2135.0, 4165.0, 10720.0, 49723.0, 500653.0, 2773148.0, 754072.0, 72767.0, 13681.0, 4928.0, 2309.0, 1205.0, 725.0, 419.0, 245.0, 154.0, 126.0, 72.0, 44.0, 37.0, 18.0, 15.0, 15.0, 13.0, 7.0, 4.0, 2.0, 2.0, 3.0, 0.0, 1.0, 1.0], "bins": [-2.615234375, -2.545654296875, -2.47607421875, -2.406494140625, -2.3369140625, -2.267333984375, -2.19775390625, -2.128173828125, -2.05859375, -1.989013671875, -1.91943359375, -1.849853515625, -1.7802734375, -1.710693359375, -1.64111328125, -1.571533203125, -1.501953125, -1.432373046875, -1.36279296875, -1.293212890625, -1.2236328125, -1.154052734375, -1.08447265625, -1.014892578125, -0.9453125, -0.875732421875, -0.80615234375, -0.736572265625, -0.6669921875, -0.597412109375, -0.52783203125, -0.458251953125, -0.388671875, -0.319091796875, -0.24951171875, -0.179931640625, -0.1103515625, -0.040771484375, 0.02880859375, 0.098388671875, 0.16796875, 0.237548828125, 0.30712890625, 0.376708984375, 0.4462890625, 0.515869140625, 0.58544921875, 0.655029296875, 0.724609375, 0.794189453125, 0.86376953125, 0.933349609375, 1.0029296875, 1.072509765625, 1.14208984375, 1.211669921875, 1.28125, 1.350830078125, 1.42041015625, 1.489990234375, 1.5595703125, 1.629150390625, 1.69873046875, 1.768310546875, 1.837890625]}, "gradients/encoder.encoder.layers.1.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 2.0, 3.0, 2.0, 3.0, 9.0, 6.0, 10.0, 14.0, 9.0, 15.0, 16.0, 22.0, 17.0, 29.0, 33.0, 35.0, 36.0, 44.0, 40.0, 54.0, 45.0, 45.0, 49.0, 42.0, 52.0, 49.0, 39.0, 33.0, 34.0, 31.0, 27.0, 23.0, 25.0, 20.0, 27.0, 14.0, 11.0, 8.0, 2.0, 11.0, 2.0, 7.0, 6.0, 3.0, 4.0, 1.0, 1.0, 1.0, 1.0, 0.0, 2.0], "bins": [-1.462890625, -1.4214935302734375, -1.380096435546875, -1.3386993408203125, -1.29730224609375, -1.2559051513671875, -1.214508056640625, -1.1731109619140625, -1.1317138671875, -1.0903167724609375, -1.048919677734375, -1.0075225830078125, -0.96612548828125, -0.9247283935546875, -0.883331298828125, -0.8419342041015625, -0.800537109375, -0.7591400146484375, -0.717742919921875, -0.6763458251953125, -0.63494873046875, -0.5935516357421875, -0.552154541015625, -0.5107574462890625, -0.4693603515625, -0.4279632568359375, -0.386566162109375, -0.3451690673828125, -0.30377197265625, -0.2623748779296875, -0.220977783203125, -0.1795806884765625, -0.13818359375, -0.0967864990234375, -0.055389404296875, -0.0139923095703125, 0.02740478515625, 0.0688018798828125, 0.110198974609375, 0.1515960693359375, 0.1929931640625, 0.2343902587890625, 0.275787353515625, 0.3171844482421875, 0.35858154296875, 0.3999786376953125, 0.441375732421875, 0.4827728271484375, 0.524169921875, 0.5655670166015625, 0.606964111328125, 0.6483612060546875, 0.68975830078125, 0.7311553955078125, 0.772552490234375, 0.8139495849609375, 0.8553466796875, 0.8967437744140625, 0.938140869140625, 0.9795379638671875, 1.02093505859375, 1.0623321533203125, 1.103729248046875, 1.1451263427734375, 1.1865234375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 5.0, 10.0, 22.0, 42.0, 60.0, 139.0, 268.0, 482.0, 1333.0, 33394.0, 4138969.0, 17251.0, 1208.0, 501.0, 264.0, 172.0, 95.0, 32.0, 23.0, 7.0, 6.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.7734375, -12.3795166015625, -11.985595703125, -11.5916748046875, -11.19775390625, -10.8038330078125, -10.409912109375, -10.0159912109375, -9.6220703125, -9.2281494140625, -8.834228515625, -8.4403076171875, -8.04638671875, -7.6524658203125, -7.258544921875, -6.8646240234375, -6.470703125, -6.0767822265625, -5.682861328125, -5.2889404296875, -4.89501953125, -4.5010986328125, -4.107177734375, -3.7132568359375, -3.3193359375, -2.9254150390625, -2.531494140625, -2.1375732421875, -1.74365234375, -1.3497314453125, -0.955810546875, -0.5618896484375, -0.16796875, 0.2259521484375, 0.619873046875, 1.0137939453125, 1.40771484375, 1.8016357421875, 2.195556640625, 2.5894775390625, 2.9833984375, 3.3773193359375, 3.771240234375, 4.1651611328125, 4.55908203125, 4.9530029296875, 5.346923828125, 5.7408447265625, 6.134765625, 6.5286865234375, 6.922607421875, 7.3165283203125, 7.71044921875, 8.1043701171875, 8.498291015625, 8.8922119140625, 9.2861328125, 9.6800537109375, 10.073974609375, 10.4678955078125, 10.86181640625, 11.2557373046875, 11.649658203125, 12.0435791015625, 12.4375]}, "gradients/encoder.encoder.layers.1.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 3.0, 0.0, 2.0, 4.0, 4.0, 13.0, 32.0, 44.0, 99.0, 215.0, 546.0, 1125.0, 1095.0, 486.0, 207.0, 82.0, 56.0, 31.0, 9.0, 9.0, 6.0, 9.0, 4.0, 5.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.806640625, -2.631072998046875, -2.45550537109375, -2.279937744140625, -2.1043701171875, -1.928802490234375, -1.75323486328125, -1.577667236328125, -1.402099609375, -1.226531982421875, -1.05096435546875, -0.875396728515625, -0.6998291015625, -0.524261474609375, -0.34869384765625, -0.173126220703125, 0.00244140625, 0.178009033203125, 0.35357666015625, 0.529144287109375, 0.7047119140625, 0.880279541015625, 1.05584716796875, 1.231414794921875, 1.406982421875, 1.582550048828125, 1.75811767578125, 1.933685302734375, 2.1092529296875, 2.284820556640625, 2.46038818359375, 2.635955810546875, 2.8115234375, 2.987091064453125, 3.16265869140625, 3.338226318359375, 3.5137939453125, 3.689361572265625, 3.86492919921875, 4.040496826171875, 4.216064453125, 4.391632080078125, 4.56719970703125, 4.742767333984375, 4.9183349609375, 5.093902587890625, 5.26947021484375, 5.445037841796875, 5.62060546875, 5.796173095703125, 5.97174072265625, 6.147308349609375, 6.3228759765625, 6.498443603515625, 6.67401123046875, 6.849578857421875, 7.025146484375, 7.200714111328125, 7.37628173828125, 7.551849365234375, 7.7274169921875, 7.902984619140625, 8.07855224609375, 8.254119873046875, 8.4296875]}, "gradients/encoder.encoder.layers.1.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 3.0, 7.0, 9.0, 13.0, 41.0, 63.0, 138.0, 229.0, 229.0, 124.0, 67.0, 36.0, 25.0, 10.0, 8.0, 4.0, 1.0, 6.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-28.824981689453125, -27.37922477722168, -25.933467864990234, -24.487709045410156, -23.041954040527344, -21.596195220947266, -20.15043830871582, -18.704681396484375, -17.25892448425293, -15.813167572021484, -14.367410659790039, -12.921652793884277, -11.475895881652832, -10.030138969421387, -8.584381103515625, -7.13862419128418, -5.692867279052734, -4.247110366821289, -2.8013529777526855, -1.355595588684082, 0.09016132354736328, 1.5359182357788086, 2.9816761016845703, 4.427433013916016, 5.873189926147461, 7.318946838378906, 8.764703750610352, 10.210461616516113, 11.656218528747559, 13.101975440979004, 14.547733306884766, 15.993490219116211, 17.439247131347656, 18.8850040435791, 20.330760955810547, 21.776519775390625, 23.222274780273438, 24.668033599853516, 26.11379051208496, 27.559547424316406, 29.00530433654785, 30.451061248779297, 31.896818161010742, 33.34257507324219, 34.788333892822266, 36.23408889770508, 37.679847717285156, 39.12560272216797, 40.57136154174805, 42.017120361328125, 43.46287536621094, 44.908634185791016, 46.35438919067383, 47.800148010253906, 49.24590301513672, 50.6916618347168, 52.137420654296875, 53.58317947387695, 55.028934478759766, 56.474693298339844, 57.920448303222656, 59.366207122802734, 60.81196594238281, 62.257720947265625, 63.70347595214844]}, "gradients/encoder.encoder.layers.1.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 3.0, 2.0, 2.0, 6.0, 8.0, 8.0, 8.0, 12.0, 13.0, 21.0, 20.0, 23.0, 25.0, 35.0, 32.0, 54.0, 56.0, 43.0, 54.0, 69.0, 73.0, 72.0, 48.0, 47.0, 46.0, 43.0, 30.0, 32.0, 28.0, 23.0, 17.0, 10.0, 13.0, 10.0, 7.0, 5.0, 5.0, 5.0, 1.0, 2.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0], "bins": [-24.54575538635254, -23.855375289916992, -23.164995193481445, -22.47461700439453, -21.784236907958984, -21.093856811523438, -20.40347671508789, -19.713096618652344, -19.022716522216797, -18.33233642578125, -17.641956329345703, -16.951576232910156, -16.261198043823242, -15.570817947387695, -14.880437850952148, -14.190057754516602, -13.499679565429688, -12.80929946899414, -12.11892032623291, -11.428540229797363, -10.738161087036133, -10.047780990600586, -9.357400894165039, -8.667020797729492, -7.976641654968262, -7.286262035369873, -6.595882415771484, -5.9055023193359375, -5.215122699737549, -4.52474308013916, -3.8343629837036133, -3.1439833641052246, -2.453601837158203, -1.763222098350525, -1.0728423595428467, -0.3824625015258789, 0.30791711807250977, 0.9982967376708984, 1.6886768341064453, 2.379056453704834, 3.0694360733032227, 3.7598156929016113, 4.4501953125, 5.140575408935547, 5.8309550285339355, 6.521334648132324, 7.211714744567871, 7.90209436416626, 8.592473983764648, 9.282854080200195, 9.973233222961426, 10.663613319396973, 11.353992462158203, 12.04437255859375, 12.734752655029297, 13.425132751464844, 14.115511894226074, 14.805891990661621, 15.496271133422852, 16.1866512298584, 16.877031326293945, 17.56740951538086, 18.257789611816406, 18.948169708251953, 19.6385498046875]}, "gradients/encoder.encoder.layers.1.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 2.0, 6.0, 8.0, 7.0, 11.0, 9.0, 19.0, 29.0, 39.0, 51.0, 96.0, 127.0, 180.0, 261.0, 402.0, 592.0, 934.0, 1459.0, 2248.0, 3839.0, 6628.0, 11750.0, 22192.0, 45594.0, 101486.0, 231026.0, 313738.0, 161857.0, 70969.0, 33622.0, 16991.0, 8951.0, 5070.0, 2984.0, 1965.0, 1148.0, 721.0, 518.0, 333.0, 233.0, 145.0, 100.0, 71.0, 45.0, 38.0, 20.0, 19.0, 8.0, 11.0, 5.0, 3.0, 5.0, 4.0, 2.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.005859375, -1.9349365234375, -1.864013671875, -1.7930908203125, -1.72216796875, -1.6512451171875, -1.580322265625, -1.5093994140625, -1.4384765625, -1.3675537109375, -1.296630859375, -1.2257080078125, -1.15478515625, -1.0838623046875, -1.012939453125, -0.9420166015625, -0.87109375, -0.8001708984375, -0.729248046875, -0.6583251953125, -0.58740234375, -0.5164794921875, -0.445556640625, -0.3746337890625, -0.3037109375, -0.2327880859375, -0.161865234375, -0.0909423828125, -0.02001953125, 0.0509033203125, 0.121826171875, 0.1927490234375, 0.263671875, 0.3345947265625, 0.405517578125, 0.4764404296875, 0.54736328125, 0.6182861328125, 0.689208984375, 0.7601318359375, 0.8310546875, 0.9019775390625, 0.972900390625, 1.0438232421875, 1.11474609375, 1.1856689453125, 1.256591796875, 1.3275146484375, 1.3984375, 1.4693603515625, 1.540283203125, 1.6112060546875, 1.68212890625, 1.7530517578125, 1.823974609375, 1.8948974609375, 1.9658203125, 2.0367431640625, 2.107666015625, 2.1785888671875, 2.24951171875, 2.3204345703125, 2.391357421875, 2.4622802734375, 2.533203125]}, "gradients/encoder.encoder.layers.1.attention.out_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0, 2.0, 2.0, 2.0, 5.0, 5.0, 5.0, 5.0, 4.0, 4.0, 9.0, 7.0, 11.0, 13.0, 20.0, 24.0, 25.0, 29.0, 33.0, 40.0, 40.0, 37.0, 41.0, 52.0, 65.0, 41.0, 61.0, 39.0, 47.0, 47.0, 37.0, 37.0, 44.0, 27.0, 22.0, 29.0, 21.0, 17.0, 17.0, 12.0, 8.0, 6.0, 9.0, 4.0, 7.0, 3.0, 1.0, 3.0, 0.0, 1.0], "bins": [-2.01171875, -1.9609375, -1.91015625, -1.859375, -1.80859375, -1.7578125, -1.70703125, -1.65625, -1.60546875, -1.5546875, -1.50390625, -1.453125, -1.40234375, -1.3515625, -1.30078125, -1.25, -1.19921875, -1.1484375, -1.09765625, -1.046875, -0.99609375, -0.9453125, -0.89453125, -0.84375, -0.79296875, -0.7421875, -0.69140625, -0.640625, -0.58984375, -0.5390625, -0.48828125, -0.4375, -0.38671875, -0.3359375, -0.28515625, -0.234375, -0.18359375, -0.1328125, -0.08203125, -0.03125, 0.01953125, 0.0703125, 0.12109375, 0.171875, 0.22265625, 0.2734375, 0.32421875, 0.375, 0.42578125, 0.4765625, 0.52734375, 0.578125, 0.62890625, 0.6796875, 0.73046875, 0.78125, 0.83203125, 0.8828125, 0.93359375, 0.984375, 1.03515625, 1.0859375, 1.13671875, 1.1875, 1.23828125]}, "gradients/encoder.encoder.layers.1.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 2.0, 0.0, 4.0, 3.0, 3.0, 1.0, 0.0, 4.0, 6.0, 5.0, 5.0, 6.0, 12.0, 13.0, 26.0, 26.0, 37.0, 31.0, 67.0, 61.0, 114.0, 170.0, 248.0, 394.0, 689.0, 1398.0, 3842.0, 19182.0, 233499.0, 741852.0, 36946.0, 5842.0, 1817.0, 814.0, 494.0, 288.0, 186.0, 128.0, 81.0, 78.0, 44.0, 32.0, 30.0, 16.0, 13.0, 15.0, 9.0, 8.0, 7.0, 6.0, 2.0, 2.0, 3.0, 3.0, 2.0, 3.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0], "bins": [-6.3828125, -6.17791748046875, -5.9730224609375, -5.76812744140625, -5.563232421875, -5.35833740234375, -5.1534423828125, -4.94854736328125, -4.74365234375, -4.53875732421875, -4.3338623046875, -4.12896728515625, -3.924072265625, -3.71917724609375, -3.5142822265625, -3.30938720703125, -3.1044921875, -2.89959716796875, -2.6947021484375, -2.48980712890625, -2.284912109375, -2.08001708984375, -1.8751220703125, -1.67022705078125, -1.46533203125, -1.26043701171875, -1.0555419921875, -0.85064697265625, -0.645751953125, -0.44085693359375, -0.2359619140625, -0.03106689453125, 0.173828125, 0.37872314453125, 0.5836181640625, 0.78851318359375, 0.993408203125, 1.19830322265625, 1.4031982421875, 1.60809326171875, 1.81298828125, 2.01788330078125, 2.2227783203125, 2.42767333984375, 2.632568359375, 2.83746337890625, 3.0423583984375, 3.24725341796875, 3.4521484375, 3.65704345703125, 3.8619384765625, 4.06683349609375, 4.271728515625, 4.47662353515625, 4.6815185546875, 4.88641357421875, 5.09130859375, 5.29620361328125, 5.5010986328125, 5.70599365234375, 5.910888671875, 6.11578369140625, 6.3206787109375, 6.52557373046875, 6.73046875]}, "gradients/encoder.encoder.layers.1.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 3.0, 3.0, 4.0, 5.0, 2.0, 5.0, 7.0, 5.0, 12.0, 13.0, 17.0, 10.0, 34.0, 27.0, 30.0, 40.0, 36.0, 44.0, 64.0, 56.0, 66.0, 77.0, 64.0, 62.0, 66.0, 52.0, 39.0, 47.0, 26.0, 22.0, 20.0, 13.0, 13.0, 5.0, 8.0, 6.0, 6.0, 3.0, 1.0, 0.0, 0.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-5.75390625, -5.53265380859375, -5.3114013671875, -5.09014892578125, -4.868896484375, -4.64764404296875, -4.4263916015625, -4.20513916015625, -3.98388671875, -3.76263427734375, -3.5413818359375, -3.32012939453125, -3.098876953125, -2.87762451171875, -2.6563720703125, -2.43511962890625, -2.2138671875, -1.99261474609375, -1.7713623046875, -1.55010986328125, -1.328857421875, -1.10760498046875, -0.8863525390625, -0.66510009765625, -0.44384765625, -0.22259521484375, -0.0013427734375, 0.21990966796875, 0.441162109375, 0.66241455078125, 0.8836669921875, 1.10491943359375, 1.326171875, 1.54742431640625, 1.7686767578125, 1.98992919921875, 2.211181640625, 2.43243408203125, 2.6536865234375, 2.87493896484375, 3.09619140625, 3.31744384765625, 3.5386962890625, 3.75994873046875, 3.981201171875, 4.20245361328125, 4.4237060546875, 4.64495849609375, 4.8662109375, 5.08746337890625, 5.3087158203125, 5.52996826171875, 5.751220703125, 5.97247314453125, 6.1937255859375, 6.41497802734375, 6.63623046875, 6.85748291015625, 7.0787353515625, 7.29998779296875, 7.521240234375, 7.74249267578125, 7.9637451171875, 8.18499755859375, 8.40625]}, "gradients/encoder.encoder.layers.1.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 3.0, 1.0, 1.0, 4.0, 3.0, 5.0, 4.0, 8.0, 5.0, 10.0, 26.0, 37.0, 44.0, 92.0, 116.0, 233.0, 461.0, 1079.0, 3053.0, 10803.0, 70336.0, 854345.0, 89762.0, 12576.0, 3311.0, 1153.0, 466.0, 244.0, 161.0, 66.0, 43.0, 37.0, 22.0, 15.0, 8.0, 8.0, 4.0, 3.0, 5.0, 3.0, 1.0, 4.0, 3.0, 2.0, 4.0, 1.0, 0.0, 1.0, 0.0, 1.0], "bins": [-2.201171875, -2.139251708984375, -2.07733154296875, -2.015411376953125, -1.9534912109375, -1.891571044921875, -1.82965087890625, -1.767730712890625, -1.705810546875, -1.643890380859375, -1.58197021484375, -1.520050048828125, -1.4581298828125, -1.396209716796875, -1.33428955078125, -1.272369384765625, -1.21044921875, -1.148529052734375, -1.08660888671875, -1.024688720703125, -0.9627685546875, -0.900848388671875, -0.83892822265625, -0.777008056640625, -0.715087890625, -0.653167724609375, -0.59124755859375, -0.529327392578125, -0.4674072265625, -0.405487060546875, -0.34356689453125, -0.281646728515625, -0.2197265625, -0.157806396484375, -0.09588623046875, -0.033966064453125, 0.0279541015625, 0.089874267578125, 0.15179443359375, 0.213714599609375, 0.275634765625, 0.337554931640625, 0.39947509765625, 0.461395263671875, 0.5233154296875, 0.585235595703125, 0.64715576171875, 0.709075927734375, 0.77099609375, 0.832916259765625, 0.89483642578125, 0.956756591796875, 1.0186767578125, 1.080596923828125, 1.14251708984375, 1.204437255859375, 1.266357421875, 1.328277587890625, 1.39019775390625, 1.452117919921875, 1.5140380859375, 1.575958251953125, 1.63787841796875, 1.699798583984375, 1.76171875]}, "gradients/encoder.encoder.layers.1.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 2.0, 3.0, 1.0, 1.0, 3.0, 3.0, 0.0, 3.0, 5.0, 9.0, 18.0, 22.0, 21.0, 46.0, 101.0, 140.0, 251.0, 161.0, 87.0, 52.0, 34.0, 12.0, 14.0, 9.0, 6.0, 0.0, 4.0, 3.0, 1.0, 1.0, 2.0, 0.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0008168220520019531, -0.0007892102003097534, -0.0007615983486175537, -0.000733986496925354, -0.0007063746452331543, -0.0006787627935409546, -0.0006511509418487549, -0.0006235390901565552, -0.0005959272384643555, -0.0005683153867721558, -0.0005407035350799561, -0.0005130916833877563, -0.00048547983169555664, -0.00045786798000335693, -0.0004302561283111572, -0.0004026442766189575, -0.0003750324249267578, -0.0003474205732345581, -0.0003198087215423584, -0.0002921968698501587, -0.000264585018157959, -0.00023697316646575928, -0.00020936131477355957, -0.00018174946308135986, -0.00015413761138916016, -0.00012652575969696045, -9.891390800476074e-05, -7.130205631256104e-05, -4.369020462036133e-05, -1.607835292816162e-05, 1.1533498764038086e-05, 3.914535045623779e-05, 6.67572021484375e-05, 9.436905384063721e-05, 0.00012198090553283691, 0.00014959275722503662, 0.00017720460891723633, 0.00020481646060943604, 0.00023242831230163574, 0.00026004016399383545, 0.00028765201568603516, 0.00031526386737823486, 0.00034287571907043457, 0.0003704875707626343, 0.000398099422454834, 0.0004257112741470337, 0.0004533231258392334, 0.0004809349775314331, 0.0005085468292236328, 0.0005361586809158325, 0.0005637705326080322, 0.0005913823843002319, 0.0006189942359924316, 0.0006466060876846313, 0.0006742179393768311, 0.0007018297910690308, 0.0007294416427612305, 0.0007570534944534302, 0.0007846653461456299, 0.0008122771978378296, 0.0008398890495300293, 0.000867500901222229, 0.0008951127529144287, 0.0009227246046066284, 0.0009503364562988281]}, "gradients/encoder.encoder.layers.1.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 2.0, 5.0, 8.0, 3.0, 4.0, 7.0, 8.0, 11.0, 15.0, 20.0, 32.0, 43.0, 44.0, 60.0, 100.0, 126.0, 237.0, 495.0, 1348.0, 5295.0, 39386.0, 877422.0, 110872.0, 9413.0, 2002.0, 679.0, 328.0, 171.0, 113.0, 89.0, 59.0, 36.0, 35.0, 29.0, 16.0, 12.0, 11.0, 9.0, 8.0, 4.0, 2.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 2.0], "bins": [-2.361328125, -2.2890625, -2.216796875, -2.14453125, -2.072265625, -2.0, -1.927734375, -1.85546875, -1.783203125, -1.7109375, -1.638671875, -1.56640625, -1.494140625, -1.421875, -1.349609375, -1.27734375, -1.205078125, -1.1328125, -1.060546875, -0.98828125, -0.916015625, -0.84375, -0.771484375, -0.69921875, -0.626953125, -0.5546875, -0.482421875, -0.41015625, -0.337890625, -0.265625, -0.193359375, -0.12109375, -0.048828125, 0.0234375, 0.095703125, 0.16796875, 0.240234375, 0.3125, 0.384765625, 0.45703125, 0.529296875, 0.6015625, 0.673828125, 0.74609375, 0.818359375, 0.890625, 0.962890625, 1.03515625, 1.107421875, 1.1796875, 1.251953125, 1.32421875, 1.396484375, 1.46875, 1.541015625, 1.61328125, 1.685546875, 1.7578125, 1.830078125, 1.90234375, 1.974609375, 2.046875, 2.119140625, 2.19140625, 2.263671875]}, "gradients/encoder.encoder.layers.1.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 1.0, 4.0, 8.0, 6.0, 5.0, 5.0, 6.0, 13.0, 7.0, 11.0, 16.0, 18.0, 27.0, 34.0, 46.0, 45.0, 67.0, 86.0, 90.0, 83.0, 83.0, 68.0, 53.0, 30.0, 34.0, 38.0, 26.0, 13.0, 13.0, 10.0, 18.0, 8.0, 14.0, 2.0, 5.0, 6.0, 4.0, 5.0, 1.0, 1.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.3525390625, -1.3103790283203125, -1.268218994140625, -1.2260589599609375, -1.18389892578125, -1.1417388916015625, -1.099578857421875, -1.0574188232421875, -1.0152587890625, -0.9730987548828125, -0.930938720703125, -0.8887786865234375, -0.84661865234375, -0.8044586181640625, -0.762298583984375, -0.7201385498046875, -0.677978515625, -0.6358184814453125, -0.593658447265625, -0.5514984130859375, -0.50933837890625, -0.4671783447265625, -0.425018310546875, -0.3828582763671875, -0.3406982421875, -0.2985382080078125, -0.256378173828125, -0.2142181396484375, -0.17205810546875, -0.1298980712890625, -0.087738037109375, -0.0455780029296875, -0.00341796875, 0.0387420654296875, 0.080902099609375, 0.1230621337890625, 0.16522216796875, 0.2073822021484375, 0.249542236328125, 0.2917022705078125, 0.3338623046875, 0.3760223388671875, 0.418182373046875, 0.4603424072265625, 0.50250244140625, 0.5446624755859375, 0.586822509765625, 0.6289825439453125, 0.671142578125, 0.7133026123046875, 0.755462646484375, 0.7976226806640625, 0.83978271484375, 0.8819427490234375, 0.924102783203125, 0.9662628173828125, 1.0084228515625, 1.0505828857421875, 1.092742919921875, 1.1349029541015625, 1.17706298828125, 1.2192230224609375, 1.261383056640625, 1.3035430908203125, 1.345703125]}, "gradients/encoder.encoder.layers.1.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 2.0, 3.0, 13.0, 193.0, 650.0, 112.0, 29.0, 7.0, 3.0, 0.0, 2.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-54.13117980957031, -50.056297302246094, -45.981414794921875, -41.90653610229492, -37.8316535949707, -33.756771087646484, -29.6818904876709, -25.607009887695312, -21.532127380371094, -17.457244873046875, -13.382364273071289, -9.307482719421387, -5.232601165771484, -1.1577186584472656, 2.9171619415283203, 6.992042541503906, 11.066925048828125, 15.141806602478027, 19.21668815612793, 23.291568756103516, 27.366451263427734, 31.441333770751953, 35.516212463378906, 39.591094970703125, 43.665977478027344, 47.74085998535156, 51.81574249267578, 55.890621185302734, 59.96550369262695, 64.04039001464844, 68.11526489257812, 72.19014739990234, 76.26502990722656, 80.33991241455078, 84.414794921875, 88.48967742919922, 92.56455993652344, 96.63943481445312, 100.71431732177734, 104.78919982910156, 108.86408233642578, 112.93896484375, 117.01384735107422, 121.08872985839844, 125.16360473632812, 129.23849487304688, 133.31336975097656, 137.38824462890625, 141.463134765625, 145.5380096435547, 149.61289978027344, 153.68777465820312, 157.76266479492188, 161.83753967285156, 165.9124298095703, 169.9873046875, 174.06219482421875, 178.13706970214844, 182.2119598388672, 186.28683471679688, 190.36172485351562, 194.4365997314453, 198.51148986816406, 202.58636474609375, 206.66123962402344]}, "gradients/encoder.encoder.layers.1.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 3.0, 2.0, 3.0, 8.0, 3.0, 5.0, 6.0, 5.0, 8.0, 9.0, 12.0, 8.0, 9.0, 18.0, 16.0, 23.0, 17.0, 20.0, 39.0, 26.0, 23.0, 41.0, 55.0, 92.0, 146.0, 92.0, 53.0, 30.0, 25.0, 32.0, 28.0, 25.0, 21.0, 21.0, 16.0, 11.0, 10.0, 12.0, 6.0, 5.0, 2.0, 6.0, 5.0, 2.0, 6.0, 3.0, 3.0, 3.0, 3.0], "bins": [-27.875879287719727, -27.167110443115234, -26.45833969116211, -25.749570846557617, -25.040802001953125, -24.33203125, -23.623262405395508, -22.914493560791016, -22.20572280883789, -21.4969539642334, -20.788183212280273, -20.07941436767578, -19.37064552307129, -18.661876678466797, -17.953105926513672, -17.24433708190918, -16.535568237304688, -15.826798439025879, -15.118029594421387, -14.409259796142578, -13.700490951538086, -12.991721153259277, -12.282951354980469, -11.574182510375977, -10.865412712097168, -10.15664291381836, -9.447874069213867, -8.739104270935059, -8.03033447265625, -7.321565628051758, -6.612795829772949, -5.904026508331299, -5.195255279541016, -4.486485958099365, -3.7777163982391357, -3.0689468383789062, -2.360177516937256, -1.6514081954956055, -0.9426383972167969, -0.23386907577514648, 0.4749002456665039, 1.1836696863174438, 1.8924391269683838, 2.6012086868286133, 3.3099780082702637, 4.018747329711914, 4.727517127990723, 5.436286449432373, 6.145055770874023, 6.853825092315674, 7.562594413757324, 8.271364212036133, 8.980133056640625, 9.688902854919434, 10.397672653198242, 11.106441497802734, 11.815211296081543, 12.523981094360352, 13.232749938964844, 13.941519737243652, 14.650289535522461, 15.359058380126953, 16.067829132080078, 16.77659797668457, 17.485366821289062]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.weight": {"_type": "histogram", "values": [3.0, 0.0, 2.0, 2.0, 4.0, 3.0, 1.0, 6.0, 7.0, 17.0, 25.0, 27.0, 33.0, 41.0, 62.0, 85.0, 127.0, 163.0, 269.0, 396.0, 562.0, 870.0, 1349.0, 2332.0, 4048.0, 7840.0, 17931.0, 56200.0, 260186.0, 1095330.0, 1838547.0, 673597.0, 162423.0, 43012.0, 14219.0, 6309.0, 3275.0, 1852.0, 1084.0, 691.0, 426.0, 292.0, 190.0, 125.0, 117.0, 62.0, 48.0, 32.0, 27.0, 15.0, 10.0, 10.0, 6.0, 2.0, 2.0, 3.0, 4.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-1.87890625, -1.81695556640625, -1.7550048828125, -1.69305419921875, -1.631103515625, -1.56915283203125, -1.5072021484375, -1.44525146484375, -1.38330078125, -1.32135009765625, -1.2593994140625, -1.19744873046875, -1.135498046875, -1.07354736328125, -1.0115966796875, -0.94964599609375, -0.8876953125, -0.82574462890625, -0.7637939453125, -0.70184326171875, -0.639892578125, -0.57794189453125, -0.5159912109375, -0.45404052734375, -0.39208984375, -0.33013916015625, -0.2681884765625, -0.20623779296875, -0.144287109375, -0.08233642578125, -0.0203857421875, 0.04156494140625, 0.103515625, 0.16546630859375, 0.2274169921875, 0.28936767578125, 0.351318359375, 0.41326904296875, 0.4752197265625, 0.53717041015625, 0.59912109375, 0.66107177734375, 0.7230224609375, 0.78497314453125, 0.846923828125, 0.90887451171875, 0.9708251953125, 1.03277587890625, 1.0947265625, 1.15667724609375, 1.2186279296875, 1.28057861328125, 1.342529296875, 1.40447998046875, 1.4664306640625, 1.52838134765625, 1.59033203125, 1.65228271484375, 1.7142333984375, 1.77618408203125, 1.838134765625, 1.90008544921875, 1.9620361328125, 2.02398681640625, 2.0859375]}, "gradients/encoder.encoder.layers.0.feed_forward.output_dense.bias": {"_type": "histogram", "values": [1.0, 5.0, 1.0, 3.0, 1.0, 0.0, 1.0, 5.0, 3.0, 2.0, 5.0, 3.0, 6.0, 6.0, 2.0, 8.0, 5.0, 9.0, 12.0, 11.0, 11.0, 13.0, 10.0, 19.0, 23.0, 25.0, 30.0, 27.0, 29.0, 35.0, 24.0, 30.0, 34.0, 34.0, 48.0, 36.0, 49.0, 43.0, 33.0, 26.0, 36.0, 44.0, 27.0, 23.0, 34.0, 20.0, 22.0, 17.0, 20.0, 19.0, 11.0, 13.0, 13.0, 12.0, 11.0, 7.0, 4.0, 3.0, 4.0, 6.0, 5.0, 2.0, 1.0, 2.0], "bins": [-1.23828125, -1.20330810546875, -1.1683349609375, -1.13336181640625, -1.098388671875, -1.06341552734375, -1.0284423828125, -0.99346923828125, -0.95849609375, -0.92352294921875, -0.8885498046875, -0.85357666015625, -0.818603515625, -0.78363037109375, -0.7486572265625, -0.71368408203125, -0.6787109375, -0.64373779296875, -0.6087646484375, -0.57379150390625, -0.538818359375, -0.50384521484375, -0.4688720703125, -0.43389892578125, -0.39892578125, -0.36395263671875, -0.3289794921875, -0.29400634765625, -0.259033203125, -0.22406005859375, -0.1890869140625, -0.15411376953125, -0.119140625, -0.08416748046875, -0.0491943359375, -0.01422119140625, 0.020751953125, 0.05572509765625, 0.0906982421875, 0.12567138671875, 0.16064453125, 0.19561767578125, 0.2305908203125, 0.26556396484375, 0.300537109375, 0.33551025390625, 0.3704833984375, 0.40545654296875, 0.4404296875, 0.47540283203125, 0.5103759765625, 0.54534912109375, 0.580322265625, 0.61529541015625, 0.6502685546875, 0.68524169921875, 0.72021484375, 0.75518798828125, 0.7901611328125, 0.82513427734375, 0.860107421875, 0.89508056640625, 0.9300537109375, 0.96502685546875, 1.0]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 6.0, 2.0, 5.0, 13.0, 56.0, 192.0, 609.0, 4466.0, 4132914.0, 53890.0, 1623.0, 342.0, 105.0, 34.0, 18.0, 8.0, 7.0, 3.0, 0.0, 0.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-22.0625, -21.34521484375, -20.6279296875, -19.91064453125, -19.193359375, -18.47607421875, -17.7587890625, -17.04150390625, -16.32421875, -15.60693359375, -14.8896484375, -14.17236328125, -13.455078125, -12.73779296875, -12.0205078125, -11.30322265625, -10.5859375, -9.86865234375, -9.1513671875, -8.43408203125, -7.716796875, -6.99951171875, -6.2822265625, -5.56494140625, -4.84765625, -4.13037109375, -3.4130859375, -2.69580078125, -1.978515625, -1.26123046875, -0.5439453125, 0.17333984375, 0.890625, 1.60791015625, 2.3251953125, 3.04248046875, 3.759765625, 4.47705078125, 5.1943359375, 5.91162109375, 6.62890625, 7.34619140625, 8.0634765625, 8.78076171875, 9.498046875, 10.21533203125, 10.9326171875, 11.64990234375, 12.3671875, 13.08447265625, 13.8017578125, 14.51904296875, 15.236328125, 15.95361328125, 16.6708984375, 17.38818359375, 18.10546875, 18.82275390625, 19.5400390625, 20.25732421875, 20.974609375, 21.69189453125, 22.4091796875, 23.12646484375, 23.84375]}, "gradients/encoder.encoder.layers.0.feed_forward.intermediate_dense.bias": {"_type": "histogram", "values": [2.0, 2.0, 1.0, 2.0, 4.0, 3.0, 7.0, 15.0, 22.0, 37.0, 73.0, 152.0, 285.0, 646.0, 1077.0, 866.0, 447.0, 197.0, 100.0, 69.0, 40.0, 20.0, 14.0, 3.0, 3.0, 1.0, 4.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.94921875, -3.68170166015625, -3.4141845703125, -3.14666748046875, -2.879150390625, -2.61163330078125, -2.3441162109375, -2.07659912109375, -1.80908203125, -1.54156494140625, -1.2740478515625, -1.00653076171875, -0.739013671875, -0.47149658203125, -0.2039794921875, 0.06353759765625, 0.3310546875, 0.59857177734375, 0.8660888671875, 1.13360595703125, 1.401123046875, 1.66864013671875, 1.9361572265625, 2.20367431640625, 2.47119140625, 2.73870849609375, 3.0062255859375, 3.27374267578125, 3.541259765625, 3.80877685546875, 4.0762939453125, 4.34381103515625, 4.611328125, 4.87884521484375, 5.1463623046875, 5.41387939453125, 5.681396484375, 5.94891357421875, 6.2164306640625, 6.48394775390625, 6.75146484375, 7.01898193359375, 7.2864990234375, 7.55401611328125, 7.821533203125, 8.08905029296875, 8.3565673828125, 8.62408447265625, 8.8916015625, 9.15911865234375, 9.4266357421875, 9.69415283203125, 9.961669921875, 10.22918701171875, 10.4967041015625, 10.76422119140625, 11.03173828125, 11.29925537109375, 11.5667724609375, 11.83428955078125, 12.101806640625, 12.36932373046875, 12.6368408203125, 12.90435791015625, 13.171875]}, "gradients/encoder.encoder.layers.0.final_layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 3.0, 0.0, 1.0, 3.0, 6.0, 15.0, 45.0, 146.0, 400.0, 265.0, 81.0, 23.0, 10.0, 8.0, 4.0, 3.0, 3.0, 1.0, 1.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-82.39708709716797, -78.61478424072266, -74.83247375488281, -71.0501708984375, -67.26786804199219, -63.485557556152344, -59.70325469970703, -55.92094802856445, -52.138641357421875, -48.3563346862793, -44.57402801513672, -40.791725158691406, -37.00941848754883, -33.22711181640625, -29.444807052612305, -25.66250228881836, -21.88019561767578, -18.097888946533203, -14.315584182739258, -10.533278465270996, -6.750972747802734, -2.9686660766601562, 0.8136386871337891, 4.595943450927734, 8.378250122070312, 12.160555839538574, 15.942861557006836, 19.72516632080078, 23.50747299194336, 27.289779663085938, 31.072084426879883, 34.85438919067383, 38.636688232421875, 42.41899490356445, 46.20130157470703, 49.983604431152344, 53.76591110229492, 57.5482177734375, 61.33052062988281, 65.11282348632812, 68.89513397216797, 72.67743682861328, 76.45974731445312, 80.24205017089844, 84.02435302734375, 87.8066635131836, 91.5889663696289, 95.37127685546875, 99.15357971191406, 102.93588256835938, 106.71819305419922, 110.50049591064453, 114.28280639648438, 118.06510925292969, 121.847412109375, 125.62971496582031, 129.41201782226562, 133.19432067871094, 136.97662353515625, 140.75894165039062, 144.54124450683594, 148.32354736328125, 152.10585021972656, 155.88815307617188, 159.67047119140625]}, "gradients/encoder.encoder.layers.0.final_layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 1.0, 3.0, 2.0, 2.0, 1.0, 1.0, 1.0, 4.0, 2.0, 3.0, 10.0, 10.0, 8.0, 20.0, 18.0, 19.0, 23.0, 31.0, 37.0, 36.0, 37.0, 49.0, 68.0, 65.0, 53.0, 60.0, 77.0, 46.0, 47.0, 45.0, 48.0, 47.0, 34.0, 21.0, 20.0, 22.0, 13.0, 8.0, 3.0, 3.0, 3.0, 3.0, 5.0, 3.0, 0.0, 4.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 1.0], "bins": [-38.04997634887695, -36.936824798583984, -35.823673248291016, -34.71052169799805, -33.59736633300781, -32.484214782714844, -31.371063232421875, -30.257911682128906, -29.144760131835938, -28.03160858154297, -26.91845703125, -25.8053035736084, -24.69215202331543, -23.57900047302246, -22.46584701538086, -21.35269546508789, -20.239543914794922, -19.126392364501953, -18.013240814208984, -16.900087356567383, -15.786935806274414, -14.673784255981445, -13.56063175201416, -12.447479248046875, -11.334327697753906, -10.221176147460938, -9.108023643493652, -7.994871616363525, -6.881719589233398, -5.7685675621032715, -4.6554155349731445, -3.5422635078430176, -2.4291114807128906, -1.3159594535827637, -0.20280742645263672, 0.9103446006774902, 2.023496627807617, 3.136648654937744, 4.249800682067871, 5.362952709197998, 6.476104736328125, 7.589256763458252, 8.702408790588379, 9.815561294555664, 10.928712844848633, 12.041864395141602, 13.155016899108887, 14.268169403076172, 15.38132095336914, 16.49447250366211, 17.607624053955078, 18.72077751159668, 19.83392906188965, 20.947080612182617, 22.06023406982422, 23.173385620117188, 24.286537170410156, 25.399688720703125, 26.512840270996094, 27.625993728637695, 28.739145278930664, 29.852296829223633, 30.965450286865234, 32.0786018371582, 33.19175338745117]}, "gradients/encoder.encoder.layers.0.attention.out_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 3.0, 3.0, 3.0, 0.0, 6.0, 7.0, 6.0, 8.0, 13.0, 18.0, 23.0, 50.0, 57.0, 103.0, 150.0, 299.0, 544.0, 1189.0, 2547.0, 6204.0, 18066.0, 73579.0, 544944.0, 325650.0, 52177.0, 13864.0, 4909.0, 2022.0, 925.0, 482.0, 268.0, 186.0, 104.0, 48.0, 39.0, 19.0, 15.0, 8.0, 8.0, 4.0, 5.0, 3.0, 3.0, 3.0, 0.0, 1.0, 0.0, 0.0, 3.0, 2.0, 1.0], "bins": [-4.5703125, -4.442962646484375, -4.31561279296875, -4.188262939453125, -4.0609130859375, -3.933563232421875, -3.80621337890625, -3.678863525390625, -3.551513671875, -3.424163818359375, -3.29681396484375, -3.169464111328125, -3.0421142578125, -2.914764404296875, -2.78741455078125, -2.660064697265625, -2.53271484375, -2.405364990234375, -2.27801513671875, -2.150665283203125, -2.0233154296875, -1.895965576171875, -1.76861572265625, -1.641265869140625, -1.513916015625, -1.386566162109375, -1.25921630859375, -1.131866455078125, -1.0045166015625, -0.877166748046875, -0.74981689453125, -0.622467041015625, -0.4951171875, -0.367767333984375, -0.24041748046875, -0.113067626953125, 0.0142822265625, 0.141632080078125, 0.26898193359375, 0.396331787109375, 0.523681640625, 0.651031494140625, 0.77838134765625, 0.905731201171875, 1.0330810546875, 1.160430908203125, 1.28778076171875, 1.415130615234375, 1.54248046875, 1.669830322265625, 1.79718017578125, 1.924530029296875, 2.0518798828125, 2.179229736328125, 2.30657958984375, 2.433929443359375, 2.561279296875, 2.688629150390625, 2.81597900390625, 2.943328857421875, 3.0706787109375, 3.198028564453125, 3.32537841796875, 3.452728271484375, 3.580078125]}, "gradients/encoder.encoder.layers.0.attention.out_proj.bias": {"_type": "histogram", "values": [2.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 2.0, 1.0, 2.0, 5.0, 6.0, 7.0, 8.0, 12.0, 14.0, 24.0, 20.0, 26.0, 40.0, 38.0, 58.0, 54.0, 66.0, 71.0, 68.0, 69.0, 72.0, 63.0, 58.0, 51.0, 45.0, 24.0, 23.0, 20.0, 27.0, 14.0, 4.0, 5.0, 5.0, 7.0, 2.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.166015625, -3.083953857421875, -3.00189208984375, -2.919830322265625, -2.8377685546875, -2.755706787109375, -2.67364501953125, -2.591583251953125, -2.509521484375, -2.427459716796875, -2.34539794921875, -2.263336181640625, -2.1812744140625, -2.099212646484375, -2.01715087890625, -1.935089111328125, -1.85302734375, -1.770965576171875, -1.68890380859375, -1.606842041015625, -1.5247802734375, -1.442718505859375, -1.36065673828125, -1.278594970703125, -1.196533203125, -1.114471435546875, -1.03240966796875, -0.950347900390625, -0.8682861328125, -0.786224365234375, -0.70416259765625, -0.622100830078125, -0.5400390625, -0.457977294921875, -0.37591552734375, -0.293853759765625, -0.2117919921875, -0.129730224609375, -0.04766845703125, 0.034393310546875, 0.116455078125, 0.198516845703125, 0.28057861328125, 0.362640380859375, 0.4447021484375, 0.526763916015625, 0.60882568359375, 0.690887451171875, 0.77294921875, 0.855010986328125, 0.93707275390625, 1.019134521484375, 1.1011962890625, 1.183258056640625, 1.26531982421875, 1.347381591796875, 1.429443359375, 1.511505126953125, 1.59356689453125, 1.675628662109375, 1.7576904296875, 1.839752197265625, 1.92181396484375, 2.003875732421875, 2.0859375]}, "gradients/encoder.encoder.layers.0.attention.v_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 1.0, 3.0, 0.0, 2.0, 5.0, 4.0, 2.0, 2.0, 7.0, 6.0, 8.0, 12.0, 18.0, 22.0, 39.0, 61.0, 83.0, 189.0, 450.0, 1263.0, 7204.0, 904134.0, 128834.0, 4516.0, 945.0, 376.0, 166.0, 102.0, 39.0, 26.0, 14.0, 14.0, 6.0, 4.0, 6.0, 4.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-13.921875, -13.5638427734375, -13.205810546875, -12.8477783203125, -12.48974609375, -12.1317138671875, -11.773681640625, -11.4156494140625, -11.0576171875, -10.6995849609375, -10.341552734375, -9.9835205078125, -9.62548828125, -9.2674560546875, -8.909423828125, -8.5513916015625, -8.193359375, -7.8353271484375, -7.477294921875, -7.1192626953125, -6.76123046875, -6.4031982421875, -6.045166015625, -5.6871337890625, -5.3291015625, -4.9710693359375, -4.613037109375, -4.2550048828125, -3.89697265625, -3.5389404296875, -3.180908203125, -2.8228759765625, -2.46484375, -2.1068115234375, -1.748779296875, -1.3907470703125, -1.03271484375, -0.6746826171875, -0.316650390625, 0.0413818359375, 0.3994140625, 0.7574462890625, 1.115478515625, 1.4735107421875, 1.83154296875, 2.1895751953125, 2.547607421875, 2.9056396484375, 3.263671875, 3.6217041015625, 3.979736328125, 4.3377685546875, 4.69580078125, 5.0538330078125, 5.411865234375, 5.7698974609375, 6.1279296875, 6.4859619140625, 6.843994140625, 7.2020263671875, 7.56005859375, 7.9180908203125, 8.276123046875, 8.6341552734375, 8.9921875]}, "gradients/encoder.encoder.layers.0.attention.v_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 3.0, 2.0, 2.0, 3.0, 1.0, 3.0, 5.0, 9.0, 6.0, 11.0, 16.0, 15.0, 24.0, 28.0, 39.0, 48.0, 60.0, 84.0, 112.0, 119.0, 89.0, 81.0, 55.0, 29.0, 46.0, 31.0, 23.0, 16.0, 16.0, 10.0, 9.0, 5.0, 6.0, 7.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-12.2421875, -11.86376953125, -11.4853515625, -11.10693359375, -10.728515625, -10.35009765625, -9.9716796875, -9.59326171875, -9.21484375, -8.83642578125, -8.4580078125, -8.07958984375, -7.701171875, -7.32275390625, -6.9443359375, -6.56591796875, -6.1875, -5.80908203125, -5.4306640625, -5.05224609375, -4.673828125, -4.29541015625, -3.9169921875, -3.53857421875, -3.16015625, -2.78173828125, -2.4033203125, -2.02490234375, -1.646484375, -1.26806640625, -0.8896484375, -0.51123046875, -0.1328125, 0.24560546875, 0.6240234375, 1.00244140625, 1.380859375, 1.75927734375, 2.1376953125, 2.51611328125, 2.89453125, 3.27294921875, 3.6513671875, 4.02978515625, 4.408203125, 4.78662109375, 5.1650390625, 5.54345703125, 5.921875, 6.30029296875, 6.6787109375, 7.05712890625, 7.435546875, 7.81396484375, 8.1923828125, 8.57080078125, 8.94921875, 9.32763671875, 9.7060546875, 10.08447265625, 10.462890625, 10.84130859375, 11.2197265625, 11.59814453125, 11.9765625]}, "gradients/encoder.encoder.layers.0.attention.k_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 2.0, 2.0, 3.0, 0.0, 0.0, 6.0, 10.0, 8.0, 13.0, 16.0, 20.0, 28.0, 36.0, 44.0, 79.0, 125.0, 161.0, 307.0, 568.0, 1099.0, 2414.0, 6071.0, 20931.0, 162759.0, 808705.0, 31002.0, 8095.0, 2976.0, 1440.0, 690.0, 332.0, 211.0, 102.0, 88.0, 59.0, 48.0, 30.0, 24.0, 15.0, 9.0, 13.0, 10.0, 4.0, 4.0, 2.0, 2.0, 1.0, 1.0, 0.0, 4.0, 1.0, 1.0], "bins": [-1.224609375, -1.1907196044921875, -1.156829833984375, -1.1229400634765625, -1.08905029296875, -1.0551605224609375, -1.021270751953125, -0.9873809814453125, -0.9534912109375, -0.9196014404296875, -0.885711669921875, -0.8518218994140625, -0.81793212890625, -0.7840423583984375, -0.750152587890625, -0.7162628173828125, -0.682373046875, -0.6484832763671875, -0.614593505859375, -0.5807037353515625, -0.54681396484375, -0.5129241943359375, -0.479034423828125, -0.4451446533203125, -0.4112548828125, -0.3773651123046875, -0.343475341796875, -0.3095855712890625, -0.27569580078125, -0.2418060302734375, -0.207916259765625, -0.1740264892578125, -0.14013671875, -0.1062469482421875, -0.072357177734375, -0.0384674072265625, -0.00457763671875, 0.0293121337890625, 0.063201904296875, 0.0970916748046875, 0.1309814453125, 0.1648712158203125, 0.198760986328125, 0.2326507568359375, 0.26654052734375, 0.3004302978515625, 0.334320068359375, 0.3682098388671875, 0.402099609375, 0.4359893798828125, 0.469879150390625, 0.5037689208984375, 0.53765869140625, 0.5715484619140625, 0.605438232421875, 0.6393280029296875, 0.6732177734375, 0.7071075439453125, 0.740997314453125, 0.7748870849609375, 0.80877685546875, 0.8426666259765625, 0.876556396484375, 0.9104461669921875, 0.9443359375]}, "gradients/encoder.encoder.layers.0.attention.k_proj.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 0.0, 2.0, 2.0, 7.0, 4.0, 6.0, 8.0, 5.0, 6.0, 12.0, 23.0, 42.0, 71.0, 108.0, 258.0, 220.0, 85.0, 48.0, 36.0, 20.0, 14.0, 8.0, 8.0, 3.0, 4.0, 4.0, 3.0, 1.0, 0.0, 1.0, 3.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 2.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-0.0005950927734375, -0.0005774572491645813, -0.0005598217248916626, -0.0005421862006187439, -0.0005245506763458252, -0.0005069151520729065, -0.0004892796277999878, -0.0004716441035270691, -0.0004540085792541504, -0.0004363730549812317, -0.000418737530708313, -0.0004011020064353943, -0.0003834664821624756, -0.0003658309578895569, -0.0003481954336166382, -0.0003305599093437195, -0.0003129243850708008, -0.0002952888607978821, -0.0002776533365249634, -0.0002600178122520447, -0.00024238228797912598, -0.00022474676370620728, -0.00020711123943328857, -0.00018947571516036987, -0.00017184019088745117, -0.00015420466661453247, -0.00013656914234161377, -0.00011893361806869507, -0.00010129809379577637, -8.366256952285767e-05, -6.602704524993896e-05, -4.8391520977020264e-05, -3.075599670410156e-05, -1.3120472431182861e-05, 4.51505184173584e-06, 2.215057611465454e-05, 3.978610038757324e-05, 5.742162466049194e-05, 7.505714893341064e-05, 9.269267320632935e-05, 0.00011032819747924805, 0.00012796372175216675, 0.00014559924602508545, 0.00016323477029800415, 0.00018087029457092285, 0.00019850581884384155, 0.00021614134311676025, 0.00023377686738967896, 0.00025141239166259766, 0.00026904791593551636, 0.00028668344020843506, 0.00030431896448135376, 0.00032195448875427246, 0.00033959001302719116, 0.00035722553730010986, 0.00037486106157302856, 0.00039249658584594727, 0.00041013211011886597, 0.00042776763439178467, 0.00044540315866470337, 0.00046303868293762207, 0.00048067420721054077, 0.0004983097314834595, 0.0005159452557563782, 0.0005335807800292969]}, "gradients/encoder.encoder.layers.0.attention.q_proj.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 2.0, 0.0, 1.0, 1.0, 3.0, 2.0, 1.0, 2.0, 4.0, 3.0, 12.0, 7.0, 20.0, 21.0, 40.0, 67.0, 113.0, 246.0, 520.0, 1516.0, 6621.0, 68249.0, 936248.0, 28999.0, 4006.0, 1038.0, 403.0, 172.0, 96.0, 40.0, 32.0, 20.0, 16.0, 19.0, 10.0, 4.0, 3.0, 3.0, 5.0, 2.0, 0.0, 2.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0], "bins": [-1.443359375, -1.39874267578125, -1.3541259765625, -1.30950927734375, -1.264892578125, -1.22027587890625, -1.1756591796875, -1.13104248046875, -1.08642578125, -1.04180908203125, -0.9971923828125, -0.95257568359375, -0.907958984375, -0.86334228515625, -0.8187255859375, -0.77410888671875, -0.7294921875, -0.68487548828125, -0.6402587890625, -0.59564208984375, -0.551025390625, -0.50640869140625, -0.4617919921875, -0.41717529296875, -0.37255859375, -0.32794189453125, -0.2833251953125, -0.23870849609375, -0.194091796875, -0.14947509765625, -0.1048583984375, -0.06024169921875, -0.015625, 0.02899169921875, 0.0736083984375, 0.11822509765625, 0.162841796875, 0.20745849609375, 0.2520751953125, 0.29669189453125, 0.34130859375, 0.38592529296875, 0.4305419921875, 0.47515869140625, 0.519775390625, 0.56439208984375, 0.6090087890625, 0.65362548828125, 0.6982421875, 0.74285888671875, 0.7874755859375, 0.83209228515625, 0.876708984375, 0.92132568359375, 0.9659423828125, 1.01055908203125, 1.05517578125, 1.09979248046875, 1.1444091796875, 1.18902587890625, 1.233642578125, 1.27825927734375, 1.3228759765625, 1.36749267578125, 1.412109375]}, "gradients/encoder.encoder.layers.0.attention.q_proj.bias": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 2.0, 2.0, 3.0, 5.0, 1.0, 5.0, 7.0, 5.0, 10.0, 13.0, 14.0, 21.0, 22.0, 23.0, 36.0, 59.0, 81.0, 89.0, 136.0, 127.0, 79.0, 58.0, 52.0, 32.0, 28.0, 26.0, 15.0, 10.0, 10.0, 12.0, 6.0, 7.0, 4.0, 3.0, 1.0, 2.0, 3.0, 0.0, 1.0, 3.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-1.0654296875, -1.02728271484375, -0.9891357421875, -0.95098876953125, -0.912841796875, -0.87469482421875, -0.8365478515625, -0.79840087890625, -0.76025390625, -0.72210693359375, -0.6839599609375, -0.64581298828125, -0.607666015625, -0.56951904296875, -0.5313720703125, -0.49322509765625, -0.455078125, -0.41693115234375, -0.3787841796875, -0.34063720703125, -0.302490234375, -0.26434326171875, -0.2261962890625, -0.18804931640625, -0.14990234375, -0.11175537109375, -0.0736083984375, -0.03546142578125, 0.002685546875, 0.04083251953125, 0.0789794921875, 0.11712646484375, 0.1552734375, 0.19342041015625, 0.2315673828125, 0.26971435546875, 0.307861328125, 0.34600830078125, 0.3841552734375, 0.42230224609375, 0.46044921875, 0.49859619140625, 0.5367431640625, 0.57489013671875, 0.613037109375, 0.65118408203125, 0.6893310546875, 0.72747802734375, 0.765625, 0.80377197265625, 0.8419189453125, 0.88006591796875, 0.918212890625, 0.95635986328125, 0.9945068359375, 1.03265380859375, 1.07080078125, 1.10894775390625, 1.1470947265625, 1.18524169921875, 1.223388671875, 1.26153564453125, 1.2996826171875, 1.33782958984375, 1.3759765625]}, "gradients/encoder.encoder.layers.0.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 1.0, 5.0, 5.0, 17.0, 38.0, 91.0, 617.0, 163.0, 50.0, 10.0, 8.0, 4.0, 2.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-114.14292907714844, -111.64790344238281, -109.15287780761719, -106.65784454345703, -104.1628189086914, -101.66779327392578, -99.17276763916016, -96.677734375, -94.18270874023438, -91.68768310546875, -89.19265747070312, -86.69762420654297, -84.20259857177734, -81.70757293701172, -79.2125473022461, -76.71751403808594, -74.22248840332031, -71.72746276855469, -69.23243713378906, -66.7374038696289, -64.24237823486328, -61.747352600097656, -59.25232696533203, -56.75729751586914, -54.26227569580078, -51.767250061035156, -49.272220611572266, -46.77719497680664, -44.28216552734375, -41.787139892578125, -39.2921142578125, -36.79708480834961, -34.30205535888672, -31.80702781677246, -29.312000274658203, -26.816974639892578, -24.321945190429688, -21.826919555664062, -19.331892013549805, -16.836864471435547, -14.341836929321289, -11.846809387207031, -9.351781845092773, -6.856755256652832, -4.361727714538574, -1.8667001724243164, 0.628326416015625, 3.123353958129883, 5.618381500244141, 8.113409042358398, 10.608436584472656, 13.103463172912598, 15.598490715026855, 18.093517303466797, 20.588544845581055, 23.083572387695312, 25.57859992980957, 28.073627471923828, 30.568655014038086, 33.063682556152344, 35.55870819091797, 38.05373764038086, 40.548763275146484, 43.043792724609375, 45.538818359375]}, "gradients/encoder.encoder.layers.0.layer_norm.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 3.0, 1.0, 1.0, 3.0, 3.0, 5.0, 5.0, 4.0, 1.0, 8.0, 1.0, 6.0, 10.0, 10.0, 10.0, 15.0, 14.0, 16.0, 19.0, 19.0, 20.0, 21.0, 19.0, 35.0, 60.0, 198.0, 219.0, 48.0, 36.0, 26.0, 27.0, 28.0, 17.0, 19.0, 12.0, 12.0, 14.0, 5.0, 6.0, 5.0, 5.0, 7.0, 7.0, 4.0, 6.0, 2.0, 1.0, 0.0, 0.0, 4.0, 0.0, 2.0], "bins": [-28.064186096191406, -27.322744369506836, -26.581302642822266, -25.839862823486328, -25.098421096801758, -24.356979370117188, -23.615537643432617, -22.874095916748047, -22.13265609741211, -21.39121437072754, -20.64977264404297, -19.90833282470703, -19.16689109802246, -18.42544937133789, -17.68400764465332, -16.94256591796875, -16.20112419128418, -15.45968246459961, -14.718241691589355, -13.976799964904785, -13.235359191894531, -12.493917465209961, -11.75247573852539, -11.01103401184082, -10.269593238830566, -9.528151512145996, -8.786710739135742, -8.045269012451172, -7.30382776260376, -6.562386512756348, -5.820944786071777, -5.079503536224365, -4.338062286376953, -3.596621036529541, -2.85517954826355, -2.1137380599975586, -1.3722968101501465, -0.6308555603027344, 0.11058616638183594, 0.852027416229248, 1.5934686660766602, 2.3349099159240723, 3.0763514041900635, 3.8177928924560547, 4.559234142303467, 5.300675392150879, 6.042117118835449, 6.783558368682861, 7.524999618530273, 8.266441345214844, 9.007882118225098, 9.749323844909668, 10.490764617919922, 11.232206344604492, 11.973648071289062, 12.715089797973633, 13.456530570983887, 14.197972297668457, 14.939413070678711, 15.680854797363281, 16.42229652404785, 17.163738250732422, 17.90517807006836, 18.64661979675293, 19.3880615234375]}, "gradients/encoder.encoder.pos_conv_embed.conv.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 2.0, 1.0, 0.0, 3.0, 4.0, 0.0, 3.0, 3.0, 6.0, 9.0, 14.0, 15.0, 18.0, 19.0, 21.0, 20.0, 23.0, 30.0, 38.0, 47.0, 116.0, 246.0, 97.0, 43.0, 33.0, 40.0, 36.0, 25.0, 21.0, 14.0, 14.0, 9.0, 12.0, 10.0, 6.0, 6.0, 0.0, 3.0, 6.0, 2.0, 1.0, 1.0, 1.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-2.095703125, -2.034942626953125, -1.97418212890625, -1.913421630859375, -1.8526611328125, -1.791900634765625, -1.73114013671875, -1.670379638671875, -1.609619140625, -1.548858642578125, -1.48809814453125, -1.427337646484375, -1.3665771484375, -1.305816650390625, -1.24505615234375, -1.184295654296875, -1.12353515625, -1.062774658203125, -1.00201416015625, -0.941253662109375, -0.8804931640625, -0.819732666015625, -0.75897216796875, -0.698211669921875, -0.637451171875, -0.576690673828125, -0.51593017578125, -0.455169677734375, -0.3944091796875, -0.333648681640625, -0.27288818359375, -0.212127685546875, -0.1513671875, -0.090606689453125, -0.02984619140625, 0.030914306640625, 0.0916748046875, 0.152435302734375, 0.21319580078125, 0.273956298828125, 0.334716796875, 0.395477294921875, 0.45623779296875, 0.516998291015625, 0.5777587890625, 0.638519287109375, 0.69927978515625, 0.760040283203125, 0.82080078125, 0.881561279296875, 0.94232177734375, 1.003082275390625, 1.0638427734375, 1.124603271484375, 1.18536376953125, 1.246124267578125, 1.306884765625, 1.367645263671875, 1.42840576171875, 1.489166259765625, 1.5499267578125, 1.610687255859375, 1.67144775390625, 1.732208251953125, 1.79296875]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_v": {"_type": "histogram", "values": [1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 2.0, 3.0, 3.0, 4.0, 0.0, 0.0, 2.0, 3.0, 8.0, 18.0, 14.0, 21.0, 16.0, 34.0, 40.0, 107.0, 185.0, 465.0, 1235.0, 4527.0, 69750.0, 8301943.0, 7289.0, 1734.0, 564.0, 263.0, 139.0, 63.0, 48.0, 29.0, 16.0, 7.0, 14.0, 13.0, 4.0, 13.0, 6.0, 2.0, 2.0, 0.0, 0.0, 2.0, 1.0, 1.0, 2.0, 5.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 3.0, 2.0], "bins": [-15.027771949768066, -14.511971473693848, -13.996170997619629, -13.48037052154541, -12.964570045471191, -12.448769569396973, -11.93297004699707, -11.417169570922852, -10.901369094848633, -10.385568618774414, -9.869768142700195, -9.353967666625977, -8.838167190551758, -8.322366714477539, -7.8065667152404785, -7.29076623916626, -6.774965286254883, -6.259164810180664, -5.743364334106445, -5.227563858032227, -4.711763381958008, -4.195962905883789, -3.6801629066467285, -3.1643624305725098, -2.648561954498291, -2.1327614784240723, -1.616961121559143, -1.1011607646942139, -0.5853602886199951, -0.06955981254577637, 0.4462404251098633, 0.962040901184082, 1.4778423309326172, 1.993642807006836, 2.5094432830810547, 3.0252435207366943, 3.541043996810913, 4.056844711303711, 4.5726447105407715, 5.08844518661499, 5.604245662689209, 6.120046138763428, 6.6358466148376465, 7.151646614074707, 7.667447090148926, 8.183247566223145, 8.699048042297363, 9.214848518371582, 9.7306489944458, 10.24644947052002, 10.762249946594238, 11.278050422668457, 11.793850898742676, 12.309651374816895, 12.825450897216797, 13.341251373291016, 13.857051849365234, 14.372852325439453, 14.888652801513672, 15.40445327758789, 15.92025375366211, 16.436054229736328, 16.951854705810547, 17.467655181884766, 17.983455657958984]}, "gradients/encoder.encoder.pos_conv_embed.conv.weight_g": {"_type": "histogram", "values": [3.0, 0.0, 0.0, 0.0, 2.0, 0.0, 0.0, 0.0, 0.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 2.0, 0.0, 1.0, 2.0, 1.0, 1.0, 1.0, 6.0, 4.0, 4.0, 1.0, 3.0, 2.0, 6.0, 1.0, 3.0, 2.0, 3.0, 5.0, 7.0, 4.0, 7.0, 6.0, 5.0, 5.0, 3.0, 3.0, 5.0, 4.0, 0.0, 1.0, 3.0, 5.0, 3.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0], "bins": [-14.410181045532227, -14.031996726989746, -13.653812408447266, -13.275628089904785, -12.897443771362305, -12.519259452819824, -12.141075134277344, -11.76289176940918, -11.384706497192383, -11.006522178649902, -10.628337860107422, -10.250153541564941, -9.871969223022461, -9.49378490447998, -9.1156005859375, -8.737417221069336, -8.359232902526855, -7.981048583984375, -7.6028642654418945, -7.224679946899414, -6.846495628356934, -6.468311309814453, -6.090127468109131, -5.71194314956665, -5.33375883102417, -4.9555745124816895, -4.577390193939209, -4.199206352233887, -3.821021795272827, -3.4428374767303467, -3.0646533966064453, -2.686469078063965, -2.308283805847168, -1.9300994873046875, -1.5519152879714966, -1.1737310886383057, -0.7955467700958252, -0.4173624515533447, -0.03917837142944336, 0.3390059471130371, 0.7171902656555176, 1.095374584197998, 1.473558783531189, 1.8517429828643799, 2.2299273014068604, 2.608111619949341, 2.986295700073242, 3.3644800186157227, 3.742664337158203, 4.120848655700684, 4.499032974243164, 4.8772172927856445, 5.255401611328125, 5.6335859298706055, 6.011769771575928, 6.389954090118408, 6.768138408660889, 7.146322727203369, 7.52450704574585, 7.902690887451172, 8.280875205993652, 8.659059524536133, 9.037243843078613, 9.415428161621094, 9.793612480163574]}, "gradients/encoder.feature_projection.projection.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 2.0, 1.0, 0.0, 2.0, 4.0, 0.0, 3.0, 3.0, 1.0, 8.0, 5.0, 5.0, 12.0, 21.0, 20.0, 48.0, 84.0, 158.0, 202.0, 464.0, 1050.0, 2784.0, 12009.0, 82892.0, 333055.0, 75621.0, 11199.0, 2689.0, 950.0, 437.0, 236.0, 141.0, 79.0, 36.0, 22.0, 15.0, 7.0, 7.0, 6.0, 0.0, 0.0, 2.0, 1.0, 1.0, 0.0, 0.0, 1.0], "bins": [-31.171875, -30.42041015625, -29.6689453125, -28.91748046875, -28.166015625, -27.41455078125, -26.6630859375, -25.91162109375, -25.16015625, -24.40869140625, -23.6572265625, -22.90576171875, -22.154296875, -21.40283203125, -20.6513671875, -19.89990234375, -19.1484375, -18.39697265625, -17.6455078125, -16.89404296875, -16.142578125, -15.39111328125, -14.6396484375, -13.88818359375, -13.13671875, -12.38525390625, -11.6337890625, -10.88232421875, -10.130859375, -9.37939453125, -8.6279296875, -7.87646484375, -7.125, -6.37353515625, -5.6220703125, -4.87060546875, -4.119140625, -3.36767578125, -2.6162109375, -1.86474609375, -1.11328125, -0.36181640625, 0.3896484375, 1.14111328125, 1.892578125, 2.64404296875, 3.3955078125, 4.14697265625, 4.8984375, 5.64990234375, 6.4013671875, 7.15283203125, 7.904296875, 8.65576171875, 9.4072265625, 10.15869140625, 10.91015625, 11.66162109375, 12.4130859375, 13.16455078125, 13.916015625, 14.66748046875, 15.4189453125, 16.17041015625, 16.921875]}, "gradients/encoder.feature_projection.projection.bias": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 2.0, 1.0, 2.0, 3.0, 0.0, 8.0, 9.0, 14.0, 10.0, 17.0, 26.0, 16.0, 33.0, 41.0, 66.0, 73.0, 91.0, 92.0, 80.0, 88.0, 68.0, 53.0, 51.0, 46.0, 31.0, 29.0, 14.0, 11.0, 19.0, 8.0, 6.0, 5.0, 3.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-3.439453125, -3.3560791015625, -3.272705078125, -3.1893310546875, -3.10595703125, -3.0225830078125, -2.939208984375, -2.8558349609375, -2.7724609375, -2.6890869140625, -2.605712890625, -2.5223388671875, -2.43896484375, -2.3555908203125, -2.272216796875, -2.1888427734375, -2.10546875, -2.0220947265625, -1.938720703125, -1.8553466796875, -1.77197265625, -1.6885986328125, -1.605224609375, -1.5218505859375, -1.4384765625, -1.3551025390625, -1.271728515625, -1.1883544921875, -1.10498046875, -1.0216064453125, -0.938232421875, -0.8548583984375, -0.771484375, -0.6881103515625, -0.604736328125, -0.5213623046875, -0.43798828125, -0.3546142578125, -0.271240234375, -0.1878662109375, -0.1044921875, -0.0211181640625, 0.062255859375, 0.1456298828125, 0.22900390625, 0.3123779296875, 0.395751953125, 0.4791259765625, 0.5625, 0.6458740234375, 0.729248046875, 0.8126220703125, 0.89599609375, 0.9793701171875, 1.062744140625, 1.1461181640625, 1.2294921875, 1.3128662109375, 1.396240234375, 1.4796142578125, 1.56298828125, 1.6463623046875, 1.729736328125, 1.8131103515625, 1.896484375]}, "gradients/encoder.feature_projection.layer_norm.weight": {"_type": "histogram", "values": [1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 0.0, 1.0, 1.0, 0.0, 0.0, 0.0, 0.0, 1.0, 4.0, 3.0, 2.0, 3.0, 7.0, 7.0, 8.0, 8.0, 4.0, 21.0, 18.0, 35.0, 33.0, 67.0, 69.0, 66.0, 63.0, 34.0, 22.0, 5.0, 10.0, 4.0, 2.0, 3.0, 3.0, 1.0, 1.0, 0.0, 2.0, 0.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-13.699359893798828, -13.20518970489502, -12.711020469665527, -12.216850280761719, -11.722681045532227, -11.228510856628418, -10.73434066772461, -10.240171432495117, -9.746002197265625, -9.251832008361816, -8.757662773132324, -8.263492584228516, -7.769323348999023, -7.275153160095215, -6.7809834480285645, -6.286813735961914, -5.7926435470581055, -5.298473834991455, -4.804304122924805, -4.310133934020996, -3.815964460372925, -3.3217947483062744, -2.827624797821045, -2.3334550857543945, -1.8392853736877441, -1.3451156616210938, -0.8509458303451538, -0.35677599906921387, 0.13739371299743652, 0.6315634250640869, 1.1257333755493164, 1.6199030876159668, 2.114072799682617, 2.6082425117492676, 3.102412223815918, 3.5965821743011475, 4.090751647949219, 4.584921836853027, 5.079091548919678, 5.573261260986328, 6.0674309730529785, 6.561600685119629, 7.055770397186279, 7.54994010925293, 8.044110298156738, 8.53827953338623, 9.032449722290039, 9.526618957519531, 10.02078914642334, 10.514959335327148, 11.00912857055664, 11.50329875946045, 11.997467994689941, 12.49163818359375, 12.985807418823242, 13.47997760772705, 13.97414779663086, 14.468317985534668, 14.96248722076416, 15.456657409667969, 15.950826644897461, 16.444995880126953, 16.939167022705078, 17.43333625793457, 17.927505493164062]}, "gradients/encoder.feature_projection.layer_norm.bias": {"_type": "histogram", "values": [1.0, 2.0, 1.0, 3.0, 2.0, 1.0, 1.0, 1.0, 0.0, 2.0, 1.0, 5.0, 7.0, 4.0, 5.0, 4.0, 10.0, 7.0, 19.0, 29.0, 51.0, 70.0, 87.0, 69.0, 54.0, 19.0, 8.0, 12.0, 5.0, 3.0, 2.0, 2.0, 2.0, 4.0, 4.0, 2.0, 1.0, 2.0, 1.0, 4.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 1.0, 0.0, 1.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 0.0, 1.0], "bins": [-9.68094539642334, -9.310079574584961, -8.939213752746582, -8.568347930908203, -8.197481155395508, -7.826615810394287, -7.45574951171875, -7.084883689880371, -6.714017868041992, -6.343152046203613, -5.972286224365234, -5.601419925689697, -5.230554103851318, -4.8596882820129395, -4.488821983337402, -4.117956161499023, -3.7470903396606445, -3.3762245178222656, -3.0053584575653076, -2.6344923973083496, -2.2636265754699707, -1.8927606344223022, -1.5218946933746338, -1.1510286331176758, -0.7801628112792969, -0.4092968702316284, -0.03843092918395996, 0.3324350118637085, 0.703300952911377, 1.0741668939590454, 1.4450328350067139, 1.8158988952636719, 2.186764717102051, 2.5576305389404297, 2.9284965991973877, 3.2993626594543457, 3.6702284812927246, 4.0410943031311035, 4.411960601806641, 4.7828264236450195, 5.153692245483398, 5.524558067321777, 5.895423889160156, 6.266290187835693, 6.637156009674072, 7.008021831512451, 7.378888130187988, 7.749753952026367, 8.120619773864746, 8.491485595703125, 8.862351417541504, 9.233217239379883, 9.604084014892578, 9.974949836730957, 10.345815658569336, 10.716681480407715, 11.087547302246094, 11.458413124084473, 11.829278945922852, 12.20014476776123, 12.57101058959961, 12.941877365112305, 13.312743186950684, 13.683609008789062, 14.054474830627441]}, "_wandb": {"runtime": 3721}} \ No newline at end of file